diff --git "a/wandb/run-20220301_200256-37laivn6/files/wandb-summary.json" "b/wandb/run-20220301_200256-37laivn6/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220301_200256-37laivn6/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.7566, "train/learning_rate": 9.94e-05, "train/epoch": 0.56, "train/global_step": 500, "_runtime": 3828, "_timestamp": 1646168804, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 31.0, 936.0, 48.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.180171966552734, -24.95094108581543, -8.721710205078125, 7.507518768310547, 23.736751556396484, 39.96598434448242, 56.19520950317383, 72.4244384765625, 88.65367126464844, 104.88290405273438, 121.11213684082031, 137.34136962890625, 153.57058715820312, 169.79983520507812, 186.029052734375, 202.25828552246094, 218.48751831054688, 234.7167510986328, 250.94598388671875, 267.1752014160156, 283.4044494628906, 299.6336669921875, 315.8629150390625, 332.0921325683594, 348.3213806152344, 364.55059814453125, 380.77984619140625, 397.0090637207031, 413.2383117675781, 429.467529296875, 445.69677734375, 461.9259948730469, 478.1552734375, 494.3844909667969, 510.6137390136719, 526.8429565429688, 543.0722045898438, 559.3014526367188, 575.5306396484375, 591.7598876953125, 607.9891357421875, 624.2183837890625, 640.4475708007812, 656.6768188476562, 672.9060668945312, 689.1353149414062, 705.364501953125, 721.59375, 737.822998046875, 754.05224609375, 770.2814331054688, 786.5106811523438, 802.7399291992188, 818.9691772460938, 835.1983642578125, 851.4276123046875, 867.6567993164062, 883.8860473632812, 900.115234375, 916.344482421875, 932.57373046875, 948.802978515625, 965.0321655273438, 981.2614135742188, 997.4906616210938]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 9.0, 8.0, 5.0, 17.0, 15.0, 17.0, 15.0, 10.0, 23.0, 24.0, 35.0, 34.0, 28.0, 37.0, 36.0, 42.0, 45.0, 56.0, 52.0, 41.0, 38.0, 42.0, 30.0, 45.0, 36.0, 26.0, 37.0, 28.0, 25.0, 30.0, 21.0, 15.0, 14.0, 20.0, 7.0, 7.0, 9.0, 6.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.49124145507812, -66.12571716308594, -63.76018524169922, -61.394657135009766, -59.02912902832031, -56.66360092163086, -54.298072814941406, -51.93254470825195, -49.5670166015625, -47.20148849487305, -44.835960388183594, -42.47043228149414, -40.10490417480469, -37.739376068115234, -35.37384796142578, -33.00831985473633, -30.642791748046875, -28.277263641357422, -25.91173553466797, -23.546207427978516, -21.180679321289062, -18.81515121459961, -16.449623107910156, -14.084095001220703, -11.71856689453125, -9.353038787841797, -6.987510681152344, -4.621982574462891, -2.2564544677734375, 0.10907363891601562, 2.4746017456054688, 4.840129852294922, 7.205650329589844, 9.571178436279297, 11.93670654296875, 14.302234649658203, 16.667762756347656, 19.03329086303711, 21.398818969726562, 23.764347076416016, 26.12987518310547, 28.495403289794922, 30.860931396484375, 33.22645950317383, 35.59198760986328, 37.957515716552734, 40.32304382324219, 42.68857192993164, 45.054100036621094, 47.41962814331055, 49.78515625, 52.15068435668945, 54.516212463378906, 56.88174057006836, 59.24726867675781, 61.612796783447266, 63.97832489013672, 66.34385681152344, 68.70938110351562, 71.07490539550781, 73.44043731689453, 75.80596923828125, 78.17149353027344, 80.53701782226562, 82.90254974365234]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 12.0, 16.0, 28.0, 27.0, 33.0, 47.0, 49.0, 52.0, 57.0, 71.0, 80.0, 75.0, 64.0, 62.0, 56.0, 48.0, 42.0, 52.0, 32.0, 33.0, 26.0, 11.0, 11.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78125, -2.6304931640625, -2.479736328125, -2.3289794921875, -2.17822265625, -2.0274658203125, -1.876708984375, -1.7259521484375, -1.5751953125, -1.4244384765625, -1.273681640625, -1.1229248046875, -0.97216796875, -0.8214111328125, -0.670654296875, -0.5198974609375, -0.369140625, -0.2183837890625, -0.067626953125, 0.0831298828125, 0.23388671875, 0.3846435546875, 0.535400390625, 0.6861572265625, 0.8369140625, 0.9876708984375, 1.138427734375, 1.2891845703125, 1.43994140625, 1.5906982421875, 1.741455078125, 1.8922119140625, 2.04296875, 2.1937255859375, 2.344482421875, 2.4952392578125, 2.64599609375, 2.7967529296875, 2.947509765625, 3.0982666015625, 3.2490234375, 3.3997802734375, 3.550537109375, 3.7012939453125, 3.85205078125, 4.0028076171875, 4.153564453125, 4.3043212890625, 4.455078125, 4.6058349609375, 4.756591796875, 4.9073486328125, 5.05810546875, 5.2088623046875, 5.359619140625, 5.5103759765625, 5.6611328125, 5.8118896484375, 5.962646484375, 6.1134033203125, 6.26416015625, 6.4149169921875, 6.565673828125, 6.7164306640625, 6.8671875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 3.0, 12.0, 24.0, 32.0, 51.0, 76.0, 121.0, 217.0, 350.0, 639.0, 1309.0, 3095.0, 9903.0, 73261.0, 3377109.0, 690712.0, 27187.0, 5746.0, 2129.0, 1003.0, 540.0, 273.0, 178.0, 111.0, 70.0, 44.0, 26.0, 20.0, 9.0, 8.0, 2.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.3203125, -13.5584716796875, -12.796630859375, -12.0347900390625, -11.27294921875, -10.5111083984375, -9.749267578125, -8.9874267578125, -8.2255859375, -7.4637451171875, -6.701904296875, -5.9400634765625, -5.17822265625, -4.4163818359375, -3.654541015625, -2.8927001953125, -2.130859375, -1.3690185546875, -0.607177734375, 0.1546630859375, 0.91650390625, 1.6783447265625, 2.440185546875, 3.2020263671875, 3.9638671875, 4.7257080078125, 5.487548828125, 6.2493896484375, 7.01123046875, 7.7730712890625, 8.534912109375, 9.2967529296875, 10.05859375, 10.8204345703125, 11.582275390625, 12.3441162109375, 13.10595703125, 13.8677978515625, 14.629638671875, 15.3914794921875, 16.1533203125, 16.9151611328125, 17.677001953125, 18.4388427734375, 19.20068359375, 19.9625244140625, 20.724365234375, 21.4862060546875, 22.248046875, 23.0098876953125, 23.771728515625, 24.5335693359375, 25.29541015625, 26.0572509765625, 26.819091796875, 27.5809326171875, 28.3427734375, 29.1046142578125, 29.866455078125, 30.6282958984375, 31.39013671875, 32.1519775390625, 32.913818359375, 33.6756591796875, 34.4375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 6.0, 14.0, 24.0, 32.0, 37.0, 80.0, 114.0, 156.0, 287.0, 388.0, 630.0, 652.0, 488.0, 367.0, 234.0, 176.0, 112.0, 74.0, 67.0, 39.0, 25.0, 26.0, 7.0, 7.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.3076171875, -13.849609375, -13.3916015625, -12.93359375, -12.4755859375, -12.017578125, -11.5595703125, -11.1015625, -10.6435546875, -10.185546875, -9.7275390625, -9.26953125, -8.8115234375, -8.353515625, -7.8955078125, -7.4375, -6.9794921875, -6.521484375, -6.0634765625, -5.60546875, -5.1474609375, -4.689453125, -4.2314453125, -3.7734375, -3.3154296875, -2.857421875, -2.3994140625, -1.94140625, -1.4833984375, -1.025390625, -0.5673828125, -0.109375, 0.3486328125, 0.806640625, 1.2646484375, 1.72265625, 2.1806640625, 2.638671875, 3.0966796875, 3.5546875, 4.0126953125, 4.470703125, 4.9287109375, 5.38671875, 5.8447265625, 6.302734375, 6.7607421875, 7.21875, 7.6767578125, 8.134765625, 8.5927734375, 9.05078125, 9.5087890625, 9.966796875, 10.4248046875, 10.8828125, 11.3408203125, 11.798828125, 12.2568359375, 12.71484375, 13.1728515625, 13.630859375, 14.0888671875, 14.546875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 9.0, 11.0, 16.0, 25.0, 22.0, 38.0, 69.0, 90.0, 157.0, 256.0, 463.0, 1023.0, 2482.0, 21506.0, 3101100.0, 1051592.0, 11205.0, 1998.0, 875.0, 503.0, 293.0, 179.0, 129.0, 79.0, 54.0, 29.0, 18.0, 15.0, 8.0, 8.0, 8.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.5625, -47.08642578125, -45.6103515625, -44.13427734375, -42.658203125, -41.18212890625, -39.7060546875, -38.22998046875, -36.75390625, -35.27783203125, -33.8017578125, -32.32568359375, -30.849609375, -29.37353515625, -27.8974609375, -26.42138671875, -24.9453125, -23.46923828125, -21.9931640625, -20.51708984375, -19.041015625, -17.56494140625, -16.0888671875, -14.61279296875, -13.13671875, -11.66064453125, -10.1845703125, -8.70849609375, -7.232421875, -5.75634765625, -4.2802734375, -2.80419921875, -1.328125, 0.14794921875, 1.6240234375, 3.10009765625, 4.576171875, 6.05224609375, 7.5283203125, 9.00439453125, 10.48046875, 11.95654296875, 13.4326171875, 14.90869140625, 16.384765625, 17.86083984375, 19.3369140625, 20.81298828125, 22.2890625, 23.76513671875, 25.2412109375, 26.71728515625, 28.193359375, 29.66943359375, 31.1455078125, 32.62158203125, 34.09765625, 35.57373046875, 37.0498046875, 38.52587890625, 40.001953125, 41.47802734375, 42.9541015625, 44.43017578125, 45.90625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 292.0, 667.0, 51.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-501.14373779296875, -491.712890625, -482.28204345703125, -472.8511962890625, -463.42034912109375, -453.989501953125, -444.55865478515625, -435.1278076171875, -425.69696044921875, -416.26611328125, -406.83526611328125, -397.4044189453125, -387.97357177734375, -378.542724609375, -369.11187744140625, -359.6810302734375, -350.25018310546875, -340.8193359375, -331.38848876953125, -321.9576416015625, -312.52679443359375, -303.095947265625, -293.66510009765625, -284.2342529296875, -274.8034362792969, -265.3725891113281, -255.94174194335938, -246.51089477539062, -237.08004760742188, -227.64920043945312, -218.21835327148438, -208.78750610351562, -199.35665893554688, -189.92581176757812, -180.49496459960938, -171.06411743164062, -161.63327026367188, -152.20242309570312, -142.77157592773438, -133.34072875976562, -123.90989685058594, -114.47904968261719, -105.04820251464844, -95.61735534667969, -86.18650817871094, -76.75566101074219, -67.32482147216797, -57.89397430419922, -48.46312713623047, -39.03227996826172, -29.6014347076416, -20.170589447021484, -10.739742279052734, -1.3088951110839844, 8.1219482421875, 17.55279541015625, 26.983642578125, 36.41448974609375, 45.8453369140625, 55.276180267333984, 64.70703125, 74.13787841796875, 83.56871795654297, 92.99956512451172, 102.43041229248047]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 14.0, 5.0, 5.0, 14.0, 19.0, 13.0, 23.0, 26.0, 38.0, 32.0, 45.0, 38.0, 37.0, 43.0, 54.0, 50.0, 61.0, 44.0, 67.0, 48.0, 32.0, 45.0, 42.0, 36.0, 40.0, 24.0, 18.0, 19.0, 28.0, 11.0, 8.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-69.6297607421875, -67.7975082397461, -65.96524810791016, -64.13299560546875, -62.30073928833008, -60.46848678588867, -58.63623046875, -56.803977966308594, -54.97172164916992, -53.13946533203125, -51.307212829589844, -49.47495651245117, -47.6427001953125, -45.810447692871094, -43.97819137573242, -42.14593505859375, -40.313682556152344, -38.48142623901367, -36.649173736572266, -34.816917419433594, -32.98466110229492, -31.152408599853516, -29.320152282714844, -27.487897872924805, -25.6556396484375, -23.82338523864746, -21.99112892150879, -20.15887451171875, -18.32662010192871, -16.494365692138672, -14.662109375, -12.829854965209961, -10.997600555419922, -9.165345191955566, -7.333090782165527, -5.500835418701172, -3.6685805320739746, -1.8363256454467773, -0.004070281982421875, 1.8281841278076172, 3.6604394912719727, 5.49269437789917, 7.324949264526367, 9.157204627990723, 10.989459991455078, 12.821714401245117, 14.653969764709473, 16.486225128173828, 18.318479537963867, 20.150733947753906, 21.982990264892578, 23.815244674682617, 25.647499084472656, 27.479755401611328, 29.312009811401367, 31.144264221191406, 32.97652053833008, 34.80877685546875, 36.641029357910156, 38.47328567504883, 40.3055419921875, 42.137794494628906, 43.97005081176758, 45.80230712890625, 47.634559631347656]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 1.0, 4.0, 8.0, 7.0, 7.0, 12.0, 24.0, 22.0, 25.0, 29.0, 26.0, 36.0, 46.0, 28.0, 41.0, 41.0, 53.0, 60.0, 63.0, 41.0, 34.0, 47.0, 46.0, 40.0, 47.0, 34.0, 27.0, 24.0, 30.0, 24.0, 19.0, 14.0, 9.0, 11.0, 4.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1328125, -3.01934814453125, -2.9058837890625, -2.79241943359375, -2.678955078125, -2.56549072265625, -2.4520263671875, -2.33856201171875, -2.22509765625, -2.11163330078125, -1.9981689453125, -1.88470458984375, -1.771240234375, -1.65777587890625, -1.5443115234375, -1.43084716796875, -1.3173828125, -1.20391845703125, -1.0904541015625, -0.97698974609375, -0.863525390625, -0.75006103515625, -0.6365966796875, -0.52313232421875, -0.40966796875, -0.29620361328125, -0.1827392578125, -0.06927490234375, 0.044189453125, 0.15765380859375, 0.2711181640625, 0.38458251953125, 0.498046875, 0.61151123046875, 0.7249755859375, 0.83843994140625, 0.951904296875, 1.06536865234375, 1.1788330078125, 1.29229736328125, 1.40576171875, 1.51922607421875, 1.6326904296875, 1.74615478515625, 1.859619140625, 1.97308349609375, 2.0865478515625, 2.20001220703125, 2.3134765625, 2.42694091796875, 2.5404052734375, 2.65386962890625, 2.767333984375, 2.88079833984375, 2.9942626953125, 3.10772705078125, 3.22119140625, 3.33465576171875, 3.4481201171875, 3.56158447265625, 3.675048828125, 3.78851318359375, 3.9019775390625, 4.01544189453125, 4.12890625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 13.0, 17.0, 24.0, 57.0, 59.0, 94.0, 170.0, 235.0, 423.0, 695.0, 1180.0, 2001.0, 3514.0, 6137.0, 10986.0, 19304.0, 34704.0, 63973.0, 129890.0, 307578.0, 242847.0, 103923.0, 53137.0, 29461.0, 16333.0, 9309.0, 5193.0, 2973.0, 1754.0, 1013.0, 580.0, 377.0, 202.0, 129.0, 95.0, 53.0, 38.0, 24.0, 22.0, 10.0, 8.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1671142578125, -0.16217803955078125, -0.1572418212890625, -0.15230560302734375, -0.147369384765625, -0.14243316650390625, -0.1374969482421875, -0.13256072998046875, -0.12762451171875, -0.12268829345703125, -0.1177520751953125, -0.11281585693359375, -0.107879638671875, -0.10294342041015625, -0.0980072021484375, -0.09307098388671875, -0.088134765625, -0.08319854736328125, -0.0782623291015625, -0.07332611083984375, -0.068389892578125, -0.06345367431640625, -0.0585174560546875, -0.05358123779296875, -0.04864501953125, -0.04370880126953125, -0.0387725830078125, -0.03383636474609375, -0.028900146484375, -0.02396392822265625, -0.0190277099609375, -0.01409149169921875, -0.0091552734375, -0.00421905517578125, 0.0007171630859375, 0.00565338134765625, 0.010589599609375, 0.01552581787109375, 0.0204620361328125, 0.02539825439453125, 0.03033447265625, 0.03527069091796875, 0.0402069091796875, 0.04514312744140625, 0.050079345703125, 0.05501556396484375, 0.0599517822265625, 0.06488800048828125, 0.06982421875, 0.07476043701171875, 0.0796966552734375, 0.08463287353515625, 0.089569091796875, 0.09450531005859375, 0.0994415283203125, 0.10437774658203125, 0.10931396484375, 0.11425018310546875, 0.1191864013671875, 0.12412261962890625, 0.129058837890625, 0.13399505615234375, 0.1389312744140625, 0.14386749267578125, 0.1488037109375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 10.0, 3.0, 11.0, 13.0, 13.0, 8.0, 17.0, 25.0, 29.0, 27.0, 31.0, 31.0, 34.0, 26.0, 31.0, 44.0, 44.0, 47.0, 1071.0, 46.0, 39.0, 34.0, 44.0, 51.0, 26.0, 24.0, 45.0, 26.0, 28.0, 24.0, 20.0, 18.0, 10.0, 11.0, 6.0, 9.0, 7.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.109375, -2.04718017578125, -1.9849853515625, -1.92279052734375, -1.860595703125, -1.79840087890625, -1.7362060546875, -1.67401123046875, -1.61181640625, -1.54962158203125, -1.4874267578125, -1.42523193359375, -1.363037109375, -1.30084228515625, -1.2386474609375, -1.17645263671875, -1.1142578125, -1.05206298828125, -0.9898681640625, -0.92767333984375, -0.865478515625, -0.80328369140625, -0.7410888671875, -0.67889404296875, -0.61669921875, -0.55450439453125, -0.4923095703125, -0.43011474609375, -0.367919921875, -0.30572509765625, -0.2435302734375, -0.18133544921875, -0.119140625, -0.05694580078125, 0.0052490234375, 0.06744384765625, 0.129638671875, 0.19183349609375, 0.2540283203125, 0.31622314453125, 0.37841796875, 0.44061279296875, 0.5028076171875, 0.56500244140625, 0.627197265625, 0.68939208984375, 0.7515869140625, 0.81378173828125, 0.8759765625, 0.93817138671875, 1.0003662109375, 1.06256103515625, 1.124755859375, 1.18695068359375, 1.2491455078125, 1.31134033203125, 1.37353515625, 1.43572998046875, 1.4979248046875, 1.56011962890625, 1.622314453125, 1.68450927734375, 1.7467041015625, 1.80889892578125, 1.87109375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 7.0, 9.0, 10.0, 23.0, 34.0, 48.0, 70.0, 127.0, 143.0, 226.0, 327.0, 487.0, 722.0, 1117.0, 1586.0, 2508.0, 3655.0, 5628.0, 8704.0, 14379.0, 23091.0, 38856.0, 68197.0, 139077.0, 1338477.0, 218588.0, 97789.0, 52251.0, 30376.0, 18444.0, 11461.0, 7106.0, 4522.0, 3011.0, 2015.0, 1293.0, 899.0, 601.0, 399.0, 276.0, 182.0, 145.0, 79.0, 54.0, 42.0, 27.0, 23.0, 17.0, 10.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12225341796875, -0.11840534210205078, -0.11455726623535156, -0.11070919036865234, -0.10686111450195312, -0.1030130386352539, -0.09916496276855469, -0.09531688690185547, -0.09146881103515625, -0.08762073516845703, -0.08377265930175781, -0.0799245834350586, -0.07607650756835938, -0.07222843170166016, -0.06838035583496094, -0.06453227996826172, -0.0606842041015625, -0.05683612823486328, -0.05298805236816406, -0.049139976501464844, -0.045291900634765625, -0.041443824768066406, -0.03759574890136719, -0.03374767303466797, -0.02989959716796875, -0.02605152130126953, -0.022203445434570312, -0.018355369567871094, -0.014507293701171875, -0.010659217834472656, -0.0068111419677734375, -0.0029630661010742188, 0.000885009765625, 0.004733085632324219, 0.008581161499023438, 0.012429237365722656, 0.016277313232421875, 0.020125389099121094, 0.023973464965820312, 0.02782154083251953, 0.03166961669921875, 0.03551769256591797, 0.03936576843261719, 0.043213844299316406, 0.047061920166015625, 0.050909996032714844, 0.05475807189941406, 0.05860614776611328, 0.0624542236328125, 0.06630229949951172, 0.07015037536621094, 0.07399845123291016, 0.07784652709960938, 0.0816946029663086, 0.08554267883300781, 0.08939075469970703, 0.09323883056640625, 0.09708690643310547, 0.10093498229980469, 0.1047830581665039, 0.10863113403320312, 0.11247920989990234, 0.11632728576660156, 0.12017536163330078, 0.1240234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 9.0, 17.0, 28.0, 14.0, 19.0, 19.0, 38.0, 40.0, 41.0, 48.0, 47.0, 54.0, 64.0, 61.0, 52.0, 52.0, 45.0, 40.0, 43.0, 38.0, 35.0, 31.0, 24.0, 17.0, 23.0, 12.0, 15.0, 10.0, 8.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.996755599975586e-05, -1.931656152009964e-05, -1.866556704044342e-05, -1.80145725607872e-05, -1.736357808113098e-05, -1.6712583601474762e-05, -1.6061589121818542e-05, -1.5410594642162323e-05, -1.4759600162506104e-05, -1.4108605682849884e-05, -1.3457611203193665e-05, -1.2806616723537445e-05, -1.2155622243881226e-05, -1.1504627764225006e-05, -1.0853633284568787e-05, -1.0202638804912567e-05, -9.551644325256348e-06, -8.900649845600128e-06, -8.249655365943909e-06, -7.598660886287689e-06, -6.94766640663147e-06, -6.29667192697525e-06, -5.645677447319031e-06, -4.994682967662811e-06, -4.343688488006592e-06, -3.6926940083503723e-06, -3.041699528694153e-06, -2.3907050490379333e-06, -1.7397105693817139e-06, -1.0887160897254944e-06, -4.377216100692749e-07, 2.1327286958694458e-07, 8.642673492431641e-07, 1.5152618288993835e-06, 2.166256308555603e-06, 2.8172507882118225e-06, 3.468245267868042e-06, 4.1192397475242615e-06, 4.770234227180481e-06, 5.4212287068367004e-06, 6.07222318649292e-06, 6.723217666149139e-06, 7.374212145805359e-06, 8.025206625461578e-06, 8.676201105117798e-06, 9.327195584774017e-06, 9.978190064430237e-06, 1.0629184544086456e-05, 1.1280179023742676e-05, 1.1931173503398895e-05, 1.2582167983055115e-05, 1.3233162462711334e-05, 1.3884156942367554e-05, 1.4535151422023773e-05, 1.5186145901679993e-05, 1.5837140381336212e-05, 1.648813486099243e-05, 1.713912934064865e-05, 1.779012382030487e-05, 1.844111829996109e-05, 1.909211277961731e-05, 1.974310725927353e-05, 2.039410173892975e-05, 2.1045096218585968e-05, 2.1696090698242188e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 5.0, 3.0, 9.0, 17.0, 10.0, 16.0, 25.0, 36.0, 29.0, 48.0, 53.0, 59.0, 71.0, 93.0, 141.0, 121.0, 168.0, 233.0, 362.0, 704.0, 57522.0, 985559.0, 1522.0, 442.0, 269.0, 180.0, 158.0, 148.0, 114.0, 70.0, 54.0, 81.0, 37.0, 30.0, 29.0, 32.0, 25.0, 18.0, 9.0, 10.0, 5.0, 8.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0], "bins": [-0.0003745555877685547, -0.0003632791340351105, -0.00035200268030166626, -0.00034072622656822205, -0.00032944977283477783, -0.0003181733191013336, -0.0003068968653678894, -0.0002956204116344452, -0.000284343957901001, -0.00027306750416755676, -0.00026179105043411255, -0.00025051459670066833, -0.00023923814296722412, -0.0002279616892337799, -0.0002166852355003357, -0.00020540878176689148, -0.00019413232803344727, -0.00018285587430000305, -0.00017157942056655884, -0.00016030296683311462, -0.0001490265130996704, -0.0001377500593662262, -0.00012647360563278198, -0.00011519715189933777, -0.00010392069816589355, -9.264424443244934e-05, -8.136779069900513e-05, -7.009133696556091e-05, -5.88148832321167e-05, -4.7538429498672485e-05, -3.626197576522827e-05, -2.4985522031784058e-05, -1.3709068298339844e-05, -2.43261456489563e-06, 8.843839168548584e-06, 2.0120292901992798e-05, 3.139674663543701e-05, 4.2673200368881226e-05, 5.394965410232544e-05, 6.522610783576965e-05, 7.650256156921387e-05, 8.777901530265808e-05, 9.90554690361023e-05, 0.00011033192276954651, 0.00012160837650299072, 0.00013288483023643494, 0.00014416128396987915, 0.00015543773770332336, 0.00016671419143676758, 0.0001779906451702118, 0.000189267098903656, 0.00020054355263710022, 0.00021182000637054443, 0.00022309646010398865, 0.00023437291383743286, 0.0002456493675708771, 0.0002569258213043213, 0.0002682022750377655, 0.0002794787287712097, 0.00029075518250465393, 0.00030203163623809814, 0.00031330808997154236, 0.00032458454370498657, 0.0003358609974384308, 0.000347137451171875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 35.0, 408.0, 507.0, 60.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.825990981771611e-05, -4.6654891775688156e-05, -4.5049873733660206e-05, -4.344485205365345e-05, -4.18398340116255e-05, -4.023481596959755e-05, -3.86297979275696e-05, -3.702477988554165e-05, -3.541975820553489e-05, -3.381474016350694e-05, -3.220972212147899e-05, -3.060470044147223e-05, -2.8999682399444282e-05, -2.7394664357416332e-05, -2.578964631538838e-05, -2.4184626454371028e-05, -2.2579608412343077e-05, -2.0974590370315127e-05, -1.9369570509297773e-05, -1.7764552467269823e-05, -1.615953260625247e-05, -1.4554514564224519e-05, -1.2949495612701867e-05, -1.1344476661179215e-05, -9.739457709656563e-06, -8.13443875813391e-06, -6.5294198066112585e-06, -4.924401309835957e-06, -3.3193823583133053e-06, -1.7143638615380041e-06, -1.0934491001535207e-07, 1.4956740415073e-06, 3.100692993029952e-06, 4.705711944552604e-06, 6.310730896075256e-06, 7.915748938103206e-06, 9.52076879912056e-06, 1.112578684114851e-05, 1.2730805792671163e-05, 1.4335824744193815e-05, 1.594084460521117e-05, 1.754586264723912e-05, 1.9150882508256473e-05, 2.0755900550284423e-05, 2.2360920411301777e-05, 2.3965938453329727e-05, 2.5570956495357677e-05, 2.717597635637503e-05, 2.878099439840298e-05, 3.0386012440430932e-05, 3.1991032301448286e-05, 3.3596050343476236e-05, 3.5201068385504186e-05, 3.6806086427532136e-05, 3.8411108107538894e-05, 4.0016126149566844e-05, 4.1621144191594794e-05, 4.3226162233622745e-05, 4.4831180275650695e-05, 4.643620195565745e-05, 4.80412199976854e-05, 4.964623803971335e-05, 5.12512560817413e-05, 5.2856274123769253e-05, 5.446129580377601e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 13.0, 3.0, 12.0, 9.0, 19.0, 9.0, 21.0, 17.0, 23.0, 28.0, 22.0, 22.0, 40.0, 32.0, 34.0, 25.0, 33.0, 39.0, 32.0, 44.0, 43.0, 30.0, 50.0, 30.0, 43.0, 27.0, 33.0, 35.0, 21.0, 31.0, 20.0, 28.0, 17.0, 14.0, 21.0, 17.0, 15.0, 10.0, 3.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.138448715209961e-05, -1.1039897799491882e-05, -1.0695308446884155e-05, -1.0350719094276428e-05, -1.0006129741668701e-05, -9.661540389060974e-06, -9.316951036453247e-06, -8.97236168384552e-06, -8.627772331237793e-06, -8.283182978630066e-06, -7.938593626022339e-06, -7.594004273414612e-06, -7.249414920806885e-06, -6.904825568199158e-06, -6.560236215591431e-06, -6.215646862983704e-06, -5.8710575103759766e-06, -5.5264681577682495e-06, -5.1818788051605225e-06, -4.837289452552795e-06, -4.492700099945068e-06, -4.148110747337341e-06, -3.8035213947296143e-06, -3.458932042121887e-06, -3.11434268951416e-06, -2.769753336906433e-06, -2.425163984298706e-06, -2.080574631690979e-06, -1.735985279083252e-06, -1.391395926475525e-06, -1.0468065738677979e-06, -7.022172212600708e-07, -3.5762786865234375e-07, -1.30385160446167e-08, 3.3155083656311035e-07, 6.761401891708374e-07, 1.0207295417785645e-06, 1.3653188943862915e-06, 1.7099082469940186e-06, 2.0544975996017456e-06, 2.3990869522094727e-06, 2.7436763048171997e-06, 3.0882656574249268e-06, 3.432855010032654e-06, 3.777444362640381e-06, 4.122033715248108e-06, 4.466623067855835e-06, 4.811212420463562e-06, 5.155801773071289e-06, 5.500391125679016e-06, 5.844980478286743e-06, 6.18956983089447e-06, 6.534159183502197e-06, 6.878748536109924e-06, 7.223337888717651e-06, 7.567927241325378e-06, 7.912516593933105e-06, 8.257105946540833e-06, 8.60169529914856e-06, 8.946284651756287e-06, 9.290874004364014e-06, 9.63546335697174e-06, 9.980052709579468e-06, 1.0324642062187195e-05, 1.0669231414794922e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 1.0, 4.0, 8.0, 7.0, 7.0, 12.0, 24.0, 22.0, 25.0, 29.0, 26.0, 36.0, 46.0, 28.0, 41.0, 41.0, 53.0, 60.0, 63.0, 41.0, 34.0, 47.0, 46.0, 40.0, 47.0, 34.0, 27.0, 24.0, 30.0, 24.0, 19.0, 14.0, 9.0, 11.0, 4.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1328125, -3.01934814453125, -2.9058837890625, -2.79241943359375, -2.678955078125, -2.56549072265625, -2.4520263671875, -2.33856201171875, -2.22509765625, -2.11163330078125, -1.9981689453125, -1.88470458984375, -1.771240234375, -1.65777587890625, -1.5443115234375, -1.43084716796875, -1.3173828125, -1.20391845703125, -1.0904541015625, -0.97698974609375, -0.863525390625, -0.75006103515625, -0.6365966796875, -0.52313232421875, -0.40966796875, -0.29620361328125, -0.1827392578125, -0.06927490234375, 0.044189453125, 0.15765380859375, 0.2711181640625, 0.38458251953125, 0.498046875, 0.61151123046875, 0.7249755859375, 0.83843994140625, 0.951904296875, 1.06536865234375, 1.1788330078125, 1.29229736328125, 1.40576171875, 1.51922607421875, 1.6326904296875, 1.74615478515625, 1.859619140625, 1.97308349609375, 2.0865478515625, 2.20001220703125, 2.3134765625, 2.42694091796875, 2.5404052734375, 2.65386962890625, 2.767333984375, 2.88079833984375, 2.9942626953125, 3.10772705078125, 3.22119140625, 3.33465576171875, 3.4481201171875, 3.56158447265625, 3.675048828125, 3.78851318359375, 3.9019775390625, 4.01544189453125, 4.12890625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 13.0, 22.0, 31.0, 43.0, 58.0, 94.0, 115.0, 167.0, 243.0, 347.0, 514.0, 705.0, 1046.0, 1771.0, 2580.0, 4164.0, 6527.0, 11491.0, 24532.0, 94397.0, 633363.0, 193809.0, 36073.0, 14612.0, 8085.0, 4754.0, 2949.0, 1969.0, 1298.0, 889.0, 623.0, 369.0, 279.0, 184.0, 130.0, 90.0, 59.0, 44.0, 33.0, 29.0, 23.0, 10.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.328125, -11.93896484375, -11.5498046875, -11.16064453125, -10.771484375, -10.38232421875, -9.9931640625, -9.60400390625, -9.21484375, -8.82568359375, -8.4365234375, -8.04736328125, -7.658203125, -7.26904296875, -6.8798828125, -6.49072265625, -6.1015625, -5.71240234375, -5.3232421875, -4.93408203125, -4.544921875, -4.15576171875, -3.7666015625, -3.37744140625, -2.98828125, -2.59912109375, -2.2099609375, -1.82080078125, -1.431640625, -1.04248046875, -0.6533203125, -0.26416015625, 0.125, 0.51416015625, 0.9033203125, 1.29248046875, 1.681640625, 2.07080078125, 2.4599609375, 2.84912109375, 3.23828125, 3.62744140625, 4.0166015625, 4.40576171875, 4.794921875, 5.18408203125, 5.5732421875, 5.96240234375, 6.3515625, 6.74072265625, 7.1298828125, 7.51904296875, 7.908203125, 8.29736328125, 8.6865234375, 9.07568359375, 9.46484375, 9.85400390625, 10.2431640625, 10.63232421875, 11.021484375, 11.41064453125, 11.7998046875, 12.18896484375, 12.578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 7.0, 8.0, 7.0, 13.0, 13.0, 21.0, 17.0, 8.0, 21.0, 22.0, 31.0, 28.0, 24.0, 27.0, 38.0, 42.0, 55.0, 62.0, 151.0, 1459.0, 382.0, 136.0, 55.0, 51.0, 39.0, 42.0, 25.0, 33.0, 29.0, 29.0, 29.0, 28.0, 18.0, 15.0, 13.0, 12.0, 14.0, 9.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.7183837890625, -7.421142578125, -7.1239013671875, -6.82666015625, -6.5294189453125, -6.232177734375, -5.9349365234375, -5.6376953125, -5.3404541015625, -5.043212890625, -4.7459716796875, -4.44873046875, -4.1514892578125, -3.854248046875, -3.5570068359375, -3.259765625, -2.9625244140625, -2.665283203125, -2.3680419921875, -2.07080078125, -1.7735595703125, -1.476318359375, -1.1790771484375, -0.8818359375, -0.5845947265625, -0.287353515625, 0.0098876953125, 0.30712890625, 0.6043701171875, 0.901611328125, 1.1988525390625, 1.49609375, 1.7933349609375, 2.090576171875, 2.3878173828125, 2.68505859375, 2.9822998046875, 3.279541015625, 3.5767822265625, 3.8740234375, 4.1712646484375, 4.468505859375, 4.7657470703125, 5.06298828125, 5.3602294921875, 5.657470703125, 5.9547119140625, 6.251953125, 6.5491943359375, 6.846435546875, 7.1436767578125, 7.44091796875, 7.7381591796875, 8.035400390625, 8.3326416015625, 8.6298828125, 8.9271240234375, 9.224365234375, 9.5216064453125, 9.81884765625, 10.1160888671875, 10.413330078125, 10.7105712890625, 11.0078125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 5.0, 8.0, 15.0, 9.0, 10.0, 11.0, 12.0, 8.0, 41.0, 17.0, 31.0, 31.0, 36.0, 42.0, 68.0, 118.0, 219.0, 556.0, 5844.0, 3093193.0, 43705.0, 992.0, 243.0, 135.0, 68.0, 46.0, 37.0, 33.0, 29.0, 18.0, 18.0, 14.0, 17.0, 18.0, 12.0, 15.0, 3.0, 5.0, 8.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-51.0625, -49.669921875, -48.27734375, -46.884765625, -45.4921875, -44.099609375, -42.70703125, -41.314453125, -39.921875, -38.529296875, -37.13671875, -35.744140625, -34.3515625, -32.958984375, -31.56640625, -30.173828125, -28.78125, -27.388671875, -25.99609375, -24.603515625, -23.2109375, -21.818359375, -20.42578125, -19.033203125, -17.640625, -16.248046875, -14.85546875, -13.462890625, -12.0703125, -10.677734375, -9.28515625, -7.892578125, -6.5, -5.107421875, -3.71484375, -2.322265625, -0.9296875, 0.462890625, 1.85546875, 3.248046875, 4.640625, 6.033203125, 7.42578125, 8.818359375, 10.2109375, 11.603515625, 12.99609375, 14.388671875, 15.78125, 17.173828125, 18.56640625, 19.958984375, 21.3515625, 22.744140625, 24.13671875, 25.529296875, 26.921875, 28.314453125, 29.70703125, 31.099609375, 32.4921875, 33.884765625, 35.27734375, 36.669921875, 38.0625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 45.0, 256.0, 471.0, 194.0, 29.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.984458923339844, -23.45728302001953, -21.930105209350586, -20.402929306030273, -18.87575340270996, -17.348575592041016, -15.821399688720703, -14.29422378540039, -12.767046928405762, -11.239870071411133, -9.71269416809082, -8.185517311096191, -6.658340930938721, -5.13116455078125, -3.603987693786621, -2.0768117904663086, -0.5496349334716797, 0.9775415658950806, 2.504718065261841, 4.031894683837891, 5.559071063995361, 7.086247444152832, 8.613424301147461, 10.140600204467773, 11.667777061462402, 13.194953918457031, 14.722129821777344, 16.249305725097656, 17.7764835357666, 19.303659439086914, 20.83083724975586, 22.358013153076172, 23.885189056396484, 25.412364959716797, 26.939542770385742, 28.466718673706055, 29.993894577026367, 31.521072387695312, 33.048248291015625, 34.57542419433594, 36.10260009765625, 37.62977600097656, 39.156951904296875, 40.68412780761719, 42.211307525634766, 43.73848342895508, 45.26565933227539, 46.7928352355957, 48.32001495361328, 49.847190856933594, 51.374366760253906, 52.90154266357422, 54.4287223815918, 55.95589828491211, 57.48307418823242, 59.010250091552734, 60.53742599487305, 62.06460189819336, 63.59177780151367, 65.11895751953125, 66.64613342285156, 68.17330932617188, 69.70048522949219, 71.2276611328125, 72.75483703613281]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 5.0, 8.0, 12.0, 13.0, 9.0, 16.0, 25.0, 13.0, 13.0, 27.0, 24.0, 30.0, 25.0, 30.0, 26.0, 30.0, 43.0, 35.0, 45.0, 42.0, 39.0, 37.0, 38.0, 27.0, 26.0, 36.0, 32.0, 23.0, 29.0, 24.0, 25.0, 31.0, 18.0, 12.0, 25.0, 11.0, 16.0, 13.0, 10.0, 9.0, 5.0, 4.0, 6.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-28.855920791625977, -27.969594955444336, -27.083269119262695, -26.196945190429688, -25.310619354248047, -24.424293518066406, -23.537967681884766, -22.651641845703125, -21.765316009521484, -20.878990173339844, -19.992664337158203, -19.106338500976562, -18.220014572143555, -17.333688735961914, -16.447362899780273, -15.561037063598633, -14.674713134765625, -13.788387298583984, -12.90206241607666, -12.01573657989502, -11.129411697387695, -10.243085861206055, -9.356760025024414, -8.470434188842773, -7.584109306335449, -6.697783946990967, -5.811458587646484, -4.925132751464844, -4.038807392120361, -3.152482032775879, -2.2661561965942383, -1.3798308372497559, -0.49350547790527344, 0.39282000064849854, 1.2791454792022705, 2.165471076965332, 3.0517964363098145, 3.938121795654297, 4.8244476318359375, 5.71077299118042, 6.597098350524902, 7.483423709869385, 8.369749069213867, 9.256074905395508, 10.142400741577148, 11.028725624084473, 11.915051460266113, 12.801376342773438, 13.687702178955078, 14.574028015136719, 15.460352897644043, 16.3466796875, 17.233003616333008, 18.11932945251465, 19.00565528869629, 19.89198112487793, 20.778305053710938, 21.664630889892578, 22.55095672607422, 23.43728256225586, 24.323606491088867, 25.209932327270508, 26.09625816345215, 26.98258399963379, 27.86890983581543]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 8.0, 7.0, 16.0, 7.0, 16.0, 20.0, 24.0, 26.0, 40.0, 31.0, 36.0, 43.0, 38.0, 37.0, 41.0, 58.0, 50.0, 53.0, 39.0, 37.0, 43.0, 42.0, 51.0, 34.0, 29.0, 32.0, 24.0, 26.0, 20.0, 18.0, 7.0, 14.0, 8.0, 6.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.37109375, -3.25457763671875, -3.1380615234375, -3.02154541015625, -2.905029296875, -2.78851318359375, -2.6719970703125, -2.55548095703125, -2.43896484375, -2.32244873046875, -2.2059326171875, -2.08941650390625, -1.972900390625, -1.85638427734375, -1.7398681640625, -1.62335205078125, -1.5068359375, -1.39031982421875, -1.2738037109375, -1.15728759765625, -1.040771484375, -0.92425537109375, -0.8077392578125, -0.69122314453125, -0.57470703125, -0.45819091796875, -0.3416748046875, -0.22515869140625, -0.108642578125, 0.00787353515625, 0.1243896484375, 0.24090576171875, 0.357421875, 0.47393798828125, 0.5904541015625, 0.70697021484375, 0.823486328125, 0.94000244140625, 1.0565185546875, 1.17303466796875, 1.28955078125, 1.40606689453125, 1.5225830078125, 1.63909912109375, 1.755615234375, 1.87213134765625, 1.9886474609375, 2.10516357421875, 2.2216796875, 2.33819580078125, 2.4547119140625, 2.57122802734375, 2.687744140625, 2.80426025390625, 2.9207763671875, 3.03729248046875, 3.15380859375, 3.27032470703125, 3.3868408203125, 3.50335693359375, 3.619873046875, 3.73638916015625, 3.8529052734375, 3.96942138671875, 4.0859375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 12.0, 14.0, 16.0, 23.0, 27.0, 45.0, 68.0, 95.0, 132.0, 182.0, 309.0, 518.0, 1077.0, 2710.0, 10705.0, 69935.0, 1948705.0, 2070589.0, 73329.0, 10596.0, 2770.0, 979.0, 516.0, 317.0, 202.0, 125.0, 76.0, 70.0, 39.0, 27.0, 21.0, 12.0, 8.0, 9.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8046875, -14.1612548828125, -13.517822265625, -12.8743896484375, -12.23095703125, -11.5875244140625, -10.944091796875, -10.3006591796875, -9.6572265625, -9.0137939453125, -8.370361328125, -7.7269287109375, -7.08349609375, -6.4400634765625, -5.796630859375, -5.1531982421875, -4.509765625, -3.8663330078125, -3.222900390625, -2.5794677734375, -1.93603515625, -1.2926025390625, -0.649169921875, -0.0057373046875, 0.6376953125, 1.2811279296875, 1.924560546875, 2.5679931640625, 3.21142578125, 3.8548583984375, 4.498291015625, 5.1417236328125, 5.78515625, 6.4285888671875, 7.072021484375, 7.7154541015625, 8.35888671875, 9.0023193359375, 9.645751953125, 10.2891845703125, 10.9326171875, 11.5760498046875, 12.219482421875, 12.8629150390625, 13.50634765625, 14.1497802734375, 14.793212890625, 15.4366455078125, 16.080078125, 16.7235107421875, 17.366943359375, 18.0103759765625, 18.65380859375, 19.2972412109375, 19.940673828125, 20.5841064453125, 21.2275390625, 21.8709716796875, 22.514404296875, 23.1578369140625, 23.80126953125, 24.4447021484375, 25.088134765625, 25.7315673828125, 26.375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 10.0, 21.0, 32.0, 61.0, 91.0, 122.0, 234.0, 350.0, 490.0, 750.0, 683.0, 450.0, 299.0, 171.0, 101.0, 78.0, 48.0, 32.0, 20.0, 8.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6796875, -12.1253662109375, -11.571044921875, -11.0167236328125, -10.46240234375, -9.9080810546875, -9.353759765625, -8.7994384765625, -8.2451171875, -7.6907958984375, -7.136474609375, -6.5821533203125, -6.02783203125, -5.4735107421875, -4.919189453125, -4.3648681640625, -3.810546875, -3.2562255859375, -2.701904296875, -2.1475830078125, -1.59326171875, -1.0389404296875, -0.484619140625, 0.0697021484375, 0.6240234375, 1.1783447265625, 1.732666015625, 2.2869873046875, 2.84130859375, 3.3956298828125, 3.949951171875, 4.5042724609375, 5.05859375, 5.6129150390625, 6.167236328125, 6.7215576171875, 7.27587890625, 7.8302001953125, 8.384521484375, 8.9388427734375, 9.4931640625, 10.0474853515625, 10.601806640625, 11.1561279296875, 11.71044921875, 12.2647705078125, 12.819091796875, 13.3734130859375, 13.927734375, 14.4820556640625, 15.036376953125, 15.5906982421875, 16.14501953125, 16.6993408203125, 17.253662109375, 17.8079833984375, 18.3623046875, 18.9166259765625, 19.470947265625, 20.0252685546875, 20.57958984375, 21.1339111328125, 21.688232421875, 22.2425537109375, 22.796875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 0.0, 5.0, 7.0, 9.0, 13.0, 12.0, 20.0, 33.0, 36.0, 64.0, 83.0, 121.0, 211.0, 402.0, 1029.0, 4831.0, 103020.0, 3770703.0, 301893.0, 8986.0, 1490.0, 569.0, 277.0, 148.0, 85.0, 65.0, 43.0, 32.0, 28.0, 16.0, 13.0, 8.0, 3.0, 7.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.9638671875, -40.677734375, -39.3916015625, -38.10546875, -36.8193359375, -35.533203125, -34.2470703125, -32.9609375, -31.6748046875, -30.388671875, -29.1025390625, -27.81640625, -26.5302734375, -25.244140625, -23.9580078125, -22.671875, -21.3857421875, -20.099609375, -18.8134765625, -17.52734375, -16.2412109375, -14.955078125, -13.6689453125, -12.3828125, -11.0966796875, -9.810546875, -8.5244140625, -7.23828125, -5.9521484375, -4.666015625, -3.3798828125, -2.09375, -0.8076171875, 0.478515625, 1.7646484375, 3.05078125, 4.3369140625, 5.623046875, 6.9091796875, 8.1953125, 9.4814453125, 10.767578125, 12.0537109375, 13.33984375, 14.6259765625, 15.912109375, 17.1982421875, 18.484375, 19.7705078125, 21.056640625, 22.3427734375, 23.62890625, 24.9150390625, 26.201171875, 27.4873046875, 28.7734375, 30.0595703125, 31.345703125, 32.6318359375, 33.91796875, 35.2041015625, 36.490234375, 37.7763671875, 39.0625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 17.0, 201.0, 596.0, 180.0, 18.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.39686965942383, -29.84035873413086, -23.28384780883789, -16.72733497619629, -10.17082405090332, -3.6143112182617188, 2.94219970703125, 9.498710632324219, 16.055221557617188, 22.611732482910156, 29.168243408203125, 35.724754333496094, 42.28126525878906, 48.8377799987793, 55.394290924072266, 61.950801849365234, 68.50730895996094, 75.0638198852539, 81.62033081054688, 88.17684173583984, 94.73335266113281, 101.28987121582031, 107.84637451171875, 114.40289306640625, 120.95940399169922, 127.51591491699219, 134.0724334716797, 140.62893676757812, 147.18545532226562, 153.74195861816406, 160.29847717285156, 166.85498046875, 173.41148376464844, 179.96800231933594, 186.52450561523438, 193.08102416992188, 199.6375274658203, 206.1940460205078, 212.75054931640625, 219.30706787109375, 225.8635711669922, 232.4200897216797, 238.97659301757812, 245.53311157226562, 252.08961486816406, 258.6461181640625, 265.20263671875, 271.7591552734375, 278.315673828125, 284.8721923828125, 291.4287109375, 297.9851989746094, 304.5417175292969, 311.0982360839844, 317.6547546386719, 324.21124267578125, 330.76776123046875, 337.32427978515625, 343.88079833984375, 350.4372863769531, 356.9938049316406, 363.5503234863281, 370.1068420410156, 376.663330078125, 383.2198486328125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 6.0, 14.0, 13.0, 21.0, 25.0, 15.0, 21.0, 20.0, 32.0, 28.0, 28.0, 37.0, 40.0, 40.0, 48.0, 44.0, 54.0, 45.0, 54.0, 35.0, 45.0, 37.0, 39.0, 27.0, 35.0, 19.0, 23.0, 23.0, 13.0, 26.0, 16.0, 12.0, 5.0, 10.0, 8.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.51606750488281, -31.352108001708984, -30.188146591186523, -29.024185180664062, -27.860225677490234, -26.696266174316406, -25.532304763793945, -24.368343353271484, -23.204383850097656, -22.040424346923828, -20.876462936401367, -19.712501525878906, -18.548542022705078, -17.38458251953125, -16.22062110900879, -15.056660652160645, -13.8927001953125, -12.728739738464355, -11.564779281616211, -10.400818824768066, -9.236858367919922, -8.072897911071777, -6.908937454223633, -5.744976997375488, -4.581016540527344, -3.417056083679199, -2.2530956268310547, -1.0891351699829102, 0.07482528686523438, 1.238785743713379, 2.4027462005615234, 3.566706657409668, 4.730663299560547, 5.894623756408691, 7.058584213256836, 8.22254467010498, 9.386505126953125, 10.55046558380127, 11.714426040649414, 12.878386497497559, 14.042346954345703, 15.206307411193848, 16.370267868041992, 17.534229278564453, 18.69818878173828, 19.86214828491211, 21.02610969543457, 22.19007110595703, 23.35403060913086, 24.517990112304688, 25.68195152282715, 26.84591293334961, 28.009872436523438, 29.173831939697266, 30.337793350219727, 31.501754760742188, 32.665714263916016, 33.829673767089844, 34.99363708496094, 36.157596588134766, 37.321556091308594, 38.48551559448242, 39.64947509765625, 40.813438415527344, 41.97739791870117]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 6.0, 13.0, 11.0, 25.0, 16.0, 20.0, 23.0, 26.0, 45.0, 22.0, 48.0, 51.0, 44.0, 44.0, 60.0, 58.0, 51.0, 42.0, 36.0, 43.0, 41.0, 40.0, 34.0, 32.0, 35.0, 28.0, 22.0, 14.0, 16.0, 14.0, 11.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46875, -3.34417724609375, -3.2196044921875, -3.09503173828125, -2.970458984375, -2.84588623046875, -2.7213134765625, -2.59674072265625, -2.47216796875, -2.34759521484375, -2.2230224609375, -2.09844970703125, -1.973876953125, -1.84930419921875, -1.7247314453125, -1.60015869140625, -1.4755859375, -1.35101318359375, -1.2264404296875, -1.10186767578125, -0.977294921875, -0.85272216796875, -0.7281494140625, -0.60357666015625, -0.47900390625, -0.35443115234375, -0.2298583984375, -0.10528564453125, 0.019287109375, 0.14385986328125, 0.2684326171875, 0.39300537109375, 0.517578125, 0.64215087890625, 0.7667236328125, 0.89129638671875, 1.015869140625, 1.14044189453125, 1.2650146484375, 1.38958740234375, 1.51416015625, 1.63873291015625, 1.7633056640625, 1.88787841796875, 2.012451171875, 2.13702392578125, 2.2615966796875, 2.38616943359375, 2.5107421875, 2.63531494140625, 2.7598876953125, 2.88446044921875, 3.009033203125, 3.13360595703125, 3.2581787109375, 3.38275146484375, 3.50732421875, 3.63189697265625, 3.7564697265625, 3.88104248046875, 4.005615234375, 4.13018798828125, 4.2547607421875, 4.37933349609375, 4.50390625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 6.0, 8.0, 20.0, 15.0, 19.0, 21.0, 52.0, 66.0, 114.0, 133.0, 245.0, 350.0, 556.0, 851.0, 1390.0, 2189.0, 3624.0, 5904.0, 9993.0, 16558.0, 28119.0, 48771.0, 88691.0, 185581.0, 306677.0, 160106.0, 79860.0, 44423.0, 25624.0, 15101.0, 9213.0, 5338.0, 3310.0, 2021.0, 1251.0, 842.0, 518.0, 312.0, 230.0, 133.0, 110.0, 66.0, 29.0, 43.0, 21.0, 15.0, 15.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1529541015625, -0.14837646484375, -0.143798828125, -0.13922119140625, -0.1346435546875, -0.13006591796875, -0.12548828125, -0.12091064453125, -0.1163330078125, -0.11175537109375, -0.107177734375, -0.10260009765625, -0.0980224609375, -0.09344482421875, -0.0888671875, -0.08428955078125, -0.0797119140625, -0.07513427734375, -0.070556640625, -0.06597900390625, -0.0614013671875, -0.05682373046875, -0.05224609375, -0.04766845703125, -0.0430908203125, -0.03851318359375, -0.033935546875, -0.02935791015625, -0.0247802734375, -0.02020263671875, -0.015625, -0.01104736328125, -0.0064697265625, -0.00189208984375, 0.002685546875, 0.00726318359375, 0.0118408203125, 0.01641845703125, 0.02099609375, 0.02557373046875, 0.0301513671875, 0.03472900390625, 0.039306640625, 0.04388427734375, 0.0484619140625, 0.05303955078125, 0.0576171875, 0.06219482421875, 0.0667724609375, 0.07135009765625, 0.075927734375, 0.08050537109375, 0.0850830078125, 0.08966064453125, 0.09423828125, 0.09881591796875, 0.1033935546875, 0.10797119140625, 0.112548828125, 0.11712646484375, 0.1217041015625, 0.12628173828125, 0.130859375, 0.13543701171875, 0.1400146484375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 9.0, 5.0, 10.0, 16.0, 10.0, 15.0, 16.0, 13.0, 20.0, 22.0, 32.0, 20.0, 37.0, 28.0, 34.0, 45.0, 44.0, 54.0, 41.0, 1071.0, 36.0, 38.0, 36.0, 43.0, 37.0, 38.0, 33.0, 26.0, 26.0, 31.0, 19.0, 18.0, 14.0, 13.0, 18.0, 6.0, 14.0, 5.0, 3.0, 7.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.978057861328125, -1.91119384765625, -1.844329833984375, -1.7774658203125, -1.710601806640625, -1.64373779296875, -1.576873779296875, -1.510009765625, -1.443145751953125, -1.37628173828125, -1.309417724609375, -1.2425537109375, -1.175689697265625, -1.10882568359375, -1.041961669921875, -0.97509765625, -0.908233642578125, -0.84136962890625, -0.774505615234375, -0.7076416015625, -0.640777587890625, -0.57391357421875, -0.507049560546875, -0.440185546875, -0.373321533203125, -0.30645751953125, -0.239593505859375, -0.1727294921875, -0.105865478515625, -0.03900146484375, 0.027862548828125, 0.0947265625, 0.161590576171875, 0.22845458984375, 0.295318603515625, 0.3621826171875, 0.429046630859375, 0.49591064453125, 0.562774658203125, 0.629638671875, 0.696502685546875, 0.76336669921875, 0.830230712890625, 0.8970947265625, 0.963958740234375, 1.03082275390625, 1.097686767578125, 1.16455078125, 1.231414794921875, 1.29827880859375, 1.365142822265625, 1.4320068359375, 1.498870849609375, 1.56573486328125, 1.632598876953125, 1.699462890625, 1.766326904296875, 1.83319091796875, 1.900054931640625, 1.9669189453125, 2.033782958984375, 2.10064697265625, 2.167510986328125, 2.234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 11.0, 12.0, 11.0, 25.0, 36.0, 52.0, 86.0, 108.0, 151.0, 235.0, 348.0, 479.0, 685.0, 1065.0, 1428.0, 2250.0, 3053.0, 4485.0, 6747.0, 9990.0, 15346.0, 23997.0, 38274.0, 65610.0, 124509.0, 1292961.0, 228398.0, 113223.0, 60858.0, 35845.0, 22686.0, 14441.0, 9570.0, 6279.0, 4330.0, 2875.0, 2047.0, 1421.0, 986.0, 678.0, 479.0, 327.0, 236.0, 138.0, 126.0, 67.0, 54.0, 38.0, 23.0, 25.0, 11.0, 6.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.115966796875, -0.11221790313720703, -0.10846900939941406, -0.1047201156616211, -0.10097122192382812, -0.09722232818603516, -0.09347343444824219, -0.08972454071044922, -0.08597564697265625, -0.08222675323486328, -0.07847785949707031, -0.07472896575927734, -0.07098007202148438, -0.0672311782836914, -0.06348228454589844, -0.05973339080810547, -0.0559844970703125, -0.05223560333251953, -0.04848670959472656, -0.044737815856933594, -0.040988922119140625, -0.037240028381347656, -0.03349113464355469, -0.02974224090576172, -0.02599334716796875, -0.02224445343017578, -0.018495559692382812, -0.014746665954589844, -0.010997772216796875, -0.007248878479003906, -0.0034999847412109375, 0.00024890899658203125, 0.003997802734375, 0.007746696472167969, 0.011495590209960938, 0.015244483947753906, 0.018993377685546875, 0.022742271423339844, 0.026491165161132812, 0.03024005889892578, 0.03398895263671875, 0.03773784637451172, 0.04148674011230469, 0.045235633850097656, 0.048984527587890625, 0.052733421325683594, 0.05648231506347656, 0.06023120880126953, 0.0639801025390625, 0.06772899627685547, 0.07147789001464844, 0.0752267837524414, 0.07897567749023438, 0.08272457122802734, 0.08647346496582031, 0.09022235870361328, 0.09397125244140625, 0.09772014617919922, 0.10146903991699219, 0.10521793365478516, 0.10896682739257812, 0.1127157211303711, 0.11646461486816406, 0.12021350860595703, 0.12396240234375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 3.0, 7.0, 7.0, 13.0, 8.0, 16.0, 11.0, 18.0, 17.0, 22.0, 27.0, 25.0, 30.0, 34.0, 26.0, 33.0, 37.0, 44.0, 48.0, 41.0, 46.0, 46.0, 55.0, 42.0, 37.0, 44.0, 47.0, 31.0, 25.0, 26.0, 17.0, 10.0, 13.0, 18.0, 16.0, 12.0, 10.0, 6.0, 8.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8298625946044922e-05, -1.773238182067871e-05, -1.71661376953125e-05, -1.659989356994629e-05, -1.6033649444580078e-05, -1.5467405319213867e-05, -1.4901161193847656e-05, -1.4334917068481445e-05, -1.3768672943115234e-05, -1.3202428817749023e-05, -1.2636184692382812e-05, -1.2069940567016602e-05, -1.150369644165039e-05, -1.093745231628418e-05, -1.0371208190917969e-05, -9.804964065551758e-06, -9.238719940185547e-06, -8.672475814819336e-06, -8.106231689453125e-06, -7.539987564086914e-06, -6.973743438720703e-06, -6.407499313354492e-06, -5.841255187988281e-06, -5.27501106262207e-06, -4.708766937255859e-06, -4.1425228118896484e-06, -3.5762786865234375e-06, -3.0100345611572266e-06, -2.4437904357910156e-06, -1.8775463104248047e-06, -1.3113021850585938e-06, -7.450580596923828e-07, -1.7881393432617188e-07, 3.8743019104003906e-07, 9.5367431640625e-07, 1.519918441772461e-06, 2.086162567138672e-06, 2.652406692504883e-06, 3.2186508178710938e-06, 3.7848949432373047e-06, 4.351139068603516e-06, 4.9173831939697266e-06, 5.4836273193359375e-06, 6.0498714447021484e-06, 6.616115570068359e-06, 7.18235969543457e-06, 7.748603820800781e-06, 8.314847946166992e-06, 8.881092071533203e-06, 9.447336196899414e-06, 1.0013580322265625e-05, 1.0579824447631836e-05, 1.1146068572998047e-05, 1.1712312698364258e-05, 1.2278556823730469e-05, 1.284480094909668e-05, 1.341104507446289e-05, 1.3977289199829102e-05, 1.4543533325195312e-05, 1.5109777450561523e-05, 1.5676021575927734e-05, 1.6242265701293945e-05, 1.6808509826660156e-05, 1.7374753952026367e-05, 1.7940998077392578e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 7.0, 4.0, 10.0, 8.0, 6.0, 10.0, 9.0, 23.0, 26.0, 34.0, 42.0, 35.0, 66.0, 83.0, 110.0, 113.0, 132.0, 131.0, 197.0, 374.0, 840.0, 15946.0, 1018054.0, 10159.0, 795.0, 329.0, 199.0, 136.0, 125.0, 91.0, 87.0, 70.0, 48.0, 49.0, 37.0, 30.0, 29.0, 22.0, 20.0, 18.0, 7.0, 12.0, 7.0, 4.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.0003714561462402344, -0.00036067888140678406, -0.00034990161657333374, -0.0003391243517398834, -0.0003283470869064331, -0.0003175698220729828, -0.00030679255723953247, -0.00029601529240608215, -0.00028523802757263184, -0.0002744607627391815, -0.0002636834979057312, -0.0002529062330722809, -0.00024212896823883057, -0.00023135170340538025, -0.00022057443857192993, -0.00020979717373847961, -0.0001990199089050293, -0.00018824264407157898, -0.00017746537923812866, -0.00016668811440467834, -0.00015591084957122803, -0.0001451335847377777, -0.0001343563199043274, -0.00012357905507087708, -0.00011280179023742676, -0.00010202452540397644, -9.124726057052612e-05, -8.04699957370758e-05, -6.969273090362549e-05, -5.891546607017517e-05, -4.8138201236724854e-05, -3.7360936403274536e-05, -2.658367156982422e-05, -1.58064067363739e-05, -5.029141902923584e-06, 5.748122930526733e-06, 1.652538776397705e-05, 2.7302652597427368e-05, 3.8079917430877686e-05, 4.8857182264328e-05, 5.963444709777832e-05, 7.041171193122864e-05, 8.118897676467896e-05, 9.196624159812927e-05, 0.00010274350643157959, 0.00011352077126502991, 0.00012429803609848022, 0.00013507530093193054, 0.00014585256576538086, 0.00015662983059883118, 0.0001674070954322815, 0.0001781843602657318, 0.00018896162509918213, 0.00019973888993263245, 0.00021051615476608276, 0.00022129341959953308, 0.0002320706844329834, 0.00024284794926643372, 0.00025362521409988403, 0.00026440247893333435, 0.00027517974376678467, 0.000285957008600235, 0.0002967342734336853, 0.0003075115382671356, 0.00031828880310058594]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 50.0, 186.0, 356.0, 271.0, 113.0, 24.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.605738725629635e-05, -1.4894461855874397e-05, -1.3731537364947144e-05, -1.2568612874019891e-05, -1.1405687473597936e-05, -1.0242762073175982e-05, -9.079837582248729e-06, -7.916913091321476e-06, -6.753987690899521e-06, -5.591062745224917e-06, -4.4281377995503135e-06, -3.2652128538757097e-06, -2.102287908201106e-06, -9.393629625265021e-07, 2.2356198314810172e-07, 1.3864864740753546e-06, 2.5494118744973093e-06, 3.712336820171913e-06, 4.875261765846517e-06, 6.038186711521121e-06, 7.2011116571957245e-06, 8.36403705761768e-06, 9.526961548544932e-06, 1.0689886039472185e-05, 1.185281143989414e-05, 1.3015736840316094e-05, 1.4178661331243347e-05, 1.53415858221706e-05, 1.6504511222592555e-05, 1.766743662301451e-05, 1.883036020444706e-05, 1.9993285604869016e-05, 2.1156207367312163e-05, 2.2319132767734118e-05, 2.3482058168156072e-05, 2.4644981749588624e-05, 2.580790715001058e-05, 2.6970832550432533e-05, 2.8133756131865084e-05, 2.929668153228704e-05, 3.0459606932708994e-05, 3.1622530514141545e-05, 3.27854577335529e-05, 3.3948381314985454e-05, 3.5111304896418005e-05, 3.6274232115829363e-05, 3.7437155697261915e-05, 3.860008291667327e-05, 3.9763006498105824e-05, 4.0925930079538375e-05, 4.208885729894973e-05, 4.3251780880382285e-05, 4.441470809979364e-05, 4.5577631681226194e-05, 4.6740555262658745e-05, 4.7903478844091296e-05, 4.9066406063502654e-05, 5.0229329644935206e-05, 5.1392256864346564e-05, 5.2555180445779115e-05, 5.3718104027211666e-05, 5.4881031246623024e-05, 5.6043954828055575e-05, 5.7206882047466934e-05, 5.8369805628899485e-05]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 10.0, 14.0, 9.0, 13.0, 22.0, 20.0, 22.0, 24.0, 23.0, 36.0, 31.0, 27.0, 49.0, 33.0, 38.0, 48.0, 46.0, 48.0, 50.0, 37.0, 34.0, 40.0, 39.0, 42.0, 38.0, 34.0, 23.0, 26.0, 24.0, 15.0, 21.0, 10.0, 14.0, 4.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2814998626708984e-05, -1.2434087693691254e-05, -1.2053176760673523e-05, -1.1672265827655792e-05, -1.1291354894638062e-05, -1.091044396162033e-05, -1.05295330286026e-05, -1.014862209558487e-05, -9.767711162567139e-06, -9.386800229549408e-06, -9.005889296531677e-06, -8.624978363513947e-06, -8.244067430496216e-06, -7.863156497478485e-06, -7.482245564460754e-06, -7.101334631443024e-06, -6.720423698425293e-06, -6.339512765407562e-06, -5.9586018323898315e-06, -5.577690899372101e-06, -5.19677996635437e-06, -4.815869033336639e-06, -4.434958100318909e-06, -4.054047167301178e-06, -3.6731362342834473e-06, -3.2922253012657166e-06, -2.911314368247986e-06, -2.530403435230255e-06, -2.1494925022125244e-06, -1.7685815691947937e-06, -1.387670636177063e-06, -1.0067597031593323e-06, -6.258487701416016e-07, -2.4493783712387085e-07, 1.3597309589385986e-07, 5.168840289115906e-07, 8.977949619293213e-07, 1.278705894947052e-06, 1.6596168279647827e-06, 2.0405277609825134e-06, 2.421438694000244e-06, 2.802349627017975e-06, 3.1832605600357056e-06, 3.5641714930534363e-06, 3.945082426071167e-06, 4.325993359088898e-06, 4.706904292106628e-06, 5.087815225124359e-06, 5.46872615814209e-06, 5.8496370911598206e-06, 6.230548024177551e-06, 6.611458957195282e-06, 6.992369890213013e-06, 7.373280823230743e-06, 7.754191756248474e-06, 8.135102689266205e-06, 8.516013622283936e-06, 8.896924555301666e-06, 9.277835488319397e-06, 9.658746421337128e-06, 1.0039657354354858e-05, 1.0420568287372589e-05, 1.080147922039032e-05, 1.118239015340805e-05, 1.1563301086425781e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 6.0, 13.0, 11.0, 25.0, 16.0, 20.0, 23.0, 26.0, 45.0, 22.0, 48.0, 51.0, 44.0, 44.0, 60.0, 58.0, 51.0, 42.0, 36.0, 43.0, 41.0, 40.0, 34.0, 32.0, 35.0, 28.0, 22.0, 14.0, 16.0, 14.0, 11.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46875, -3.34417724609375, -3.2196044921875, -3.09503173828125, -2.970458984375, -2.84588623046875, -2.7213134765625, -2.59674072265625, -2.47216796875, -2.34759521484375, -2.2230224609375, -2.09844970703125, -1.973876953125, -1.84930419921875, -1.7247314453125, -1.60015869140625, -1.4755859375, -1.35101318359375, -1.2264404296875, -1.10186767578125, -0.977294921875, -0.85272216796875, -0.7281494140625, -0.60357666015625, -0.47900390625, -0.35443115234375, -0.2298583984375, -0.10528564453125, 0.019287109375, 0.14385986328125, 0.2684326171875, 0.39300537109375, 0.517578125, 0.64215087890625, 0.7667236328125, 0.89129638671875, 1.015869140625, 1.14044189453125, 1.2650146484375, 1.38958740234375, 1.51416015625, 1.63873291015625, 1.7633056640625, 1.88787841796875, 2.012451171875, 2.13702392578125, 2.2615966796875, 2.38616943359375, 2.5107421875, 2.63531494140625, 2.7598876953125, 2.88446044921875, 3.009033203125, 3.13360595703125, 3.2581787109375, 3.38275146484375, 3.50732421875, 3.63189697265625, 3.7564697265625, 3.88104248046875, 4.005615234375, 4.13018798828125, 4.2547607421875, 4.37933349609375, 4.50390625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 11.0, 12.0, 15.0, 23.0, 38.0, 30.0, 65.0, 101.0, 133.0, 214.0, 334.0, 511.0, 808.0, 1285.0, 2373.0, 4931.0, 12516.0, 34939.0, 113335.0, 431124.0, 313995.0, 85499.0, 26877.0, 9928.0, 4167.0, 2071.0, 1125.0, 755.0, 439.0, 305.0, 173.0, 147.0, 73.0, 65.0, 37.0, 29.0, 24.0, 13.0, 10.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.56640625, -3.44293212890625, -3.3194580078125, -3.19598388671875, -3.072509765625, -2.94903564453125, -2.8255615234375, -2.70208740234375, -2.57861328125, -2.45513916015625, -2.3316650390625, -2.20819091796875, -2.084716796875, -1.96124267578125, -1.8377685546875, -1.71429443359375, -1.5908203125, -1.46734619140625, -1.3438720703125, -1.22039794921875, -1.096923828125, -0.97344970703125, -0.8499755859375, -0.72650146484375, -0.60302734375, -0.47955322265625, -0.3560791015625, -0.23260498046875, -0.109130859375, 0.01434326171875, 0.1378173828125, 0.26129150390625, 0.384765625, 0.50823974609375, 0.6317138671875, 0.75518798828125, 0.878662109375, 1.00213623046875, 1.1256103515625, 1.24908447265625, 1.37255859375, 1.49603271484375, 1.6195068359375, 1.74298095703125, 1.866455078125, 1.98992919921875, 2.1134033203125, 2.23687744140625, 2.3603515625, 2.48382568359375, 2.6072998046875, 2.73077392578125, 2.854248046875, 2.97772216796875, 3.1011962890625, 3.22467041015625, 3.34814453125, 3.47161865234375, 3.5950927734375, 3.71856689453125, 3.842041015625, 3.96551513671875, 4.0889892578125, 4.21246337890625, 4.3359375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 8.0, 12.0, 9.0, 16.0, 24.0, 30.0, 15.0, 33.0, 37.0, 34.0, 42.0, 49.0, 52.0, 53.0, 59.0, 134.0, 1776.0, 164.0, 67.0, 49.0, 45.0, 36.0, 43.0, 26.0, 24.0, 31.0, 25.0, 21.0, 14.0, 22.0, 12.0, 18.0, 8.0, 11.0, 4.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4609375, -11.0858154296875, -10.710693359375, -10.3355712890625, -9.96044921875, -9.5853271484375, -9.210205078125, -8.8350830078125, -8.4599609375, -8.0848388671875, -7.709716796875, -7.3345947265625, -6.95947265625, -6.5843505859375, -6.209228515625, -5.8341064453125, -5.458984375, -5.0838623046875, -4.708740234375, -4.3336181640625, -3.95849609375, -3.5833740234375, -3.208251953125, -2.8331298828125, -2.4580078125, -2.0828857421875, -1.707763671875, -1.3326416015625, -0.95751953125, -0.5823974609375, -0.207275390625, 0.1678466796875, 0.54296875, 0.9180908203125, 1.293212890625, 1.6683349609375, 2.04345703125, 2.4185791015625, 2.793701171875, 3.1688232421875, 3.5439453125, 3.9190673828125, 4.294189453125, 4.6693115234375, 5.04443359375, 5.4195556640625, 5.794677734375, 6.1697998046875, 6.544921875, 6.9200439453125, 7.295166015625, 7.6702880859375, 8.04541015625, 8.4205322265625, 8.795654296875, 9.1707763671875, 9.5458984375, 9.9210205078125, 10.296142578125, 10.6712646484375, 11.04638671875, 11.4215087890625, 11.796630859375, 12.1717529296875, 12.546875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 12.0, 15.0, 11.0, 20.0, 16.0, 23.0, 26.0, 36.0, 42.0, 54.0, 78.0, 115.0, 187.0, 370.0, 939.0, 4763.0, 1852120.0, 1280291.0, 4617.0, 920.0, 319.0, 208.0, 116.0, 77.0, 66.0, 44.0, 40.0, 28.0, 29.0, 25.0, 15.0, 9.0, 10.0, 9.0, 11.0, 4.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-26.46875, -25.641357421875, -24.81396484375, -23.986572265625, -23.1591796875, -22.331787109375, -21.50439453125, -20.677001953125, -19.849609375, -19.022216796875, -18.19482421875, -17.367431640625, -16.5400390625, -15.712646484375, -14.88525390625, -14.057861328125, -13.23046875, -12.403076171875, -11.57568359375, -10.748291015625, -9.9208984375, -9.093505859375, -8.26611328125, -7.438720703125, -6.611328125, -5.783935546875, -4.95654296875, -4.129150390625, -3.3017578125, -2.474365234375, -1.64697265625, -0.819580078125, 0.0078125, 0.835205078125, 1.66259765625, 2.489990234375, 3.3173828125, 4.144775390625, 4.97216796875, 5.799560546875, 6.626953125, 7.454345703125, 8.28173828125, 9.109130859375, 9.9365234375, 10.763916015625, 11.59130859375, 12.418701171875, 13.24609375, 14.073486328125, 14.90087890625, 15.728271484375, 16.5556640625, 17.383056640625, 18.21044921875, 19.037841796875, 19.865234375, 20.692626953125, 21.52001953125, 22.347412109375, 23.1748046875, 24.002197265625, 24.82958984375, 25.656982421875, 26.484375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 797.0, 218.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.39162063598633, -35.188682556152344, -27.985742568969727, -20.78280258178711, -13.579864501953125, -6.376926422119141, 0.8260154724121094, 8.028953552246094, 15.231891632080078, 22.434829711914062, 29.63776969909668, 36.8407096862793, 44.04364776611328, 51.246585845947266, 58.449527740478516, 65.6524658203125, 72.85540771484375, 80.058349609375, 87.26128387451172, 94.46422576904297, 101.66716003417969, 108.87010192871094, 116.07304382324219, 123.27598571777344, 130.47891235351562, 137.68185424804688, 144.88479614257812, 152.08773803710938, 159.29066467285156, 166.4936065673828, 173.69654846191406, 180.8994903564453, 188.1024169921875, 195.30535888671875, 202.50830078125, 209.71124267578125, 216.91416931152344, 224.1171112060547, 231.32005310058594, 238.5229949951172, 245.72592163085938, 252.92886352539062, 260.1318054199219, 267.3347473144531, 274.5376892089844, 281.7406005859375, 288.94354248046875, 296.146484375, 303.34942626953125, 310.5523681640625, 317.75531005859375, 324.958251953125, 332.16119384765625, 339.3641357421875, 346.56707763671875, 353.7699890136719, 360.97296142578125, 368.1759033203125, 375.37884521484375, 382.581787109375, 389.78472900390625, 396.9876708984375, 404.19061279296875, 411.3935241699219, 418.5964660644531]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 6.0, 8.0, 6.0, 21.0, 16.0, 24.0, 23.0, 28.0, 32.0, 27.0, 32.0, 32.0, 30.0, 34.0, 33.0, 49.0, 49.0, 39.0, 39.0, 48.0, 44.0, 50.0, 40.0, 43.0, 32.0, 42.0, 29.0, 20.0, 30.0, 16.0, 14.0, 13.0, 21.0, 5.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.352359771728516, -34.09259796142578, -32.83283615112305, -31.57307243347168, -30.313310623168945, -29.05354881286621, -27.793785095214844, -26.53402328491211, -25.274261474609375, -24.01449966430664, -22.754737854003906, -21.49497413635254, -20.235212326049805, -18.97545051574707, -17.715686798095703, -16.45592498779297, -15.196163177490234, -13.9364013671875, -12.67663860321045, -11.416875839233398, -10.157114028930664, -8.89735221862793, -7.637589454650879, -6.377826690673828, -5.118064880371094, -3.858302593231201, -2.5985403060913086, -1.338778018951416, -0.07901573181152344, 1.1807465553283691, 2.4405088424682617, 3.7002716064453125, 4.960033416748047, 6.2197957038879395, 7.479557991027832, 8.739320755004883, 9.999082565307617, 11.258844375610352, 12.518607139587402, 13.778369903564453, 15.038131713867188, 16.297893524169922, 17.557655334472656, 18.817419052124023, 20.077180862426758, 21.336942672729492, 22.59670639038086, 23.856468200683594, 25.116230010986328, 26.375991821289062, 27.635753631591797, 28.895517349243164, 30.1552791595459, 31.415040969848633, 32.6748046875, 33.934566497802734, 35.19432830810547, 36.4540901184082, 37.71385192871094, 38.97361373901367, 40.233375549316406, 41.493141174316406, 42.75290298461914, 44.012664794921875, 45.27242660522461]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 9.0, 1.0, 5.0, 18.0, 19.0, 22.0, 16.0, 29.0, 26.0, 29.0, 27.0, 40.0, 56.0, 40.0, 45.0, 48.0, 62.0, 50.0, 48.0, 38.0, 50.0, 37.0, 32.0, 34.0, 35.0, 42.0, 25.0, 29.0, 12.0, 17.0, 16.0, 13.0, 6.0, 6.0, 2.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.51171875, -3.387451171875, -3.26318359375, -3.138916015625, -3.0146484375, -2.890380859375, -2.76611328125, -2.641845703125, -2.517578125, -2.393310546875, -2.26904296875, -2.144775390625, -2.0205078125, -1.896240234375, -1.77197265625, -1.647705078125, -1.5234375, -1.399169921875, -1.27490234375, -1.150634765625, -1.0263671875, -0.902099609375, -0.77783203125, -0.653564453125, -0.529296875, -0.405029296875, -0.28076171875, -0.156494140625, -0.0322265625, 0.092041015625, 0.21630859375, 0.340576171875, 0.46484375, 0.589111328125, 0.71337890625, 0.837646484375, 0.9619140625, 1.086181640625, 1.21044921875, 1.334716796875, 1.458984375, 1.583251953125, 1.70751953125, 1.831787109375, 1.9560546875, 2.080322265625, 2.20458984375, 2.328857421875, 2.453125, 2.577392578125, 2.70166015625, 2.825927734375, 2.9501953125, 3.074462890625, 3.19873046875, 3.322998046875, 3.447265625, 3.571533203125, 3.69580078125, 3.820068359375, 3.9443359375, 4.068603515625, 4.19287109375, 4.317138671875, 4.44140625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 11.0, 12.0, 16.0, 20.0, 22.0, 30.0, 39.0, 54.0, 61.0, 81.0, 134.0, 242.0, 573.0, 1928.0, 15012.0, 292064.0, 3627507.0, 239261.0, 13975.0, 1951.0, 525.0, 253.0, 137.0, 73.0, 59.0, 53.0, 45.0, 31.0, 30.0, 22.0, 11.0, 7.0, 9.0, 9.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.478515625, -13.91015625, -13.341796875, -12.7734375, -12.205078125, -11.63671875, -11.068359375, -10.5, -9.931640625, -9.36328125, -8.794921875, -8.2265625, -7.658203125, -7.08984375, -6.521484375, -5.953125, -5.384765625, -4.81640625, -4.248046875, -3.6796875, -3.111328125, -2.54296875, -1.974609375, -1.40625, -0.837890625, -0.26953125, 0.298828125, 0.8671875, 1.435546875, 2.00390625, 2.572265625, 3.140625, 3.708984375, 4.27734375, 4.845703125, 5.4140625, 5.982421875, 6.55078125, 7.119140625, 7.6875, 8.255859375, 8.82421875, 9.392578125, 9.9609375, 10.529296875, 11.09765625, 11.666015625, 12.234375, 12.802734375, 13.37109375, 13.939453125, 14.5078125, 15.076171875, 15.64453125, 16.212890625, 16.78125, 17.349609375, 17.91796875, 18.486328125, 19.0546875, 19.623046875, 20.19140625, 20.759765625, 21.328125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 8.0, 23.0, 22.0, 32.0, 36.0, 70.0, 82.0, 114.0, 186.0, 269.0, 403.0, 495.0, 552.0, 507.0, 343.0, 293.0, 193.0, 126.0, 90.0, 67.0, 51.0, 32.0, 23.0, 20.0, 7.0, 10.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.421875, -14.01513671875, -13.6083984375, -13.20166015625, -12.794921875, -12.38818359375, -11.9814453125, -11.57470703125, -11.16796875, -10.76123046875, -10.3544921875, -9.94775390625, -9.541015625, -9.13427734375, -8.7275390625, -8.32080078125, -7.9140625, -7.50732421875, -7.1005859375, -6.69384765625, -6.287109375, -5.88037109375, -5.4736328125, -5.06689453125, -4.66015625, -4.25341796875, -3.8466796875, -3.43994140625, -3.033203125, -2.62646484375, -2.2197265625, -1.81298828125, -1.40625, -0.99951171875, -0.5927734375, -0.18603515625, 0.220703125, 0.62744140625, 1.0341796875, 1.44091796875, 1.84765625, 2.25439453125, 2.6611328125, 3.06787109375, 3.474609375, 3.88134765625, 4.2880859375, 4.69482421875, 5.1015625, 5.50830078125, 5.9150390625, 6.32177734375, 6.728515625, 7.13525390625, 7.5419921875, 7.94873046875, 8.35546875, 8.76220703125, 9.1689453125, 9.57568359375, 9.982421875, 10.38916015625, 10.7958984375, 11.20263671875, 11.609375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 8.0, 11.0, 21.0, 26.0, 64.0, 105.0, 180.0, 369.0, 968.0, 3964.0, 53357.0, 3016119.0, 1090779.0, 24403.0, 2527.0, 712.0, 291.0, 147.0, 83.0, 43.0, 34.0, 20.0, 14.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.25, -38.09130859375, -36.9326171875, -35.77392578125, -34.615234375, -33.45654296875, -32.2978515625, -31.13916015625, -29.98046875, -28.82177734375, -27.6630859375, -26.50439453125, -25.345703125, -24.18701171875, -23.0283203125, -21.86962890625, -20.7109375, -19.55224609375, -18.3935546875, -17.23486328125, -16.076171875, -14.91748046875, -13.7587890625, -12.60009765625, -11.44140625, -10.28271484375, -9.1240234375, -7.96533203125, -6.806640625, -5.64794921875, -4.4892578125, -3.33056640625, -2.171875, -1.01318359375, 0.1455078125, 1.30419921875, 2.462890625, 3.62158203125, 4.7802734375, 5.93896484375, 7.09765625, 8.25634765625, 9.4150390625, 10.57373046875, 11.732421875, 12.89111328125, 14.0498046875, 15.20849609375, 16.3671875, 17.52587890625, 18.6845703125, 19.84326171875, 21.001953125, 22.16064453125, 23.3193359375, 24.47802734375, 25.63671875, 26.79541015625, 27.9541015625, 29.11279296875, 30.271484375, 31.43017578125, 32.5888671875, 33.74755859375, 34.90625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 29.0, 84.0, 177.0, 277.0, 253.0, 131.0, 44.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.88306427001953, -69.1788558959961, -65.47463989257812, -61.77043151855469, -58.06622314453125, -54.36201477050781, -50.65780258178711, -46.953590393066406, -43.24938201904297, -39.54517364501953, -35.84096145629883, -32.136749267578125, -28.432540893554688, -24.728330612182617, -21.024120330810547, -17.319910049438477, -13.615699768066406, -9.911489486694336, -6.207279205322266, -2.5030689239501953, 1.201141357421875, 4.905351638793945, 8.609561920166016, 12.313772201538086, 16.017982482910156, 19.722192764282227, 23.426403045654297, 27.130613327026367, 30.834823608398438, 34.539031982421875, 38.24324417114258, 41.94745635986328, 45.65167236328125, 49.35588073730469, 53.06009292602539, 56.764305114746094, 60.46851348876953, 64.17272186279297, 67.87693786621094, 71.58114624023438, 75.28535461425781, 78.98956298828125, 82.69377136230469, 86.39798736572266, 90.1021957397461, 93.80640411376953, 97.5106201171875, 101.21482849121094, 104.91903686523438, 108.62324523925781, 112.32745361328125, 116.03166961669922, 119.73587799072266, 123.4400863647461, 127.14430236816406, 130.8485107421875, 134.55271911621094, 138.25692749023438, 141.9611358642578, 145.66534423828125, 149.36956787109375, 153.0737762451172, 156.77798461914062, 160.48219299316406, 164.1864013671875]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 4.0, 5.0, 5.0, 8.0, 8.0, 15.0, 10.0, 16.0, 24.0, 20.0, 16.0, 23.0, 27.0, 18.0, 30.0, 31.0, 30.0, 40.0, 29.0, 40.0, 47.0, 36.0, 36.0, 34.0, 31.0, 41.0, 32.0, 29.0, 34.0, 32.0, 31.0, 30.0, 26.0, 19.0, 17.0, 17.0, 19.0, 12.0, 12.0, 9.0, 10.0, 9.0, 8.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-33.657432556152344, -32.625389099121094, -31.593341827392578, -30.561296463012695, -29.529251098632812, -28.49720573425293, -27.465160369873047, -26.433116912841797, -25.40106964111328, -24.3690242767334, -23.336978912353516, -22.304933547973633, -21.27288818359375, -20.240842819213867, -19.208797454833984, -18.176753997802734, -17.14470863342285, -16.11266326904297, -15.080617904663086, -14.048572540283203, -13.01652717590332, -11.984481811523438, -10.952437400817871, -9.920392036437988, -8.888346672058105, -7.856301307678223, -6.82425594329834, -5.792211055755615, -4.760165691375732, -3.7281203269958496, -2.696075439453125, -1.6640300750732422, -0.6319847106933594, 0.4000605344772339, 1.4321057796478271, 2.464150905609131, 3.4961962699890137, 4.5282416343688965, 5.560286521911621, 6.592331886291504, 7.624377250671387, 8.65642261505127, 9.688467979431152, 10.720512390136719, 11.752557754516602, 12.784603118896484, 13.816648483276367, 14.84869384765625, 15.880739212036133, 16.912784576416016, 17.9448299407959, 18.97687530517578, 20.008920669555664, 21.040966033935547, 22.073009490966797, 23.105056762695312, 24.137100219726562, 25.169145584106445, 26.201190948486328, 27.23323631286621, 28.265281677246094, 29.297327041625977, 30.32937240600586, 31.36141586303711, 32.393463134765625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 2.0, 4.0, 5.0, 9.0, 10.0, 8.0, 12.0, 27.0, 35.0, 27.0, 34.0, 35.0, 43.0, 42.0, 32.0, 49.0, 64.0, 48.0, 55.0, 42.0, 50.0, 41.0, 48.0, 35.0, 47.0, 32.0, 36.0, 18.0, 15.0, 21.0, 23.0, 13.0, 7.0, 9.0, 4.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.642578125, -3.513580322265625, -3.38458251953125, -3.255584716796875, -3.1265869140625, -2.997589111328125, -2.86859130859375, -2.739593505859375, -2.610595703125, -2.481597900390625, -2.35260009765625, -2.223602294921875, -2.0946044921875, -1.965606689453125, -1.83660888671875, -1.707611083984375, -1.57861328125, -1.449615478515625, -1.32061767578125, -1.191619873046875, -1.0626220703125, -0.933624267578125, -0.80462646484375, -0.675628662109375, -0.546630859375, -0.417633056640625, -0.28863525390625, -0.159637451171875, -0.0306396484375, 0.098358154296875, 0.22735595703125, 0.356353759765625, 0.4853515625, 0.614349365234375, 0.74334716796875, 0.872344970703125, 1.0013427734375, 1.130340576171875, 1.25933837890625, 1.388336181640625, 1.517333984375, 1.646331787109375, 1.77532958984375, 1.904327392578125, 2.0333251953125, 2.162322998046875, 2.29132080078125, 2.420318603515625, 2.54931640625, 2.678314208984375, 2.80731201171875, 2.936309814453125, 3.0653076171875, 3.194305419921875, 3.32330322265625, 3.452301025390625, 3.581298828125, 3.710296630859375, 3.83929443359375, 3.968292236328125, 4.0972900390625, 4.226287841796875, 4.35528564453125, 4.484283447265625, 4.61328125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 10.0, 15.0, 23.0, 19.0, 31.0, 45.0, 62.0, 96.0, 156.0, 195.0, 313.0, 448.0, 765.0, 1173.0, 1847.0, 2981.0, 4901.0, 7999.0, 13628.0, 23369.0, 41707.0, 76844.0, 164586.0, 323256.0, 189435.0, 85726.0, 45653.0, 25544.0, 14954.0, 8780.0, 5244.0, 3096.0, 1990.0, 1281.0, 817.0, 538.0, 354.0, 216.0, 141.0, 101.0, 61.0, 65.0, 23.0, 14.0, 23.0, 11.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15981292724609375, -0.1545867919921875, -0.14936065673828125, -0.144134521484375, -0.13890838623046875, -0.1336822509765625, -0.12845611572265625, -0.12322998046875, -0.11800384521484375, -0.1127777099609375, -0.10755157470703125, -0.102325439453125, -0.09709930419921875, -0.0918731689453125, -0.08664703369140625, -0.0814208984375, -0.07619476318359375, -0.0709686279296875, -0.06574249267578125, -0.060516357421875, -0.05529022216796875, -0.0500640869140625, -0.04483795166015625, -0.03961181640625, -0.03438568115234375, -0.0291595458984375, -0.02393341064453125, -0.018707275390625, -0.01348114013671875, -0.0082550048828125, -0.00302886962890625, 0.002197265625, 0.00742340087890625, 0.0126495361328125, 0.01787567138671875, 0.023101806640625, 0.02832794189453125, 0.0335540771484375, 0.03878021240234375, 0.04400634765625, 0.04923248291015625, 0.0544586181640625, 0.05968475341796875, 0.064910888671875, 0.07013702392578125, 0.0753631591796875, 0.08058929443359375, 0.0858154296875, 0.09104156494140625, 0.0962677001953125, 0.10149383544921875, 0.106719970703125, 0.11194610595703125, 0.1171722412109375, 0.12239837646484375, 0.12762451171875, 0.13285064697265625, 0.1380767822265625, 0.14330291748046875, 0.148529052734375, 0.15375518798828125, 0.1589813232421875, 0.16420745849609375, 0.16943359375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 11.0, 12.0, 16.0, 12.0, 9.0, 25.0, 20.0, 31.0, 31.0, 30.0, 29.0, 39.0, 35.0, 36.0, 49.0, 32.0, 49.0, 1075.0, 48.0, 41.0, 37.0, 43.0, 42.0, 35.0, 31.0, 28.0, 38.0, 32.0, 16.0, 14.0, 17.0, 11.0, 7.0, 10.0, 8.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.576171875, -2.4969482421875, -2.417724609375, -2.3385009765625, -2.25927734375, -2.1800537109375, -2.100830078125, -2.0216064453125, -1.9423828125, -1.8631591796875, -1.783935546875, -1.7047119140625, -1.62548828125, -1.5462646484375, -1.467041015625, -1.3878173828125, -1.30859375, -1.2293701171875, -1.150146484375, -1.0709228515625, -0.99169921875, -0.9124755859375, -0.833251953125, -0.7540283203125, -0.6748046875, -0.5955810546875, -0.516357421875, -0.4371337890625, -0.35791015625, -0.2786865234375, -0.199462890625, -0.1202392578125, -0.041015625, 0.0382080078125, 0.117431640625, 0.1966552734375, 0.27587890625, 0.3551025390625, 0.434326171875, 0.5135498046875, 0.5927734375, 0.6719970703125, 0.751220703125, 0.8304443359375, 0.90966796875, 0.9888916015625, 1.068115234375, 1.1473388671875, 1.2265625, 1.3057861328125, 1.385009765625, 1.4642333984375, 1.54345703125, 1.6226806640625, 1.701904296875, 1.7811279296875, 1.8603515625, 1.9395751953125, 2.018798828125, 2.0980224609375, 2.17724609375, 2.2564697265625, 2.335693359375, 2.4149169921875, 2.494140625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 11.0, 16.0, 25.0, 32.0, 50.0, 69.0, 126.0, 184.0, 269.0, 426.0, 594.0, 992.0, 1487.0, 2308.0, 3740.0, 5824.0, 9324.0, 15558.0, 25828.0, 44531.0, 80669.0, 172852.0, 1364610.0, 174849.0, 81141.0, 44376.0, 26178.0, 15621.0, 9266.0, 5797.0, 3707.0, 2346.0, 1496.0, 984.0, 598.0, 420.0, 274.0, 167.0, 111.0, 88.0, 60.0, 41.0, 27.0, 15.0, 10.0, 12.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.151611328125, -0.14679908752441406, -0.14198684692382812, -0.1371746063232422, -0.13236236572265625, -0.1275501251220703, -0.12273788452148438, -0.11792564392089844, -0.1131134033203125, -0.10830116271972656, -0.10348892211914062, -0.09867668151855469, -0.09386444091796875, -0.08905220031738281, -0.08423995971679688, -0.07942771911621094, -0.074615478515625, -0.06980323791503906, -0.06499099731445312, -0.06017875671386719, -0.05536651611328125, -0.05055427551269531, -0.045742034912109375, -0.04092979431152344, -0.0361175537109375, -0.03130531311035156, -0.026493072509765625, -0.021680831909179688, -0.01686859130859375, -0.012056350708007812, -0.007244110107421875, -0.0024318695068359375, 0.00238037109375, 0.0071926116943359375, 0.012004852294921875, 0.016817092895507812, 0.02162933349609375, 0.026441574096679688, 0.031253814697265625, 0.03606605529785156, 0.0408782958984375, 0.04569053649902344, 0.050502777099609375, 0.05531501770019531, 0.06012725830078125, 0.06493949890136719, 0.06975173950195312, 0.07456398010253906, 0.079376220703125, 0.08418846130371094, 0.08900070190429688, 0.09381294250488281, 0.09862518310546875, 0.10343742370605469, 0.10824966430664062, 0.11306190490722656, 0.1178741455078125, 0.12268638610839844, 0.12749862670898438, 0.1323108673095703, 0.13712310791015625, 0.1419353485107422, 0.14674758911132812, 0.15155982971191406, 0.1563720703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 8.0, 6.0, 9.0, 13.0, 8.0, 24.0, 18.0, 18.0, 16.0, 26.0, 28.0, 20.0, 35.0, 27.0, 36.0, 52.0, 39.0, 45.0, 46.0, 32.0, 44.0, 47.0, 51.0, 44.0, 34.0, 36.0, 25.0, 28.0, 29.0, 27.0, 18.0, 13.0, 15.0, 14.0, 13.0, 7.0, 6.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.6748905181884766e-05, -1.6219913959503174e-05, -1.5690922737121582e-05, -1.516193151473999e-05, -1.4632940292358398e-05, -1.4103949069976807e-05, -1.3574957847595215e-05, -1.3045966625213623e-05, -1.2516975402832031e-05, -1.198798418045044e-05, -1.1458992958068848e-05, -1.0930001735687256e-05, -1.0401010513305664e-05, -9.872019290924072e-06, -9.34302806854248e-06, -8.814036846160889e-06, -8.285045623779297e-06, -7.756054401397705e-06, -7.227063179016113e-06, -6.6980719566345215e-06, -6.16908073425293e-06, -5.640089511871338e-06, -5.111098289489746e-06, -4.582107067108154e-06, -4.0531158447265625e-06, -3.5241246223449707e-06, -2.995133399963379e-06, -2.466142177581787e-06, -1.9371509552001953e-06, -1.4081597328186035e-06, -8.791685104370117e-07, -3.501772880554199e-07, 1.7881393432617188e-07, 7.078051567077637e-07, 1.2367963790893555e-06, 1.7657876014709473e-06, 2.294778823852539e-06, 2.823770046234131e-06, 3.3527612686157227e-06, 3.8817524909973145e-06, 4.410743713378906e-06, 4.939734935760498e-06, 5.46872615814209e-06, 5.997717380523682e-06, 6.5267086029052734e-06, 7.055699825286865e-06, 7.584691047668457e-06, 8.113682270050049e-06, 8.64267349243164e-06, 9.171664714813232e-06, 9.700655937194824e-06, 1.0229647159576416e-05, 1.0758638381958008e-05, 1.12876296043396e-05, 1.1816620826721191e-05, 1.2345612049102783e-05, 1.2874603271484375e-05, 1.3403594493865967e-05, 1.3932585716247559e-05, 1.446157693862915e-05, 1.4990568161010742e-05, 1.5519559383392334e-05, 1.6048550605773926e-05, 1.6577541828155518e-05, 1.710653305053711e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 6.0, 7.0, 11.0, 8.0, 21.0, 17.0, 18.0, 38.0, 49.0, 53.0, 67.0, 87.0, 117.0, 136.0, 185.0, 293.0, 521.0, 1748.0, 436534.0, 604772.0, 2204.0, 540.0, 270.0, 181.0, 163.0, 95.0, 60.0, 60.0, 52.0, 56.0, 30.0, 27.0, 30.0, 18.0, 15.0, 16.0, 9.0, 9.0, 14.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00034689903259277344, -0.0003357231616973877, -0.00032454729080200195, -0.0003133714199066162, -0.00030219554901123047, -0.0002910196781158447, -0.000279843807220459, -0.00026866793632507324, -0.0002574920654296875, -0.00024631619453430176, -0.00023514032363891602, -0.00022396445274353027, -0.00021278858184814453, -0.0002016127109527588, -0.00019043684005737305, -0.0001792609691619873, -0.00016808509826660156, -0.00015690922737121582, -0.00014573335647583008, -0.00013455748558044434, -0.0001233816146850586, -0.00011220574378967285, -0.00010102987289428711, -8.985400199890137e-05, -7.867813110351562e-05, -6.750226020812988e-05, -5.632638931274414e-05, -4.51505184173584e-05, -3.3974647521972656e-05, -2.2798776626586914e-05, -1.1622905731201172e-05, -4.470348358154297e-07, 1.0728836059570312e-05, 2.1904706954956055e-05, 3.30805778503418e-05, 4.425644874572754e-05, 5.543231964111328e-05, 6.660819053649902e-05, 7.778406143188477e-05, 8.895993232727051e-05, 0.00010013580322265625, 0.00011131167411804199, 0.00012248754501342773, 0.00013366341590881348, 0.00014483928680419922, 0.00015601515769958496, 0.0001671910285949707, 0.00017836689949035645, 0.0001895427703857422, 0.00020071864128112793, 0.00021189451217651367, 0.00022307038307189941, 0.00023424625396728516, 0.0002454221248626709, 0.00025659799575805664, 0.0002677738666534424, 0.0002789497375488281, 0.00029012560844421387, 0.0003013014793395996, 0.00031247735023498535, 0.0003236532211303711, 0.00033482909202575684, 0.0003460049629211426, 0.0003571808338165283, 0.00036835670471191406]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 37.0, 118.0, 200.0, 254.0, 219.0, 105.0, 43.0, 20.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.800529495696537e-05, -4.7034693125169724e-05, -4.6064091293374076e-05, -4.5093493099557236e-05, -4.412289126776159e-05, -4.315228943596594e-05, -4.218168760417029e-05, -4.1211085772374645e-05, -4.0240483940579e-05, -3.926988210878335e-05, -3.82992802769877e-05, -3.732868208317086e-05, -3.635808025137521e-05, -3.5387478419579566e-05, -3.441687658778392e-05, -3.344627475598827e-05, -3.247567656217143e-05, -3.150507473037578e-05, -3.0534472898580134e-05, -2.956387288577389e-05, -2.8593272872967646e-05, -2.7622671041171998e-05, -2.665206920937635e-05, -2.5681467377580702e-05, -2.4710867364774458e-05, -2.374026553297881e-05, -2.2769665520172566e-05, -2.179906368837692e-05, -2.082846185658127e-05, -1.9857861843775027e-05, -1.888726001197938e-05, -1.7916659999173135e-05, -1.6946058167377487e-05, -1.597545633558184e-05, -1.5004856322775595e-05, -1.4034254490979947e-05, -1.3063653568679001e-05, -1.2093052646378055e-05, -1.1122450814582407e-05, -1.0151849892281462e-05, -9.181249879475217e-06, -8.210648957174271e-06, -7.2400475801259745e-06, -6.269446203077678e-06, -5.298845280776732e-06, -4.328244358475786e-06, -3.357642981427489e-06, -2.387041604379192e-06, -1.416440682078246e-06, -4.458395324036246e-07, 5.247616172709968e-07, 1.4953627669456182e-06, 2.4659639166202396e-06, 3.4365648389211856e-06, 4.4071662159694824e-06, 5.377767593017779e-06, 6.348368515318725e-06, 7.318969437619671e-06, 8.289571269415319e-06, 9.260172191716265e-06, 1.0230773114017211e-05, 1.1201374036318157e-05, 1.2171974958619103e-05, 1.314257679041475e-05, 1.4113177712715697e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 10.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 8.0, 19.0, 12.0, 15.0, 13.0, 17.0, 21.0, 26.0, 30.0, 23.0, 41.0, 32.0, 39.0, 30.0, 22.0, 38.0, 30.0, 30.0, 51.0, 32.0, 33.0, 33.0, 35.0, 30.0, 32.0, 32.0, 23.0, 26.0, 21.0, 22.0, 18.0, 19.0, 23.0, 15.0, 17.0, 11.0, 9.0, 7.0, 7.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0], "bins": [-1.0728836059570312e-05, -1.0409392416477203e-05, -1.0089948773384094e-05, -9.770505130290985e-06, -9.451061487197876e-06, -9.131617844104767e-06, -8.812174201011658e-06, -8.492730557918549e-06, -8.17328691482544e-06, -7.85384327173233e-06, -7.534399628639221e-06, -7.214955985546112e-06, -6.895512342453003e-06, -6.576068699359894e-06, -6.256625056266785e-06, -5.9371814131736755e-06, -5.617737770080566e-06, -5.298294126987457e-06, -4.978850483894348e-06, -4.659406840801239e-06, -4.33996319770813e-06, -4.020519554615021e-06, -3.7010759115219116e-06, -3.3816322684288025e-06, -3.0621886253356934e-06, -2.7427449822425842e-06, -2.423301339149475e-06, -2.103857696056366e-06, -1.7844140529632568e-06, -1.4649704098701477e-06, -1.1455267667770386e-06, -8.260831236839294e-07, -5.066394805908203e-07, -1.8719583749771118e-07, 1.3224780559539795e-07, 4.516914486885071e-07, 7.711350917816162e-07, 1.0905787348747253e-06, 1.4100223779678345e-06, 1.7294660210609436e-06, 2.0489096641540527e-06, 2.368353307247162e-06, 2.687796950340271e-06, 3.00724059343338e-06, 3.3266842365264893e-06, 3.6461278796195984e-06, 3.9655715227127075e-06, 4.285015165805817e-06, 4.604458808898926e-06, 4.923902451992035e-06, 5.243346095085144e-06, 5.562789738178253e-06, 5.882233381271362e-06, 6.2016770243644714e-06, 6.5211206674575806e-06, 6.84056431055069e-06, 7.160007953643799e-06, 7.479451596736908e-06, 7.798895239830017e-06, 8.118338882923126e-06, 8.437782526016235e-06, 8.757226169109344e-06, 9.076669812202454e-06, 9.396113455295563e-06, 9.715557098388672e-06]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 2.0, 4.0, 5.0, 9.0, 10.0, 8.0, 12.0, 27.0, 35.0, 27.0, 34.0, 35.0, 43.0, 42.0, 32.0, 49.0, 64.0, 48.0, 55.0, 42.0, 50.0, 41.0, 48.0, 35.0, 47.0, 32.0, 36.0, 18.0, 15.0, 21.0, 23.0, 13.0, 7.0, 9.0, 4.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.642578125, -3.513580322265625, -3.38458251953125, -3.255584716796875, -3.1265869140625, -2.997589111328125, -2.86859130859375, -2.739593505859375, -2.610595703125, -2.481597900390625, -2.35260009765625, -2.223602294921875, -2.0946044921875, -1.965606689453125, -1.83660888671875, -1.707611083984375, -1.57861328125, -1.449615478515625, -1.32061767578125, -1.191619873046875, -1.0626220703125, -0.933624267578125, -0.80462646484375, -0.675628662109375, -0.546630859375, -0.417633056640625, -0.28863525390625, -0.159637451171875, -0.0306396484375, 0.098358154296875, 0.22735595703125, 0.356353759765625, 0.4853515625, 0.614349365234375, 0.74334716796875, 0.872344970703125, 1.0013427734375, 1.130340576171875, 1.25933837890625, 1.388336181640625, 1.517333984375, 1.646331787109375, 1.77532958984375, 1.904327392578125, 2.0333251953125, 2.162322998046875, 2.29132080078125, 2.420318603515625, 2.54931640625, 2.678314208984375, 2.80731201171875, 2.936309814453125, 3.0653076171875, 3.194305419921875, 3.32330322265625, 3.452301025390625, 3.581298828125, 3.710296630859375, 3.83929443359375, 3.968292236328125, 4.0972900390625, 4.226287841796875, 4.35528564453125, 4.484283447265625, 4.61328125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 10.0, 10.0, 14.0, 18.0, 28.0, 41.0, 71.0, 85.0, 110.0, 172.0, 250.0, 401.0, 641.0, 1086.0, 1751.0, 2986.0, 5247.0, 9595.0, 17802.0, 36214.0, 85877.0, 256285.0, 404635.0, 125258.0, 49238.0, 22961.0, 11961.0, 6507.0, 3628.0, 2133.0, 1261.0, 778.0, 485.0, 307.0, 209.0, 151.0, 97.0, 65.0, 51.0, 33.0, 21.0, 18.0, 20.0, 9.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.44140625, -2.36053466796875, -2.2796630859375, -2.19879150390625, -2.117919921875, -2.03704833984375, -1.9561767578125, -1.87530517578125, -1.79443359375, -1.71356201171875, -1.6326904296875, -1.55181884765625, -1.470947265625, -1.39007568359375, -1.3092041015625, -1.22833251953125, -1.1474609375, -1.06658935546875, -0.9857177734375, -0.90484619140625, -0.823974609375, -0.74310302734375, -0.6622314453125, -0.58135986328125, -0.50048828125, -0.41961669921875, -0.3387451171875, -0.25787353515625, -0.177001953125, -0.09613037109375, -0.0152587890625, 0.06561279296875, 0.146484375, 0.22735595703125, 0.3082275390625, 0.38909912109375, 0.469970703125, 0.55084228515625, 0.6317138671875, 0.71258544921875, 0.79345703125, 0.87432861328125, 0.9552001953125, 1.03607177734375, 1.116943359375, 1.19781494140625, 1.2786865234375, 1.35955810546875, 1.4404296875, 1.52130126953125, 1.6021728515625, 1.68304443359375, 1.763916015625, 1.84478759765625, 1.9256591796875, 2.00653076171875, 2.08740234375, 2.16827392578125, 2.2491455078125, 2.33001708984375, 2.410888671875, 2.49176025390625, 2.5726318359375, 2.65350341796875, 2.734375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 5.0, 13.0, 6.0, 14.0, 14.0, 15.0, 15.0, 17.0, 22.0, 24.0, 24.0, 26.0, 24.0, 22.0, 37.0, 36.0, 50.0, 66.0, 89.0, 305.0, 1569.0, 138.0, 70.0, 42.0, 46.0, 36.0, 40.0, 34.0, 27.0, 35.0, 27.0, 14.0, 24.0, 21.0, 12.0, 11.0, 12.0, 11.0, 7.0, 7.0, 2.0, 8.0, 6.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-11.4375, -11.0819091796875, -10.726318359375, -10.3707275390625, -10.01513671875, -9.6595458984375, -9.303955078125, -8.9483642578125, -8.5927734375, -8.2371826171875, -7.881591796875, -7.5260009765625, -7.17041015625, -6.8148193359375, -6.459228515625, -6.1036376953125, -5.748046875, -5.3924560546875, -5.036865234375, -4.6812744140625, -4.32568359375, -3.9700927734375, -3.614501953125, -3.2589111328125, -2.9033203125, -2.5477294921875, -2.192138671875, -1.8365478515625, -1.48095703125, -1.1253662109375, -0.769775390625, -0.4141845703125, -0.05859375, 0.2969970703125, 0.652587890625, 1.0081787109375, 1.36376953125, 1.7193603515625, 2.074951171875, 2.4305419921875, 2.7861328125, 3.1417236328125, 3.497314453125, 3.8529052734375, 4.20849609375, 4.5640869140625, 4.919677734375, 5.2752685546875, 5.630859375, 5.9864501953125, 6.342041015625, 6.6976318359375, 7.05322265625, 7.4088134765625, 7.764404296875, 8.1199951171875, 8.4755859375, 8.8311767578125, 9.186767578125, 9.5423583984375, 9.89794921875, 10.2535400390625, 10.609130859375, 10.9647216796875, 11.3203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 11.0, 10.0, 13.0, 10.0, 15.0, 24.0, 23.0, 28.0, 36.0, 49.0, 57.0, 65.0, 126.0, 195.0, 341.0, 850.0, 3553.0, 41262.0, 2915134.0, 173920.0, 7350.0, 1370.0, 472.0, 234.0, 135.0, 81.0, 61.0, 43.0, 29.0, 37.0, 19.0, 24.0, 17.0, 21.0, 13.0, 15.0, 7.0, 10.0, 6.0, 2.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.625, -19.005615234375, -18.38623046875, -17.766845703125, -17.1474609375, -16.528076171875, -15.90869140625, -15.289306640625, -14.669921875, -14.050537109375, -13.43115234375, -12.811767578125, -12.1923828125, -11.572998046875, -10.95361328125, -10.334228515625, -9.71484375, -9.095458984375, -8.47607421875, -7.856689453125, -7.2373046875, -6.617919921875, -5.99853515625, -5.379150390625, -4.759765625, -4.140380859375, -3.52099609375, -2.901611328125, -2.2822265625, -1.662841796875, -1.04345703125, -0.424072265625, 0.1953125, 0.814697265625, 1.43408203125, 2.053466796875, 2.6728515625, 3.292236328125, 3.91162109375, 4.531005859375, 5.150390625, 5.769775390625, 6.38916015625, 7.008544921875, 7.6279296875, 8.247314453125, 8.86669921875, 9.486083984375, 10.10546875, 10.724853515625, 11.34423828125, 11.963623046875, 12.5830078125, 13.202392578125, 13.82177734375, 14.441162109375, 15.060546875, 15.679931640625, 16.29931640625, 16.918701171875, 17.5380859375, 18.157470703125, 18.77685546875, 19.396240234375, 20.015625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 50.0, 876.0, 92.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.466377258300781, -7.657550811767578, -2.848724365234375, 1.9601020812988281, 6.768928527832031, 11.577754974365234, 16.386581420898438, 21.19540786743164, 26.004234313964844, 30.813060760498047, 35.62188720703125, 40.43071365356445, 45.239540100097656, 50.04836654663086, 54.85719299316406, 59.666019439697266, 64.47484588623047, 69.28367614746094, 74.09249877929688, 78.90132141113281, 83.71015167236328, 88.51898193359375, 93.32780456542969, 98.13662719726562, 102.9454574584961, 107.75428771972656, 112.5631103515625, 117.37193298339844, 122.1807632446289, 126.98959350585938, 131.7984161376953, 136.60723876953125, 141.41607666015625, 146.2248992919922, 151.03372192382812, 155.84255981445312, 160.65138244628906, 165.460205078125, 170.26904296875, 175.07786560058594, 179.88668823242188, 184.6955108642578, 189.50433349609375, 194.31317138671875, 199.1219940185547, 203.93081665039062, 208.73965454101562, 213.54847717285156, 218.3572998046875, 223.16612243652344, 227.97494506835938, 232.78378295898438, 237.5926055908203, 242.40142822265625, 247.21026611328125, 252.0190887451172, 256.8279113769531, 261.6367492675781, 266.445556640625, 271.25439453125, 276.063232421875, 280.8720397949219, 285.6808776855469, 290.48968505859375, 295.29852294921875]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 4.0, 6.0, 4.0, 6.0, 8.0, 14.0, 14.0, 23.0, 22.0, 24.0, 22.0, 23.0, 17.0, 24.0, 35.0, 41.0, 39.0, 37.0, 47.0, 35.0, 38.0, 27.0, 38.0, 36.0, 40.0, 47.0, 44.0, 35.0, 38.0, 31.0, 18.0, 24.0, 29.0, 19.0, 17.0, 10.0, 6.0, 19.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-39.55100631713867, -38.2352294921875, -36.91945266723633, -35.603675842285156, -34.287899017333984, -32.97212219238281, -31.656347274780273, -30.3405704498291, -29.02479362487793, -27.709016799926758, -26.393239974975586, -25.077463150024414, -23.761688232421875, -22.445911407470703, -21.13013458251953, -19.81435775756836, -18.498580932617188, -17.182804107666016, -15.867027282714844, -14.551251411437988, -13.235474586486816, -11.919697761535645, -10.603921890258789, -9.288145065307617, -7.972368240356445, -6.656591415405273, -5.34081506729126, -4.025038719177246, -2.709261894226074, -1.3934850692749023, -0.07770872116088867, 1.238067626953125, 2.5538482666015625, 3.8696248531341553, 5.185401439666748, 6.501177787780762, 7.816954612731934, 9.132731437683105, 10.448507308959961, 11.764284133911133, 13.080060958862305, 14.395837783813477, 15.711614608764648, 17.02739143371582, 18.34316635131836, 19.65894317626953, 20.974720001220703, 22.290496826171875, 23.606273651123047, 24.92205047607422, 26.23782730102539, 27.553604125976562, 28.869380950927734, 30.185157775878906, 31.500932693481445, 32.81671142578125, 34.132484436035156, 35.44826126098633, 36.7640380859375, 38.07981491088867, 39.395591735839844, 40.711368560791016, 42.02714538574219, 43.342918395996094, 44.65869903564453]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 8.0, 7.0, 9.0, 9.0, 21.0, 28.0, 23.0, 34.0, 33.0, 32.0, 40.0, 42.0, 47.0, 46.0, 52.0, 51.0, 50.0, 64.0, 43.0, 38.0, 42.0, 42.0, 36.0, 36.0, 39.0, 18.0, 16.0, 16.0, 22.0, 11.0, 9.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7890625, -3.6541748046875, -3.519287109375, -3.3843994140625, -3.24951171875, -3.1146240234375, -2.979736328125, -2.8448486328125, -2.7099609375, -2.5750732421875, -2.440185546875, -2.3052978515625, -2.17041015625, -2.0355224609375, -1.900634765625, -1.7657470703125, -1.630859375, -1.4959716796875, -1.361083984375, -1.2261962890625, -1.09130859375, -0.9564208984375, -0.821533203125, -0.6866455078125, -0.5517578125, -0.4168701171875, -0.281982421875, -0.1470947265625, -0.01220703125, 0.1226806640625, 0.257568359375, 0.3924560546875, 0.52734375, 0.6622314453125, 0.797119140625, 0.9320068359375, 1.06689453125, 1.2017822265625, 1.336669921875, 1.4715576171875, 1.6064453125, 1.7413330078125, 1.876220703125, 2.0111083984375, 2.14599609375, 2.2808837890625, 2.415771484375, 2.5506591796875, 2.685546875, 2.8204345703125, 2.955322265625, 3.0902099609375, 3.22509765625, 3.3599853515625, 3.494873046875, 3.6297607421875, 3.7646484375, 3.8995361328125, 4.034423828125, 4.1693115234375, 4.30419921875, 4.4390869140625, 4.573974609375, 4.7088623046875, 4.84375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 16.0, 14.0, 14.0, 20.0, 37.0, 33.0, 52.0, 62.0, 112.0, 176.0, 430.0, 2167.0, 26105.0, 1175035.0, 2924974.0, 59764.0, 3972.0, 643.0, 224.0, 111.0, 66.0, 64.0, 42.0, 27.0, 22.0, 18.0, 10.0, 11.0, 18.0, 9.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.4375, -18.770263671875, -18.10302734375, -17.435791015625, -16.7685546875, -16.101318359375, -15.43408203125, -14.766845703125, -14.099609375, -13.432373046875, -12.76513671875, -12.097900390625, -11.4306640625, -10.763427734375, -10.09619140625, -9.428955078125, -8.76171875, -8.094482421875, -7.42724609375, -6.760009765625, -6.0927734375, -5.425537109375, -4.75830078125, -4.091064453125, -3.423828125, -2.756591796875, -2.08935546875, -1.422119140625, -0.7548828125, -0.087646484375, 0.57958984375, 1.246826171875, 1.9140625, 2.581298828125, 3.24853515625, 3.915771484375, 4.5830078125, 5.250244140625, 5.91748046875, 6.584716796875, 7.251953125, 7.919189453125, 8.58642578125, 9.253662109375, 9.9208984375, 10.588134765625, 11.25537109375, 11.922607421875, 12.58984375, 13.257080078125, 13.92431640625, 14.591552734375, 15.2587890625, 15.926025390625, 16.59326171875, 17.260498046875, 17.927734375, 18.594970703125, 19.26220703125, 19.929443359375, 20.5966796875, 21.263916015625, 21.93115234375, 22.598388671875, 23.265625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 16.0, 13.0, 18.0, 21.0, 45.0, 62.0, 125.0, 148.0, 193.0, 282.0, 369.0, 511.0, 597.0, 515.0, 346.0, 259.0, 183.0, 115.0, 97.0, 52.0, 36.0, 23.0, 15.0, 10.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2578125, -14.8597412109375, -14.461669921875, -14.0635986328125, -13.66552734375, -13.2674560546875, -12.869384765625, -12.4713134765625, -12.0732421875, -11.6751708984375, -11.277099609375, -10.8790283203125, -10.48095703125, -10.0828857421875, -9.684814453125, -9.2867431640625, -8.888671875, -8.4906005859375, -8.092529296875, -7.6944580078125, -7.29638671875, -6.8983154296875, -6.500244140625, -6.1021728515625, -5.7041015625, -5.3060302734375, -4.907958984375, -4.5098876953125, -4.11181640625, -3.7137451171875, -3.315673828125, -2.9176025390625, -2.51953125, -2.1214599609375, -1.723388671875, -1.3253173828125, -0.92724609375, -0.5291748046875, -0.131103515625, 0.2669677734375, 0.6650390625, 1.0631103515625, 1.461181640625, 1.8592529296875, 2.25732421875, 2.6553955078125, 3.053466796875, 3.4515380859375, 3.849609375, 4.2476806640625, 4.645751953125, 5.0438232421875, 5.44189453125, 5.8399658203125, 6.238037109375, 6.6361083984375, 7.0341796875, 7.4322509765625, 7.830322265625, 8.2283935546875, 8.62646484375, 9.0245361328125, 9.422607421875, 9.8206787109375, 10.21875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 11.0, 6.0, 12.0, 16.0, 24.0, 49.0, 95.0, 113.0, 200.0, 274.0, 612.0, 2426.0, 25384.0, 800149.0, 3269726.0, 87364.0, 5637.0, 1061.0, 435.0, 259.0, 175.0, 92.0, 73.0, 30.0, 19.0, 12.0, 12.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-33.65625, -32.57763671875, -31.4990234375, -30.42041015625, -29.341796875, -28.26318359375, -27.1845703125, -26.10595703125, -25.02734375, -23.94873046875, -22.8701171875, -21.79150390625, -20.712890625, -19.63427734375, -18.5556640625, -17.47705078125, -16.3984375, -15.31982421875, -14.2412109375, -13.16259765625, -12.083984375, -11.00537109375, -9.9267578125, -8.84814453125, -7.76953125, -6.69091796875, -5.6123046875, -4.53369140625, -3.455078125, -2.37646484375, -1.2978515625, -0.21923828125, 0.859375, 1.93798828125, 3.0166015625, 4.09521484375, 5.173828125, 6.25244140625, 7.3310546875, 8.40966796875, 9.48828125, 10.56689453125, 11.6455078125, 12.72412109375, 13.802734375, 14.88134765625, 15.9599609375, 17.03857421875, 18.1171875, 19.19580078125, 20.2744140625, 21.35302734375, 22.431640625, 23.51025390625, 24.5888671875, 25.66748046875, 26.74609375, 27.82470703125, 28.9033203125, 29.98193359375, 31.060546875, 32.13916015625, 33.2177734375, 34.29638671875, 35.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 18.0, 76.0, 207.0, 334.0, 258.0, 94.0, 20.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.193058013916016, -27.36686134338379, -22.540664672851562, -17.71446990966797, -12.888273239135742, -8.062076568603516, -3.235881805419922, 1.5903167724609375, 6.416511535644531, 11.242708206176758, 16.068904876708984, 20.895099639892578, 25.721296310424805, 30.54749298095703, 35.373687744140625, 40.199886322021484, 45.02608108520508, 49.85227584838867, 54.67847442626953, 59.504669189453125, 64.33086395263672, 69.15705871582031, 73.98326110839844, 78.80945587158203, 83.63565063476562, 88.46184539794922, 93.28804016113281, 98.11424255371094, 102.94043731689453, 107.76663208007812, 112.59282684326172, 117.41902160644531, 122.24522399902344, 127.07141876220703, 131.89761352539062, 136.72381591796875, 141.5500030517578, 146.37620544433594, 151.202392578125, 156.02859497070312, 160.85479736328125, 165.68099975585938, 170.50718688964844, 175.33338928222656, 180.15957641601562, 184.98577880859375, 189.81198120117188, 194.63816833496094, 199.46435546875, 204.29055786132812, 209.1167449951172, 213.9429473876953, 218.76913452148438, 223.5953369140625, 228.42153930664062, 233.2477264404297, 238.0739288330078, 242.90013122558594, 247.726318359375, 252.55252075195312, 257.37872314453125, 262.20489501953125, 267.0310974121094, 271.8572998046875, 276.6835021972656]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 8.0, 5.0, 9.0, 8.0, 12.0, 12.0, 15.0, 21.0, 25.0, 14.0, 29.0, 25.0, 31.0, 34.0, 40.0, 40.0, 50.0, 47.0, 32.0, 54.0, 32.0, 43.0, 36.0, 44.0, 36.0, 32.0, 28.0, 34.0, 24.0, 30.0, 25.0, 28.0, 17.0, 15.0, 11.0, 8.0, 9.0, 11.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-39.5534782409668, -38.45800018310547, -37.36252212524414, -36.26704406738281, -35.171566009521484, -34.076087951660156, -32.980613708496094, -31.885133743286133, -30.789657592773438, -29.69417953491211, -28.59870147705078, -27.503223419189453, -26.407747268676758, -25.31226921081543, -24.2167911529541, -23.121313095092773, -22.025835037231445, -20.930356979370117, -19.83487892150879, -18.739402770996094, -17.643924713134766, -16.548446655273438, -15.45296859741211, -14.357490539550781, -13.26201343536377, -12.166535377502441, -11.07105827331543, -9.975580215454102, -8.880102157592773, -7.784625053405762, -6.689146995544434, -5.593669414520264, -4.498191833496094, -3.402714252471924, -2.307236433029175, -1.2117586135864258, -0.11628103256225586, 0.9791965484619141, 2.074674606323242, 3.170152187347412, 4.265629768371582, 5.361107349395752, 6.456584930419922, 7.55206298828125, 8.647541046142578, 9.74301815032959, 10.838496208190918, 11.93397331237793, 13.029451370239258, 14.124929428100586, 15.220406532287598, 16.31588363647461, 17.411361694335938, 18.506839752197266, 19.602317810058594, 20.697795867919922, 21.79327392578125, 22.888751983642578, 23.984230041503906, 25.079708099365234, 26.17518424987793, 27.270662307739258, 28.366140365600586, 29.461618423461914, 30.55709457397461]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 10.0, 13.0, 14.0, 21.0, 18.0, 31.0, 24.0, 25.0, 42.0, 38.0, 39.0, 38.0, 46.0, 58.0, 47.0, 44.0, 49.0, 45.0, 48.0, 59.0, 41.0, 38.0, 35.0, 25.0, 24.0, 23.0, 12.0, 19.0, 14.0, 13.0, 19.0, 8.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.990234375, -3.850128173828125, -3.71002197265625, -3.569915771484375, -3.4298095703125, -3.289703369140625, -3.14959716796875, -3.009490966796875, -2.869384765625, -2.729278564453125, -2.58917236328125, -2.449066162109375, -2.3089599609375, -2.168853759765625, -2.02874755859375, -1.888641357421875, -1.74853515625, -1.608428955078125, -1.46832275390625, -1.328216552734375, -1.1881103515625, -1.048004150390625, -0.90789794921875, -0.767791748046875, -0.627685546875, -0.487579345703125, -0.34747314453125, -0.207366943359375, -0.0672607421875, 0.072845458984375, 0.21295166015625, 0.353057861328125, 0.4931640625, 0.633270263671875, 0.77337646484375, 0.913482666015625, 1.0535888671875, 1.193695068359375, 1.33380126953125, 1.473907470703125, 1.614013671875, 1.754119873046875, 1.89422607421875, 2.034332275390625, 2.1744384765625, 2.314544677734375, 2.45465087890625, 2.594757080078125, 2.73486328125, 2.874969482421875, 3.01507568359375, 3.155181884765625, 3.2952880859375, 3.435394287109375, 3.57550048828125, 3.715606689453125, 3.855712890625, 3.995819091796875, 4.13592529296875, 4.276031494140625, 4.4161376953125, 4.556243896484375, 4.69635009765625, 4.836456298828125, 4.9765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 9.0, 12.0, 14.0, 22.0, 19.0, 38.0, 42.0, 66.0, 92.0, 168.0, 237.0, 327.0, 545.0, 791.0, 1244.0, 1978.0, 3238.0, 5158.0, 8337.0, 13361.0, 21904.0, 36629.0, 64206.0, 124624.0, 267932.0, 242421.0, 110389.0, 57621.0, 33523.0, 20574.0, 12413.0, 7589.0, 4799.0, 2980.0, 1906.0, 1121.0, 737.0, 506.0, 303.0, 203.0, 142.0, 106.0, 78.0, 44.0, 34.0, 17.0, 20.0, 13.0, 6.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1658935546875, -0.16069602966308594, -0.15549850463867188, -0.1503009796142578, -0.14510345458984375, -0.1399059295654297, -0.13470840454101562, -0.12951087951660156, -0.1243133544921875, -0.11911582946777344, -0.11391830444335938, -0.10872077941894531, -0.10352325439453125, -0.09832572937011719, -0.09312820434570312, -0.08793067932128906, -0.082733154296875, -0.07753562927246094, -0.07233810424804688, -0.06714057922363281, -0.06194305419921875, -0.05674552917480469, -0.051548004150390625, -0.04635047912597656, -0.0411529541015625, -0.03595542907714844, -0.030757904052734375, -0.025560379028320312, -0.02036285400390625, -0.015165328979492188, -0.009967803955078125, -0.0047702789306640625, 0.00042724609375, 0.0056247711181640625, 0.010822296142578125, 0.016019821166992188, 0.02121734619140625, 0.026414871215820312, 0.031612396240234375, 0.03680992126464844, 0.0420074462890625, 0.04720497131347656, 0.052402496337890625, 0.05760002136230469, 0.06279754638671875, 0.06799507141113281, 0.07319259643554688, 0.07839012145996094, 0.083587646484375, 0.08878517150878906, 0.09398269653320312, 0.09918022155761719, 0.10437774658203125, 0.10957527160644531, 0.11477279663085938, 0.11997032165527344, 0.1251678466796875, 0.13036537170410156, 0.13556289672851562, 0.1407604217529297, 0.14595794677734375, 0.1511554718017578, 0.15635299682617188, 0.16155052185058594, 0.166748046875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 10.0, 6.0, 8.0, 8.0, 16.0, 19.0, 18.0, 13.0, 20.0, 29.0, 35.0, 40.0, 43.0, 37.0, 52.0, 47.0, 49.0, 1068.0, 50.0, 46.0, 31.0, 41.0, 37.0, 29.0, 34.0, 28.0, 35.0, 35.0, 30.0, 13.0, 28.0, 17.0, 9.0, 10.0, 7.0, 7.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443359375, -2.3590087890625, -2.274658203125, -2.1903076171875, -2.10595703125, -2.0216064453125, -1.937255859375, -1.8529052734375, -1.7685546875, -1.6842041015625, -1.599853515625, -1.5155029296875, -1.43115234375, -1.3468017578125, -1.262451171875, -1.1781005859375, -1.09375, -1.0093994140625, -0.925048828125, -0.8406982421875, -0.75634765625, -0.6719970703125, -0.587646484375, -0.5032958984375, -0.4189453125, -0.3345947265625, -0.250244140625, -0.1658935546875, -0.08154296875, 0.0028076171875, 0.087158203125, 0.1715087890625, 0.255859375, 0.3402099609375, 0.424560546875, 0.5089111328125, 0.59326171875, 0.6776123046875, 0.761962890625, 0.8463134765625, 0.9306640625, 1.0150146484375, 1.099365234375, 1.1837158203125, 1.26806640625, 1.3524169921875, 1.436767578125, 1.5211181640625, 1.60546875, 1.6898193359375, 1.774169921875, 1.8585205078125, 1.94287109375, 2.0272216796875, 2.111572265625, 2.1959228515625, 2.2802734375, 2.3646240234375, 2.448974609375, 2.5333251953125, 2.61767578125, 2.7020263671875, 2.786376953125, 2.8707275390625, 2.955078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 10.0, 12.0, 23.0, 37.0, 35.0, 48.0, 94.0, 140.0, 196.0, 290.0, 406.0, 612.0, 987.0, 1419.0, 2188.0, 3344.0, 5470.0, 8784.0, 13887.0, 23714.0, 40505.0, 72774.0, 150522.0, 1353916.0, 203260.0, 91197.0, 49339.0, 28356.0, 16900.0, 10464.0, 6513.0, 4109.0, 2574.0, 1704.0, 1092.0, 731.0, 473.0, 312.0, 227.0, 140.0, 114.0, 70.0, 43.0, 33.0, 18.0, 17.0, 8.0, 8.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.160400390625, -0.1553363800048828, -0.15027236938476562, -0.14520835876464844, -0.14014434814453125, -0.13508033752441406, -0.13001632690429688, -0.12495231628417969, -0.1198883056640625, -0.11482429504394531, -0.10976028442382812, -0.10469627380371094, -0.09963226318359375, -0.09456825256347656, -0.08950424194335938, -0.08444023132324219, -0.079376220703125, -0.07431221008300781, -0.06924819946289062, -0.06418418884277344, -0.05912017822265625, -0.05405616760253906, -0.048992156982421875, -0.04392814636230469, -0.0388641357421875, -0.03380012512207031, -0.028736114501953125, -0.023672103881835938, -0.01860809326171875, -0.013544082641601562, -0.008480072021484375, -0.0034160614013671875, 0.00164794921875, 0.0067119598388671875, 0.011775970458984375, 0.016839981079101562, 0.02190399169921875, 0.026968002319335938, 0.032032012939453125, 0.03709602355957031, 0.0421600341796875, 0.04722404479980469, 0.052288055419921875, 0.05735206604003906, 0.06241607666015625, 0.06748008728027344, 0.07254409790039062, 0.07760810852050781, 0.082672119140625, 0.08773612976074219, 0.09280014038085938, 0.09786415100097656, 0.10292816162109375, 0.10799217224121094, 0.11305618286132812, 0.11812019348144531, 0.1231842041015625, 0.1282482147216797, 0.13331222534179688, 0.13837623596191406, 0.14344024658203125, 0.14850425720214844, 0.15356826782226562, 0.1586322784423828, 0.1636962890625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 6.0, 6.0, 8.0, 6.0, 15.0, 16.0, 19.0, 27.0, 30.0, 33.0, 34.0, 32.0, 42.0, 48.0, 48.0, 58.0, 52.0, 61.0, 51.0, 53.0, 43.0, 37.0, 51.0, 32.0, 41.0, 27.0, 24.0, 18.0, 19.0, 15.0, 11.0, 6.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.562999725341797e-05, -2.493150532245636e-05, -2.423301339149475e-05, -2.3534521460533142e-05, -2.2836029529571533e-05, -2.2137537598609924e-05, -2.1439045667648315e-05, -2.0740553736686707e-05, -2.0042061805725098e-05, -1.934356987476349e-05, -1.864507794380188e-05, -1.794658601284027e-05, -1.7248094081878662e-05, -1.6549602150917053e-05, -1.5851110219955444e-05, -1.5152618288993835e-05, -1.4454126358032227e-05, -1.3755634427070618e-05, -1.3057142496109009e-05, -1.23586505651474e-05, -1.1660158634185791e-05, -1.0961666703224182e-05, -1.0263174772262573e-05, -9.564682841300964e-06, -8.866190910339355e-06, -8.167698979377747e-06, -7.469207048416138e-06, -6.770715117454529e-06, -6.07222318649292e-06, -5.373731255531311e-06, -4.675239324569702e-06, -3.976747393608093e-06, -3.2782554626464844e-06, -2.5797635316848755e-06, -1.8812716007232666e-06, -1.1827796697616577e-06, -4.842877388000488e-07, 2.1420419216156006e-07, 9.126961231231689e-07, 1.6111880540847778e-06, 2.3096799850463867e-06, 3.0081719160079956e-06, 3.7066638469696045e-06, 4.405155777931213e-06, 5.103647708892822e-06, 5.802139639854431e-06, 6.50063157081604e-06, 7.199123501777649e-06, 7.897615432739258e-06, 8.596107363700867e-06, 9.294599294662476e-06, 9.993091225624084e-06, 1.0691583156585693e-05, 1.1390075087547302e-05, 1.2088567018508911e-05, 1.278705894947052e-05, 1.3485550880432129e-05, 1.4184042811393738e-05, 1.4882534742355347e-05, 1.5581026673316956e-05, 1.6279518604278564e-05, 1.6978010535240173e-05, 1.7676502466201782e-05, 1.837499439716339e-05, 1.9073486328125e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 4.0, 8.0, 5.0, 4.0, 17.0, 9.0, 21.0, 24.0, 31.0, 47.0, 82.0, 123.0, 156.0, 260.0, 432.0, 943.0, 99004.0, 942782.0, 3031.0, 566.0, 316.0, 195.0, 129.0, 93.0, 76.0, 46.0, 29.0, 31.0, 25.0, 17.0, 14.0, 5.0, 8.0, 3.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004944801330566406, -0.0004791431128978729, -0.0004638060927391052, -0.0004484690725803375, -0.0004331320524215698, -0.0004177950322628021, -0.0004024580121040344, -0.0003871209919452667, -0.000371783971786499, -0.0003564469516277313, -0.0003411099314689636, -0.0003257729113101959, -0.0003104358911514282, -0.0002950988709926605, -0.0002797618508338928, -0.0002644248306751251, -0.0002490878105163574, -0.00023375079035758972, -0.00021841377019882202, -0.00020307675004005432, -0.00018773972988128662, -0.00017240270972251892, -0.00015706568956375122, -0.00014172866940498352, -0.00012639164924621582, -0.00011105462908744812, -9.571760892868042e-05, -8.038058876991272e-05, -6.504356861114502e-05, -4.970654845237732e-05, -3.436952829360962e-05, -1.903250813484192e-05, -3.6954879760742188e-06, 1.1641532182693481e-05, 2.697855234146118e-05, 4.231557250022888e-05, 5.765259265899658e-05, 7.298961281776428e-05, 8.832663297653198e-05, 0.00010366365313529968, 0.00011900067329406738, 0.00013433769345283508, 0.00014967471361160278, 0.00016501173377037048, 0.00018034875392913818, 0.00019568577408790588, 0.00021102279424667358, 0.00022635981440544128, 0.00024169683456420898, 0.0002570338547229767, 0.0002723708748817444, 0.0002877078950405121, 0.0003030449151992798, 0.0003183819353580475, 0.0003337189555168152, 0.0003490559756755829, 0.0003643929958343506, 0.0003797300159931183, 0.000395067036151886, 0.0004104040563106537, 0.0004257410764694214, 0.0004410780966281891, 0.0004564151167869568, 0.0004717521369457245, 0.0004870891571044922]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 12.0, 29.0, 53.0, 89.0, 176.0, 213.0, 158.0, 137.0, 73.0, 35.0, 20.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359965194249526e-05, -3.27078414557036e-05, -3.1816030968911946e-05, -3.092422048212029e-05, -3.0032409995328635e-05, -2.914059950853698e-05, -2.8248789021745324e-05, -2.735697853495367e-05, -2.6465168048162013e-05, -2.5573357561370358e-05, -2.4681547074578702e-05, -2.3789736587787047e-05, -2.289792610099539e-05, -2.2006115614203736e-05, -2.111430512741208e-05, -2.0222494640620425e-05, -1.933068415382877e-05, -1.8438873667037115e-05, -1.754706318024546e-05, -1.6655252693453804e-05, -1.5763442206662148e-05, -1.4871631719870493e-05, -1.3979821233078837e-05, -1.3088010746287182e-05, -1.2196200259495527e-05, -1.1304389772703871e-05, -1.0412579285912216e-05, -9.52076879912056e-06, -8.628958312328905e-06, -7.73714782553725e-06, -6.845337338745594e-06, -5.953526851953939e-06, -5.061718184151687e-06, -4.169907697360031e-06, -3.278097210568376e-06, -2.3862867237767205e-06, -1.494476236985065e-06, -6.026657501934096e-07, 2.891447365982458e-07, 1.1809552233899012e-06, 2.0727657101815566e-06, 2.964576196973212e-06, 3.8563866837648675e-06, 4.748197170556523e-06, 5.640007657348178e-06, 6.531818144139834e-06, 7.423628630931489e-06, 8.315439117723145e-06, 9.2072496045148e-06, 1.0099060091306455e-05, 1.0990870578098111e-05, 1.1882681064889766e-05, 1.2774491551681422e-05, 1.3666302038473077e-05, 1.4558112525264733e-05, 1.5449923012056388e-05, 1.6341733498848043e-05, 1.72335439856397e-05, 1.8125354472431354e-05, 1.901716495922301e-05, 1.9908975446014665e-05, 2.080078593280632e-05, 2.1692596419597976e-05, 2.258440690638963e-05, 2.3476217393181287e-05]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 7.0, 12.0, 20.0, 11.0, 25.0, 18.0, 23.0, 23.0, 33.0, 46.0, 32.0, 46.0, 43.0, 51.0, 47.0, 52.0, 43.0, 52.0, 42.0, 45.0, 36.0, 32.0, 29.0, 33.0, 23.0, 39.0, 18.0, 25.0, 26.0, 10.0, 13.0, 8.0, 7.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.4841556549072266e-05, -1.442059874534607e-05, -1.3999640941619873e-05, -1.3578683137893677e-05, -1.315772533416748e-05, -1.2736767530441284e-05, -1.2315809726715088e-05, -1.1894851922988892e-05, -1.1473894119262695e-05, -1.1052936315536499e-05, -1.0631978511810303e-05, -1.0211020708084106e-05, -9.79006290435791e-06, -9.369105100631714e-06, -8.948147296905518e-06, -8.527189493179321e-06, -8.106231689453125e-06, -7.685273885726929e-06, -7.264316082000732e-06, -6.843358278274536e-06, -6.42240047454834e-06, -6.0014426708221436e-06, -5.580484867095947e-06, -5.159527063369751e-06, -4.738569259643555e-06, -4.317611455917358e-06, -3.896653652191162e-06, -3.475695848464966e-06, -3.0547380447387695e-06, -2.6337802410125732e-06, -2.212822437286377e-06, -1.7918646335601807e-06, -1.3709068298339844e-06, -9.499490261077881e-07, -5.289912223815918e-07, -1.0803341865539551e-07, 3.129243850708008e-07, 7.338821887969971e-07, 1.1548399925231934e-06, 1.5757977962493896e-06, 1.996755599975586e-06, 2.4177134037017822e-06, 2.8386712074279785e-06, 3.259629011154175e-06, 3.680586814880371e-06, 4.101544618606567e-06, 4.522502422332764e-06, 4.94346022605896e-06, 5.364418029785156e-06, 5.7853758335113525e-06, 6.206333637237549e-06, 6.627291440963745e-06, 7.048249244689941e-06, 7.469207048416138e-06, 7.890164852142334e-06, 8.31112265586853e-06, 8.732080459594727e-06, 9.153038263320923e-06, 9.573996067047119e-06, 9.994953870773315e-06, 1.0415911674499512e-05, 1.0836869478225708e-05, 1.1257827281951904e-05, 1.16787850856781e-05, 1.2099742889404297e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 10.0, 13.0, 14.0, 21.0, 18.0, 31.0, 24.0, 25.0, 42.0, 38.0, 39.0, 38.0, 46.0, 58.0, 47.0, 44.0, 49.0, 45.0, 48.0, 59.0, 41.0, 38.0, 35.0, 25.0, 24.0, 23.0, 12.0, 19.0, 14.0, 13.0, 19.0, 8.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.990234375, -3.850128173828125, -3.71002197265625, -3.569915771484375, -3.4298095703125, -3.289703369140625, -3.14959716796875, -3.009490966796875, -2.869384765625, -2.729278564453125, -2.58917236328125, -2.449066162109375, -2.3089599609375, -2.168853759765625, -2.02874755859375, -1.888641357421875, -1.74853515625, -1.608428955078125, -1.46832275390625, -1.328216552734375, -1.1881103515625, -1.048004150390625, -0.90789794921875, -0.767791748046875, -0.627685546875, -0.487579345703125, -0.34747314453125, -0.207366943359375, -0.0672607421875, 0.072845458984375, 0.21295166015625, 0.353057861328125, 0.4931640625, 0.633270263671875, 0.77337646484375, 0.913482666015625, 1.0535888671875, 1.193695068359375, 1.33380126953125, 1.473907470703125, 1.614013671875, 1.754119873046875, 1.89422607421875, 2.034332275390625, 2.1744384765625, 2.314544677734375, 2.45465087890625, 2.594757080078125, 2.73486328125, 2.874969482421875, 3.01507568359375, 3.155181884765625, 3.2952880859375, 3.435394287109375, 3.57550048828125, 3.715606689453125, 3.855712890625, 3.995819091796875, 4.13592529296875, 4.276031494140625, 4.4161376953125, 4.556243896484375, 4.69635009765625, 4.836456298828125, 4.9765625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 7.0, 6.0, 2.0, 14.0, 18.0, 22.0, 45.0, 52.0, 76.0, 136.0, 178.0, 371.0, 605.0, 1138.0, 2193.0, 4432.0, 9314.0, 24067.0, 89357.0, 531173.0, 298691.0, 54886.0, 17231.0, 7106.0, 3513.0, 1712.0, 897.0, 511.0, 267.0, 165.0, 134.0, 79.0, 45.0, 38.0, 25.0, 11.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.59375, -3.4691162109375, -3.344482421875, -3.2198486328125, -3.09521484375, -2.9705810546875, -2.845947265625, -2.7213134765625, -2.5966796875, -2.4720458984375, -2.347412109375, -2.2227783203125, -2.09814453125, -1.9735107421875, -1.848876953125, -1.7242431640625, -1.599609375, -1.4749755859375, -1.350341796875, -1.2257080078125, -1.10107421875, -0.9764404296875, -0.851806640625, -0.7271728515625, -0.6025390625, -0.4779052734375, -0.353271484375, -0.2286376953125, -0.10400390625, 0.0206298828125, 0.145263671875, 0.2698974609375, 0.39453125, 0.5191650390625, 0.643798828125, 0.7684326171875, 0.89306640625, 1.0177001953125, 1.142333984375, 1.2669677734375, 1.3916015625, 1.5162353515625, 1.640869140625, 1.7655029296875, 1.89013671875, 2.0147705078125, 2.139404296875, 2.2640380859375, 2.388671875, 2.5133056640625, 2.637939453125, 2.7625732421875, 2.88720703125, 3.0118408203125, 3.136474609375, 3.2611083984375, 3.3857421875, 3.5103759765625, 3.635009765625, 3.7596435546875, 3.88427734375, 4.0089111328125, 4.133544921875, 4.2581787109375, 4.3828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 11.0, 9.0, 9.0, 10.0, 12.0, 14.0, 13.0, 31.0, 15.0, 39.0, 31.0, 34.0, 33.0, 34.0, 41.0, 66.0, 60.0, 163.0, 1761.0, 157.0, 62.0, 49.0, 35.0, 49.0, 34.0, 34.0, 32.0, 21.0, 24.0, 20.0, 24.0, 20.0, 14.0, 18.0, 11.0, 10.0, 6.0, 5.0, 5.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 4.0], "bins": [-14.3203125, -13.927978515625, -13.53564453125, -13.143310546875, -12.7509765625, -12.358642578125, -11.96630859375, -11.573974609375, -11.181640625, -10.789306640625, -10.39697265625, -10.004638671875, -9.6123046875, -9.219970703125, -8.82763671875, -8.435302734375, -8.04296875, -7.650634765625, -7.25830078125, -6.865966796875, -6.4736328125, -6.081298828125, -5.68896484375, -5.296630859375, -4.904296875, -4.511962890625, -4.11962890625, -3.727294921875, -3.3349609375, -2.942626953125, -2.55029296875, -2.157958984375, -1.765625, -1.373291015625, -0.98095703125, -0.588623046875, -0.1962890625, 0.196044921875, 0.58837890625, 0.980712890625, 1.373046875, 1.765380859375, 2.15771484375, 2.550048828125, 2.9423828125, 3.334716796875, 3.72705078125, 4.119384765625, 4.51171875, 4.904052734375, 5.29638671875, 5.688720703125, 6.0810546875, 6.473388671875, 6.86572265625, 7.258056640625, 7.650390625, 8.042724609375, 8.43505859375, 8.827392578125, 9.2197265625, 9.612060546875, 10.00439453125, 10.396728515625, 10.7890625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 12.0, 12.0, 19.0, 24.0, 35.0, 33.0, 35.0, 54.0, 77.0, 143.0, 226.0, 471.0, 1231.0, 7796.0, 1411537.0, 1713681.0, 7884.0, 1249.0, 471.0, 193.0, 142.0, 93.0, 61.0, 43.0, 44.0, 22.0, 17.0, 14.0, 9.0, 14.0, 8.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.636474609375, -22.89794921875, -22.159423828125, -21.4208984375, -20.682373046875, -19.94384765625, -19.205322265625, -18.466796875, -17.728271484375, -16.98974609375, -16.251220703125, -15.5126953125, -14.774169921875, -14.03564453125, -13.297119140625, -12.55859375, -11.820068359375, -11.08154296875, -10.343017578125, -9.6044921875, -8.865966796875, -8.12744140625, -7.388916015625, -6.650390625, -5.911865234375, -5.17333984375, -4.434814453125, -3.6962890625, -2.957763671875, -2.21923828125, -1.480712890625, -0.7421875, -0.003662109375, 0.73486328125, 1.473388671875, 2.2119140625, 2.950439453125, 3.68896484375, 4.427490234375, 5.166015625, 5.904541015625, 6.64306640625, 7.381591796875, 8.1201171875, 8.858642578125, 9.59716796875, 10.335693359375, 11.07421875, 11.812744140625, 12.55126953125, 13.289794921875, 14.0283203125, 14.766845703125, 15.50537109375, 16.243896484375, 16.982421875, 17.720947265625, 18.45947265625, 19.197998046875, 19.9365234375, 20.675048828125, 21.41357421875, 22.152099609375, 22.890625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 9.0, 19.0, 42.0, 90.0, 192.0, 247.0, 205.0, 132.0, 48.0, 18.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6290340423584, -21.80978775024414, -20.990543365478516, -20.171297073364258, -19.35205078125, -18.532806396484375, -17.713560104370117, -16.89431381225586, -16.075069427490234, -15.255824089050293, -14.436578750610352, -13.617332458496094, -12.798087120056152, -11.978841781616211, -11.159595489501953, -10.340350151062012, -9.52110481262207, -8.701859474182129, -7.882613658905029, -7.06336784362793, -6.244122505187988, -5.424877166748047, -4.605631351470947, -3.7863855361938477, -2.9671401977539062, -2.1478946208953857, -1.3286490440368652, -0.5094034671783447, 0.3098421096801758, 1.1290874481201172, 1.9483332633972168, 2.7675790786743164, 3.586824417114258, 4.406069755554199, 5.225315570831299, 6.044561386108398, 6.86380672454834, 7.683052062988281, 8.502298355102539, 9.32154369354248, 10.140789031982422, 10.960034370422363, 11.779279708862305, 12.598526000976562, 13.417771339416504, 14.237016677856445, 15.056262969970703, 15.875508308410645, 16.694753646850586, 17.513999938964844, 18.33324432373047, 19.152490615844727, 19.971736907958984, 20.79098129272461, 21.610227584838867, 22.429473876953125, 23.24871826171875, 24.067964553833008, 24.887208938598633, 25.70645523071289, 26.525699615478516, 27.344945907592773, 28.16419219970703, 28.983436584472656, 29.802682876586914]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 9.0, 12.0, 10.0, 5.0, 8.0, 4.0, 7.0, 22.0, 16.0, 33.0, 38.0, 26.0, 31.0, 41.0, 41.0, 35.0, 39.0, 37.0, 44.0, 42.0, 48.0, 47.0, 48.0, 52.0, 41.0, 34.0, 42.0, 26.0, 26.0, 28.0, 16.0, 18.0, 16.0, 12.0, 15.0, 8.0, 10.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.84524917602539, -44.43391036987305, -43.0225715637207, -41.61123275756836, -40.19989013671875, -38.788551330566406, -37.37721252441406, -35.96587371826172, -34.554534912109375, -33.14319610595703, -31.731857299804688, -30.32051658630371, -28.909177780151367, -27.497838973999023, -26.086498260498047, -24.675159454345703, -23.26382064819336, -21.852481842041016, -20.441143035888672, -19.029802322387695, -17.61846351623535, -16.207124710083008, -14.795784950256348, -13.384445190429688, -11.973106384277344, -10.561767578125, -9.15042781829834, -7.739088535308838, -6.327749252319336, -4.916409969329834, -3.505070686340332, -2.093730926513672, -0.6823883056640625, 0.7289509773254395, 2.1402902603149414, 3.5516295433044434, 4.962968826293945, 6.374308109283447, 7.785647392272949, 9.19698715209961, 10.608325958251953, 12.019664764404297, 13.431004524230957, 14.842344284057617, 16.25368309020996, 17.665021896362305, 19.07636260986328, 20.487701416015625, 21.89904022216797, 23.310379028320312, 24.721717834472656, 26.133058547973633, 27.544397354125977, 28.95573616027832, 30.367076873779297, 31.77841567993164, 33.189754486083984, 34.60109329223633, 36.01243209838867, 37.423770904541016, 38.835113525390625, 40.24645233154297, 41.65779113769531, 43.069129943847656, 44.48046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 2.0, 3.0, 10.0, 10.0, 16.0, 22.0, 20.0, 26.0, 30.0, 38.0, 31.0, 36.0, 44.0, 34.0, 51.0, 48.0, 51.0, 51.0, 49.0, 50.0, 48.0, 52.0, 34.0, 48.0, 25.0, 24.0, 28.0, 18.0, 20.0, 15.0, 23.0, 8.0, 15.0, 5.0, 0.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.892578125, -3.75, -3.607421875, -3.46484375, -3.322265625, -3.1796875, -3.037109375, -2.89453125, -2.751953125, -2.609375, -2.466796875, -2.32421875, -2.181640625, -2.0390625, -1.896484375, -1.75390625, -1.611328125, -1.46875, -1.326171875, -1.18359375, -1.041015625, -0.8984375, -0.755859375, -0.61328125, -0.470703125, -0.328125, -0.185546875, -0.04296875, 0.099609375, 0.2421875, 0.384765625, 0.52734375, 0.669921875, 0.8125, 0.955078125, 1.09765625, 1.240234375, 1.3828125, 1.525390625, 1.66796875, 1.810546875, 1.953125, 2.095703125, 2.23828125, 2.380859375, 2.5234375, 2.666015625, 2.80859375, 2.951171875, 3.09375, 3.236328125, 3.37890625, 3.521484375, 3.6640625, 3.806640625, 3.94921875, 4.091796875, 4.234375, 4.376953125, 4.51953125, 4.662109375, 4.8046875, 4.947265625, 5.08984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 5.0, 13.0, 12.0, 12.0, 22.0, 27.0, 48.0, 65.0, 110.0, 170.0, 350.0, 841.0, 2213.0, 7878.0, 31786.0, 166443.0, 1577867.0, 2110746.0, 239598.0, 40934.0, 10057.0, 3056.0, 1003.0, 415.0, 212.0, 118.0, 83.0, 37.0, 44.0, 29.0, 25.0, 10.0, 9.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.703125, -8.3818359375, -8.060546875, -7.7392578125, -7.41796875, -7.0966796875, -6.775390625, -6.4541015625, -6.1328125, -5.8115234375, -5.490234375, -5.1689453125, -4.84765625, -4.5263671875, -4.205078125, -3.8837890625, -3.5625, -3.2412109375, -2.919921875, -2.5986328125, -2.27734375, -1.9560546875, -1.634765625, -1.3134765625, -0.9921875, -0.6708984375, -0.349609375, -0.0283203125, 0.29296875, 0.6142578125, 0.935546875, 1.2568359375, 1.578125, 1.8994140625, 2.220703125, 2.5419921875, 2.86328125, 3.1845703125, 3.505859375, 3.8271484375, 4.1484375, 4.4697265625, 4.791015625, 5.1123046875, 5.43359375, 5.7548828125, 6.076171875, 6.3974609375, 6.71875, 7.0400390625, 7.361328125, 7.6826171875, 8.00390625, 8.3251953125, 8.646484375, 8.9677734375, 9.2890625, 9.6103515625, 9.931640625, 10.2529296875, 10.57421875, 10.8955078125, 11.216796875, 11.5380859375, 11.859375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 8.0, 12.0, 18.0, 24.0, 45.0, 62.0, 110.0, 147.0, 229.0, 321.0, 511.0, 595.0, 608.0, 446.0, 319.0, 212.0, 158.0, 84.0, 54.0, 30.0, 22.0, 16.0, 13.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2578125, -12.813720703125, -12.36962890625, -11.925537109375, -11.4814453125, -11.037353515625, -10.59326171875, -10.149169921875, -9.705078125, -9.260986328125, -8.81689453125, -8.372802734375, -7.9287109375, -7.484619140625, -7.04052734375, -6.596435546875, -6.15234375, -5.708251953125, -5.26416015625, -4.820068359375, -4.3759765625, -3.931884765625, -3.48779296875, -3.043701171875, -2.599609375, -2.155517578125, -1.71142578125, -1.267333984375, -0.8232421875, -0.379150390625, 0.06494140625, 0.509033203125, 0.953125, 1.397216796875, 1.84130859375, 2.285400390625, 2.7294921875, 3.173583984375, 3.61767578125, 4.061767578125, 4.505859375, 4.949951171875, 5.39404296875, 5.838134765625, 6.2822265625, 6.726318359375, 7.17041015625, 7.614501953125, 8.05859375, 8.502685546875, 8.94677734375, 9.390869140625, 9.8349609375, 10.279052734375, 10.72314453125, 11.167236328125, 11.611328125, 12.055419921875, 12.49951171875, 12.943603515625, 13.3876953125, 13.831787109375, 14.27587890625, 14.719970703125, 15.1640625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 16.0, 17.0, 18.0, 42.0, 73.0, 115.0, 211.0, 461.0, 1233.0, 5778.0, 71149.0, 3105620.0, 976140.0, 28414.0, 3287.0, 908.0, 361.0, 160.0, 125.0, 35.0, 34.0, 18.0, 22.0, 16.0, 7.0, 4.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.621826171875, -22.54052734375, -21.459228515625, -20.3779296875, -19.296630859375, -18.21533203125, -17.134033203125, -16.052734375, -14.971435546875, -13.89013671875, -12.808837890625, -11.7275390625, -10.646240234375, -9.56494140625, -8.483642578125, -7.40234375, -6.321044921875, -5.23974609375, -4.158447265625, -3.0771484375, -1.995849609375, -0.91455078125, 0.166748046875, 1.248046875, 2.329345703125, 3.41064453125, 4.491943359375, 5.5732421875, 6.654541015625, 7.73583984375, 8.817138671875, 9.8984375, 10.979736328125, 12.06103515625, 13.142333984375, 14.2236328125, 15.304931640625, 16.38623046875, 17.467529296875, 18.548828125, 19.630126953125, 20.71142578125, 21.792724609375, 22.8740234375, 23.955322265625, 25.03662109375, 26.117919921875, 27.19921875, 28.280517578125, 29.36181640625, 30.443115234375, 31.5244140625, 32.605712890625, 33.68701171875, 34.768310546875, 35.849609375, 36.930908203125, 38.01220703125, 39.093505859375, 40.1748046875, 41.256103515625, 42.33740234375, 43.418701171875, 44.5]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 4.0, 20.0, 47.0, 86.0, 132.0, 178.0, 171.0, 164.0, 99.0, 51.0, 36.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.54182052612305, -60.80144500732422, -58.061065673828125, -55.3206901550293, -52.58031463623047, -49.839935302734375, -47.09955978393555, -44.35918426513672, -41.618804931640625, -38.8784294128418, -36.1380500793457, -33.397674560546875, -30.657297134399414, -27.916919708251953, -25.176544189453125, -22.436166763305664, -19.695789337158203, -16.955411911010742, -14.215035438537598, -11.474658966064453, -8.734281539916992, -5.993904113769531, -3.253528594970703, -0.5131511688232422, 2.2272262573242188, 4.9676032066345215, 7.707980155944824, 10.448356628417969, 13.18873405456543, 15.92911148071289, 18.66948699951172, 21.40986442565918, 24.150245666503906, 26.890623092651367, 29.631000518798828, 32.371376037597656, 35.11175537109375, 37.85213088989258, 40.592506408691406, 43.3328857421875, 46.07326126098633, 48.813636779785156, 51.55401611328125, 54.29439163208008, 57.034767150878906, 59.775146484375, 62.51552200317383, 65.25589752197266, 67.99627685546875, 70.73665618896484, 73.4770278930664, 76.2174072265625, 78.9577865600586, 81.69816589355469, 84.43853759765625, 87.17891693115234, 89.91929626464844, 92.65967559814453, 95.4000473022461, 98.14042663574219, 100.88080596923828, 103.62118530273438, 106.36155700683594, 109.10193634033203, 111.8423080444336]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 11.0, 14.0, 11.0, 16.0, 16.0, 18.0, 21.0, 27.0, 28.0, 31.0, 37.0, 33.0, 42.0, 41.0, 46.0, 36.0, 41.0, 58.0, 49.0, 37.0, 47.0, 36.0, 44.0, 28.0, 28.0, 26.0, 31.0, 22.0, 17.0, 17.0, 15.0, 18.0, 13.0, 7.0, 6.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-44.178733825683594, -42.95210647583008, -41.72548294067383, -40.49885559082031, -39.27223205566406, -38.04560470581055, -36.8189811706543, -35.59235382080078, -34.36573028564453, -33.139102935791016, -31.912479400634766, -30.685853958129883, -29.459228515625, -28.232601165771484, -27.0059757232666, -25.77935028076172, -24.552722930908203, -23.32609748840332, -22.099472045898438, -20.872846603393555, -19.646221160888672, -18.419593811035156, -17.192968368530273, -15.96634292602539, -14.739717483520508, -13.513092041015625, -12.286466598510742, -11.059840202331543, -9.83321475982666, -8.606589317321777, -7.379963397979736, -6.153337478637695, -4.926708221435547, -3.700082540512085, -2.473456859588623, -1.2468311786651611, -0.02020549774169922, 1.2064199447631836, 2.4330458641052246, 3.6596717834472656, 4.886297225952148, 6.112922668457031, 7.339548587799072, 8.566174507141113, 9.792799949645996, 11.019425392150879, 12.246051788330078, 13.472677230834961, 14.699302673339844, 15.925928115844727, 17.15255355834961, 18.379179000854492, 19.605804443359375, 20.83243179321289, 22.059057235717773, 23.285682678222656, 24.51230812072754, 25.738933563232422, 26.965559005737305, 28.192184448242188, 29.418811798095703, 30.645435333251953, 31.87206268310547, 33.09868621826172, 34.325313568115234]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 7.0, 9.0, 14.0, 19.0, 16.0, 13.0, 36.0, 28.0, 38.0, 41.0, 47.0, 44.0, 43.0, 64.0, 54.0, 45.0, 52.0, 52.0, 45.0, 42.0, 42.0, 35.0, 34.0, 32.0, 26.0, 23.0, 26.0, 17.0, 15.0, 17.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.6595458984375, -4.502685546875, -4.3458251953125, -4.18896484375, -4.0321044921875, -3.875244140625, -3.7183837890625, -3.5615234375, -3.4046630859375, -3.247802734375, -3.0909423828125, -2.93408203125, -2.7772216796875, -2.620361328125, -2.4635009765625, -2.306640625, -2.1497802734375, -1.992919921875, -1.8360595703125, -1.67919921875, -1.5223388671875, -1.365478515625, -1.2086181640625, -1.0517578125, -0.8948974609375, -0.738037109375, -0.5811767578125, -0.42431640625, -0.2674560546875, -0.110595703125, 0.0462646484375, 0.203125, 0.3599853515625, 0.516845703125, 0.6737060546875, 0.83056640625, 0.9874267578125, 1.144287109375, 1.3011474609375, 1.4580078125, 1.6148681640625, 1.771728515625, 1.9285888671875, 2.08544921875, 2.2423095703125, 2.399169921875, 2.5560302734375, 2.712890625, 2.8697509765625, 3.026611328125, 3.1834716796875, 3.34033203125, 3.4971923828125, 3.654052734375, 3.8109130859375, 3.9677734375, 4.1246337890625, 4.281494140625, 4.4383544921875, 4.59521484375, 4.7520751953125, 4.908935546875, 5.0657958984375, 5.22265625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 7.0, 4.0, 12.0, 14.0, 14.0, 33.0, 50.0, 48.0, 92.0, 133.0, 191.0, 301.0, 468.0, 758.0, 1273.0, 2178.0, 3899.0, 6771.0, 11807.0, 20980.0, 37532.0, 71589.0, 158628.0, 335750.0, 206217.0, 87886.0, 44764.0, 24610.0, 13778.0, 7833.0, 4462.0, 2598.0, 1469.0, 888.0, 528.0, 338.0, 219.0, 133.0, 89.0, 64.0, 37.0, 29.0, 33.0, 15.0, 16.0, 2.0, 7.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.2086181640625, -0.2022266387939453, -0.19583511352539062, -0.18944358825683594, -0.18305206298828125, -0.17666053771972656, -0.17026901245117188, -0.1638774871826172, -0.1574859619140625, -0.1510944366455078, -0.14470291137695312, -0.13831138610839844, -0.13191986083984375, -0.12552833557128906, -0.11913681030273438, -0.11274528503417969, -0.106353759765625, -0.09996223449707031, -0.09357070922851562, -0.08717918395996094, -0.08078765869140625, -0.07439613342285156, -0.06800460815429688, -0.06161308288574219, -0.0552215576171875, -0.04883003234863281, -0.042438507080078125, -0.03604698181152344, -0.02965545654296875, -0.023263931274414062, -0.016872406005859375, -0.010480880737304688, -0.00408935546875, 0.0023021697998046875, 0.008693695068359375, 0.015085220336914062, 0.02147674560546875, 0.027868270874023438, 0.034259796142578125, 0.04065132141113281, 0.0470428466796875, 0.05343437194824219, 0.059825897216796875, 0.06621742248535156, 0.07260894775390625, 0.07900047302246094, 0.08539199829101562, 0.09178352355957031, 0.098175048828125, 0.10456657409667969, 0.11095809936523438, 0.11734962463378906, 0.12374114990234375, 0.13013267517089844, 0.13652420043945312, 0.1429157257080078, 0.1493072509765625, 0.1556987762451172, 0.16209030151367188, 0.16848182678222656, 0.17487335205078125, 0.18126487731933594, 0.18765640258789062, 0.1940479278564453, 0.200439453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 5.0, 3.0, 14.0, 11.0, 11.0, 10.0, 28.0, 17.0, 20.0, 31.0, 27.0, 30.0, 28.0, 29.0, 48.0, 29.0, 34.0, 33.0, 35.0, 48.0, 1061.0, 32.0, 35.0, 30.0, 38.0, 38.0, 32.0, 30.0, 25.0, 25.0, 30.0, 16.0, 18.0, 18.0, 8.0, 16.0, 13.0, 10.0, 6.0, 3.0, 12.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.30078125, -2.2281494140625, -2.155517578125, -2.0828857421875, -2.01025390625, -1.9376220703125, -1.864990234375, -1.7923583984375, -1.7197265625, -1.6470947265625, -1.574462890625, -1.5018310546875, -1.42919921875, -1.3565673828125, -1.283935546875, -1.2113037109375, -1.138671875, -1.0660400390625, -0.993408203125, -0.9207763671875, -0.84814453125, -0.7755126953125, -0.702880859375, -0.6302490234375, -0.5576171875, -0.4849853515625, -0.412353515625, -0.3397216796875, -0.26708984375, -0.1944580078125, -0.121826171875, -0.0491943359375, 0.0234375, 0.0960693359375, 0.168701171875, 0.2413330078125, 0.31396484375, 0.3865966796875, 0.459228515625, 0.5318603515625, 0.6044921875, 0.6771240234375, 0.749755859375, 0.8223876953125, 0.89501953125, 0.9676513671875, 1.040283203125, 1.1129150390625, 1.185546875, 1.2581787109375, 1.330810546875, 1.4034423828125, 1.47607421875, 1.5487060546875, 1.621337890625, 1.6939697265625, 1.7666015625, 1.8392333984375, 1.911865234375, 1.9844970703125, 2.05712890625, 2.1297607421875, 2.202392578125, 2.2750244140625, 2.34765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 17.0, 24.0, 34.0, 57.0, 92.0, 121.0, 158.0, 251.0, 349.0, 514.0, 756.0, 1055.0, 1557.0, 2271.0, 3223.0, 4823.0, 7264.0, 11231.0, 17046.0, 26855.0, 43554.0, 74041.0, 142686.0, 1308004.0, 200762.0, 99982.0, 55150.0, 33670.0, 21020.0, 13367.0, 8893.0, 5857.0, 3822.0, 2657.0, 1795.0, 1275.0, 849.0, 605.0, 478.0, 296.0, 191.0, 142.0, 82.0, 66.0, 50.0, 46.0, 30.0, 11.0, 17.0, 10.0, 9.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.1433124542236328, -0.13879776000976562, -0.13428306579589844, -0.12976837158203125, -0.12525367736816406, -0.12073898315429688, -0.11622428894042969, -0.1117095947265625, -0.10719490051269531, -0.10268020629882812, -0.09816551208496094, -0.09365081787109375, -0.08913612365722656, -0.08462142944335938, -0.08010673522949219, -0.075592041015625, -0.07107734680175781, -0.06656265258789062, -0.06204795837402344, -0.05753326416015625, -0.05301856994628906, -0.048503875732421875, -0.04398918151855469, -0.0394744873046875, -0.03495979309082031, -0.030445098876953125, -0.025930404663085938, -0.02141571044921875, -0.016901016235351562, -0.012386322021484375, -0.007871627807617188, -0.00335693359375, 0.0011577606201171875, 0.005672454833984375, 0.010187149047851562, 0.01470184326171875, 0.019216537475585938, 0.023731231689453125, 0.028245925903320312, 0.0327606201171875, 0.03727531433105469, 0.041790008544921875, 0.04630470275878906, 0.05081939697265625, 0.05533409118652344, 0.059848785400390625, 0.06436347961425781, 0.068878173828125, 0.07339286804199219, 0.07790756225585938, 0.08242225646972656, 0.08693695068359375, 0.09145164489746094, 0.09596633911132812, 0.10048103332519531, 0.1049957275390625, 0.10951042175292969, 0.11402511596679688, 0.11853981018066406, 0.12305450439453125, 0.12756919860839844, 0.13208389282226562, 0.1365985870361328, 0.14111328125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 3.0, 7.0, 11.0, 14.0, 10.0, 14.0, 25.0, 27.0, 37.0, 37.0, 52.0, 59.0, 54.0, 51.0, 67.0, 58.0, 65.0, 51.0, 69.0, 43.0, 34.0, 33.0, 25.0, 16.0, 25.0, 24.0, 18.0, 17.0, 8.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7120113372802734e-05, -2.624746412038803e-05, -2.5374814867973328e-05, -2.4502165615558624e-05, -2.362951636314392e-05, -2.2756867110729218e-05, -2.1884217858314514e-05, -2.101156860589981e-05, -2.0138919353485107e-05, -1.9266270101070404e-05, -1.83936208486557e-05, -1.7520971596240997e-05, -1.6648322343826294e-05, -1.577567309141159e-05, -1.4903023838996887e-05, -1.4030374586582184e-05, -1.315772533416748e-05, -1.2285076081752777e-05, -1.1412426829338074e-05, -1.053977757692337e-05, -9.667128324508667e-06, -8.794479072093964e-06, -7.92182981967926e-06, -7.049180567264557e-06, -6.1765313148498535e-06, -5.30388206243515e-06, -4.431232810020447e-06, -3.5585835576057434e-06, -2.68593430519104e-06, -1.8132850527763367e-06, -9.406358003616333e-07, -6.798654794692993e-08, 8.046627044677734e-07, 1.6773119568824768e-06, 2.54996120929718e-06, 3.4226104617118835e-06, 4.295259714126587e-06, 5.16790896654129e-06, 6.040558218955994e-06, 6.913207471370697e-06, 7.7858567237854e-06, 8.658505976200104e-06, 9.531155228614807e-06, 1.040380448102951e-05, 1.1276453733444214e-05, 1.2149102985858917e-05, 1.302175223827362e-05, 1.3894401490688324e-05, 1.4767050743103027e-05, 1.563969999551773e-05, 1.6512349247932434e-05, 1.7384998500347137e-05, 1.825764775276184e-05, 1.9130297005176544e-05, 2.0002946257591248e-05, 2.087559551000595e-05, 2.1748244762420654e-05, 2.2620894014835358e-05, 2.349354326725006e-05, 2.4366192519664764e-05, 2.5238841772079468e-05, 2.611149102449417e-05, 2.6984140276908875e-05, 2.7856789529323578e-05, 2.872943878173828e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 15.0, 13.0, 12.0, 14.0, 16.0, 26.0, 40.0, 46.0, 88.0, 112.0, 148.0, 314.0, 632.0, 4498.0, 1015618.0, 25181.0, 770.0, 375.0, 190.0, 141.0, 88.0, 58.0, 43.0, 25.0, 20.0, 21.0, 16.0, 6.0, 2.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005731582641601562, -0.0005544424057006836, -0.0005357265472412109, -0.0005170106887817383, -0.0004982948303222656, -0.00047957897186279297, -0.0004608631134033203, -0.00044214725494384766, -0.000423431396484375, -0.00040471553802490234, -0.0003859996795654297, -0.00036728382110595703, -0.0003485679626464844, -0.0003298521041870117, -0.00031113624572753906, -0.0002924203872680664, -0.00027370452880859375, -0.0002549886703491211, -0.00023627281188964844, -0.00021755695343017578, -0.00019884109497070312, -0.00018012523651123047, -0.0001614093780517578, -0.00014269351959228516, -0.0001239776611328125, -0.00010526180267333984, -8.654594421386719e-05, -6.783008575439453e-05, -4.9114227294921875e-05, -3.039836883544922e-05, -1.1682510375976562e-05, 7.033348083496094e-06, 2.574920654296875e-05, 4.4465065002441406e-05, 6.318092346191406e-05, 8.189678192138672e-05, 0.00010061264038085938, 0.00011932849884033203, 0.0001380443572998047, 0.00015676021575927734, 0.00017547607421875, 0.00019419193267822266, 0.0002129077911376953, 0.00023162364959716797, 0.0002503395080566406, 0.0002690553665161133, 0.00028777122497558594, 0.0003064870834350586, 0.00032520294189453125, 0.0003439188003540039, 0.00036263465881347656, 0.0003813505172729492, 0.0004000663757324219, 0.00041878223419189453, 0.0004374980926513672, 0.00045621395111083984, 0.0004749298095703125, 0.0004936456680297852, 0.0005123615264892578, 0.0005310773849487305, 0.0005497932434082031, 0.0005685091018676758, 0.0005872249603271484, 0.0006059408187866211, 0.0006246566772460938]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 10.0, 15.0, 31.0, 69.0, 121.0, 175.0, 184.0, 143.0, 130.0, 70.0, 40.0, 15.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.898307896743063e-06, -7.960656148497947e-06, -7.023004855000181e-06, -6.085353561502416e-06, -5.147701813257299e-06, -4.210050065012183e-06, -3.2723987715144176e-06, -2.334747478016652e-06, -1.3970957297715358e-06, -4.5944420890009496e-07, 4.782073119713459e-07, 1.4158588328427868e-06, 2.3535103537142277e-06, 3.291162101959344e-06, 4.2288133954571094e-06, 5.166464688954875e-06, 6.104116437199991e-06, 7.0417681854451075e-06, 7.979419024195522e-06, 8.917070772440638e-06, 9.854722520685755e-06, 1.0792374268930871e-05, 1.1730026017175987e-05, 1.2667676855926402e-05, 1.3605328604171518e-05, 1.4542980352416635e-05, 1.548063119116705e-05, 1.6418283848906867e-05, 1.7355934687657282e-05, 1.82935873453971e-05, 1.9231238184147514e-05, 2.016888902289793e-05, 2.1106541680637747e-05, 2.204419251938816e-05, 2.298184517712798e-05, 2.3919496015878394e-05, 2.4857148673618212e-05, 2.5794799512368627e-05, 2.673245035111904e-05, 2.767010300885886e-05, 2.8607753847609274e-05, 2.954540468635969e-05, 3.0483057344099507e-05, 3.1420710001839325e-05, 3.2358359021600336e-05, 3.3296011679340154e-05, 3.423366433707997e-05, 3.517131335684098e-05, 3.61089660145808e-05, 3.704661867232062e-05, 3.798426769208163e-05, 3.892192034982145e-05, 3.9859573007561266e-05, 4.0797225665301085e-05, 4.1734874685062096e-05, 4.2672527342801914e-05, 4.3610176362562925e-05, 4.454782902030274e-05, 4.5485478040063754e-05, 4.642313069780357e-05, 4.736078335554339e-05, 4.82984323753044e-05, 4.923608503304422e-05, 5.017373769078404e-05, 5.1111390348523855e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 9.0, 6.0, 10.0, 5.0, 10.0, 9.0, 11.0, 15.0, 15.0, 30.0, 25.0, 23.0, 19.0, 19.0, 27.0, 30.0, 31.0, 35.0, 40.0, 38.0, 42.0, 49.0, 34.0, 38.0, 36.0, 42.0, 40.0, 30.0, 31.0, 27.0, 31.0, 26.0, 18.0, 19.0, 25.0, 14.0, 16.0, 11.0, 15.0, 5.0, 6.0, 12.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.2934207916259766e-05, -1.254398375749588e-05, -1.2153759598731995e-05, -1.1763535439968109e-05, -1.1373311281204224e-05, -1.0983087122440338e-05, -1.0592862963676453e-05, -1.0202638804912567e-05, -9.812414646148682e-06, -9.422190487384796e-06, -9.03196632862091e-06, -8.641742169857025e-06, -8.25151801109314e-06, -7.861293852329254e-06, -7.471069693565369e-06, -7.080845534801483e-06, -6.690621376037598e-06, -6.300397217273712e-06, -5.910173058509827e-06, -5.519948899745941e-06, -5.129724740982056e-06, -4.73950058221817e-06, -4.349276423454285e-06, -3.959052264690399e-06, -3.5688281059265137e-06, -3.178603947162628e-06, -2.7883797883987427e-06, -2.398155629634857e-06, -2.0079314708709717e-06, -1.6177073121070862e-06, -1.2274831533432007e-06, -8.372589945793152e-07, -4.470348358154297e-07, -5.681067705154419e-08, 3.334134817123413e-07, 7.236376404762268e-07, 1.1138617992401123e-06, 1.5040859580039978e-06, 1.8943101167678833e-06, 2.284534275531769e-06, 2.6747584342956543e-06, 3.06498259305954e-06, 3.4552067518234253e-06, 3.845430910587311e-06, 4.235655069351196e-06, 4.625879228115082e-06, 5.016103386878967e-06, 5.406327545642853e-06, 5.796551704406738e-06, 6.186775863170624e-06, 6.577000021934509e-06, 6.967224180698395e-06, 7.35744833946228e-06, 7.747672498226166e-06, 8.137896656990051e-06, 8.528120815753937e-06, 8.918344974517822e-06, 9.308569133281708e-06, 9.698793292045593e-06, 1.0089017450809479e-05, 1.0479241609573364e-05, 1.086946576833725e-05, 1.1259689927101135e-05, 1.164991408586502e-05, 1.2040138244628906e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 7.0, 9.0, 14.0, 19.0, 16.0, 13.0, 36.0, 28.0, 38.0, 41.0, 47.0, 44.0, 43.0, 64.0, 54.0, 45.0, 52.0, 52.0, 45.0, 42.0, 42.0, 35.0, 34.0, 32.0, 26.0, 23.0, 26.0, 17.0, 15.0, 17.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.6595458984375, -4.502685546875, -4.3458251953125, -4.18896484375, -4.0321044921875, -3.875244140625, -3.7183837890625, -3.5615234375, -3.4046630859375, -3.247802734375, -3.0909423828125, -2.93408203125, -2.7772216796875, -2.620361328125, -2.4635009765625, -2.306640625, -2.1497802734375, -1.992919921875, -1.8360595703125, -1.67919921875, -1.5223388671875, -1.365478515625, -1.2086181640625, -1.0517578125, -0.8948974609375, -0.738037109375, -0.5811767578125, -0.42431640625, -0.2674560546875, -0.110595703125, 0.0462646484375, 0.203125, 0.3599853515625, 0.516845703125, 0.6737060546875, 0.83056640625, 0.9874267578125, 1.144287109375, 1.3011474609375, 1.4580078125, 1.6148681640625, 1.771728515625, 1.9285888671875, 2.08544921875, 2.2423095703125, 2.399169921875, 2.5560302734375, 2.712890625, 2.8697509765625, 3.026611328125, 3.1834716796875, 3.34033203125, 3.4971923828125, 3.654052734375, 3.8109130859375, 3.9677734375, 4.1246337890625, 4.281494140625, 4.4383544921875, 4.59521484375, 4.7520751953125, 4.908935546875, 5.0657958984375, 5.22265625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 12.0, 16.0, 24.0, 37.0, 57.0, 78.0, 148.0, 181.0, 254.0, 351.0, 567.0, 850.0, 1285.0, 2056.0, 3783.0, 7391.0, 16391.0, 44132.0, 144231.0, 498899.0, 222676.0, 62314.0, 22146.0, 9313.0, 4551.0, 2509.0, 1430.0, 925.0, 581.0, 416.0, 326.0, 180.0, 145.0, 109.0, 67.0, 43.0, 23.0, 18.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.650390625, -2.563934326171875, -2.47747802734375, -2.391021728515625, -2.3045654296875, -2.218109130859375, -2.13165283203125, -2.045196533203125, -1.958740234375, -1.872283935546875, -1.78582763671875, -1.699371337890625, -1.6129150390625, -1.526458740234375, -1.44000244140625, -1.353546142578125, -1.26708984375, -1.180633544921875, -1.09417724609375, -1.007720947265625, -0.9212646484375, -0.834808349609375, -0.74835205078125, -0.661895751953125, -0.575439453125, -0.488983154296875, -0.40252685546875, -0.316070556640625, -0.2296142578125, -0.143157958984375, -0.05670166015625, 0.029754638671875, 0.1162109375, 0.202667236328125, 0.28912353515625, 0.375579833984375, 0.4620361328125, 0.548492431640625, 0.63494873046875, 0.721405029296875, 0.807861328125, 0.894317626953125, 0.98077392578125, 1.067230224609375, 1.1536865234375, 1.240142822265625, 1.32659912109375, 1.413055419921875, 1.49951171875, 1.585968017578125, 1.67242431640625, 1.758880615234375, 1.8453369140625, 1.931793212890625, 2.01824951171875, 2.104705810546875, 2.191162109375, 2.277618408203125, 2.36407470703125, 2.450531005859375, 2.5369873046875, 2.623443603515625, 2.70989990234375, 2.796356201171875, 2.8828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 0.0, 2.0, 7.0, 8.0, 9.0, 16.0, 17.0, 25.0, 17.0, 26.0, 29.0, 25.0, 37.0, 33.0, 40.0, 31.0, 51.0, 50.0, 63.0, 308.0, 1715.0, 93.0, 67.0, 51.0, 55.0, 38.0, 44.0, 36.0, 24.0, 16.0, 24.0, 14.0, 14.0, 14.0, 7.0, 9.0, 13.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.6900634765625, -12.184814453125, -11.6795654296875, -11.17431640625, -10.6690673828125, -10.163818359375, -9.6585693359375, -9.1533203125, -8.6480712890625, -8.142822265625, -7.6375732421875, -7.13232421875, -6.6270751953125, -6.121826171875, -5.6165771484375, -5.111328125, -4.6060791015625, -4.100830078125, -3.5955810546875, -3.09033203125, -2.5850830078125, -2.079833984375, -1.5745849609375, -1.0693359375, -0.5640869140625, -0.058837890625, 0.4464111328125, 0.95166015625, 1.4569091796875, 1.962158203125, 2.4674072265625, 2.97265625, 3.4779052734375, 3.983154296875, 4.4884033203125, 4.99365234375, 5.4989013671875, 6.004150390625, 6.5093994140625, 7.0146484375, 7.5198974609375, 8.025146484375, 8.5303955078125, 9.03564453125, 9.5408935546875, 10.046142578125, 10.5513916015625, 11.056640625, 11.5618896484375, 12.067138671875, 12.5723876953125, 13.07763671875, 13.5828857421875, 14.088134765625, 14.5933837890625, 15.0986328125, 15.6038818359375, 16.109130859375, 16.6143798828125, 17.11962890625, 17.6248779296875, 18.130126953125, 18.6353759765625, 19.140625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 8.0, 10.0, 9.0, 9.0, 10.0, 21.0, 18.0, 19.0, 23.0, 36.0, 37.0, 67.0, 86.0, 120.0, 208.0, 350.0, 983.0, 4066.0, 54539.0, 3047492.0, 32719.0, 3056.0, 767.0, 347.0, 190.0, 120.0, 82.0, 63.0, 42.0, 43.0, 44.0, 21.0, 17.0, 22.0, 16.0, 12.0, 8.0, 5.0, 6.0, 3.0, 0.0, 5.0, 5.0, 1.0, 0.0, 1.0], "bins": [-29.09375, -28.31640625, -27.5390625, -26.76171875, -25.984375, -25.20703125, -24.4296875, -23.65234375, -22.875, -22.09765625, -21.3203125, -20.54296875, -19.765625, -18.98828125, -18.2109375, -17.43359375, -16.65625, -15.87890625, -15.1015625, -14.32421875, -13.546875, -12.76953125, -11.9921875, -11.21484375, -10.4375, -9.66015625, -8.8828125, -8.10546875, -7.328125, -6.55078125, -5.7734375, -4.99609375, -4.21875, -3.44140625, -2.6640625, -1.88671875, -1.109375, -0.33203125, 0.4453125, 1.22265625, 2.0, 2.77734375, 3.5546875, 4.33203125, 5.109375, 5.88671875, 6.6640625, 7.44140625, 8.21875, 8.99609375, 9.7734375, 10.55078125, 11.328125, 12.10546875, 12.8828125, 13.66015625, 14.4375, 15.21484375, 15.9921875, 16.76953125, 17.546875, 18.32421875, 19.1015625, 19.87890625, 20.65625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 72.0, 518.0, 375.0, 42.0, 4.0, 1.0], "bins": [-183.222900390625, -180.16116333007812, -177.09942626953125, -174.03768920898438, -170.9759521484375, -167.91421508789062, -164.85247802734375, -161.79074096679688, -158.72900390625, -155.66726684570312, -152.60552978515625, -149.54379272460938, -146.4820556640625, -143.42031860351562, -140.35858154296875, -137.29684448242188, -134.23512268066406, -131.1733856201172, -128.1116485595703, -125.04991149902344, -121.98817443847656, -118.92644500732422, -115.86470794677734, -112.80297088623047, -109.7412338256836, -106.67949676513672, -103.61775970458984, -100.55602264404297, -97.49429321289062, -94.43255615234375, -91.37081909179688, -88.30908203125, -85.24734497070312, -82.18560791015625, -79.12387084960938, -76.0621337890625, -73.00039672851562, -69.93866729736328, -66.8769302368164, -63.81519317626953, -60.753456115722656, -57.69171905517578, -54.629981994628906, -51.5682487487793, -48.50651168823242, -45.44477462768555, -42.38304138183594, -39.32130432128906, -36.25956726074219, -33.19783020019531, -30.13609504699707, -27.074359893798828, -24.012622833251953, -20.950885772705078, -17.889150619506836, -14.827415466308594, -11.765679359436035, -8.703943252563477, -5.642207145690918, -2.5804710388183594, 0.4812650680541992, 3.543001174926758, 6.604737281799316, 9.666472434997559, 12.728209495544434]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 2.0, 8.0, 8.0, 12.0, 13.0, 14.0, 17.0, 14.0, 22.0, 16.0, 25.0, 26.0, 26.0, 31.0, 31.0, 35.0, 35.0, 36.0, 34.0, 32.0, 42.0, 37.0, 49.0, 28.0, 41.0, 30.0, 29.0, 33.0, 33.0, 28.0, 33.0, 24.0, 23.0, 20.0, 25.0, 16.0, 15.0, 9.0, 8.0, 8.0, 9.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.56866455078125, -45.13760757446289, -43.70655059814453, -42.27549362182617, -40.84443664550781, -39.41337585449219, -37.98231887817383, -36.55126190185547, -35.12020492553711, -33.68914794921875, -32.25809097290039, -30.8270320892334, -29.39597511291504, -27.96491813659668, -26.533859252929688, -25.102802276611328, -23.67174530029297, -22.24068832397461, -20.80963134765625, -19.378572463989258, -17.9475154876709, -16.51645851135254, -15.085400581359863, -13.654342651367188, -12.223285675048828, -10.792228698730469, -9.361170768737793, -7.930113315582275, -6.499055862426758, -5.06799840927124, -3.6369409561157227, -2.205883026123047, -0.7748222351074219, 0.6562352180480957, 2.0872926712036133, 3.518350124359131, 4.949407577514648, 6.380465030670166, 7.811522483825684, 9.24258041381836, 10.673637390136719, 12.104694366455078, 13.535752296447754, 14.96681022644043, 16.39786720275879, 17.82892417907715, 19.25998306274414, 20.6910400390625, 22.12209701538086, 23.55315399169922, 24.984210968017578, 26.41526985168457, 27.84632682800293, 29.27738380432129, 30.70844268798828, 32.13949966430664, 33.570556640625, 35.00161361694336, 36.43267059326172, 37.86372756958008, 39.29478454589844, 40.72584533691406, 42.15690231323242, 43.58795928955078, 45.01901626586914]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 7.0, 6.0, 8.0, 16.0, 19.0, 20.0, 15.0, 25.0, 31.0, 43.0, 39.0, 37.0, 44.0, 61.0, 52.0, 43.0, 57.0, 49.0, 50.0, 36.0, 40.0, 45.0, 33.0, 36.0, 37.0, 20.0, 25.0, 23.0, 13.0, 18.0, 13.0, 15.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.76171875, -4.60638427734375, -4.4510498046875, -4.29571533203125, -4.140380859375, -3.98504638671875, -3.8297119140625, -3.67437744140625, -3.51904296875, -3.36370849609375, -3.2083740234375, -3.05303955078125, -2.897705078125, -2.74237060546875, -2.5870361328125, -2.43170166015625, -2.2763671875, -2.12103271484375, -1.9656982421875, -1.81036376953125, -1.655029296875, -1.49969482421875, -1.3443603515625, -1.18902587890625, -1.03369140625, -0.87835693359375, -0.7230224609375, -0.56768798828125, -0.412353515625, -0.25701904296875, -0.1016845703125, 0.05364990234375, 0.208984375, 0.36431884765625, 0.5196533203125, 0.67498779296875, 0.830322265625, 0.98565673828125, 1.1409912109375, 1.29632568359375, 1.45166015625, 1.60699462890625, 1.7623291015625, 1.91766357421875, 2.072998046875, 2.22833251953125, 2.3836669921875, 2.53900146484375, 2.6943359375, 2.84967041015625, 3.0050048828125, 3.16033935546875, 3.315673828125, 3.47100830078125, 3.6263427734375, 3.78167724609375, 3.93701171875, 4.09234619140625, 4.2476806640625, 4.40301513671875, 4.558349609375, 4.71368408203125, 4.8690185546875, 5.02435302734375, 5.1796875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 0.0, 3.0, 5.0, 8.0, 7.0, 9.0, 8.0, 15.0, 22.0, 20.0, 34.0, 38.0, 44.0, 87.0, 171.0, 475.0, 1730.0, 8597.0, 58477.0, 769120.0, 3035275.0, 283496.0, 29732.0, 5018.0, 1108.0, 337.0, 141.0, 103.0, 42.0, 29.0, 31.0, 19.0, 10.0, 19.0, 16.0, 5.0, 6.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.006103515625, -11.56689453125, -11.127685546875, -10.6884765625, -10.249267578125, -9.81005859375, -9.370849609375, -8.931640625, -8.492431640625, -8.05322265625, -7.614013671875, -7.1748046875, -6.735595703125, -6.29638671875, -5.857177734375, -5.41796875, -4.978759765625, -4.53955078125, -4.100341796875, -3.6611328125, -3.221923828125, -2.78271484375, -2.343505859375, -1.904296875, -1.465087890625, -1.02587890625, -0.586669921875, -0.1474609375, 0.291748046875, 0.73095703125, 1.170166015625, 1.609375, 2.048583984375, 2.48779296875, 2.927001953125, 3.3662109375, 3.805419921875, 4.24462890625, 4.683837890625, 5.123046875, 5.562255859375, 6.00146484375, 6.440673828125, 6.8798828125, 7.319091796875, 7.75830078125, 8.197509765625, 8.63671875, 9.075927734375, 9.51513671875, 9.954345703125, 10.3935546875, 10.832763671875, 11.27197265625, 11.711181640625, 12.150390625, 12.589599609375, 13.02880859375, 13.468017578125, 13.9072265625, 14.346435546875, 14.78564453125, 15.224853515625, 15.6640625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 5.0, 13.0, 19.0, 15.0, 20.0, 44.0, 60.0, 98.0, 141.0, 238.0, 322.0, 497.0, 663.0, 632.0, 469.0, 280.0, 194.0, 134.0, 74.0, 59.0, 33.0, 25.0, 14.0, 12.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.292724609375, -18.81982421875, -18.346923828125, -17.8740234375, -17.401123046875, -16.92822265625, -16.455322265625, -15.982421875, -15.509521484375, -15.03662109375, -14.563720703125, -14.0908203125, -13.617919921875, -13.14501953125, -12.672119140625, -12.19921875, -11.726318359375, -11.25341796875, -10.780517578125, -10.3076171875, -9.834716796875, -9.36181640625, -8.888916015625, -8.416015625, -7.943115234375, -7.47021484375, -6.997314453125, -6.5244140625, -6.051513671875, -5.57861328125, -5.105712890625, -4.6328125, -4.159912109375, -3.68701171875, -3.214111328125, -2.7412109375, -2.268310546875, -1.79541015625, -1.322509765625, -0.849609375, -0.376708984375, 0.09619140625, 0.569091796875, 1.0419921875, 1.514892578125, 1.98779296875, 2.460693359375, 2.93359375, 3.406494140625, 3.87939453125, 4.352294921875, 4.8251953125, 5.298095703125, 5.77099609375, 6.243896484375, 6.716796875, 7.189697265625, 7.66259765625, 8.135498046875, 8.6083984375, 9.081298828125, 9.55419921875, 10.027099609375, 10.5]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 8.0, 19.0, 23.0, 35.0, 56.0, 95.0, 125.0, 224.0, 429.0, 1299.0, 10021.0, 266267.0, 3738418.0, 167887.0, 7268.0, 1106.0, 414.0, 188.0, 135.0, 88.0, 59.0, 46.0, 23.0, 11.0, 12.0, 5.0, 10.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.46875, -31.3271484375, -30.185546875, -29.0439453125, -27.90234375, -26.7607421875, -25.619140625, -24.4775390625, -23.3359375, -22.1943359375, -21.052734375, -19.9111328125, -18.76953125, -17.6279296875, -16.486328125, -15.3447265625, -14.203125, -13.0615234375, -11.919921875, -10.7783203125, -9.63671875, -8.4951171875, -7.353515625, -6.2119140625, -5.0703125, -3.9287109375, -2.787109375, -1.6455078125, -0.50390625, 0.6376953125, 1.779296875, 2.9208984375, 4.0625, 5.2041015625, 6.345703125, 7.4873046875, 8.62890625, 9.7705078125, 10.912109375, 12.0537109375, 13.1953125, 14.3369140625, 15.478515625, 16.6201171875, 17.76171875, 18.9033203125, 20.044921875, 21.1865234375, 22.328125, 23.4697265625, 24.611328125, 25.7529296875, 26.89453125, 28.0361328125, 29.177734375, 30.3193359375, 31.4609375, 32.6025390625, 33.744140625, 34.8857421875, 36.02734375, 37.1689453125, 38.310546875, 39.4521484375, 40.59375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 16.0, 17.0, 56.0, 78.0, 116.0, 164.0, 172.0, 152.0, 92.0, 65.0, 37.0, 24.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.080894470214844, -56.57168197631836, -54.06247329711914, -51.553260803222656, -49.04405212402344, -46.53483963012695, -44.02562713623047, -41.51641845703125, -39.007205963134766, -36.49799346923828, -33.98878479003906, -31.479572296142578, -28.970361709594727, -26.461151123046875, -23.95193862915039, -21.44272804260254, -18.933517456054688, -16.424306869506836, -13.915095329284668, -11.4058837890625, -8.896673202514648, -6.387462615966797, -3.878251075744629, -1.369039535522461, 1.1401710510253906, 3.6493821144104004, 6.15859317779541, 8.667804718017578, 11.17701530456543, 13.686225891113281, 16.195438385009766, 18.704648971557617, 21.213851928710938, 23.72306251525879, 26.23227310180664, 28.741485595703125, 31.250696182250977, 33.75990676879883, 36.26911926269531, 38.77832794189453, 41.287540435791016, 43.7967529296875, 46.30596160888672, 48.8151741027832, 51.32438659667969, 53.833595275878906, 56.34280776977539, 58.852020263671875, 61.361228942871094, 63.87044143676758, 66.37965393066406, 68.88886260986328, 71.3980712890625, 73.90728759765625, 76.41649627685547, 78.92570495605469, 81.43492126464844, 83.94412994384766, 86.4533462524414, 88.96255493164062, 91.47176361083984, 93.98097229003906, 96.49018859863281, 98.99939727783203, 101.50860595703125]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 11.0, 15.0, 14.0, 20.0, 24.0, 27.0, 28.0, 24.0, 23.0, 34.0, 44.0, 42.0, 59.0, 44.0, 47.0, 58.0, 55.0, 42.0, 48.0, 37.0, 32.0, 35.0, 34.0, 35.0, 29.0, 21.0, 23.0, 16.0, 14.0, 14.0, 10.0, 12.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.61665344238281, -44.21318817138672, -42.809722900390625, -41.4062614440918, -40.0027961730957, -38.59933090209961, -37.19586944580078, -35.79240417480469, -34.388938903808594, -32.9854736328125, -31.58201026916504, -30.178546905517578, -28.775081634521484, -27.37161636352539, -25.96815299987793, -24.56468963623047, -23.161224365234375, -21.75775909423828, -20.35429573059082, -18.95083236694336, -17.547367095947266, -16.143901824951172, -14.740438461303711, -13.336974143981934, -11.933509826660156, -10.530045509338379, -9.126581192016602, -7.723116874694824, -6.319652557373047, -4.9161882400512695, -3.512723922729492, -2.109259605407715, -0.7057991027832031, 0.6976652145385742, 2.1011295318603516, 3.504593849182129, 4.908058166503906, 6.311522483825684, 7.714986801147461, 9.118451118469238, 10.521915435791016, 11.925379753112793, 13.32884407043457, 14.732308387756348, 16.135772705078125, 17.53923797607422, 18.94270133972168, 20.34616470336914, 21.749629974365234, 23.153095245361328, 24.55655860900879, 25.96002197265625, 27.363487243652344, 28.766952514648438, 30.1704158782959, 31.57387924194336, 32.97734451293945, 34.38080978393555, 35.784271240234375, 37.18773651123047, 38.59120178222656, 39.994667053222656, 41.39813232421875, 42.80159378051758, 44.20505905151367]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 12.0, 8.0, 21.0, 22.0, 27.0, 36.0, 35.0, 42.0, 41.0, 53.0, 62.0, 58.0, 37.0, 51.0, 48.0, 51.0, 56.0, 37.0, 49.0, 42.0, 30.0, 23.0, 28.0, 26.0, 17.0, 18.0, 13.0, 13.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4921875, -5.3238525390625, -5.155517578125, -4.9871826171875, -4.81884765625, -4.6505126953125, -4.482177734375, -4.3138427734375, -4.1455078125, -3.9771728515625, -3.808837890625, -3.6405029296875, -3.47216796875, -3.3038330078125, -3.135498046875, -2.9671630859375, -2.798828125, -2.6304931640625, -2.462158203125, -2.2938232421875, -2.12548828125, -1.9571533203125, -1.788818359375, -1.6204833984375, -1.4521484375, -1.2838134765625, -1.115478515625, -0.9471435546875, -0.77880859375, -0.6104736328125, -0.442138671875, -0.2738037109375, -0.10546875, 0.0628662109375, 0.231201171875, 0.3995361328125, 0.56787109375, 0.7362060546875, 0.904541015625, 1.0728759765625, 1.2412109375, 1.4095458984375, 1.577880859375, 1.7462158203125, 1.91455078125, 2.0828857421875, 2.251220703125, 2.4195556640625, 2.587890625, 2.7562255859375, 2.924560546875, 3.0928955078125, 3.26123046875, 3.4295654296875, 3.597900390625, 3.7662353515625, 3.9345703125, 4.1029052734375, 4.271240234375, 4.4395751953125, 4.60791015625, 4.7762451171875, 4.944580078125, 5.1129150390625, 5.28125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 12.0, 11.0, 15.0, 29.0, 43.0, 50.0, 99.0, 132.0, 208.0, 359.0, 577.0, 993.0, 1739.0, 2970.0, 5202.0, 9240.0, 16680.0, 31913.0, 65194.0, 154710.0, 350806.0, 228452.0, 89394.0, 41410.0, 21192.0, 11597.0, 6605.0, 3664.0, 2187.0, 1179.0, 697.0, 435.0, 265.0, 174.0, 104.0, 68.0, 44.0, 45.0, 17.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2381591796875, -0.23087501525878906, -0.22359085083007812, -0.2163066864013672, -0.20902252197265625, -0.2017383575439453, -0.19445419311523438, -0.18717002868652344, -0.1798858642578125, -0.17260169982910156, -0.16531753540039062, -0.1580333709716797, -0.15074920654296875, -0.1434650421142578, -0.13618087768554688, -0.12889671325683594, -0.121612548828125, -0.11432838439941406, -0.10704421997070312, -0.09976005554199219, -0.09247589111328125, -0.08519172668457031, -0.07790756225585938, -0.07062339782714844, -0.0633392333984375, -0.05605506896972656, -0.048770904541015625, -0.04148674011230469, -0.03420257568359375, -0.026918411254882812, -0.019634246826171875, -0.012350082397460938, -0.00506591796875, 0.0022182464599609375, 0.009502410888671875, 0.016786575317382812, 0.02407073974609375, 0.03135490417480469, 0.038639068603515625, 0.04592323303222656, 0.0532073974609375, 0.06049156188964844, 0.06777572631835938, 0.07505989074707031, 0.08234405517578125, 0.08962821960449219, 0.09691238403320312, 0.10419654846191406, 0.111480712890625, 0.11876487731933594, 0.12604904174804688, 0.1333332061767578, 0.14061737060546875, 0.1479015350341797, 0.15518569946289062, 0.16246986389160156, 0.1697540283203125, 0.17703819274902344, 0.18432235717773438, 0.1916065216064453, 0.19889068603515625, 0.2061748504638672, 0.21345901489257812, 0.22074317932128906, 0.22802734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 3.0, 9.0, 9.0, 20.0, 8.0, 10.0, 16.0, 15.0, 20.0, 29.0, 27.0, 23.0, 37.0, 40.0, 46.0, 42.0, 36.0, 44.0, 1070.0, 44.0, 43.0, 38.0, 40.0, 46.0, 30.0, 40.0, 34.0, 26.0, 34.0, 25.0, 19.0, 23.0, 18.0, 12.0, 14.0, 8.0, 8.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6328125, -2.542938232421875, -2.45306396484375, -2.363189697265625, -2.2733154296875, -2.183441162109375, -2.09356689453125, -2.003692626953125, -1.913818359375, -1.823944091796875, -1.73406982421875, -1.644195556640625, -1.5543212890625, -1.464447021484375, -1.37457275390625, -1.284698486328125, -1.19482421875, -1.104949951171875, -1.01507568359375, -0.925201416015625, -0.8353271484375, -0.745452880859375, -0.65557861328125, -0.565704345703125, -0.475830078125, -0.385955810546875, -0.29608154296875, -0.206207275390625, -0.1163330078125, -0.026458740234375, 0.06341552734375, 0.153289794921875, 0.2431640625, 0.333038330078125, 0.42291259765625, 0.512786865234375, 0.6026611328125, 0.692535400390625, 0.78240966796875, 0.872283935546875, 0.962158203125, 1.052032470703125, 1.14190673828125, 1.231781005859375, 1.3216552734375, 1.411529541015625, 1.50140380859375, 1.591278076171875, 1.68115234375, 1.771026611328125, 1.86090087890625, 1.950775146484375, 2.0406494140625, 2.130523681640625, 2.22039794921875, 2.310272216796875, 2.400146484375, 2.490020751953125, 2.57989501953125, 2.669769287109375, 2.7596435546875, 2.849517822265625, 2.93939208984375, 3.029266357421875, 3.119140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 15.0, 13.0, 30.0, 29.0, 61.0, 88.0, 138.0, 169.0, 310.0, 484.0, 783.0, 1175.0, 1809.0, 3022.0, 4615.0, 7605.0, 12146.0, 20316.0, 34360.0, 61439.0, 122395.0, 1315023.0, 252141.0, 115318.0, 58419.0, 33289.0, 19851.0, 12004.0, 7317.0, 4729.0, 2865.0, 1899.0, 1196.0, 754.0, 461.0, 309.0, 199.0, 132.0, 70.0, 52.0, 31.0, 27.0, 16.0, 13.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.177978515625, -0.1724090576171875, -0.166839599609375, -0.1612701416015625, -0.15570068359375, -0.1501312255859375, -0.144561767578125, -0.1389923095703125, -0.1334228515625, -0.1278533935546875, -0.122283935546875, -0.1167144775390625, -0.11114501953125, -0.1055755615234375, -0.100006103515625, -0.0944366455078125, -0.0888671875, -0.0832977294921875, -0.077728271484375, -0.0721588134765625, -0.06658935546875, -0.0610198974609375, -0.055450439453125, -0.0498809814453125, -0.0443115234375, -0.0387420654296875, -0.033172607421875, -0.0276031494140625, -0.02203369140625, -0.0164642333984375, -0.010894775390625, -0.0053253173828125, 0.000244140625, 0.0058135986328125, 0.011383056640625, 0.0169525146484375, 0.02252197265625, 0.0280914306640625, 0.033660888671875, 0.0392303466796875, 0.0447998046875, 0.0503692626953125, 0.055938720703125, 0.0615081787109375, 0.06707763671875, 0.0726470947265625, 0.078216552734375, 0.0837860107421875, 0.08935546875, 0.0949249267578125, 0.100494384765625, 0.1060638427734375, 0.11163330078125, 0.1172027587890625, 0.122772216796875, 0.1283416748046875, 0.1339111328125, 0.1394805908203125, 0.145050048828125, 0.1506195068359375, 0.15618896484375, 0.1617584228515625, 0.167327880859375, 0.1728973388671875, 0.178466796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 8.0, 10.0, 10.0, 9.0, 7.0, 17.0, 16.0, 31.0, 36.0, 36.0, 30.0, 38.0, 49.0, 60.0, 64.0, 69.0, 58.0, 48.0, 50.0, 53.0, 46.0, 34.0, 34.0, 36.0, 26.0, 24.0, 20.0, 16.0, 11.0, 13.0, 11.0, 9.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6345252990722656e-05, -2.544466406106949e-05, -2.454407513141632e-05, -2.3643486201763153e-05, -2.2742897272109985e-05, -2.1842308342456818e-05, -2.094171941280365e-05, -2.0041130483150482e-05, -1.9140541553497314e-05, -1.8239952623844147e-05, -1.733936369419098e-05, -1.643877476453781e-05, -1.5538185834884644e-05, -1.4637596905231476e-05, -1.3737007975578308e-05, -1.283641904592514e-05, -1.1935830116271973e-05, -1.1035241186618805e-05, -1.0134652256965637e-05, -9.23406332731247e-06, -8.333474397659302e-06, -7.432885468006134e-06, -6.532296538352966e-06, -5.631707608699799e-06, -4.731118679046631e-06, -3.830529749393463e-06, -2.9299408197402954e-06, -2.0293518900871277e-06, -1.12876296043396e-06, -2.2817403078079224e-07, 6.724148988723755e-07, 1.5730038285255432e-06, 2.473592758178711e-06, 3.3741816878318787e-06, 4.274770617485046e-06, 5.175359547138214e-06, 6.075948476791382e-06, 6.9765374064445496e-06, 7.877126336097717e-06, 8.777715265750885e-06, 9.678304195404053e-06, 1.057889312505722e-05, 1.1479482054710388e-05, 1.2380070984363556e-05, 1.3280659914016724e-05, 1.4181248843669891e-05, 1.5081837773323059e-05, 1.5982426702976227e-05, 1.6883015632629395e-05, 1.7783604562282562e-05, 1.868419349193573e-05, 1.9584782421588898e-05, 2.0485371351242065e-05, 2.1385960280895233e-05, 2.22865492105484e-05, 2.318713814020157e-05, 2.4087727069854736e-05, 2.4988315999507904e-05, 2.5888904929161072e-05, 2.678949385881424e-05, 2.7690082788467407e-05, 2.8590671718120575e-05, 2.9491260647773743e-05, 3.039184957742691e-05, 3.129243850708008e-05]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 9.0, 12.0, 19.0, 26.0, 26.0, 36.0, 39.0, 63.0, 109.0, 165.0, 253.0, 478.0, 1626.0, 533470.0, 509344.0, 1579.0, 494.0, 254.0, 159.0, 127.0, 59.0, 56.0, 38.0, 19.0, 17.0, 16.0, 9.0, 15.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006456375122070312, -0.0006266459822654724, -0.0006076544523239136, -0.0005886629223823547, -0.0005696713924407959, -0.0005506798624992371, -0.0005316883325576782, -0.0005126968026161194, -0.0004937052726745605, -0.0004747137427330017, -0.00045572221279144287, -0.00043673068284988403, -0.0004177391529083252, -0.00039874762296676636, -0.0003797560930252075, -0.0003607645630836487, -0.00034177303314208984, -0.000322781503200531, -0.00030378997325897217, -0.00028479844331741333, -0.0002658069133758545, -0.00024681538343429565, -0.00022782385349273682, -0.00020883232355117798, -0.00018984079360961914, -0.0001708492636680603, -0.00015185773372650146, -0.00013286620378494263, -0.00011387467384338379, -9.488314390182495e-05, -7.589161396026611e-05, -5.6900084018707275e-05, -3.790855407714844e-05, -1.89170241355896e-05, 7.450580596923828e-08, 1.9066035747528076e-05, 3.8057565689086914e-05, 5.704909563064575e-05, 7.604062557220459e-05, 9.503215551376343e-05, 0.00011402368545532227, 0.0001330152153968811, 0.00015200674533843994, 0.00017099827527999878, 0.00018998980522155762, 0.00020898133516311646, 0.0002279728651046753, 0.00024696439504623413, 0.00026595592498779297, 0.0002849474549293518, 0.00030393898487091064, 0.0003229305148124695, 0.0003419220447540283, 0.00036091357469558716, 0.000379905104637146, 0.00039889663457870483, 0.00041788816452026367, 0.0004368796944618225, 0.00045587122440338135, 0.0004748627543449402, 0.000493854284286499, 0.0005128458142280579, 0.0005318373441696167, 0.0005508288741111755, 0.0005698204040527344]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 118.0, 614.0, 262.0, 19.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002219722227891907, -0.0002178354625357315, -0.00021369870228227228, -0.00020956194202881306, -0.00020542518177535385, -0.00020128843607380986, -0.00019715167582035065, -0.00019301491556689143, -0.00018887815531343222, -0.000184741395059973, -0.00018060463480651379, -0.00017646787455305457, -0.00017233111429959536, -0.00016819435404613614, -0.00016405759379267693, -0.00015992084809113294, -0.0001557840732857585, -0.00015164731303229928, -0.00014751055277884007, -0.00014337379252538085, -0.00013923703227192163, -0.00013510027201846242, -0.0001309635117650032, -0.00012682676606345922, -0.00012269000581, -0.00011855324555654079, -0.00011441648530308157, -0.00011027972504962236, -0.00010614297207212076, -0.00010200621181866154, -9.786945156520233e-05, -9.373269131174311e-05, -8.959592378232628e-05, -8.545916352886707e-05, -8.132240327540785e-05, -7.718564302194864e-05, -7.304889004444703e-05, -6.891212979098782e-05, -6.47753695375286e-05, -6.063860928406939e-05, -5.650185630656779e-05, -5.236509605310857e-05, -4.8228339437628165e-05, -4.409157918416895e-05, -3.995482256868854e-05, -3.5818062315229326e-05, -3.168130206177011e-05, -2.75445436273003e-05, -2.3407785192830488e-05, -1.9271026758360676e-05, -1.5134267414396163e-05, -1.099750807043165e-05, -6.860749635961838e-06, -2.7239912014920264e-06, 1.4127690519671887e-06, 5.549527486437e-06, 9.686285920906812e-06, 1.3823044355376624e-05, 1.7959802789846435e-05, 2.209656304330565e-05, 2.6233321477775462e-05, 3.0370079912245274e-05, 3.450684016570449e-05, 3.8643600419163704e-05, 4.278035703464411e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 6.0, 6.0, 12.0, 13.0, 15.0, 14.0, 17.0, 21.0, 19.0, 20.0, 22.0, 31.0, 33.0, 34.0, 37.0, 45.0, 48.0, 47.0, 30.0, 51.0, 39.0, 34.0, 38.0, 54.0, 34.0, 33.0, 37.0, 33.0, 23.0, 23.0, 23.0, 14.0, 11.0, 11.0, 14.0, 11.0, 6.0, 10.0, 9.0, 4.0, 1.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4960765838623047e-05, -1.4493241906166077e-05, -1.4025717973709106e-05, -1.3558194041252136e-05, -1.3090670108795166e-05, -1.2623146176338196e-05, -1.2155622243881226e-05, -1.1688098311424255e-05, -1.1220574378967285e-05, -1.0753050446510315e-05, -1.0285526514053345e-05, -9.818002581596375e-06, -9.350478649139404e-06, -8.882954716682434e-06, -8.415430784225464e-06, -7.947906851768494e-06, -7.4803829193115234e-06, -7.012858986854553e-06, -6.545335054397583e-06, -6.077811121940613e-06, -5.610287189483643e-06, -5.142763257026672e-06, -4.675239324569702e-06, -4.207715392112732e-06, -3.7401914596557617e-06, -3.2726675271987915e-06, -2.8051435947418213e-06, -2.337619662284851e-06, -1.8700957298278809e-06, -1.4025717973709106e-06, -9.350478649139404e-07, -4.675239324569702e-07, 0.0, 4.675239324569702e-07, 9.350478649139404e-07, 1.4025717973709106e-06, 1.8700957298278809e-06, 2.337619662284851e-06, 2.8051435947418213e-06, 3.2726675271987915e-06, 3.7401914596557617e-06, 4.207715392112732e-06, 4.675239324569702e-06, 5.142763257026672e-06, 5.610287189483643e-06, 6.077811121940613e-06, 6.545335054397583e-06, 7.012858986854553e-06, 7.4803829193115234e-06, 7.947906851768494e-06, 8.415430784225464e-06, 8.882954716682434e-06, 9.350478649139404e-06, 9.818002581596375e-06, 1.0285526514053345e-05, 1.0753050446510315e-05, 1.1220574378967285e-05, 1.1688098311424255e-05, 1.2155622243881226e-05, 1.2623146176338196e-05, 1.3090670108795166e-05, 1.3558194041252136e-05, 1.4025717973709106e-05, 1.4493241906166077e-05, 1.4960765838623047e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 12.0, 8.0, 21.0, 22.0, 27.0, 36.0, 35.0, 42.0, 41.0, 53.0, 62.0, 58.0, 37.0, 51.0, 48.0, 51.0, 56.0, 37.0, 49.0, 42.0, 30.0, 23.0, 28.0, 26.0, 17.0, 18.0, 13.0, 13.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4921875, -5.3238525390625, -5.155517578125, -4.9871826171875, -4.81884765625, -4.6505126953125, -4.482177734375, -4.3138427734375, -4.1455078125, -3.9771728515625, -3.808837890625, -3.6405029296875, -3.47216796875, -3.3038330078125, -3.135498046875, -2.9671630859375, -2.798828125, -2.6304931640625, -2.462158203125, -2.2938232421875, -2.12548828125, -1.9571533203125, -1.788818359375, -1.6204833984375, -1.4521484375, -1.2838134765625, -1.115478515625, -0.9471435546875, -0.77880859375, -0.6104736328125, -0.442138671875, -0.2738037109375, -0.10546875, 0.0628662109375, 0.231201171875, 0.3995361328125, 0.56787109375, 0.7362060546875, 0.904541015625, 1.0728759765625, 1.2412109375, 1.4095458984375, 1.577880859375, 1.7462158203125, 1.91455078125, 2.0828857421875, 2.251220703125, 2.4195556640625, 2.587890625, 2.7562255859375, 2.924560546875, 3.0928955078125, 3.26123046875, 3.4295654296875, 3.597900390625, 3.7662353515625, 3.9345703125, 4.1029052734375, 4.271240234375, 4.4395751953125, 4.60791015625, 4.7762451171875, 4.944580078125, 5.1129150390625, 5.28125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 15.0, 14.0, 21.0, 21.0, 37.0, 51.0, 101.0, 99.0, 184.0, 268.0, 410.0, 640.0, 1149.0, 2016.0, 3444.0, 6195.0, 12370.0, 27644.0, 81760.0, 376214.0, 395355.0, 84875.0, 28128.0, 12468.0, 6440.0, 3570.0, 2004.0, 1189.0, 673.0, 386.0, 273.0, 161.0, 108.0, 82.0, 56.0, 34.0, 24.0, 14.0, 9.0, 6.0, 6.0, 8.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.958984375, -3.831329345703125, -3.70367431640625, -3.576019287109375, -3.4483642578125, -3.320709228515625, -3.19305419921875, -3.065399169921875, -2.937744140625, -2.810089111328125, -2.68243408203125, -2.554779052734375, -2.4271240234375, -2.299468994140625, -2.17181396484375, -2.044158935546875, -1.91650390625, -1.788848876953125, -1.66119384765625, -1.533538818359375, -1.4058837890625, -1.278228759765625, -1.15057373046875, -1.022918701171875, -0.895263671875, -0.767608642578125, -0.63995361328125, -0.512298583984375, -0.3846435546875, -0.256988525390625, -0.12933349609375, -0.001678466796875, 0.1259765625, 0.253631591796875, 0.38128662109375, 0.508941650390625, 0.6365966796875, 0.764251708984375, 0.89190673828125, 1.019561767578125, 1.147216796875, 1.274871826171875, 1.40252685546875, 1.530181884765625, 1.6578369140625, 1.785491943359375, 1.91314697265625, 2.040802001953125, 2.16845703125, 2.296112060546875, 2.42376708984375, 2.551422119140625, 2.6790771484375, 2.806732177734375, 2.93438720703125, 3.062042236328125, 3.189697265625, 3.317352294921875, 3.44500732421875, 3.572662353515625, 3.7003173828125, 3.827972412109375, 3.95562744140625, 4.083282470703125, 4.2109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 4.0, 8.0, 14.0, 3.0, 12.0, 12.0, 11.0, 17.0, 19.0, 16.0, 21.0, 34.0, 25.0, 26.0, 52.0, 41.0, 50.0, 49.0, 113.0, 375.0, 1559.0, 130.0, 45.0, 46.0, 39.0, 44.0, 29.0, 33.0, 22.0, 32.0, 24.0, 27.0, 16.0, 16.0, 12.0, 16.0, 14.0, 5.0, 7.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.56298828125, -14.0947265625, -13.62646484375, -13.158203125, -12.68994140625, -12.2216796875, -11.75341796875, -11.28515625, -10.81689453125, -10.3486328125, -9.88037109375, -9.412109375, -8.94384765625, -8.4755859375, -8.00732421875, -7.5390625, -7.07080078125, -6.6025390625, -6.13427734375, -5.666015625, -5.19775390625, -4.7294921875, -4.26123046875, -3.79296875, -3.32470703125, -2.8564453125, -2.38818359375, -1.919921875, -1.45166015625, -0.9833984375, -0.51513671875, -0.046875, 0.42138671875, 0.8896484375, 1.35791015625, 1.826171875, 2.29443359375, 2.7626953125, 3.23095703125, 3.69921875, 4.16748046875, 4.6357421875, 5.10400390625, 5.572265625, 6.04052734375, 6.5087890625, 6.97705078125, 7.4453125, 7.91357421875, 8.3818359375, 8.85009765625, 9.318359375, 9.78662109375, 10.2548828125, 10.72314453125, 11.19140625, 11.65966796875, 12.1279296875, 12.59619140625, 13.064453125, 13.53271484375, 14.0009765625, 14.46923828125, 14.9375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 9.0, 7.0, 12.0, 22.0, 23.0, 25.0, 40.0, 50.0, 61.0, 78.0, 117.0, 195.0, 340.0, 786.0, 4473.0, 361506.0, 2767146.0, 8699.0, 1034.0, 390.0, 207.0, 119.0, 91.0, 55.0, 45.0, 34.0, 27.0, 26.0, 17.0, 9.0, 15.0, 8.0, 3.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.09375, -38.068115234375, -37.04248046875, -36.016845703125, -34.9912109375, -33.965576171875, -32.93994140625, -31.914306640625, -30.888671875, -29.863037109375, -28.83740234375, -27.811767578125, -26.7861328125, -25.760498046875, -24.73486328125, -23.709228515625, -22.68359375, -21.657958984375, -20.63232421875, -19.606689453125, -18.5810546875, -17.555419921875, -16.52978515625, -15.504150390625, -14.478515625, -13.452880859375, -12.42724609375, -11.401611328125, -10.3759765625, -9.350341796875, -8.32470703125, -7.299072265625, -6.2734375, -5.247802734375, -4.22216796875, -3.196533203125, -2.1708984375, -1.145263671875, -0.11962890625, 0.906005859375, 1.931640625, 2.957275390625, 3.98291015625, 5.008544921875, 6.0341796875, 7.059814453125, 8.08544921875, 9.111083984375, 10.13671875, 11.162353515625, 12.18798828125, 13.213623046875, 14.2392578125, 15.264892578125, 16.29052734375, 17.316162109375, 18.341796875, 19.367431640625, 20.39306640625, 21.418701171875, 22.4443359375, 23.469970703125, 24.49560546875, 25.521240234375, 26.546875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 722.0, 295.0, 0.0, 2.0], "bins": [-546.7039184570312, -537.720703125, -528.7374877929688, -519.7542114257812, -510.77099609375, -501.78778076171875, -492.8045654296875, -483.8213195800781, -474.8381042480469, -465.8548889160156, -456.87164306640625, -447.888427734375, -438.90521240234375, -429.9219665527344, -420.9387512207031, -411.95550537109375, -402.9722900390625, -393.98907470703125, -385.0058288574219, -376.0226135253906, -367.03936767578125, -358.05615234375, -349.07293701171875, -340.0896911621094, -331.1064758300781, -322.1232604980469, -313.1400146484375, -304.15679931640625, -295.173583984375, -286.1903381347656, -277.2071228027344, -268.223876953125, -259.24066162109375, -250.25743103027344, -241.27420043945312, -232.29098510742188, -223.30775451660156, -214.32452392578125, -205.34130859375, -196.3580780029297, -187.3748321533203, -178.3916015625, -169.40838623046875, -160.42515563964844, -151.44192504882812, -142.4586944580078, -133.4754638671875, -124.49224853515625, -115.50901794433594, -106.52578735351562, -97.54256439208984, -88.55934143066406, -79.57611083984375, -70.59288024902344, -61.609657287597656, -52.62643051147461, -43.64320373535156, -34.659976959228516, -25.67675018310547, -16.693523406982422, -7.710296630859375, 1.2729301452636719, 10.256156921386719, 19.239383697509766, 28.222610473632812]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 5.0, 8.0, 7.0, 5.0, 5.0, 14.0, 7.0, 17.0, 14.0, 25.0, 28.0, 18.0, 20.0, 17.0, 33.0, 32.0, 35.0, 42.0, 34.0, 38.0, 36.0, 49.0, 34.0, 37.0, 33.0, 33.0, 38.0, 33.0, 26.0, 36.0, 25.0, 28.0, 25.0, 30.0, 27.0, 18.0, 12.0, 15.0, 8.0, 8.0, 9.0, 7.0, 13.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.51777648925781, -42.08256912231445, -40.64736557006836, -39.212158203125, -37.776954650878906, -36.34174728393555, -34.90653991699219, -33.471336364746094, -32.0361328125, -30.600927352905273, -29.165721893310547, -27.730514526367188, -26.295310974121094, -24.860103607177734, -23.424898147583008, -21.98969268798828, -20.554485321044922, -19.119279861450195, -17.68407440185547, -16.24886703491211, -14.8136625289917, -13.378457069396973, -11.94325065612793, -10.508045196533203, -9.072839736938477, -7.63763427734375, -6.202428340911865, -4.7672224044799805, -3.332016944885254, -1.8968114852905273, -0.4616050720214844, 0.9736003875732422, 2.4088096618652344, 3.84401535987854, 5.279221057891846, 6.7144269943237305, 8.149632453918457, 9.584837913513184, 11.020044326782227, 12.455249786376953, 13.89045524597168, 15.325660705566406, 16.760866165161133, 18.19607162475586, 19.63127899169922, 21.066482543945312, 22.501689910888672, 23.9368953704834, 25.372100830078125, 26.80730628967285, 28.242511749267578, 29.677719116210938, 31.11292266845703, 32.54813003540039, 33.98333740234375, 35.418540954589844, 36.85374450683594, 38.2889518737793, 39.72415542602539, 41.15936279296875, 42.594566345214844, 44.0297737121582, 45.46498107910156, 46.900184631347656, 48.335391998291016]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 9.0, 8.0, 13.0, 10.0, 23.0, 28.0, 35.0, 34.0, 42.0, 41.0, 50.0, 46.0, 54.0, 48.0, 49.0, 43.0, 47.0, 58.0, 46.0, 48.0, 29.0, 35.0, 32.0, 27.0, 23.0, 25.0, 18.0, 13.0, 16.0, 14.0, 7.0, 8.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3828125, -5.2152099609375, -5.047607421875, -4.8800048828125, -4.71240234375, -4.5447998046875, -4.377197265625, -4.2095947265625, -4.0419921875, -3.8743896484375, -3.706787109375, -3.5391845703125, -3.37158203125, -3.2039794921875, -3.036376953125, -2.8687744140625, -2.701171875, -2.5335693359375, -2.365966796875, -2.1983642578125, -2.03076171875, -1.8631591796875, -1.695556640625, -1.5279541015625, -1.3603515625, -1.1927490234375, -1.025146484375, -0.8575439453125, -0.68994140625, -0.5223388671875, -0.354736328125, -0.1871337890625, -0.01953125, 0.1480712890625, 0.315673828125, 0.4832763671875, 0.65087890625, 0.8184814453125, 0.986083984375, 1.1536865234375, 1.3212890625, 1.4888916015625, 1.656494140625, 1.8240966796875, 1.99169921875, 2.1593017578125, 2.326904296875, 2.4945068359375, 2.662109375, 2.8297119140625, 2.997314453125, 3.1649169921875, 3.33251953125, 3.5001220703125, 3.667724609375, 3.8353271484375, 4.0029296875, 4.1705322265625, 4.338134765625, 4.5057373046875, 4.67333984375, 4.8409423828125, 5.008544921875, 5.1761474609375, 5.34375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 12.0, 15.0, 18.0, 27.0, 29.0, 56.0, 78.0, 108.0, 178.0, 306.0, 563.0, 995.0, 2074.0, 4243.0, 9201.0, 22044.0, 57583.0, 181195.0, 774331.0, 1875407.0, 936210.0, 216984.0, 66860.0, 25597.0, 10617.0, 4795.0, 2184.0, 1082.0, 574.0, 335.0, 190.0, 127.0, 85.0, 43.0, 41.0, 26.0, 22.0, 11.0, 5.0, 7.0, 7.0, 5.0, 6.0, 1.0, 6.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.39544677734375, -7.1815185546875, -6.96759033203125, -6.753662109375, -6.53973388671875, -6.3258056640625, -6.11187744140625, -5.89794921875, -5.68402099609375, -5.4700927734375, -5.25616455078125, -5.042236328125, -4.82830810546875, -4.6143798828125, -4.40045166015625, -4.1865234375, -3.97259521484375, -3.7586669921875, -3.54473876953125, -3.330810546875, -3.11688232421875, -2.9029541015625, -2.68902587890625, -2.47509765625, -2.26116943359375, -2.0472412109375, -1.83331298828125, -1.619384765625, -1.40545654296875, -1.1915283203125, -0.97760009765625, -0.763671875, -0.54974365234375, -0.3358154296875, -0.12188720703125, 0.092041015625, 0.30596923828125, 0.5198974609375, 0.73382568359375, 0.94775390625, 1.16168212890625, 1.3756103515625, 1.58953857421875, 1.803466796875, 2.01739501953125, 2.2313232421875, 2.44525146484375, 2.6591796875, 2.87310791015625, 3.0870361328125, 3.30096435546875, 3.514892578125, 3.72882080078125, 3.9427490234375, 4.15667724609375, 4.37060546875, 4.58453369140625, 4.7984619140625, 5.01239013671875, 5.226318359375, 5.44024658203125, 5.6541748046875, 5.86810302734375, 6.08203125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 6.0, 11.0, 11.0, 13.0, 18.0, 19.0, 34.0, 52.0, 64.0, 93.0, 136.0, 155.0, 225.0, 316.0, 409.0, 495.0, 454.0, 412.0, 299.0, 227.0, 166.0, 141.0, 78.0, 66.0, 44.0, 30.0, 23.0, 19.0, 13.0, 12.0, 9.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.2890625, -12.9383544921875, -12.587646484375, -12.2369384765625, -11.88623046875, -11.5355224609375, -11.184814453125, -10.8341064453125, -10.4833984375, -10.1326904296875, -9.781982421875, -9.4312744140625, -9.08056640625, -8.7298583984375, -8.379150390625, -8.0284423828125, -7.677734375, -7.3270263671875, -6.976318359375, -6.6256103515625, -6.27490234375, -5.9241943359375, -5.573486328125, -5.2227783203125, -4.8720703125, -4.5213623046875, -4.170654296875, -3.8199462890625, -3.46923828125, -3.1185302734375, -2.767822265625, -2.4171142578125, -2.06640625, -1.7156982421875, -1.364990234375, -1.0142822265625, -0.66357421875, -0.3128662109375, 0.037841796875, 0.3885498046875, 0.7392578125, 1.0899658203125, 1.440673828125, 1.7913818359375, 2.14208984375, 2.4927978515625, 2.843505859375, 3.1942138671875, 3.544921875, 3.8956298828125, 4.246337890625, 4.5970458984375, 4.94775390625, 5.2984619140625, 5.649169921875, 5.9998779296875, 6.3505859375, 6.7012939453125, 7.052001953125, 7.4027099609375, 7.75341796875, 8.1041259765625, 8.454833984375, 8.8055419921875, 9.15625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 9.0, 14.0, 30.0, 43.0, 44.0, 93.0, 153.0, 329.0, 908.0, 4980.0, 72350.0, 3110685.0, 973524.0, 27344.0, 2577.0, 593.0, 240.0, 142.0, 77.0, 47.0, 30.0, 20.0, 13.0, 15.0, 7.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.53125, -30.43798828125, -29.3447265625, -28.25146484375, -27.158203125, -26.06494140625, -24.9716796875, -23.87841796875, -22.78515625, -21.69189453125, -20.5986328125, -19.50537109375, -18.412109375, -17.31884765625, -16.2255859375, -15.13232421875, -14.0390625, -12.94580078125, -11.8525390625, -10.75927734375, -9.666015625, -8.57275390625, -7.4794921875, -6.38623046875, -5.29296875, -4.19970703125, -3.1064453125, -2.01318359375, -0.919921875, 0.17333984375, 1.2666015625, 2.35986328125, 3.453125, 4.54638671875, 5.6396484375, 6.73291015625, 7.826171875, 8.91943359375, 10.0126953125, 11.10595703125, 12.19921875, 13.29248046875, 14.3857421875, 15.47900390625, 16.572265625, 17.66552734375, 18.7587890625, 19.85205078125, 20.9453125, 22.03857421875, 23.1318359375, 24.22509765625, 25.318359375, 26.41162109375, 27.5048828125, 28.59814453125, 29.69140625, 30.78466796875, 31.8779296875, 32.97119140625, 34.064453125, 35.15771484375, 36.2509765625, 37.34423828125, 38.4375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 14.0, 35.0, 52.0, 94.0, 132.0, 154.0, 154.0, 145.0, 98.0, 63.0, 40.0, 12.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-134.74916076660156, -132.1248779296875, -129.50059509277344, -126.87630462646484, -124.25201416015625, -121.62773132324219, -119.0034408569336, -116.37915802001953, -113.75486755371094, -111.13058471679688, -108.50629425048828, -105.88201141357422, -103.25772094726562, -100.63343811035156, -98.00914764404297, -95.3848648071289, -92.76057434082031, -90.13629150390625, -87.51200103759766, -84.8877182006836, -82.263427734375, -79.63914489746094, -77.01485443115234, -74.39057159423828, -71.76628875732422, -69.14200592041016, -66.51771545410156, -63.893428802490234, -61.269142150878906, -58.64485549926758, -56.02056884765625, -53.39628601074219, -50.77199935913086, -48.14771270751953, -45.5234260559082, -42.899139404296875, -40.27485275268555, -37.65056610107422, -35.026283264160156, -32.40199279785156, -29.777708053588867, -27.15342140197754, -24.52913475036621, -21.904850006103516, -19.280563354492188, -16.65627670288086, -14.031990051269531, -11.407703399658203, -8.783416748046875, -6.159130096435547, -3.534843921661377, -0.910557746887207, 1.713728904724121, 4.338015556335449, 6.962301254272461, 9.586587905883789, 12.210874557495117, 14.835161209106445, 17.459447860717773, 20.08373260498047, 22.708019256591797, 25.332305908203125, 27.956592559814453, 30.58087921142578, 33.20516586303711]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 0.0, 5.0, 7.0, 4.0, 9.0, 7.0, 16.0, 5.0, 14.0, 18.0, 13.0, 16.0, 20.0, 30.0, 30.0, 28.0, 32.0, 23.0, 33.0, 26.0, 39.0, 35.0, 33.0, 42.0, 38.0, 45.0, 38.0, 41.0, 34.0, 32.0, 36.0, 21.0, 38.0, 19.0, 25.0, 24.0, 17.0, 19.0, 10.0, 16.0, 12.0, 12.0, 3.0, 8.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-32.325130462646484, -31.310733795166016, -30.296337127685547, -29.28194236755371, -28.267545700073242, -27.253149032592773, -26.238754272460938, -25.22435760498047, -24.2099609375, -23.19556427001953, -22.181167602539062, -21.166772842407227, -20.152376174926758, -19.13797950744629, -18.123584747314453, -17.109188079833984, -16.094791412353516, -15.080394744873047, -14.065999031066895, -13.051603317260742, -12.037206649780273, -11.022809982299805, -10.008414268493652, -8.9940185546875, -7.979621887207031, -6.965225696563721, -5.95082950592041, -4.9364333152771, -3.922037124633789, -2.9076409339904785, -1.893244743347168, -0.8788485527038574, 0.1355438232421875, 1.149940013885498, 2.1643362045288086, 3.178732395172119, 4.19312858581543, 5.20752477645874, 6.221920967102051, 7.236317157745361, 8.250713348388672, 9.26511001586914, 10.279505729675293, 11.293901443481445, 12.308298110961914, 13.322694778442383, 14.337090492248535, 15.351486206054688, 16.365882873535156, 17.380279541015625, 18.394676208496094, 19.40907096862793, 20.4234676361084, 21.437864303588867, 22.452259063720703, 23.466655731201172, 24.48105239868164, 25.49544906616211, 26.509845733642578, 27.524240493774414, 28.538637161254883, 29.55303382873535, 30.567428588867188, 31.581825256347656, 32.596221923828125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 9.0, 13.0, 15.0, 16.0, 17.0, 20.0, 31.0, 38.0, 34.0, 47.0, 45.0, 46.0, 49.0, 50.0, 43.0, 44.0, 42.0, 61.0, 59.0, 31.0, 41.0, 44.0, 30.0, 24.0, 27.0, 15.0, 18.0, 17.0, 15.0, 11.0, 13.0, 5.0, 8.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.94140625, -5.77215576171875, -5.6029052734375, -5.43365478515625, -5.264404296875, -5.09515380859375, -4.9259033203125, -4.75665283203125, -4.58740234375, -4.41815185546875, -4.2489013671875, -4.07965087890625, -3.910400390625, -3.74114990234375, -3.5718994140625, -3.40264892578125, -3.2333984375, -3.06414794921875, -2.8948974609375, -2.72564697265625, -2.556396484375, -2.38714599609375, -2.2178955078125, -2.04864501953125, -1.87939453125, -1.71014404296875, -1.5408935546875, -1.37164306640625, -1.202392578125, -1.03314208984375, -0.8638916015625, -0.69464111328125, -0.525390625, -0.35614013671875, -0.1868896484375, -0.01763916015625, 0.151611328125, 0.32086181640625, 0.4901123046875, 0.65936279296875, 0.82861328125, 0.99786376953125, 1.1671142578125, 1.33636474609375, 1.505615234375, 1.67486572265625, 1.8441162109375, 2.01336669921875, 2.1826171875, 2.35186767578125, 2.5211181640625, 2.69036865234375, 2.859619140625, 3.02886962890625, 3.1981201171875, 3.36737060546875, 3.53662109375, 3.70587158203125, 3.8751220703125, 4.04437255859375, 4.213623046875, 4.38287353515625, 4.5521240234375, 4.72137451171875, 4.890625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 10.0, 16.0, 17.0, 29.0, 36.0, 82.0, 98.0, 149.0, 240.0, 399.0, 631.0, 1037.0, 1810.0, 2999.0, 5369.0, 9216.0, 16238.0, 29433.0, 58183.0, 130000.0, 305725.0, 266602.0, 109484.0, 50556.0, 26090.0, 14160.0, 8287.0, 4812.0, 2820.0, 1532.0, 962.0, 570.0, 341.0, 225.0, 143.0, 83.0, 49.0, 41.0, 30.0, 15.0, 13.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2215576171875, -0.21414756774902344, -0.20673751831054688, -0.1993274688720703, -0.19191741943359375, -0.1845073699951172, -0.17709732055664062, -0.16968727111816406, -0.1622772216796875, -0.15486717224121094, -0.14745712280273438, -0.1400470733642578, -0.13263702392578125, -0.1252269744873047, -0.11781692504882812, -0.11040687561035156, -0.102996826171875, -0.09558677673339844, -0.08817672729492188, -0.08076667785644531, -0.07335662841796875, -0.06594657897949219, -0.058536529541015625, -0.05112648010253906, -0.0437164306640625, -0.03630638122558594, -0.028896331787109375, -0.021486282348632812, -0.01407623291015625, -0.0066661834716796875, 0.000743865966796875, 0.008153915405273438, 0.01556396484375, 0.022974014282226562, 0.030384063720703125, 0.03779411315917969, 0.04520416259765625, 0.05261421203613281, 0.060024261474609375, 0.06743431091308594, 0.0748443603515625, 0.08225440979003906, 0.08966445922851562, 0.09707450866699219, 0.10448455810546875, 0.11189460754394531, 0.11930465698242188, 0.12671470642089844, 0.134124755859375, 0.14153480529785156, 0.14894485473632812, 0.1563549041748047, 0.16376495361328125, 0.1711750030517578, 0.17858505249023438, 0.18599510192871094, 0.1934051513671875, 0.20081520080566406, 0.20822525024414062, 0.2156352996826172, 0.22304534912109375, 0.2304553985595703, 0.23786544799804688, 0.24527549743652344, 0.252685546875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 10.0, 7.0, 9.0, 12.0, 17.0, 20.0, 16.0, 11.0, 26.0, 26.0, 19.0, 22.0, 30.0, 31.0, 35.0, 38.0, 33.0, 38.0, 40.0, 50.0, 1065.0, 33.0, 43.0, 40.0, 23.0, 37.0, 28.0, 35.0, 26.0, 19.0, 24.0, 22.0, 18.0, 14.0, 15.0, 21.0, 12.0, 11.0, 9.0, 3.0, 6.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.90625, -2.821319580078125, -2.73638916015625, -2.651458740234375, -2.5665283203125, -2.481597900390625, -2.39666748046875, -2.311737060546875, -2.226806640625, -2.141876220703125, -2.05694580078125, -1.972015380859375, -1.8870849609375, -1.802154541015625, -1.71722412109375, -1.632293701171875, -1.54736328125, -1.462432861328125, -1.37750244140625, -1.292572021484375, -1.2076416015625, -1.122711181640625, -1.03778076171875, -0.952850341796875, -0.867919921875, -0.782989501953125, -0.69805908203125, -0.613128662109375, -0.5281982421875, -0.443267822265625, -0.35833740234375, -0.273406982421875, -0.1884765625, -0.103546142578125, -0.01861572265625, 0.066314697265625, 0.1512451171875, 0.236175537109375, 0.32110595703125, 0.406036376953125, 0.490966796875, 0.575897216796875, 0.66082763671875, 0.745758056640625, 0.8306884765625, 0.915618896484375, 1.00054931640625, 1.085479736328125, 1.17041015625, 1.255340576171875, 1.34027099609375, 1.425201416015625, 1.5101318359375, 1.595062255859375, 1.67999267578125, 1.764923095703125, 1.849853515625, 1.934783935546875, 2.01971435546875, 2.104644775390625, 2.1895751953125, 2.274505615234375, 2.35943603515625, 2.444366455078125, 2.529296875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 12.0, 13.0, 20.0, 38.0, 64.0, 79.0, 107.0, 129.0, 232.0, 337.0, 538.0, 721.0, 1116.0, 1582.0, 2368.0, 3528.0, 5259.0, 8238.0, 12165.0, 18990.0, 29834.0, 48575.0, 85599.0, 176021.0, 1331768.0, 162747.0, 79589.0, 45744.0, 28478.0, 18228.0, 11547.0, 7794.0, 5076.0, 3497.0, 2264.0, 1605.0, 996.0, 747.0, 477.0, 323.0, 224.0, 143.0, 100.0, 66.0, 55.0, 38.0, 23.0, 11.0, 13.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1661376953125, -0.16085433959960938, -0.15557098388671875, -0.15028762817382812, -0.1450042724609375, -0.13972091674804688, -0.13443756103515625, -0.12915420532226562, -0.123870849609375, -0.11858749389648438, -0.11330413818359375, -0.10802078247070312, -0.1027374267578125, -0.09745407104492188, -0.09217071533203125, -0.08688735961914062, -0.08160400390625, -0.07632064819335938, -0.07103729248046875, -0.06575393676757812, -0.0604705810546875, -0.055187225341796875, -0.04990386962890625, -0.044620513916015625, -0.039337158203125, -0.034053802490234375, -0.02877044677734375, -0.023487091064453125, -0.0182037353515625, -0.012920379638671875, -0.00763702392578125, -0.002353668212890625, 0.0029296875, 0.008213043212890625, 0.01349639892578125, 0.018779754638671875, 0.0240631103515625, 0.029346466064453125, 0.03462982177734375, 0.039913177490234375, 0.045196533203125, 0.050479888916015625, 0.05576324462890625, 0.061046600341796875, 0.0663299560546875, 0.07161331176757812, 0.07689666748046875, 0.08218002319335938, 0.08746337890625, 0.09274673461914062, 0.09803009033203125, 0.10331344604492188, 0.1085968017578125, 0.11388015747070312, 0.11916351318359375, 0.12444686889648438, 0.129730224609375, 0.13501358032226562, 0.14029693603515625, 0.14558029174804688, 0.1508636474609375, 0.15614700317382812, 0.16143035888671875, 0.16671371459960938, 0.1719970703125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 12.0, 17.0, 23.0, 22.0, 26.0, 26.0, 42.0, 42.0, 53.0, 46.0, 49.0, 56.0, 53.0, 52.0, 54.0, 63.0, 44.0, 44.0, 42.0, 30.0, 36.0, 24.0, 29.0, 22.0, 16.0, 10.0, 6.0, 5.0, 8.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2709369659423828e-05, -2.1954067051410675e-05, -2.1198764443397522e-05, -2.044346183538437e-05, -1.9688159227371216e-05, -1.8932856619358063e-05, -1.817755401134491e-05, -1.7422251403331757e-05, -1.6666948795318604e-05, -1.591164618730545e-05, -1.5156343579292297e-05, -1.4401040971279144e-05, -1.3645738363265991e-05, -1.2890435755252838e-05, -1.2135133147239685e-05, -1.1379830539226532e-05, -1.0624527931213379e-05, -9.869225323200226e-06, -9.113922715187073e-06, -8.35862010717392e-06, -7.603317499160767e-06, -6.8480148911476135e-06, -6.0927122831344604e-06, -5.337409675121307e-06, -4.582107067108154e-06, -3.826804459095001e-06, -3.071501851081848e-06, -2.316199243068695e-06, -1.560896635055542e-06, -8.055940270423889e-07, -5.029141902923584e-08, 7.050111889839172e-07, 1.4603137969970703e-06, 2.2156164050102234e-06, 2.9709190130233765e-06, 3.7262216210365295e-06, 4.481524229049683e-06, 5.236826837062836e-06, 5.992129445075989e-06, 6.747432053089142e-06, 7.502734661102295e-06, 8.258037269115448e-06, 9.013339877128601e-06, 9.768642485141754e-06, 1.0523945093154907e-05, 1.127924770116806e-05, 1.2034550309181213e-05, 1.2789852917194366e-05, 1.354515552520752e-05, 1.4300458133220673e-05, 1.5055760741233826e-05, 1.581106334924698e-05, 1.6566365957260132e-05, 1.7321668565273285e-05, 1.8076971173286438e-05, 1.883227378129959e-05, 1.9587576389312744e-05, 2.0342878997325897e-05, 2.109818160533905e-05, 2.1853484213352203e-05, 2.2608786821365356e-05, 2.336408942937851e-05, 2.4119392037391663e-05, 2.4874694645404816e-05, 2.562999725341797e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 7.0, 9.0, 6.0, 14.0, 15.0, 26.0, 25.0, 55.0, 71.0, 99.0, 168.0, 292.0, 534.0, 1576.0, 198635.0, 840444.0, 4874.0, 703.0, 351.0, 203.0, 124.0, 83.0, 66.0, 43.0, 29.0, 26.0, 16.0, 7.0, 11.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00046539306640625, -0.0004499778151512146, -0.0004345625638961792, -0.0004191473126411438, -0.0004037320613861084, -0.000388316810131073, -0.0003729015588760376, -0.0003574863076210022, -0.0003420710563659668, -0.0003266558051109314, -0.000311240553855896, -0.0002958253026008606, -0.0002804100513458252, -0.0002649948000907898, -0.0002495795488357544, -0.000234164297580719, -0.0002187490463256836, -0.0002033337950706482, -0.0001879185438156128, -0.0001725032925605774, -0.000157088041305542, -0.0001416727900505066, -0.0001262575387954712, -0.00011084228754043579, -9.542703628540039e-05, -8.001178503036499e-05, -6.459653377532959e-05, -4.918128252029419e-05, -3.376603126525879e-05, -1.835078001022339e-05, -2.9355287551879883e-06, 1.2479722499847412e-05, 2.7894973754882812e-05, 4.331022500991821e-05, 5.872547626495361e-05, 7.414072751998901e-05, 8.955597877502441e-05, 0.00010497123003005981, 0.00012038648128509521, 0.00013580173254013062, 0.00015121698379516602, 0.00016663223505020142, 0.00018204748630523682, 0.00019746273756027222, 0.00021287798881530762, 0.00022829324007034302, 0.00024370849132537842, 0.0002591237425804138, 0.0002745389938354492, 0.0002899542450904846, 0.00030536949634552, 0.0003207847476005554, 0.0003361999988555908, 0.0003516152501106262, 0.0003670305013656616, 0.000382445752620697, 0.0003978610038757324, 0.0004132762551307678, 0.0004286915063858032, 0.0004441067576408386, 0.000459522008895874, 0.0004749372601509094, 0.0004903525114059448, 0.0005057677626609802, 0.0005211830139160156]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 14.0, 31.0, 33.0, 52.0, 85.0, 101.0, 110.0, 132.0, 117.0, 102.0, 89.0, 54.0, 37.0, 17.0, 14.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7822463380289264e-05, -2.7118641810375266e-05, -2.6414820240461268e-05, -2.571099867054727e-05, -2.5007178919622675e-05, -2.4303357349708676e-05, -2.3599535779794678e-05, -2.289571420988068e-05, -2.219189263996668e-05, -2.1488071070052683e-05, -2.0784249500138685e-05, -2.0080427930224687e-05, -1.937660636031069e-05, -1.8672786609386094e-05, -1.7968965039472096e-05, -1.7265143469558097e-05, -1.65613218996441e-05, -1.58575003297301e-05, -1.5153678759816103e-05, -1.4449858099396806e-05, -1.3746036529482808e-05, -1.304221495956881e-05, -1.2338394299149513e-05, -1.1634572729235515e-05, -1.0930751159321517e-05, -1.0226929589407519e-05, -9.52310801949352e-06, -8.819287359074224e-06, -8.115465789160226e-06, -7.411644219246227e-06, -6.70782310407958e-06, -6.0040019889129326e-06, -5.300180418998934e-06, -4.596358849084936e-06, -3.892537733918289e-06, -3.188716391377966e-06, -2.484895048837643e-06, -1.7810737062973203e-06, -1.0772523637569975e-06, -3.7343124859035015e-07, 3.303903213236481e-07, 1.034211663863971e-06, 1.7380330064042937e-06, 2.4418543489446165e-06, 3.1456756914849393e-06, 3.8494972613989376e-06, 4.553318376565585e-06, 5.257139491732232e-06, 5.9609610616462305e-06, 6.664782631560229e-06, 7.368603746726876e-06, 8.072424861893523e-06, 8.776246431807522e-06, 9.48006800172152e-06, 1.0183888662140816e-05, 1.0887710232054815e-05, 1.1591531801968813e-05, 1.2295353371882811e-05, 1.299917494179681e-05, 1.3702995602216106e-05, 1.4406817172130104e-05, 1.5110638742044102e-05, 1.58144594024634e-05, 1.6518280972377397e-05, 1.7222102542291395e-05]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 5.0, 10.0, 3.0, 11.0, 15.0, 15.0, 12.0, 11.0, 23.0, 27.0, 22.0, 23.0, 44.0, 30.0, 37.0, 54.0, 38.0, 38.0, 42.0, 43.0, 37.0, 42.0, 39.0, 33.0, 46.0, 34.0, 45.0, 38.0, 33.0, 29.0, 18.0, 23.0, 22.0, 10.0, 11.0, 5.0, 10.0, 10.0, 5.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2159347534179688e-05, -1.1750496923923492e-05, -1.1341646313667297e-05, -1.0932795703411102e-05, -1.0523945093154907e-05, -1.0115094482898712e-05, -9.706243872642517e-06, -9.297393262386322e-06, -8.888542652130127e-06, -8.479692041873932e-06, -8.070841431617737e-06, -7.661990821361542e-06, -7.253140211105347e-06, -6.844289600849152e-06, -6.4354389905929565e-06, -6.0265883803367615e-06, -5.617737770080566e-06, -5.208887159824371e-06, -4.800036549568176e-06, -4.391185939311981e-06, -3.982335329055786e-06, -3.573484718799591e-06, -3.164634108543396e-06, -2.755783498287201e-06, -2.346932888031006e-06, -1.938082277774811e-06, -1.5292316675186157e-06, -1.1203810572624207e-06, -7.115304470062256e-07, -3.026798367500305e-07, 1.0617077350616455e-07, 5.150213837623596e-07, 9.238719940185547e-07, 1.3327226042747498e-06, 1.7415732145309448e-06, 2.15042382478714e-06, 2.559274435043335e-06, 2.96812504529953e-06, 3.376975655555725e-06, 3.78582626581192e-06, 4.194676876068115e-06, 4.60352748632431e-06, 5.012378096580505e-06, 5.4212287068367004e-06, 5.8300793170928955e-06, 6.2389299273490906e-06, 6.647780537605286e-06, 7.056631147861481e-06, 7.465481758117676e-06, 7.874332368373871e-06, 8.283182978630066e-06, 8.692033588886261e-06, 9.100884199142456e-06, 9.509734809398651e-06, 9.918585419654846e-06, 1.0327436029911041e-05, 1.0736286640167236e-05, 1.1145137250423431e-05, 1.1553987860679626e-05, 1.1962838470935822e-05, 1.2371689081192017e-05, 1.2780539691448212e-05, 1.3189390301704407e-05, 1.3598240911960602e-05, 1.4007091522216797e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 9.0, 13.0, 15.0, 16.0, 17.0, 20.0, 31.0, 38.0, 34.0, 47.0, 45.0, 46.0, 49.0, 50.0, 43.0, 44.0, 42.0, 61.0, 59.0, 31.0, 41.0, 44.0, 30.0, 24.0, 27.0, 15.0, 18.0, 17.0, 15.0, 11.0, 13.0, 5.0, 8.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.94140625, -5.77215576171875, -5.6029052734375, -5.43365478515625, -5.264404296875, -5.09515380859375, -4.9259033203125, -4.75665283203125, -4.58740234375, -4.41815185546875, -4.2489013671875, -4.07965087890625, -3.910400390625, -3.74114990234375, -3.5718994140625, -3.40264892578125, -3.2333984375, -3.06414794921875, -2.8948974609375, -2.72564697265625, -2.556396484375, -2.38714599609375, -2.2178955078125, -2.04864501953125, -1.87939453125, -1.71014404296875, -1.5408935546875, -1.37164306640625, -1.202392578125, -1.03314208984375, -0.8638916015625, -0.69464111328125, -0.525390625, -0.35614013671875, -0.1868896484375, -0.01763916015625, 0.151611328125, 0.32086181640625, 0.4901123046875, 0.65936279296875, 0.82861328125, 0.99786376953125, 1.1671142578125, 1.33636474609375, 1.505615234375, 1.67486572265625, 1.8441162109375, 2.01336669921875, 2.1826171875, 2.35186767578125, 2.5211181640625, 2.69036865234375, 2.859619140625, 3.02886962890625, 3.1981201171875, 3.36737060546875, 3.53662109375, 3.70587158203125, 3.8751220703125, 4.04437255859375, 4.213623046875, 4.38287353515625, 4.5521240234375, 4.72137451171875, 4.890625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 4.0, 9.0, 10.0, 13.0, 32.0, 27.0, 49.0, 56.0, 84.0, 163.0, 211.0, 313.0, 526.0, 865.0, 1209.0, 2031.0, 3387.0, 5469.0, 9312.0, 17165.0, 37075.0, 105421.0, 435916.0, 290456.0, 75054.0, 28982.0, 14316.0, 7957.0, 4693.0, 2788.0, 1733.0, 1129.0, 739.0, 454.0, 286.0, 204.0, 136.0, 84.0, 67.0, 43.0, 24.0, 16.0, 14.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.81640625, -3.70367431640625, -3.5909423828125, -3.47821044921875, -3.365478515625, -3.25274658203125, -3.1400146484375, -3.02728271484375, -2.91455078125, -2.80181884765625, -2.6890869140625, -2.57635498046875, -2.463623046875, -2.35089111328125, -2.2381591796875, -2.12542724609375, -2.0126953125, -1.89996337890625, -1.7872314453125, -1.67449951171875, -1.561767578125, -1.44903564453125, -1.3363037109375, -1.22357177734375, -1.11083984375, -0.99810791015625, -0.8853759765625, -0.77264404296875, -0.659912109375, -0.54718017578125, -0.4344482421875, -0.32171630859375, -0.208984375, -0.09625244140625, 0.0164794921875, 0.12921142578125, 0.241943359375, 0.35467529296875, 0.4674072265625, 0.58013916015625, 0.69287109375, 0.80560302734375, 0.9183349609375, 1.03106689453125, 1.143798828125, 1.25653076171875, 1.3692626953125, 1.48199462890625, 1.5947265625, 1.70745849609375, 1.8201904296875, 1.93292236328125, 2.045654296875, 2.15838623046875, 2.2711181640625, 2.38385009765625, 2.49658203125, 2.60931396484375, 2.7220458984375, 2.83477783203125, 2.947509765625, 3.06024169921875, 3.1729736328125, 3.28570556640625, 3.3984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 8.0, 9.0, 11.0, 14.0, 14.0, 13.0, 23.0, 19.0, 21.0, 25.0, 25.0, 24.0, 31.0, 40.0, 29.0, 39.0, 66.0, 56.0, 142.0, 1661.0, 230.0, 78.0, 55.0, 49.0, 37.0, 40.0, 47.0, 32.0, 27.0, 25.0, 22.0, 13.0, 19.0, 15.0, 14.0, 12.0, 18.0, 6.0, 6.0, 8.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.421875, -14.9345703125, -14.447265625, -13.9599609375, -13.47265625, -12.9853515625, -12.498046875, -12.0107421875, -11.5234375, -11.0361328125, -10.548828125, -10.0615234375, -9.57421875, -9.0869140625, -8.599609375, -8.1123046875, -7.625, -7.1376953125, -6.650390625, -6.1630859375, -5.67578125, -5.1884765625, -4.701171875, -4.2138671875, -3.7265625, -3.2392578125, -2.751953125, -2.2646484375, -1.77734375, -1.2900390625, -0.802734375, -0.3154296875, 0.171875, 0.6591796875, 1.146484375, 1.6337890625, 2.12109375, 2.6083984375, 3.095703125, 3.5830078125, 4.0703125, 4.5576171875, 5.044921875, 5.5322265625, 6.01953125, 6.5068359375, 6.994140625, 7.4814453125, 7.96875, 8.4560546875, 8.943359375, 9.4306640625, 9.91796875, 10.4052734375, 10.892578125, 11.3798828125, 11.8671875, 12.3544921875, 12.841796875, 13.3291015625, 13.81640625, 14.3037109375, 14.791015625, 15.2783203125, 15.765625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 4.0, 10.0, 8.0, 9.0, 24.0, 25.0, 24.0, 29.0, 35.0, 42.0, 75.0, 121.0, 161.0, 207.0, 351.0, 1230.0, 10123.0, 2820041.0, 305973.0, 5306.0, 863.0, 313.0, 183.0, 140.0, 101.0, 67.0, 48.0, 40.0, 35.0, 22.0, 20.0, 19.0, 15.0, 10.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-44.875, -43.658203125, -42.44140625, -41.224609375, -40.0078125, -38.791015625, -37.57421875, -36.357421875, -35.140625, -33.923828125, -32.70703125, -31.490234375, -30.2734375, -29.056640625, -27.83984375, -26.623046875, -25.40625, -24.189453125, -22.97265625, -21.755859375, -20.5390625, -19.322265625, -18.10546875, -16.888671875, -15.671875, -14.455078125, -13.23828125, -12.021484375, -10.8046875, -9.587890625, -8.37109375, -7.154296875, -5.9375, -4.720703125, -3.50390625, -2.287109375, -1.0703125, 0.146484375, 1.36328125, 2.580078125, 3.796875, 5.013671875, 6.23046875, 7.447265625, 8.6640625, 9.880859375, 11.09765625, 12.314453125, 13.53125, 14.748046875, 15.96484375, 17.181640625, 18.3984375, 19.615234375, 20.83203125, 22.048828125, 23.265625, 24.482421875, 25.69921875, 26.916015625, 28.1328125, 29.349609375, 30.56640625, 31.783203125, 33.0]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [5.0, 64.0, 722.0, 222.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.988240242004395, -8.909732818603516, -3.8312253952026367, 1.2472820281982422, 6.325789451599121, 11.404295921325684, 16.482803344726562, 21.56131362915039, 26.639820098876953, 31.718326568603516, 36.796836853027344, 41.875343322753906, 46.95384979248047, 52.03235626220703, 57.110862731933594, 62.18937301635742, 67.26787567138672, 72.34638214111328, 77.42488861083984, 82.5033950805664, 87.5819091796875, 92.66041564941406, 97.73892211914062, 102.81742858886719, 107.89593505859375, 112.97444152832031, 118.05294799804688, 123.13145446777344, 128.2099609375, 133.28846740722656, 138.36697387695312, 143.44549560546875, 148.52398681640625, 153.6024932861328, 158.68099975585938, 163.75950622558594, 168.8380126953125, 173.91651916503906, 178.99502563476562, 184.07354736328125, 189.15203857421875, 194.2305450439453, 199.30905151367188, 204.38755798339844, 209.466064453125, 214.54457092285156, 219.62307739257812, 224.70159912109375, 229.7801055908203, 234.85861206054688, 239.93711853027344, 245.015625, 250.09413146972656, 255.17263793945312, 260.25115966796875, 265.32965087890625, 270.4081726074219, 275.4866943359375, 280.565185546875, 285.6437072753906, 290.7221984863281, 295.80072021484375, 300.87921142578125, 305.9577331542969, 311.0362243652344]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 12.0, 13.0, 14.0, 12.0, 15.0, 18.0, 14.0, 17.0, 21.0, 11.0, 35.0, 29.0, 29.0, 34.0, 31.0, 40.0, 39.0, 33.0, 27.0, 40.0, 35.0, 34.0, 29.0, 38.0, 30.0, 39.0, 33.0, 30.0, 26.0, 28.0, 27.0, 19.0, 27.0, 21.0, 12.0, 11.0, 18.0, 10.0, 9.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.42393112182617, -35.20858383178711, -33.99323272705078, -32.77788543701172, -31.56253433227539, -30.347187042236328, -29.131837844848633, -27.916488647460938, -26.701139450073242, -25.485790252685547, -24.27044105529785, -23.055091857910156, -21.839744567871094, -20.624393463134766, -19.409046173095703, -18.193696975708008, -16.978347778320312, -15.762998580932617, -14.547649383544922, -13.332301139831543, -12.116951942443848, -10.901602745056152, -9.686254501342773, -8.470905303955078, -7.255556106567383, -6.0402069091796875, -4.82485818862915, -3.609509229660034, -2.394160270690918, -1.1788110733032227, 0.03653764724731445, 1.2518863677978516, 2.4672317504882812, 3.6825807094573975, 4.897929668426514, 6.113278388977051, 7.328627586364746, 8.543976783752441, 9.75932502746582, 10.974674224853516, 12.190023422241211, 13.405372619628906, 14.620721817016602, 15.83607006072998, 17.05141830444336, 18.266769409179688, 19.48211669921875, 20.697465896606445, 21.91281509399414, 23.128164291381836, 24.34351348876953, 25.558862686157227, 26.774211883544922, 27.989559173583984, 29.20490837097168, 30.420257568359375, 31.63560676574707, 32.850955963134766, 34.06630325317383, 35.281654357910156, 36.49700164794922, 37.71235275268555, 38.92770004272461, 40.14305114746094, 41.3583984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 12.0, 11.0, 8.0, 11.0, 16.0, 13.0, 17.0, 24.0, 30.0, 33.0, 39.0, 48.0, 49.0, 43.0, 51.0, 45.0, 40.0, 45.0, 41.0, 59.0, 49.0, 39.0, 45.0, 30.0, 33.0, 34.0, 18.0, 16.0, 11.0, 21.0, 21.0, 10.0, 13.0, 4.0, 3.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.14453125, -5.97357177734375, -5.8026123046875, -5.63165283203125, -5.460693359375, -5.28973388671875, -5.1187744140625, -4.94781494140625, -4.77685546875, -4.60589599609375, -4.4349365234375, -4.26397705078125, -4.093017578125, -3.92205810546875, -3.7510986328125, -3.58013916015625, -3.4091796875, -3.23822021484375, -3.0672607421875, -2.89630126953125, -2.725341796875, -2.55438232421875, -2.3834228515625, -2.21246337890625, -2.04150390625, -1.87054443359375, -1.6995849609375, -1.52862548828125, -1.357666015625, -1.18670654296875, -1.0157470703125, -0.84478759765625, -0.673828125, -0.50286865234375, -0.3319091796875, -0.16094970703125, 0.010009765625, 0.18096923828125, 0.3519287109375, 0.52288818359375, 0.69384765625, 0.86480712890625, 1.0357666015625, 1.20672607421875, 1.377685546875, 1.54864501953125, 1.7196044921875, 1.89056396484375, 2.0615234375, 2.23248291015625, 2.4034423828125, 2.57440185546875, 2.745361328125, 2.91632080078125, 3.0872802734375, 3.25823974609375, 3.42919921875, 3.60015869140625, 3.7711181640625, 3.94207763671875, 4.113037109375, 4.28399658203125, 4.4549560546875, 4.62591552734375, 4.796875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 4.0, 16.0, 10.0, 20.0, 14.0, 28.0, 42.0, 48.0, 44.0, 95.0, 119.0, 273.0, 684.0, 3368.0, 40555.0, 2022028.0, 2080252.0, 42009.0, 3329.0, 640.0, 228.0, 99.0, 84.0, 58.0, 43.0, 46.0, 28.0, 26.0, 12.0, 16.0, 10.0, 14.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-24.578125, -23.8759765625, -23.173828125, -22.4716796875, -21.76953125, -21.0673828125, -20.365234375, -19.6630859375, -18.9609375, -18.2587890625, -17.556640625, -16.8544921875, -16.15234375, -15.4501953125, -14.748046875, -14.0458984375, -13.34375, -12.6416015625, -11.939453125, -11.2373046875, -10.53515625, -9.8330078125, -9.130859375, -8.4287109375, -7.7265625, -7.0244140625, -6.322265625, -5.6201171875, -4.91796875, -4.2158203125, -3.513671875, -2.8115234375, -2.109375, -1.4072265625, -0.705078125, -0.0029296875, 0.69921875, 1.4013671875, 2.103515625, 2.8056640625, 3.5078125, 4.2099609375, 4.912109375, 5.6142578125, 6.31640625, 7.0185546875, 7.720703125, 8.4228515625, 9.125, 9.8271484375, 10.529296875, 11.2314453125, 11.93359375, 12.6357421875, 13.337890625, 14.0400390625, 14.7421875, 15.4443359375, 16.146484375, 16.8486328125, 17.55078125, 18.2529296875, 18.955078125, 19.6572265625, 20.359375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 13.0, 10.0, 22.0, 44.0, 51.0, 81.0, 148.0, 185.0, 337.0, 507.0, 680.0, 673.0, 470.0, 306.0, 192.0, 113.0, 86.0, 63.0, 33.0, 21.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.546875, -17.0438232421875, -16.540771484375, -16.0377197265625, -15.53466796875, -15.0316162109375, -14.528564453125, -14.0255126953125, -13.5224609375, -13.0194091796875, -12.516357421875, -12.0133056640625, -11.51025390625, -11.0072021484375, -10.504150390625, -10.0010986328125, -9.498046875, -8.9949951171875, -8.491943359375, -7.9888916015625, -7.48583984375, -6.9827880859375, -6.479736328125, -5.9766845703125, -5.4736328125, -4.9705810546875, -4.467529296875, -3.9644775390625, -3.46142578125, -2.9583740234375, -2.455322265625, -1.9522705078125, -1.44921875, -0.9461669921875, -0.443115234375, 0.0599365234375, 0.56298828125, 1.0660400390625, 1.569091796875, 2.0721435546875, 2.5751953125, 3.0782470703125, 3.581298828125, 4.0843505859375, 4.58740234375, 5.0904541015625, 5.593505859375, 6.0965576171875, 6.599609375, 7.1026611328125, 7.605712890625, 8.1087646484375, 8.61181640625, 9.1148681640625, 9.617919921875, 10.1209716796875, 10.6240234375, 11.1270751953125, 11.630126953125, 12.1331787109375, 12.63623046875, 13.1392822265625, 13.642333984375, 14.1453857421875, 14.6484375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 9.0, 13.0, 18.0, 18.0, 42.0, 50.0, 89.0, 138.0, 219.0, 450.0, 1153.0, 5671.0, 166824.0, 3856268.0, 155782.0, 5394.0, 1107.0, 403.0, 229.0, 141.0, 85.0, 73.0, 36.0, 27.0, 17.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.4560546875, -38.162109375, -36.8681640625, -35.57421875, -34.2802734375, -32.986328125, -31.6923828125, -30.3984375, -29.1044921875, -27.810546875, -26.5166015625, -25.22265625, -23.9287109375, -22.634765625, -21.3408203125, -20.046875, -18.7529296875, -17.458984375, -16.1650390625, -14.87109375, -13.5771484375, -12.283203125, -10.9892578125, -9.6953125, -8.4013671875, -7.107421875, -5.8134765625, -4.51953125, -3.2255859375, -1.931640625, -0.6376953125, 0.65625, 1.9501953125, 3.244140625, 4.5380859375, 5.83203125, 7.1259765625, 8.419921875, 9.7138671875, 11.0078125, 12.3017578125, 13.595703125, 14.8896484375, 16.18359375, 17.4775390625, 18.771484375, 20.0654296875, 21.359375, 22.6533203125, 23.947265625, 25.2412109375, 26.53515625, 27.8291015625, 29.123046875, 30.4169921875, 31.7109375, 33.0048828125, 34.298828125, 35.5927734375, 36.88671875, 38.1806640625, 39.474609375, 40.7685546875, 42.0625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 11.0, 24.0, 66.0, 170.0, 203.0, 223.0, 179.0, 84.0, 41.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.06033325195312, -123.2231216430664, -119.38591766357422, -115.5487060546875, -111.71149444580078, -107.87428283691406, -104.03707885742188, -100.19986724853516, -96.36265563964844, -92.52544403076172, -88.68824005126953, -84.85102844238281, -81.0138168334961, -77.17660522460938, -73.33940124511719, -69.50218963623047, -65.66498565673828, -61.82777786254883, -57.99056625366211, -54.153358459472656, -50.31614685058594, -46.478939056396484, -42.64173126220703, -38.80451965332031, -34.96731185913086, -31.130102157592773, -27.292892456054688, -23.455684661865234, -19.61847496032715, -15.781265258789062, -11.94405746459961, -8.106847763061523, -4.269630432128906, -0.4324212074279785, 3.404788017272949, 7.241996765136719, 11.079206466674805, 14.91641616821289, 18.753623962402344, 22.59083366394043, 26.428043365478516, 30.2652530670166, 34.10246276855469, 37.93967056274414, 41.776878356933594, 45.61408996582031, 49.451297760009766, 53.28850555419922, 57.12571716308594, 60.96292495727539, 64.80013275146484, 68.63734436035156, 72.47455596923828, 76.311767578125, 80.14897155761719, 83.9861831665039, 87.82339477539062, 91.66060638427734, 95.49781036376953, 99.33502197265625, 103.17223358154297, 107.00944519042969, 110.84664916992188, 114.6838607788086, 118.52106475830078]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 8.0, 11.0, 8.0, 15.0, 14.0, 22.0, 21.0, 29.0, 35.0, 29.0, 45.0, 48.0, 42.0, 46.0, 39.0, 47.0, 53.0, 46.0, 42.0, 55.0, 42.0, 43.0, 35.0, 31.0, 32.0, 31.0, 27.0, 15.0, 17.0, 14.0, 9.0, 12.0, 10.0, 6.0, 11.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.070892333984375, -36.733882904052734, -35.396873474121094, -34.05986022949219, -32.72285079956055, -31.385841369628906, -30.048830032348633, -28.71181869506836, -27.37480926513672, -26.037799835205078, -24.700788497924805, -23.36377716064453, -22.02676773071289, -20.68975830078125, -19.352746963500977, -18.015735626220703, -16.678726196289062, -15.341715812683105, -14.004705429077148, -12.667695045471191, -11.330684661865234, -9.993674278259277, -8.65666389465332, -7.319653511047363, -5.982643127441406, -4.645632743835449, -3.308622360229492, -1.9716119766235352, -0.6346015930175781, 0.7024087905883789, 2.039419174194336, 3.376429557800293, 4.71343994140625, 6.050450325012207, 7.387460708618164, 8.724471092224121, 10.061481475830078, 11.398491859436035, 12.735502243041992, 14.07251262664795, 15.409523010253906, 16.746532440185547, 18.08354377746582, 19.420555114746094, 20.757564544677734, 22.094573974609375, 23.43158531188965, 24.768596649169922, 26.105606079101562, 27.442615509033203, 28.779626846313477, 30.11663818359375, 31.45364761352539, 32.79065704345703, 34.12767028808594, 35.46467971801758, 36.80168914794922, 38.13869857788086, 39.4757080078125, 40.812721252441406, 42.14973068237305, 43.48674011230469, 44.823753356933594, 46.160762786865234, 47.497772216796875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 6.0, 11.0, 6.0, 15.0, 14.0, 22.0, 22.0, 21.0, 31.0, 31.0, 43.0, 43.0, 23.0, 43.0, 36.0, 40.0, 42.0, 48.0, 42.0, 55.0, 49.0, 40.0, 46.0, 31.0, 33.0, 29.0, 28.0, 22.0, 15.0, 21.0, 14.0, 14.0, 8.0, 8.0, 6.0, 11.0, 3.0, 9.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-5.796875, -5.6334228515625, -5.469970703125, -5.3065185546875, -5.14306640625, -4.9796142578125, -4.816162109375, -4.6527099609375, -4.4892578125, -4.3258056640625, -4.162353515625, -3.9989013671875, -3.83544921875, -3.6719970703125, -3.508544921875, -3.3450927734375, -3.181640625, -3.0181884765625, -2.854736328125, -2.6912841796875, -2.52783203125, -2.3643798828125, -2.200927734375, -2.0374755859375, -1.8740234375, -1.7105712890625, -1.547119140625, -1.3836669921875, -1.22021484375, -1.0567626953125, -0.893310546875, -0.7298583984375, -0.56640625, -0.4029541015625, -0.239501953125, -0.0760498046875, 0.08740234375, 0.2508544921875, 0.414306640625, 0.5777587890625, 0.7412109375, 0.9046630859375, 1.068115234375, 1.2315673828125, 1.39501953125, 1.5584716796875, 1.721923828125, 1.8853759765625, 2.048828125, 2.2122802734375, 2.375732421875, 2.5391845703125, 2.70263671875, 2.8660888671875, 3.029541015625, 3.1929931640625, 3.3564453125, 3.5198974609375, 3.683349609375, 3.8468017578125, 4.01025390625, 4.1737060546875, 4.337158203125, 4.5006103515625, 4.6640625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 10.0, 12.0, 15.0, 22.0, 46.0, 64.0, 81.0, 156.0, 203.0, 340.0, 513.0, 809.0, 1207.0, 1954.0, 3286.0, 5193.0, 8569.0, 14702.0, 25120.0, 44315.0, 84111.0, 185730.0, 322838.0, 170060.0, 78354.0, 41864.0, 23555.0, 13938.0, 8202.0, 5016.0, 3022.0, 1906.0, 1169.0, 770.0, 492.0, 303.0, 208.0, 131.0, 100.0, 57.0, 33.0, 29.0, 18.0, 13.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2156982421875, -0.20861434936523438, -0.20153045654296875, -0.19444656372070312, -0.1873626708984375, -0.18027877807617188, -0.17319488525390625, -0.16611099243164062, -0.159027099609375, -0.15194320678710938, -0.14485931396484375, -0.13777542114257812, -0.1306915283203125, -0.12360763549804688, -0.11652374267578125, -0.10943984985351562, -0.10235595703125, -0.09527206420898438, -0.08818817138671875, -0.08110427856445312, -0.0740203857421875, -0.06693649291992188, -0.05985260009765625, -0.052768707275390625, -0.045684814453125, -0.038600921630859375, -0.03151702880859375, -0.024433135986328125, -0.0173492431640625, -0.010265350341796875, -0.00318145751953125, 0.003902435302734375, 0.010986328125, 0.018070220947265625, 0.02515411376953125, 0.032238006591796875, 0.0393218994140625, 0.046405792236328125, 0.05348968505859375, 0.060573577880859375, 0.067657470703125, 0.07474136352539062, 0.08182525634765625, 0.08890914916992188, 0.0959930419921875, 0.10307693481445312, 0.11016082763671875, 0.11724472045898438, 0.12432861328125, 0.13141250610351562, 0.13849639892578125, 0.14558029174804688, 0.1526641845703125, 0.15974807739257812, 0.16683197021484375, 0.17391586303710938, 0.180999755859375, 0.18808364868164062, 0.19516754150390625, 0.20225143432617188, 0.2093353271484375, 0.21641921997070312, 0.22350311279296875, 0.23058700561523438, 0.2376708984375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 13.0, 8.0, 14.0, 13.0, 18.0, 18.0, 17.0, 19.0, 29.0, 40.0, 40.0, 41.0, 34.0, 47.0, 42.0, 48.0, 42.0, 1074.0, 44.0, 49.0, 38.0, 45.0, 41.0, 34.0, 23.0, 26.0, 25.0, 20.0, 15.0, 22.0, 16.0, 3.0, 13.0, 4.0, 11.0, 6.0, 6.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.21392822265625, -3.1075439453125, -3.00115966796875, -2.894775390625, -2.78839111328125, -2.6820068359375, -2.57562255859375, -2.46923828125, -2.36285400390625, -2.2564697265625, -2.15008544921875, -2.043701171875, -1.93731689453125, -1.8309326171875, -1.72454833984375, -1.6181640625, -1.51177978515625, -1.4053955078125, -1.29901123046875, -1.192626953125, -1.08624267578125, -0.9798583984375, -0.87347412109375, -0.76708984375, -0.66070556640625, -0.5543212890625, -0.44793701171875, -0.341552734375, -0.23516845703125, -0.1287841796875, -0.02239990234375, 0.083984375, 0.19036865234375, 0.2967529296875, 0.40313720703125, 0.509521484375, 0.61590576171875, 0.7222900390625, 0.82867431640625, 0.93505859375, 1.04144287109375, 1.1478271484375, 1.25421142578125, 1.360595703125, 1.46697998046875, 1.5733642578125, 1.67974853515625, 1.7861328125, 1.89251708984375, 1.9989013671875, 2.10528564453125, 2.211669921875, 2.31805419921875, 2.4244384765625, 2.53082275390625, 2.63720703125, 2.74359130859375, 2.8499755859375, 2.95635986328125, 3.062744140625, 3.16912841796875, 3.2755126953125, 3.38189697265625, 3.48828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 4.0, 8.0, 9.0, 13.0, 21.0, 15.0, 24.0, 39.0, 77.0, 96.0, 102.0, 184.0, 235.0, 334.0, 540.0, 762.0, 1042.0, 1508.0, 2228.0, 3377.0, 5069.0, 7691.0, 11774.0, 18757.0, 30857.0, 52208.0, 99382.0, 213991.0, 1330799.0, 141356.0, 69519.0, 39080.0, 23338.0, 14824.0, 9222.0, 5906.0, 4049.0, 2805.0, 1852.0, 1274.0, 845.0, 592.0, 357.0, 317.0, 197.0, 131.0, 111.0, 63.0, 60.0, 32.0, 27.0, 10.0, 5.0, 7.0, 1.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.187744140625, -0.1817340850830078, -0.17572402954101562, -0.16971397399902344, -0.16370391845703125, -0.15769386291503906, -0.15168380737304688, -0.1456737518310547, -0.1396636962890625, -0.1336536407470703, -0.12764358520507812, -0.12163352966308594, -0.11562347412109375, -0.10961341857910156, -0.10360336303710938, -0.09759330749511719, -0.091583251953125, -0.08557319641113281, -0.07956314086914062, -0.07355308532714844, -0.06754302978515625, -0.06153297424316406, -0.055522918701171875, -0.04951286315917969, -0.0435028076171875, -0.03749275207519531, -0.031482696533203125, -0.025472640991210938, -0.01946258544921875, -0.013452529907226562, -0.007442474365234375, -0.0014324188232421875, 0.00457763671875, 0.010587692260742188, 0.016597747802734375, 0.022607803344726562, 0.02861785888671875, 0.03462791442871094, 0.040637969970703125, 0.04664802551269531, 0.0526580810546875, 0.05866813659667969, 0.06467819213867188, 0.07068824768066406, 0.07669830322265625, 0.08270835876464844, 0.08871841430664062, 0.09472846984863281, 0.100738525390625, 0.10674858093261719, 0.11275863647460938, 0.11876869201660156, 0.12477874755859375, 0.13078880310058594, 0.13679885864257812, 0.1428089141845703, 0.1488189697265625, 0.1548290252685547, 0.16083908081054688, 0.16684913635253906, 0.17285919189453125, 0.17886924743652344, 0.18487930297851562, 0.1908893585205078, 0.1968994140625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 3.0, 10.0, 9.0, 12.0, 17.0, 15.0, 24.0, 23.0, 29.0, 28.0, 33.0, 47.0, 53.0, 48.0, 60.0, 52.0, 49.0, 54.0, 43.0, 38.0, 37.0, 49.0, 42.0, 38.0, 28.0, 29.0, 31.0, 20.0, 19.0, 6.0, 7.0, 7.0, 8.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-3.159046173095703e-05, -3.067776560783386e-05, -2.9765069484710693e-05, -2.8852373361587524e-05, -2.7939677238464355e-05, -2.7026981115341187e-05, -2.6114284992218018e-05, -2.520158886909485e-05, -2.428889274597168e-05, -2.337619662284851e-05, -2.2463500499725342e-05, -2.1550804376602173e-05, -2.0638108253479004e-05, -1.9725412130355835e-05, -1.8812716007232666e-05, -1.7900019884109497e-05, -1.6987323760986328e-05, -1.607462763786316e-05, -1.516193151473999e-05, -1.4249235391616821e-05, -1.3336539268493652e-05, -1.2423843145370483e-05, -1.1511147022247314e-05, -1.0598450899124146e-05, -9.685754776000977e-06, -8.773058652877808e-06, -7.860362529754639e-06, -6.94766640663147e-06, -6.034970283508301e-06, -5.122274160385132e-06, -4.209578037261963e-06, -3.296881914138794e-06, -2.384185791015625e-06, -1.471489667892456e-06, -5.587935447692871e-07, 3.5390257835388184e-07, 1.2665987014770508e-06, 2.1792948246002197e-06, 3.0919909477233887e-06, 4.004687070846558e-06, 4.9173831939697266e-06, 5.8300793170928955e-06, 6.7427754402160645e-06, 7.655471563339233e-06, 8.568167686462402e-06, 9.480863809585571e-06, 1.039355993270874e-05, 1.130625605583191e-05, 1.2218952178955078e-05, 1.3131648302078247e-05, 1.4044344425201416e-05, 1.4957040548324585e-05, 1.5869736671447754e-05, 1.6782432794570923e-05, 1.7695128917694092e-05, 1.860782504081726e-05, 1.952052116394043e-05, 2.04332172870636e-05, 2.1345913410186768e-05, 2.2258609533309937e-05, 2.3171305656433105e-05, 2.4084001779556274e-05, 2.4996697902679443e-05, 2.5909394025802612e-05, 2.682209014892578e-05]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 7.0, 4.0, 7.0, 8.0, 6.0, 19.0, 26.0, 20.0, 40.0, 52.0, 55.0, 81.0, 117.0, 202.0, 329.0, 626.0, 2771.0, 468035.0, 571227.0, 3267.0, 686.0, 339.0, 175.0, 116.0, 84.0, 44.0, 39.0, 31.0, 24.0, 29.0, 21.0, 6.0, 12.0, 6.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00051116943359375, -0.000494144856929779, -0.0004771202802658081, -0.00046009570360183716, -0.0004430711269378662, -0.00042604655027389526, -0.0004090219736099243, -0.00039199739694595337, -0.0003749728202819824, -0.0003579482436180115, -0.00034092366695404053, -0.0003238990902900696, -0.00030687451362609863, -0.0002898499369621277, -0.00027282536029815674, -0.0002558007836341858, -0.00023877620697021484, -0.0002217516303062439, -0.00020472705364227295, -0.000187702476978302, -0.00017067790031433105, -0.0001536533236503601, -0.00013662874698638916, -0.00011960417032241821, -0.00010257959365844727, -8.555501699447632e-05, -6.853044033050537e-05, -5.1505863666534424e-05, -3.4481287002563477e-05, -1.745671033859253e-05, -4.3213367462158203e-07, 1.6592442989349365e-05, 3.361701965332031e-05, 5.064159631729126e-05, 6.766617298126221e-05, 8.469074964523315e-05, 0.0001017153263092041, 0.00011873990297317505, 0.000135764479637146, 0.00015278905630111694, 0.0001698136329650879, 0.00018683820962905884, 0.00020386278629302979, 0.00022088736295700073, 0.00023791193962097168, 0.0002549365162849426, 0.0002719610929489136, 0.0002889856696128845, 0.00030601024627685547, 0.0003230348229408264, 0.00034005939960479736, 0.0003570839762687683, 0.00037410855293273926, 0.0003911331295967102, 0.00040815770626068115, 0.0004251822829246521, 0.00044220685958862305, 0.000459231436252594, 0.00047625601291656494, 0.0004932805895805359, 0.0005103051662445068, 0.0005273297429084778, 0.0005443543195724487, 0.0005613788962364197, 0.0005784034729003906]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 11.0, 146.0, 479.0, 317.0, 63.0, 2.0, 2.0], "bins": [-0.00021927875059191138, -0.00021561012545134872, -0.00021194148575887084, -0.0002082728606183082, -0.00020460423547774553, -0.00020093561033718288, -0.000197266970644705, -0.00019359834550414234, -0.0001899297203635797, -0.00018626109522301704, -0.00018259245553053916, -0.0001789238303899765, -0.00017525520524941385, -0.0001715865801088512, -0.0001679179404163733, -0.00016424931527581066, -0.00016058067558333278, -0.00015691205044277012, -0.00015324341075029224, -0.0001495747856097296, -0.00014590616046916693, -0.00014223752077668905, -0.0001385688956361264, -0.00013490027049556375, -0.0001312316453550011, -0.00012756302021443844, -0.00012389438052196056, -0.0001202257553813979, -0.00011655713024083525, -0.00011288849782431498, -0.00010921986540779471, -0.00010555124026723206, -0.00010188260785071179, -9.821397543419152e-05, -9.454535029362887e-05, -9.08767178771086e-05, -8.720809273654595e-05, -8.353946032002568e-05, -7.987083517946303e-05, -7.620220276294276e-05, -7.25335703464225e-05, -6.886493792990223e-05, -6.519631278933957e-05, -6.15276803728193e-05, -5.7859051594277844e-05, -5.419042281573638e-05, -5.052179403719492e-05, -4.685316525865346e-05, -4.3184532842133194e-05, -3.9515904063591734e-05, -3.584727528505027e-05, -3.2178642868530005e-05, -2.8510014089988545e-05, -2.4841385311447084e-05, -2.1172756532905623e-05, -1.750412593537476e-05, -1.3835498975822702e-05, -1.016686928778654e-05, -6.498240054497728e-06, -2.8296108212089166e-06, 8.390188668272458e-07, 4.507648554863408e-06, 8.176277333404869e-06, 1.1844907930935733e-05, 1.5513536709477194e-05]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 0.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 20.0, 14.0, 11.0, 15.0, 15.0, 26.0, 29.0, 38.0, 26.0, 22.0, 29.0, 37.0, 25.0, 35.0, 44.0, 28.0, 29.0, 42.0, 38.0, 38.0, 40.0, 37.0, 35.0, 33.0, 26.0, 34.0, 18.0, 28.0, 15.0, 20.0, 22.0, 12.0, 18.0, 12.0, 11.0, 4.0, 6.0, 4.0, 6.0, 3.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5020370483398438e-05, -1.4560297131538391e-05, -1.4100223779678345e-05, -1.3640150427818298e-05, -1.3180077075958252e-05, -1.2720003724098206e-05, -1.225993037223816e-05, -1.1799857020378113e-05, -1.1339783668518066e-05, -1.087971031665802e-05, -1.0419636964797974e-05, -9.959563612937927e-06, -9.499490261077881e-06, -9.039416909217834e-06, -8.579343557357788e-06, -8.119270205497742e-06, -7.659196853637695e-06, -7.199123501777649e-06, -6.7390501499176025e-06, -6.278976798057556e-06, -5.81890344619751e-06, -5.358830094337463e-06, -4.898756742477417e-06, -4.438683390617371e-06, -3.978610038757324e-06, -3.518536686897278e-06, -3.0584633350372314e-06, -2.598389983177185e-06, -2.1383166313171387e-06, -1.6782432794570923e-06, -1.218169927597046e-06, -7.580965757369995e-07, -2.980232238769531e-07, 1.6205012798309326e-07, 6.221234798431396e-07, 1.082196831703186e-06, 1.5422701835632324e-06, 2.002343535423279e-06, 2.462416887283325e-06, 2.9224902391433716e-06, 3.382563591003418e-06, 3.842636942863464e-06, 4.302710294723511e-06, 4.762783646583557e-06, 5.2228569984436035e-06, 5.68293035030365e-06, 6.143003702163696e-06, 6.603077054023743e-06, 7.063150405883789e-06, 7.5232237577438354e-06, 7.983297109603882e-06, 8.443370461463928e-06, 8.903443813323975e-06, 9.363517165184021e-06, 9.823590517044067e-06, 1.0283663868904114e-05, 1.074373722076416e-05, 1.1203810572624207e-05, 1.1663883924484253e-05, 1.21239572763443e-05, 1.2584030628204346e-05, 1.3044103980064392e-05, 1.3504177331924438e-05, 1.3964250683784485e-05, 1.4424324035644531e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 6.0, 11.0, 6.0, 15.0, 14.0, 22.0, 22.0, 21.0, 31.0, 31.0, 43.0, 43.0, 23.0, 43.0, 36.0, 40.0, 42.0, 48.0, 42.0, 55.0, 49.0, 40.0, 46.0, 31.0, 33.0, 29.0, 28.0, 22.0, 15.0, 21.0, 14.0, 14.0, 8.0, 8.0, 6.0, 11.0, 3.0, 9.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-5.796875, -5.6334228515625, -5.469970703125, -5.3065185546875, -5.14306640625, -4.9796142578125, -4.816162109375, -4.6527099609375, -4.4892578125, -4.3258056640625, -4.162353515625, -3.9989013671875, -3.83544921875, -3.6719970703125, -3.508544921875, -3.3450927734375, -3.181640625, -3.0181884765625, -2.854736328125, -2.6912841796875, -2.52783203125, -2.3643798828125, -2.200927734375, -2.0374755859375, -1.8740234375, -1.7105712890625, -1.547119140625, -1.3836669921875, -1.22021484375, -1.0567626953125, -0.893310546875, -0.7298583984375, -0.56640625, -0.4029541015625, -0.239501953125, -0.0760498046875, 0.08740234375, 0.2508544921875, 0.414306640625, 0.5777587890625, 0.7412109375, 0.9046630859375, 1.068115234375, 1.2315673828125, 1.39501953125, 1.5584716796875, 1.721923828125, 1.8853759765625, 2.048828125, 2.2122802734375, 2.375732421875, 2.5391845703125, 2.70263671875, 2.8660888671875, 3.029541015625, 3.1929931640625, 3.3564453125, 3.5198974609375, 3.683349609375, 3.8468017578125, 4.01025390625, 4.1737060546875, 4.337158203125, 4.5006103515625, 4.6640625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 9.0, 3.0, 4.0, 2.0, 8.0, 6.0, 17.0, 16.0, 30.0, 34.0, 50.0, 79.0, 91.0, 141.0, 226.0, 321.0, 453.0, 698.0, 1047.0, 1777.0, 2944.0, 5244.0, 9386.0, 17744.0, 35012.0, 77758.0, 261967.0, 435124.0, 104825.0, 44689.0, 21788.0, 11467.0, 6277.0, 3551.0, 2113.0, 1220.0, 776.0, 527.0, 349.0, 226.0, 162.0, 124.0, 80.0, 56.0, 45.0, 35.0, 24.0, 19.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.8046875, -3.67852783203125, -3.5523681640625, -3.42620849609375, -3.300048828125, -3.17388916015625, -3.0477294921875, -2.92156982421875, -2.79541015625, -2.66925048828125, -2.5430908203125, -2.41693115234375, -2.290771484375, -2.16461181640625, -2.0384521484375, -1.91229248046875, -1.7861328125, -1.65997314453125, -1.5338134765625, -1.40765380859375, -1.281494140625, -1.15533447265625, -1.0291748046875, -0.90301513671875, -0.77685546875, -0.65069580078125, -0.5245361328125, -0.39837646484375, -0.272216796875, -0.14605712890625, -0.0198974609375, 0.10626220703125, 0.232421875, 0.35858154296875, 0.4847412109375, 0.61090087890625, 0.737060546875, 0.86322021484375, 0.9893798828125, 1.11553955078125, 1.24169921875, 1.36785888671875, 1.4940185546875, 1.62017822265625, 1.746337890625, 1.87249755859375, 1.9986572265625, 2.12481689453125, 2.2509765625, 2.37713623046875, 2.5032958984375, 2.62945556640625, 2.755615234375, 2.88177490234375, 3.0079345703125, 3.13409423828125, 3.26025390625, 3.38641357421875, 3.5125732421875, 3.63873291015625, 3.764892578125, 3.89105224609375, 4.0172119140625, 4.14337158203125, 4.26953125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 10.0, 10.0, 13.0, 13.0, 14.0, 13.0, 24.0, 36.0, 48.0, 55.0, 47.0, 52.0, 85.0, 98.0, 369.0, 1640.0, 120.0, 62.0, 61.0, 53.0, 36.0, 35.0, 33.0, 25.0, 19.0, 15.0, 16.0, 13.0, 9.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.609375, -24.812744140625, -24.01611328125, -23.219482421875, -22.4228515625, -21.626220703125, -20.82958984375, -20.032958984375, -19.236328125, -18.439697265625, -17.64306640625, -16.846435546875, -16.0498046875, -15.253173828125, -14.45654296875, -13.659912109375, -12.86328125, -12.066650390625, -11.27001953125, -10.473388671875, -9.6767578125, -8.880126953125, -8.08349609375, -7.286865234375, -6.490234375, -5.693603515625, -4.89697265625, -4.100341796875, -3.3037109375, -2.507080078125, -1.71044921875, -0.913818359375, -0.1171875, 0.679443359375, 1.47607421875, 2.272705078125, 3.0693359375, 3.865966796875, 4.66259765625, 5.459228515625, 6.255859375, 7.052490234375, 7.84912109375, 8.645751953125, 9.4423828125, 10.239013671875, 11.03564453125, 11.832275390625, 12.62890625, 13.425537109375, 14.22216796875, 15.018798828125, 15.8154296875, 16.612060546875, 17.40869140625, 18.205322265625, 19.001953125, 19.798583984375, 20.59521484375, 21.391845703125, 22.1884765625, 22.985107421875, 23.78173828125, 24.578369140625, 25.375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 11.0, 11.0, 18.0, 33.0, 37.0, 42.0, 66.0, 110.0, 181.0, 325.0, 982.0, 13539.0, 3106864.0, 21353.0, 1131.0, 372.0, 209.0, 136.0, 91.0, 60.0, 26.0, 34.0, 20.0, 12.0, 9.0, 9.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25, -62.27587890625, -60.3017578125, -58.32763671875, -56.353515625, -54.37939453125, -52.4052734375, -50.43115234375, -48.45703125, -46.48291015625, -44.5087890625, -42.53466796875, -40.560546875, -38.58642578125, -36.6123046875, -34.63818359375, -32.6640625, -30.68994140625, -28.7158203125, -26.74169921875, -24.767578125, -22.79345703125, -20.8193359375, -18.84521484375, -16.87109375, -14.89697265625, -12.9228515625, -10.94873046875, -8.974609375, -7.00048828125, -5.0263671875, -3.05224609375, -1.078125, 0.89599609375, 2.8701171875, 4.84423828125, 6.818359375, 8.79248046875, 10.7666015625, 12.74072265625, 14.71484375, 16.68896484375, 18.6630859375, 20.63720703125, 22.611328125, 24.58544921875, 26.5595703125, 28.53369140625, 30.5078125, 32.48193359375, 34.4560546875, 36.43017578125, 38.404296875, 40.37841796875, 42.3525390625, 44.32666015625, 46.30078125, 48.27490234375, 50.2490234375, 52.22314453125, 54.197265625, 56.17138671875, 58.1455078125, 60.11962890625, 62.09375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 153.0, 714.0, 141.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.471294403076172, -13.944808006286621, -8.41832160949707, -2.891834259033203, 2.6346511840820312, 8.161136627197266, 13.687625885009766, 19.214111328125, 24.740596771240234, 30.26708221435547, 35.79357147216797, 41.3200569152832, 46.84654235839844, 52.37302780151367, 57.89951705932617, 63.426002502441406, 68.95248413085938, 74.47897338867188, 80.00545501708984, 85.53194427490234, 91.05842590332031, 96.58491516113281, 102.11140441894531, 107.63789367675781, 113.16438293457031, 118.69087219238281, 124.21735382080078, 129.74383544921875, 135.27032470703125, 140.79681396484375, 146.32330322265625, 151.84979248046875, 157.37628173828125, 162.90277099609375, 168.42926025390625, 173.95574951171875, 179.4822235107422, 185.0087127685547, 190.5352020263672, 196.0616912841797, 201.58816528320312, 207.11465454101562, 212.64114379882812, 218.16763305664062, 223.69410705566406, 229.22059631347656, 234.74708557128906, 240.27357482910156, 245.80006408691406, 251.32655334472656, 256.85302734375, 262.3795166015625, 267.906005859375, 273.4324951171875, 278.958984375, 284.4854736328125, 290.011962890625, 295.5384521484375, 301.06494140625, 306.5914306640625, 312.117919921875, 317.6444091796875, 323.1708984375, 328.6973571777344, 334.2238464355469]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 4.0, 8.0, 12.0, 11.0, 12.0, 11.0, 21.0, 19.0, 21.0, 23.0, 24.0, 38.0, 23.0, 42.0, 42.0, 40.0, 44.0, 50.0, 34.0, 42.0, 37.0, 35.0, 53.0, 33.0, 28.0, 40.0, 36.0, 27.0, 35.0, 16.0, 21.0, 17.0, 14.0, 18.0, 15.0, 5.0, 14.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.028987884521484, -51.3138427734375, -49.59869384765625, -47.883548736572266, -46.16840362548828, -44.45325469970703, -42.73810958862305, -41.02296447753906, -39.30781555175781, -37.59267044067383, -35.87752151489258, -34.162376403808594, -32.44723129272461, -30.732084274291992, -29.016937255859375, -27.30179214477539, -25.586647033691406, -23.87150001525879, -22.156354904174805, -20.441207885742188, -18.726062774658203, -17.010915756225586, -15.295768737792969, -13.580622673034668, -11.865476608276367, -10.150330543518066, -8.435184478759766, -6.720037460327148, -5.004891395568848, -3.289745330810547, -1.5745983123779297, 0.1405477523803711, 1.8556900024414062, 3.570836305618286, 5.285982608795166, 7.001129150390625, 8.716275215148926, 10.431421279907227, 12.146568298339844, 13.861714363098145, 15.576860427856445, 17.292007446289062, 19.007152557373047, 20.722299575805664, 22.43744659423828, 24.152591705322266, 25.867738723754883, 27.5828857421875, 29.298030853271484, 31.0131778717041, 32.72832489013672, 34.4434700012207, 36.15861511230469, 37.87376403808594, 39.58890914916992, 41.304054260253906, 43.019203186035156, 44.73434829711914, 46.44949722290039, 48.164642333984375, 49.87978744506836, 51.594932556152344, 53.310081481933594, 55.02522659301758, 56.74037170410156]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 6.0, 10.0, 15.0, 17.0, 18.0, 26.0, 25.0, 27.0, 32.0, 37.0, 37.0, 33.0, 45.0, 29.0, 45.0, 36.0, 42.0, 46.0, 49.0, 44.0, 45.0, 45.0, 36.0, 31.0, 40.0, 19.0, 20.0, 25.0, 13.0, 18.0, 12.0, 7.0, 13.0, 8.0, 6.0, 7.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.0859375, -5.91436767578125, -5.7427978515625, -5.57122802734375, -5.399658203125, -5.22808837890625, -5.0565185546875, -4.88494873046875, -4.71337890625, -4.54180908203125, -4.3702392578125, -4.19866943359375, -4.027099609375, -3.85552978515625, -3.6839599609375, -3.51239013671875, -3.3408203125, -3.16925048828125, -2.9976806640625, -2.82611083984375, -2.654541015625, -2.48297119140625, -2.3114013671875, -2.13983154296875, -1.96826171875, -1.79669189453125, -1.6251220703125, -1.45355224609375, -1.281982421875, -1.11041259765625, -0.9388427734375, -0.76727294921875, -0.595703125, -0.42413330078125, -0.2525634765625, -0.08099365234375, 0.090576171875, 0.26214599609375, 0.4337158203125, 0.60528564453125, 0.77685546875, 0.94842529296875, 1.1199951171875, 1.29156494140625, 1.463134765625, 1.63470458984375, 1.8062744140625, 1.97784423828125, 2.1494140625, 2.32098388671875, 2.4925537109375, 2.66412353515625, 2.835693359375, 3.00726318359375, 3.1788330078125, 3.35040283203125, 3.52197265625, 3.69354248046875, 3.8651123046875, 4.03668212890625, 4.208251953125, 4.37982177734375, 4.5513916015625, 4.72296142578125, 4.89453125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 11.0, 9.0, 19.0, 21.0, 20.0, 37.0, 51.0, 82.0, 126.0, 190.0, 320.0, 560.0, 1132.0, 2141.0, 4834.0, 11246.0, 28795.0, 91660.0, 395569.0, 1421596.0, 1577791.0, 488091.0, 112486.0, 34071.0, 12814.0, 5397.0, 2439.0, 1230.0, 642.0, 334.0, 160.0, 115.0, 67.0, 43.0, 29.0, 39.0, 24.0, 13.0, 24.0, 12.0, 9.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0], "bins": [-8.4375, -8.20989990234375, -7.9822998046875, -7.75469970703125, -7.527099609375, -7.29949951171875, -7.0718994140625, -6.84429931640625, -6.61669921875, -6.38909912109375, -6.1614990234375, -5.93389892578125, -5.706298828125, -5.47869873046875, -5.2510986328125, -5.02349853515625, -4.7958984375, -4.56829833984375, -4.3406982421875, -4.11309814453125, -3.885498046875, -3.65789794921875, -3.4302978515625, -3.20269775390625, -2.97509765625, -2.74749755859375, -2.5198974609375, -2.29229736328125, -2.064697265625, -1.83709716796875, -1.6094970703125, -1.38189697265625, -1.154296875, -0.92669677734375, -0.6990966796875, -0.47149658203125, -0.243896484375, -0.01629638671875, 0.2113037109375, 0.43890380859375, 0.66650390625, 0.89410400390625, 1.1217041015625, 1.34930419921875, 1.576904296875, 1.80450439453125, 2.0321044921875, 2.25970458984375, 2.4873046875, 2.71490478515625, 2.9425048828125, 3.17010498046875, 3.397705078125, 3.62530517578125, 3.8529052734375, 4.08050537109375, 4.30810546875, 4.53570556640625, 4.7633056640625, 4.99090576171875, 5.218505859375, 5.44610595703125, 5.6737060546875, 5.90130615234375, 6.12890625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 11.0, 7.0, 20.0, 19.0, 28.0, 41.0, 57.0, 75.0, 132.0, 156.0, 267.0, 424.0, 535.0, 615.0, 514.0, 388.0, 244.0, 170.0, 139.0, 73.0, 46.0, 33.0, 17.0, 13.0, 16.0, 9.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.065185546875, -9.61474609375, -9.164306640625, -8.7138671875, -8.263427734375, -7.81298828125, -7.362548828125, -6.912109375, -6.461669921875, -6.01123046875, -5.560791015625, -5.1103515625, -4.659912109375, -4.20947265625, -3.759033203125, -3.30859375, -2.858154296875, -2.40771484375, -1.957275390625, -1.5068359375, -1.056396484375, -0.60595703125, -0.155517578125, 0.294921875, 0.745361328125, 1.19580078125, 1.646240234375, 2.0966796875, 2.547119140625, 2.99755859375, 3.447998046875, 3.8984375, 4.348876953125, 4.79931640625, 5.249755859375, 5.7001953125, 6.150634765625, 6.60107421875, 7.051513671875, 7.501953125, 7.952392578125, 8.40283203125, 8.853271484375, 9.3037109375, 9.754150390625, 10.20458984375, 10.655029296875, 11.10546875, 11.555908203125, 12.00634765625, 12.456787109375, 12.9072265625, 13.357666015625, 13.80810546875, 14.258544921875, 14.708984375, 15.159423828125, 15.60986328125, 16.060302734375, 16.5107421875, 16.961181640625, 17.41162109375, 17.862060546875, 18.3125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 10.0, 12.0, 32.0, 26.0, 61.0, 49.0, 91.0, 152.0, 251.0, 466.0, 1280.0, 7365.0, 135699.0, 3533820.0, 493768.0, 17666.0, 1923.0, 657.0, 346.0, 182.0, 123.0, 76.0, 60.0, 33.0, 34.0, 24.0, 14.0, 8.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-36.96875, -35.960693359375, -34.95263671875, -33.944580078125, -32.9365234375, -31.928466796875, -30.92041015625, -29.912353515625, -28.904296875, -27.896240234375, -26.88818359375, -25.880126953125, -24.8720703125, -23.864013671875, -22.85595703125, -21.847900390625, -20.83984375, -19.831787109375, -18.82373046875, -17.815673828125, -16.8076171875, -15.799560546875, -14.79150390625, -13.783447265625, -12.775390625, -11.767333984375, -10.75927734375, -9.751220703125, -8.7431640625, -7.735107421875, -6.72705078125, -5.718994140625, -4.7109375, -3.702880859375, -2.69482421875, -1.686767578125, -0.6787109375, 0.329345703125, 1.33740234375, 2.345458984375, 3.353515625, 4.361572265625, 5.36962890625, 6.377685546875, 7.3857421875, 8.393798828125, 9.40185546875, 10.409912109375, 11.41796875, 12.426025390625, 13.43408203125, 14.442138671875, 15.4501953125, 16.458251953125, 17.46630859375, 18.474365234375, 19.482421875, 20.490478515625, 21.49853515625, 22.506591796875, 23.5146484375, 24.522705078125, 25.53076171875, 26.538818359375, 27.546875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 3.0, 29.0, 36.0, 69.0, 91.0, 129.0, 152.0, 151.0, 126.0, 86.0, 55.0, 34.0, 17.0, 14.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-107.76737976074219, -105.6114730834961, -103.45556640625, -101.29966735839844, -99.14376068115234, -96.98785400390625, -94.83195495605469, -92.6760482788086, -90.5201416015625, -88.3642349243164, -86.20832824707031, -84.05242919921875, -81.89652252197266, -79.74061584472656, -77.584716796875, -75.4288101196289, -73.27290344238281, -71.11699676513672, -68.96109008789062, -66.80519104003906, -64.64928436279297, -62.493377685546875, -60.33747482299805, -58.18157196044922, -56.025665283203125, -53.86975860595703, -51.7138557434082, -49.557952880859375, -47.40204620361328, -45.24613952636719, -43.09023666381836, -40.93433380126953, -38.77843475341797, -36.622528076171875, -34.46662521362305, -32.31072235107422, -30.154815673828125, -27.998910903930664, -25.843006134033203, -23.687101364135742, -21.53119659423828, -19.37529182434082, -17.21938705444336, -15.063482284545898, -12.907577514648438, -10.751672744750977, -8.595767974853516, -6.439863204956055, -4.283958435058594, -2.128053665161133, 0.027851104736328125, 2.183755874633789, 4.33966064453125, 6.495565414428711, 8.651470184326172, 10.807374954223633, 12.963279724121094, 15.119184494018555, 17.275089263916016, 19.430994033813477, 21.586898803710938, 23.7428035736084, 25.89870834350586, 28.05461311340332, 30.21051788330078]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 3.0, 12.0, 10.0, 19.0, 19.0, 24.0, 25.0, 22.0, 31.0, 32.0, 40.0, 39.0, 49.0, 47.0, 38.0, 51.0, 39.0, 49.0, 47.0, 38.0, 38.0, 44.0, 39.0, 36.0, 32.0, 36.0, 23.0, 29.0, 9.0, 9.0, 16.0, 9.0, 12.0, 7.0, 6.0, 1.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.13395690917969, -39.87421798706055, -38.61448287963867, -37.35474395751953, -36.095008850097656, -34.835269927978516, -33.57553482055664, -32.3157958984375, -31.056058883666992, -29.796321868896484, -28.536584854125977, -27.27684783935547, -26.017108917236328, -24.757373809814453, -23.497634887695312, -22.237897872924805, -20.978160858154297, -19.71842384338379, -18.45868682861328, -17.198949813842773, -15.93921184539795, -14.679474830627441, -13.419736862182617, -12.15999984741211, -10.900262832641602, -9.640525817871094, -8.380788803100586, -7.121050834655762, -5.861313819885254, -4.601576805114746, -3.34183931350708, -2.082101821899414, -0.8223648071289062, 0.43737244606018066, 1.6971096992492676, 2.9568469524383545, 4.216584205627441, 5.476321220397949, 6.736058712005615, 7.995796203613281, 9.255533218383789, 10.515270233154297, 11.775007247924805, 13.034745216369629, 14.294482231140137, 15.554219245910645, 16.81395721435547, 18.073694229125977, 19.333431243896484, 20.593168258666992, 21.8529052734375, 23.112642288208008, 24.372379302978516, 25.632118225097656, 26.891855239868164, 28.151592254638672, 29.41132926940918, 30.671066284179688, 31.930803298950195, 33.1905403137207, 34.450279235839844, 35.71001434326172, 36.96975326538086, 38.2294921875, 39.489227294921875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 11.0, 12.0, 3.0, 14.0, 7.0, 15.0, 12.0, 22.0, 17.0, 29.0, 37.0, 25.0, 36.0, 49.0, 41.0, 51.0, 36.0, 40.0, 45.0, 41.0, 49.0, 49.0, 45.0, 43.0, 38.0, 35.0, 28.0, 18.0, 24.0, 18.0, 22.0, 21.0, 14.0, 13.0, 3.0, 7.0, 7.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.33984375, -6.16644287109375, -5.9930419921875, -5.81964111328125, -5.646240234375, -5.47283935546875, -5.2994384765625, -5.12603759765625, -4.95263671875, -4.77923583984375, -4.6058349609375, -4.43243408203125, -4.259033203125, -4.08563232421875, -3.9122314453125, -3.73883056640625, -3.5654296875, -3.39202880859375, -3.2186279296875, -3.04522705078125, -2.871826171875, -2.69842529296875, -2.5250244140625, -2.35162353515625, -2.17822265625, -2.00482177734375, -1.8314208984375, -1.65802001953125, -1.484619140625, -1.31121826171875, -1.1378173828125, -0.96441650390625, -0.791015625, -0.61761474609375, -0.4442138671875, -0.27081298828125, -0.097412109375, 0.07598876953125, 0.2493896484375, 0.42279052734375, 0.59619140625, 0.76959228515625, 0.9429931640625, 1.11639404296875, 1.289794921875, 1.46319580078125, 1.6365966796875, 1.80999755859375, 1.9833984375, 2.15679931640625, 2.3302001953125, 2.50360107421875, 2.677001953125, 2.85040283203125, 3.0238037109375, 3.19720458984375, 3.37060546875, 3.54400634765625, 3.7174072265625, 3.89080810546875, 4.064208984375, 4.23760986328125, 4.4110107421875, 4.58441162109375, 4.7578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 9.0, 9.0, 18.0, 20.0, 34.0, 50.0, 80.0, 115.0, 159.0, 304.0, 384.0, 572.0, 991.0, 1509.0, 2176.0, 3456.0, 5376.0, 8644.0, 14225.0, 23771.0, 42648.0, 83204.0, 182447.0, 314970.0, 178387.0, 81435.0, 42226.0, 23551.0, 14087.0, 8503.0, 5360.0, 3515.0, 2144.0, 1468.0, 887.0, 630.0, 425.0, 284.0, 170.0, 104.0, 76.0, 45.0, 32.0, 18.0, 17.0, 14.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2396240234375, -0.23224830627441406, -0.22487258911132812, -0.2174968719482422, -0.21012115478515625, -0.2027454376220703, -0.19536972045898438, -0.18799400329589844, -0.1806182861328125, -0.17324256896972656, -0.16586685180664062, -0.1584911346435547, -0.15111541748046875, -0.1437397003173828, -0.13636398315429688, -0.12898826599121094, -0.121612548828125, -0.11423683166503906, -0.10686111450195312, -0.09948539733886719, -0.09210968017578125, -0.08473396301269531, -0.07735824584960938, -0.06998252868652344, -0.0626068115234375, -0.05523109436035156, -0.047855377197265625, -0.04047966003417969, -0.03310394287109375, -0.025728225708007812, -0.018352508544921875, -0.010976791381835938, -0.00360107421875, 0.0037746429443359375, 0.011150360107421875, 0.018526077270507812, 0.02590179443359375, 0.03327751159667969, 0.040653228759765625, 0.04802894592285156, 0.0554046630859375, 0.06278038024902344, 0.07015609741210938, 0.07753181457519531, 0.08490753173828125, 0.09228324890136719, 0.09965896606445312, 0.10703468322753906, 0.114410400390625, 0.12178611755371094, 0.12916183471679688, 0.1365375518798828, 0.14391326904296875, 0.1512889862060547, 0.15866470336914062, 0.16604042053222656, 0.1734161376953125, 0.18079185485839844, 0.18816757202148438, 0.1955432891845703, 0.20291900634765625, 0.2102947235107422, 0.21767044067382812, 0.22504615783691406, 0.232421875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 18.0, 10.0, 13.0, 19.0, 23.0, 21.0, 33.0, 19.0, 31.0, 30.0, 22.0, 30.0, 39.0, 30.0, 36.0, 49.0, 25.0, 1063.0, 49.0, 39.0, 37.0, 35.0, 39.0, 31.0, 29.0, 29.0, 24.0, 27.0, 24.0, 24.0, 15.0, 21.0, 8.0, 9.0, 10.0, 6.0, 6.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-3.689453125, -3.589996337890625, -3.49053955078125, -3.391082763671875, -3.2916259765625, -3.192169189453125, -3.09271240234375, -2.993255615234375, -2.893798828125, -2.794342041015625, -2.69488525390625, -2.595428466796875, -2.4959716796875, -2.396514892578125, -2.29705810546875, -2.197601318359375, -2.09814453125, -1.998687744140625, -1.89923095703125, -1.799774169921875, -1.7003173828125, -1.600860595703125, -1.50140380859375, -1.401947021484375, -1.302490234375, -1.203033447265625, -1.10357666015625, -1.004119873046875, -0.9046630859375, -0.805206298828125, -0.70574951171875, -0.606292724609375, -0.5068359375, -0.407379150390625, -0.30792236328125, -0.208465576171875, -0.1090087890625, -0.009552001953125, 0.08990478515625, 0.189361572265625, 0.288818359375, 0.388275146484375, 0.48773193359375, 0.587188720703125, 0.6866455078125, 0.786102294921875, 0.88555908203125, 0.985015869140625, 1.08447265625, 1.183929443359375, 1.28338623046875, 1.382843017578125, 1.4822998046875, 1.581756591796875, 1.68121337890625, 1.780670166015625, 1.880126953125, 1.979583740234375, 2.07904052734375, 2.178497314453125, 2.2779541015625, 2.377410888671875, 2.47686767578125, 2.576324462890625, 2.67578125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 13.0, 7.0, 15.0, 22.0, 31.0, 33.0, 51.0, 59.0, 92.0, 123.0, 181.0, 282.0, 408.0, 582.0, 845.0, 1233.0, 1774.0, 2815.0, 4236.0, 6794.0, 10353.0, 16535.0, 27232.0, 44799.0, 79611.0, 165489.0, 1342262.0, 180468.0, 85793.0, 47983.0, 28440.0, 17684.0, 10946.0, 6795.0, 4440.0, 2902.0, 1969.0, 1276.0, 796.0, 545.0, 374.0, 285.0, 184.0, 124.0, 87.0, 62.0, 34.0, 29.0, 10.0, 17.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2115478515625, -0.2050495147705078, -0.19855117797851562, -0.19205284118652344, -0.18555450439453125, -0.17905616760253906, -0.17255783081054688, -0.1660594940185547, -0.1595611572265625, -0.1530628204345703, -0.14656448364257812, -0.14006614685058594, -0.13356781005859375, -0.12706947326660156, -0.12057113647460938, -0.11407279968261719, -0.107574462890625, -0.10107612609863281, -0.09457778930664062, -0.08807945251464844, -0.08158111572265625, -0.07508277893066406, -0.06858444213867188, -0.06208610534667969, -0.0555877685546875, -0.04908943176269531, -0.042591094970703125, -0.03609275817871094, -0.02959442138671875, -0.023096084594726562, -0.016597747802734375, -0.010099411010742188, -0.00360107421875, 0.0028972625732421875, 0.009395599365234375, 0.015893936157226562, 0.02239227294921875, 0.028890609741210938, 0.035388946533203125, 0.04188728332519531, 0.0483856201171875, 0.05488395690917969, 0.061382293701171875, 0.06788063049316406, 0.07437896728515625, 0.08087730407714844, 0.08737564086914062, 0.09387397766113281, 0.100372314453125, 0.10687065124511719, 0.11336898803710938, 0.11986732482910156, 0.12636566162109375, 0.13286399841308594, 0.13936233520507812, 0.1458606719970703, 0.1523590087890625, 0.1588573455810547, 0.16535568237304688, 0.17185401916503906, 0.17835235595703125, 0.18485069274902344, 0.19134902954101562, 0.1978473663330078, 0.204345703125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 12.0, 11.0, 5.0, 15.0, 15.0, 14.0, 32.0, 30.0, 41.0, 49.0, 51.0, 58.0, 72.0, 80.0, 70.0, 57.0, 65.0, 53.0, 36.0, 42.0, 50.0, 22.0, 27.0, 19.0, 18.0, 14.0, 17.0, 5.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2007694244384766e-05, -3.0973926186561584e-05, -2.9940158128738403e-05, -2.8906390070915222e-05, -2.787262201309204e-05, -2.683885395526886e-05, -2.580508589744568e-05, -2.4771317839622498e-05, -2.3737549781799316e-05, -2.2703781723976135e-05, -2.1670013666152954e-05, -2.0636245608329773e-05, -1.9602477550506592e-05, -1.856870949268341e-05, -1.753494143486023e-05, -1.650117337703705e-05, -1.5467405319213867e-05, -1.4433637261390686e-05, -1.3399869203567505e-05, -1.2366101145744324e-05, -1.1332333087921143e-05, -1.0298565030097961e-05, -9.26479697227478e-06, -8.231028914451599e-06, -7.197260856628418e-06, -6.163492798805237e-06, -5.129724740982056e-06, -4.0959566831588745e-06, -3.0621886253356934e-06, -2.028420567512512e-06, -9.94652509689331e-07, 3.91155481338501e-08, 1.0728836059570312e-06, 2.1066516637802124e-06, 3.1404197216033936e-06, 4.174187779426575e-06, 5.207955837249756e-06, 6.241723895072937e-06, 7.275491952896118e-06, 8.3092600107193e-06, 9.34302806854248e-06, 1.0376796126365662e-05, 1.1410564184188843e-05, 1.2444332242012024e-05, 1.3478100299835205e-05, 1.4511868357658386e-05, 1.5545636415481567e-05, 1.657940447330475e-05, 1.761317253112793e-05, 1.864694058895111e-05, 1.9680708646774292e-05, 2.0714476704597473e-05, 2.1748244762420654e-05, 2.2782012820243835e-05, 2.3815780878067017e-05, 2.4849548935890198e-05, 2.588331699371338e-05, 2.691708505153656e-05, 2.795085310935974e-05, 2.8984621167182922e-05, 3.0018389225006104e-05, 3.1052157282829285e-05, 3.2085925340652466e-05, 3.311969339847565e-05, 3.415346145629883e-05]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 12.0, 7.0, 9.0, 8.0, 15.0, 22.0, 25.0, 24.0, 51.0, 57.0, 97.0, 114.0, 294.0, 791.0, 16070.0, 1021145.0, 8394.0, 736.0, 269.0, 132.0, 79.0, 61.0, 36.0, 19.0, 19.0, 11.0, 11.0, 12.0, 10.0, 11.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006737709045410156, -0.0006523504853248596, -0.0006309300661087036, -0.0006095096468925476, -0.0005880892276763916, -0.0005666688084602356, -0.0005452483892440796, -0.0005238279700279236, -0.0005024075508117676, -0.00048098713159561157, -0.00045956671237945557, -0.00043814629316329956, -0.00041672587394714355, -0.00039530545473098755, -0.00037388503551483154, -0.00035246461629867554, -0.00033104419708251953, -0.0003096237778663635, -0.0002882033586502075, -0.0002667829394340515, -0.0002453625202178955, -0.0002239421010017395, -0.0002025216817855835, -0.0001811012625694275, -0.00015968084335327148, -0.00013826042413711548, -0.00011684000492095947, -9.541958570480347e-05, -7.399916648864746e-05, -5.2578747272491455e-05, -3.115832805633545e-05, -9.737908840179443e-06, 1.1682510375976562e-05, 3.310292959213257e-05, 5.4523348808288574e-05, 7.594376802444458e-05, 9.736418724060059e-05, 0.00011878460645675659, 0.0001402050256729126, 0.0001616254448890686, 0.0001830458641052246, 0.00020446628332138062, 0.00022588670253753662, 0.0002473071217536926, 0.00026872754096984863, 0.00029014796018600464, 0.00031156837940216064, 0.00033298879861831665, 0.00035440921783447266, 0.00037582963705062866, 0.00039725005626678467, 0.0004186704754829407, 0.0004400908946990967, 0.0004615113139152527, 0.0004829317331314087, 0.0005043521523475647, 0.0005257725715637207, 0.0005471929907798767, 0.0005686134099960327, 0.0005900338292121887, 0.0006114542484283447, 0.0006328746676445007, 0.0006542950868606567, 0.0006757155060768127, 0.0006971359252929688]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 14.0, 22.0, 33.0, 40.0, 65.0, 123.0, 129.0, 147.0, 132.0, 104.0, 89.0, 42.0, 24.0, 20.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9572413293644786e-05, -1.873641122074332e-05, -1.7900409147841856e-05, -1.706440707494039e-05, -1.6228405002038926e-05, -1.5392404748126864e-05, -1.45564026752254e-05, -1.3720400602323934e-05, -1.288439852942247e-05, -1.2048396456521004e-05, -1.121239438361954e-05, -1.0376393220212776e-05, -9.540391147311311e-06, -8.704389074409846e-06, -7.868387911003083e-06, -7.032385838101618e-06, -6.196383765200153e-06, -5.360381692298688e-06, -4.524380074144574e-06, -3.6883782286167843e-06, -2.8523763830889948e-06, -2.0163743101875298e-06, -1.1803726920334157e-06, -3.4437107387930155e-07, 4.916309990221635e-07, 1.327632844549953e-06, 2.1636346900777426e-06, 2.999636535605532e-06, 3.835638381133322e-06, 4.671640454034787e-06, 5.507642072188901e-06, 6.343643690343015e-06, 7.17964576324448e-06, 8.015647836145945e-06, 8.85164990904741e-06, 9.687651072454173e-06, 1.0523653145355638e-05, 1.1359655218257103e-05, 1.2195656381663866e-05, 1.3031658454565331e-05, 1.3867660527466796e-05, 1.4703662600368261e-05, 1.5539664673269726e-05, 1.637566674617119e-05, 1.7211667000083253e-05, 1.804767089197412e-05, 1.8883671145886183e-05, 1.9719673218787648e-05, 2.0555675291689113e-05, 2.1391677364590578e-05, 2.2227679437492043e-05, 2.3063681510393508e-05, 2.3899683583294973e-05, 2.4735683837207034e-05, 2.55716859101085e-05, 2.6407687983009964e-05, 2.724369005591143e-05, 2.8079692128812894e-05, 2.891569420171436e-05, 2.9751696274615824e-05, 3.0587696528527886e-05, 3.1423700420418754e-05, 3.2259700674330816e-05, 3.3095704566221684e-05, 3.3931704820133746e-05]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 4.0, 7.0, 14.0, 9.0, 13.0, 25.0, 21.0, 25.0, 33.0, 20.0, 33.0, 35.0, 37.0, 44.0, 35.0, 43.0, 43.0, 39.0, 47.0, 41.0, 38.0, 45.0, 37.0, 41.0, 38.0, 30.0, 31.0, 34.0, 26.0, 15.0, 13.0, 23.0, 10.0, 11.0, 7.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.895427703857422e-05, -1.8458813428878784e-05, -1.796334981918335e-05, -1.7467886209487915e-05, -1.697242259979248e-05, -1.6476958990097046e-05, -1.598149538040161e-05, -1.5486031770706177e-05, -1.4990568161010742e-05, -1.4495104551315308e-05, -1.3999640941619873e-05, -1.3504177331924438e-05, -1.3008713722229004e-05, -1.251325011253357e-05, -1.2017786502838135e-05, -1.15223228931427e-05, -1.1026859283447266e-05, -1.0531395673751831e-05, -1.0035932064056396e-05, -9.540468454360962e-06, -9.045004844665527e-06, -8.549541234970093e-06, -8.054077625274658e-06, -7.558614015579224e-06, -7.063150405883789e-06, -6.5676867961883545e-06, -6.07222318649292e-06, -5.576759576797485e-06, -5.081295967102051e-06, -4.585832357406616e-06, -4.090368747711182e-06, -3.594905138015747e-06, -3.0994415283203125e-06, -2.603977918624878e-06, -2.1085143089294434e-06, -1.6130506992340088e-06, -1.1175870895385742e-06, -6.221234798431396e-07, -1.2665987014770508e-07, 3.688037395477295e-07, 8.642673492431641e-07, 1.3597309589385986e-06, 1.8551945686340332e-06, 2.3506581783294678e-06, 2.8461217880249023e-06, 3.341585397720337e-06, 3.8370490074157715e-06, 4.332512617111206e-06, 4.827976226806641e-06, 5.323439836502075e-06, 5.81890344619751e-06, 6.314367055892944e-06, 6.809830665588379e-06, 7.3052942752838135e-06, 7.800757884979248e-06, 8.296221494674683e-06, 8.791685104370117e-06, 9.287148714065552e-06, 9.782612323760986e-06, 1.0278075933456421e-05, 1.0773539543151855e-05, 1.126900315284729e-05, 1.1764466762542725e-05, 1.225993037223816e-05, 1.2755393981933594e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 11.0, 12.0, 3.0, 14.0, 7.0, 15.0, 12.0, 22.0, 17.0, 29.0, 37.0, 25.0, 36.0, 49.0, 41.0, 51.0, 36.0, 40.0, 45.0, 41.0, 49.0, 49.0, 45.0, 43.0, 38.0, 35.0, 28.0, 18.0, 24.0, 18.0, 22.0, 21.0, 14.0, 13.0, 3.0, 7.0, 7.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.33984375, -6.16644287109375, -5.9930419921875, -5.81964111328125, -5.646240234375, -5.47283935546875, -5.2994384765625, -5.12603759765625, -4.95263671875, -4.77923583984375, -4.6058349609375, -4.43243408203125, -4.259033203125, -4.08563232421875, -3.9122314453125, -3.73883056640625, -3.5654296875, -3.39202880859375, -3.2186279296875, -3.04522705078125, -2.871826171875, -2.69842529296875, -2.5250244140625, -2.35162353515625, -2.17822265625, -2.00482177734375, -1.8314208984375, -1.65802001953125, -1.484619140625, -1.31121826171875, -1.1378173828125, -0.96441650390625, -0.791015625, -0.61761474609375, -0.4442138671875, -0.27081298828125, -0.097412109375, 0.07598876953125, 0.2493896484375, 0.42279052734375, 0.59619140625, 0.76959228515625, 0.9429931640625, 1.11639404296875, 1.289794921875, 1.46319580078125, 1.6365966796875, 1.80999755859375, 1.9833984375, 2.15679931640625, 2.3302001953125, 2.50360107421875, 2.677001953125, 2.85040283203125, 3.0238037109375, 3.19720458984375, 3.37060546875, 3.54400634765625, 3.7174072265625, 3.89080810546875, 4.064208984375, 4.23760986328125, 4.4110107421875, 4.58441162109375, 4.7578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 8.0, 12.0, 21.0, 28.0, 32.0, 70.0, 94.0, 139.0, 262.0, 386.0, 639.0, 1051.0, 1850.0, 3368.0, 6279.0, 12358.0, 26234.0, 63755.0, 211430.0, 493521.0, 137237.0, 47411.0, 20714.0, 9747.0, 5135.0, 2834.0, 1539.0, 929.0, 568.0, 337.0, 196.0, 131.0, 88.0, 61.0, 25.0, 25.0, 12.0, 8.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.916015625, -3.782562255859375, -3.64910888671875, -3.515655517578125, -3.3822021484375, -3.248748779296875, -3.11529541015625, -2.981842041015625, -2.848388671875, -2.714935302734375, -2.58148193359375, -2.448028564453125, -2.3145751953125, -2.181121826171875, -2.04766845703125, -1.914215087890625, -1.78076171875, -1.647308349609375, -1.51385498046875, -1.380401611328125, -1.2469482421875, -1.113494873046875, -0.98004150390625, -0.846588134765625, -0.713134765625, -0.579681396484375, -0.44622802734375, -0.312774658203125, -0.1793212890625, -0.045867919921875, 0.08758544921875, 0.221038818359375, 0.3544921875, 0.487945556640625, 0.62139892578125, 0.754852294921875, 0.8883056640625, 1.021759033203125, 1.15521240234375, 1.288665771484375, 1.422119140625, 1.555572509765625, 1.68902587890625, 1.822479248046875, 1.9559326171875, 2.089385986328125, 2.22283935546875, 2.356292724609375, 2.48974609375, 2.623199462890625, 2.75665283203125, 2.890106201171875, 3.0235595703125, 3.157012939453125, 3.29046630859375, 3.423919677734375, 3.557373046875, 3.690826416015625, 3.82427978515625, 3.957733154296875, 4.0911865234375, 4.224639892578125, 4.35809326171875, 4.491546630859375, 4.625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 4.0, 5.0, 7.0, 9.0, 17.0, 7.0, 19.0, 18.0, 39.0, 23.0, 32.0, 44.0, 39.0, 52.0, 76.0, 114.0, 1594.0, 391.0, 108.0, 65.0, 66.0, 42.0, 42.0, 39.0, 37.0, 27.0, 20.0, 19.0, 15.0, 13.0, 13.0, 14.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.8125, -23.089599609375, -22.36669921875, -21.643798828125, -20.9208984375, -20.197998046875, -19.47509765625, -18.752197265625, -18.029296875, -17.306396484375, -16.58349609375, -15.860595703125, -15.1376953125, -14.414794921875, -13.69189453125, -12.968994140625, -12.24609375, -11.523193359375, -10.80029296875, -10.077392578125, -9.3544921875, -8.631591796875, -7.90869140625, -7.185791015625, -6.462890625, -5.739990234375, -5.01708984375, -4.294189453125, -3.5712890625, -2.848388671875, -2.12548828125, -1.402587890625, -0.6796875, 0.043212890625, 0.76611328125, 1.489013671875, 2.2119140625, 2.934814453125, 3.65771484375, 4.380615234375, 5.103515625, 5.826416015625, 6.54931640625, 7.272216796875, 7.9951171875, 8.718017578125, 9.44091796875, 10.163818359375, 10.88671875, 11.609619140625, 12.33251953125, 13.055419921875, 13.7783203125, 14.501220703125, 15.22412109375, 15.947021484375, 16.669921875, 17.392822265625, 18.11572265625, 18.838623046875, 19.5615234375, 20.284423828125, 21.00732421875, 21.730224609375, 22.453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 13.0, 8.0, 12.0, 25.0, 17.0, 49.0, 47.0, 79.0, 105.0, 169.0, 253.0, 536.0, 2373.0, 836099.0, 2302188.0, 2510.0, 475.0, 271.0, 152.0, 86.0, 75.0, 56.0, 29.0, 20.0, 16.0, 9.0, 6.0, 14.0, 7.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-84.0, -81.84716796875, -79.6943359375, -77.54150390625, -75.388671875, -73.23583984375, -71.0830078125, -68.93017578125, -66.77734375, -64.62451171875, -62.4716796875, -60.31884765625, -58.166015625, -56.01318359375, -53.8603515625, -51.70751953125, -49.5546875, -47.40185546875, -45.2490234375, -43.09619140625, -40.943359375, -38.79052734375, -36.6376953125, -34.48486328125, -32.33203125, -30.17919921875, -28.0263671875, -25.87353515625, -23.720703125, -21.56787109375, -19.4150390625, -17.26220703125, -15.109375, -12.95654296875, -10.8037109375, -8.65087890625, -6.498046875, -4.34521484375, -2.1923828125, -0.03955078125, 2.11328125, 4.26611328125, 6.4189453125, 8.57177734375, 10.724609375, 12.87744140625, 15.0302734375, 17.18310546875, 19.3359375, 21.48876953125, 23.6416015625, 25.79443359375, 27.947265625, 30.10009765625, 32.2529296875, 34.40576171875, 36.55859375, 38.71142578125, 40.8642578125, 43.01708984375, 45.169921875, 47.32275390625, 49.4755859375, 51.62841796875, 53.78125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 33.0, 119.0, 283.0, 318.0, 179.0, 57.0, 16.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.58555221557617, -31.2160701751709, -28.846588134765625, -26.477108001708984, -24.107624053955078, -21.738143920898438, -19.368661880493164, -16.99917984008789, -14.629697799682617, -12.260215759277344, -9.89073371887207, -7.521252632141113, -5.15177059173584, -2.7822885513305664, -0.4128074645996094, 1.956674575805664, 4.3261566162109375, 6.695638656616211, 9.065120697021484, 11.434601783752441, 13.804083824157715, 16.173564910888672, 18.543046951293945, 20.91252899169922, 23.282011032104492, 25.651493072509766, 28.02097511291504, 30.390457153320312, 32.75993728637695, 35.12942123413086, 37.4989013671875, 39.868385314941406, 42.23786926269531, 44.60734939575195, 46.97683334350586, 49.3463134765625, 51.715797424316406, 54.08527755737305, 56.45475769042969, 58.824241638183594, 61.1937255859375, 63.56320571899414, 65.93268585205078, 68.30216979980469, 70.6716537475586, 73.0411376953125, 75.41061401367188, 77.78009796142578, 80.14958190917969, 82.5190658569336, 84.88854217529297, 87.25802612304688, 89.62751007080078, 91.99699401855469, 94.36647033691406, 96.73595428466797, 99.10543060302734, 101.47491455078125, 103.84439086914062, 106.21387481689453, 108.58335876464844, 110.95284271240234, 113.32231903076172, 115.69180297851562, 118.06128692626953]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 5.0, 11.0, 9.0, 9.0, 11.0, 20.0, 19.0, 10.0, 19.0, 9.0, 23.0, 29.0, 28.0, 31.0, 31.0, 31.0, 44.0, 33.0, 42.0, 41.0, 32.0, 37.0, 39.0, 44.0, 29.0, 39.0, 20.0, 46.0, 32.0, 30.0, 23.0, 16.0, 28.0, 16.0, 16.0, 18.0, 10.0, 5.0, 16.0, 12.0, 3.0, 3.0, 4.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-47.413238525390625, -45.88478469848633, -44.3563346862793, -42.827880859375, -41.29943084716797, -39.77097702026367, -38.242523193359375, -36.714073181152344, -35.18561935424805, -33.65716552734375, -32.12871551513672, -30.600261688232422, -29.071809768676758, -27.543357849121094, -26.014904022216797, -24.486452102661133, -22.95800018310547, -21.429548263549805, -19.90109634399414, -18.372642517089844, -16.84419059753418, -15.315738677978516, -13.787285804748535, -12.258832931518555, -10.73038101196289, -9.201929092407227, -7.673476219177246, -6.145023822784424, -4.616571426391602, -3.0881190299987793, -1.559666633605957, -0.031213760375976562, 1.4972343444824219, 3.025686740875244, 4.554139137268066, 6.082591533660889, 7.611043930053711, 9.139495849609375, 10.667948722839355, 12.196401596069336, 13.724853515625, 15.253305435180664, 16.781757354736328, 18.310211181640625, 19.83866310119629, 21.367115020751953, 22.89556884765625, 24.424020767211914, 25.952472686767578, 27.480924606323242, 29.009376525878906, 30.537830352783203, 32.0662841796875, 33.59473419189453, 35.12318801879883, 36.651641845703125, 38.180091857910156, 39.70854568481445, 41.236995697021484, 42.76544952392578, 44.29389953613281, 45.82235336303711, 47.350807189941406, 48.87925720214844, 50.407711029052734]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 9.0, 4.0, 10.0, 11.0, 12.0, 18.0, 14.0, 28.0, 38.0, 28.0, 23.0, 25.0, 44.0, 42.0, 47.0, 55.0, 50.0, 44.0, 43.0, 42.0, 37.0, 46.0, 51.0, 43.0, 35.0, 21.0, 26.0, 27.0, 19.0, 22.0, 15.0, 16.0, 4.0, 10.0, 7.0, 5.0, 8.0, 8.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.89453125, -6.70672607421875, -6.5189208984375, -6.33111572265625, -6.143310546875, -5.95550537109375, -5.7677001953125, -5.57989501953125, -5.39208984375, -5.20428466796875, -5.0164794921875, -4.82867431640625, -4.640869140625, -4.45306396484375, -4.2652587890625, -4.07745361328125, -3.8896484375, -3.70184326171875, -3.5140380859375, -3.32623291015625, -3.138427734375, -2.95062255859375, -2.7628173828125, -2.57501220703125, -2.38720703125, -2.19940185546875, -2.0115966796875, -1.82379150390625, -1.635986328125, -1.44818115234375, -1.2603759765625, -1.07257080078125, -0.884765625, -0.69696044921875, -0.5091552734375, -0.32135009765625, -0.133544921875, 0.05426025390625, 0.2420654296875, 0.42987060546875, 0.61767578125, 0.80548095703125, 0.9932861328125, 1.18109130859375, 1.368896484375, 1.55670166015625, 1.7445068359375, 1.93231201171875, 2.1201171875, 2.30792236328125, 2.4957275390625, 2.68353271484375, 2.871337890625, 3.05914306640625, 3.2469482421875, 3.43475341796875, 3.62255859375, 3.81036376953125, 3.9981689453125, 4.18597412109375, 4.373779296875, 4.56158447265625, 4.7493896484375, 4.93719482421875, 5.125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 5.0, 4.0, 5.0, 8.0, 8.0, 11.0, 6.0, 19.0, 21.0, 25.0, 31.0, 31.0, 38.0, 56.0, 110.0, 227.0, 680.0, 2808.0, 23934.0, 638609.0, 3327900.0, 185968.0, 11110.0, 1725.0, 450.0, 159.0, 89.0, 45.0, 32.0, 26.0, 21.0, 15.0, 21.0, 16.0, 15.0, 10.0, 10.0, 7.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.15625, -22.5009765625, -21.845703125, -21.1904296875, -20.53515625, -19.8798828125, -19.224609375, -18.5693359375, -17.9140625, -17.2587890625, -16.603515625, -15.9482421875, -15.29296875, -14.6376953125, -13.982421875, -13.3271484375, -12.671875, -12.0166015625, -11.361328125, -10.7060546875, -10.05078125, -9.3955078125, -8.740234375, -8.0849609375, -7.4296875, -6.7744140625, -6.119140625, -5.4638671875, -4.80859375, -4.1533203125, -3.498046875, -2.8427734375, -2.1875, -1.5322265625, -0.876953125, -0.2216796875, 0.43359375, 1.0888671875, 1.744140625, 2.3994140625, 3.0546875, 3.7099609375, 4.365234375, 5.0205078125, 5.67578125, 6.3310546875, 6.986328125, 7.6416015625, 8.296875, 8.9521484375, 9.607421875, 10.2626953125, 10.91796875, 11.5732421875, 12.228515625, 12.8837890625, 13.5390625, 14.1943359375, 14.849609375, 15.5048828125, 16.16015625, 16.8154296875, 17.470703125, 18.1259765625, 18.78125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 4.0, 9.0, 10.0, 12.0, 20.0, 29.0, 45.0, 61.0, 89.0, 120.0, 189.0, 281.0, 457.0, 594.0, 684.0, 490.0, 334.0, 199.0, 162.0, 96.0, 56.0, 35.0, 31.0, 16.0, 16.0, 7.0, 9.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-19.1875, -18.7318115234375, -18.276123046875, -17.8204345703125, -17.36474609375, -16.9090576171875, -16.453369140625, -15.9976806640625, -15.5419921875, -15.0863037109375, -14.630615234375, -14.1749267578125, -13.71923828125, -13.2635498046875, -12.807861328125, -12.3521728515625, -11.896484375, -11.4407958984375, -10.985107421875, -10.5294189453125, -10.07373046875, -9.6180419921875, -9.162353515625, -8.7066650390625, -8.2509765625, -7.7952880859375, -7.339599609375, -6.8839111328125, -6.42822265625, -5.9725341796875, -5.516845703125, -5.0611572265625, -4.60546875, -4.1497802734375, -3.694091796875, -3.2384033203125, -2.78271484375, -2.3270263671875, -1.871337890625, -1.4156494140625, -0.9599609375, -0.5042724609375, -0.048583984375, 0.4071044921875, 0.86279296875, 1.3184814453125, 1.774169921875, 2.2298583984375, 2.685546875, 3.1412353515625, 3.596923828125, 4.0526123046875, 4.50830078125, 4.9639892578125, 5.419677734375, 5.8753662109375, 6.3310546875, 6.7867431640625, 7.242431640625, 7.6981201171875, 8.15380859375, 8.6094970703125, 9.065185546875, 9.5208740234375, 9.9765625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 8.0, 1.0, 10.0, 5.0, 9.0, 20.0, 19.0, 23.0, 31.0, 52.0, 64.0, 98.0, 125.0, 182.0, 368.0, 784.0, 3199.0, 35231.0, 1799880.0, 2306570.0, 42239.0, 3493.0, 848.0, 337.0, 190.0, 143.0, 90.0, 80.0, 45.0, 37.0, 27.0, 12.0, 17.0, 17.0, 9.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.234375, -25.186279296875, -24.13818359375, -23.090087890625, -22.0419921875, -20.993896484375, -19.94580078125, -18.897705078125, -17.849609375, -16.801513671875, -15.75341796875, -14.705322265625, -13.6572265625, -12.609130859375, -11.56103515625, -10.512939453125, -9.46484375, -8.416748046875, -7.36865234375, -6.320556640625, -5.2724609375, -4.224365234375, -3.17626953125, -2.128173828125, -1.080078125, -0.031982421875, 1.01611328125, 2.064208984375, 3.1123046875, 4.160400390625, 5.20849609375, 6.256591796875, 7.3046875, 8.352783203125, 9.40087890625, 10.448974609375, 11.4970703125, 12.545166015625, 13.59326171875, 14.641357421875, 15.689453125, 16.737548828125, 17.78564453125, 18.833740234375, 19.8818359375, 20.929931640625, 21.97802734375, 23.026123046875, 24.07421875, 25.122314453125, 26.17041015625, 27.218505859375, 28.2666015625, 29.314697265625, 30.36279296875, 31.410888671875, 32.458984375, 33.507080078125, 34.55517578125, 35.603271484375, 36.6513671875, 37.699462890625, 38.74755859375, 39.795654296875, 40.84375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 12.0, 30.0, 71.0, 132.0, 199.0, 210.0, 172.0, 100.0, 49.0, 25.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.96991729736328, -70.81488800048828, -67.65986633300781, -64.50483703613281, -61.34980773925781, -58.19478225708008, -55.039756774902344, -51.884727478027344, -48.72970199584961, -45.574676513671875, -42.419647216796875, -39.26462173461914, -36.109596252441406, -32.954566955566406, -29.799541473388672, -26.644514083862305, -23.489486694335938, -20.33445930480957, -17.179431915283203, -14.024406433105469, -10.869379043579102, -7.714351654052734, -4.559326171875, -1.4042987823486328, 1.7507286071777344, 4.905755519866943, 8.060782432556152, 11.215808868408203, 14.37083625793457, 17.525863647460938, 20.680889129638672, 23.83591651916504, 26.990936279296875, 30.145963668823242, 33.30099105834961, 36.456016540527344, 39.611045837402344, 42.76607131958008, 45.92109680175781, 49.07612609863281, 52.23115158081055, 55.38617706298828, 58.54120635986328, 61.696231842041016, 64.85125732421875, 68.00628662109375, 71.16131591796875, 74.31633758544922, 77.47136688232422, 80.62639617919922, 83.78141784667969, 86.93644714355469, 90.09147644042969, 93.24650573730469, 96.40152740478516, 99.55655670166016, 102.71157836914062, 105.86660766601562, 109.0216293334961, 112.1766586303711, 115.3316879272461, 118.48670959472656, 121.64173889160156, 124.79676818847656, 127.95179748535156]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 5.0, 12.0, 10.0, 17.0, 8.0, 14.0, 14.0, 16.0, 21.0, 21.0, 27.0, 26.0, 27.0, 32.0, 46.0, 30.0, 35.0, 40.0, 38.0, 38.0, 44.0, 36.0, 31.0, 31.0, 36.0, 38.0, 29.0, 29.0, 24.0, 33.0, 28.0, 22.0, 16.0, 21.0, 24.0, 18.0, 9.0, 12.0, 12.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.168731689453125, -32.07419204711914, -30.979650497436523, -29.885108947753906, -28.790569305419922, -27.696027755737305, -26.601486206054688, -25.506946563720703, -24.412405014038086, -23.31786346435547, -22.223323822021484, -21.128782272338867, -20.03424072265625, -18.939701080322266, -17.84515953063965, -16.75061798095703, -15.656078338623047, -14.561537742614746, -13.466997146606445, -12.372455596923828, -11.277915000915527, -10.183374404907227, -9.08883285522461, -7.994292259216309, -6.899751663208008, -5.805211067199707, -4.710669994354248, -3.616129159927368, -2.5215883255004883, -1.4270477294921875, -0.3325066566467285, 0.7620344161987305, 1.8565711975097656, 2.9511120319366455, 4.045652866363525, 5.140193939208984, 6.234734535217285, 7.329275131225586, 8.423816680908203, 9.518357276916504, 10.612897872924805, 11.707438468933105, 12.801979064941406, 13.896520614624023, 14.991061210632324, 16.085601806640625, 17.180143356323242, 18.27468490600586, 19.369224548339844, 20.46376609802246, 21.558305740356445, 22.652847290039062, 23.747386932373047, 24.841928482055664, 25.93647003173828, 27.031009674072266, 28.125551223754883, 29.2200927734375, 30.314632415771484, 31.4091739654541, 32.50371551513672, 33.5982551574707, 34.69279479980469, 35.78733825683594, 36.88187789916992]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 11.0, 14.0, 12.0, 20.0, 27.0, 27.0, 27.0, 43.0, 40.0, 44.0, 57.0, 53.0, 59.0, 59.0, 71.0, 58.0, 65.0, 37.0, 66.0, 44.0, 29.0, 29.0, 28.0, 22.0, 12.0, 8.0, 10.0, 7.0, 7.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.171875, -9.92822265625, -9.6845703125, -9.44091796875, -9.197265625, -8.95361328125, -8.7099609375, -8.46630859375, -8.22265625, -7.97900390625, -7.7353515625, -7.49169921875, -7.248046875, -7.00439453125, -6.7607421875, -6.51708984375, -6.2734375, -6.02978515625, -5.7861328125, -5.54248046875, -5.298828125, -5.05517578125, -4.8115234375, -4.56787109375, -4.32421875, -4.08056640625, -3.8369140625, -3.59326171875, -3.349609375, -3.10595703125, -2.8623046875, -2.61865234375, -2.375, -2.13134765625, -1.8876953125, -1.64404296875, -1.400390625, -1.15673828125, -0.9130859375, -0.66943359375, -0.42578125, -0.18212890625, 0.0615234375, 0.30517578125, 0.548828125, 0.79248046875, 1.0361328125, 1.27978515625, 1.5234375, 1.76708984375, 2.0107421875, 2.25439453125, 2.498046875, 2.74169921875, 2.9853515625, 3.22900390625, 3.47265625, 3.71630859375, 3.9599609375, 4.20361328125, 4.447265625, 4.69091796875, 4.9345703125, 5.17822265625, 5.421875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 5.0, 10.0, 4.0, 10.0, 5.0, 19.0, 13.0, 22.0, 38.0, 50.0, 71.0, 124.0, 233.0, 397.0, 712.0, 1286.0, 2591.0, 4982.0, 9984.0, 20347.0, 43751.0, 108768.0, 353052.0, 322607.0, 99874.0, 41307.0, 19114.0, 9214.0, 4777.0, 2421.0, 1254.0, 659.0, 341.0, 209.0, 132.0, 56.0, 34.0, 21.0, 21.0, 10.0, 11.0, 6.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36767578125, -0.356170654296875, -0.34466552734375, -0.333160400390625, -0.3216552734375, -0.310150146484375, -0.29864501953125, -0.287139892578125, -0.275634765625, -0.264129638671875, -0.25262451171875, -0.241119384765625, -0.2296142578125, -0.218109130859375, -0.20660400390625, -0.195098876953125, -0.18359375, -0.172088623046875, -0.16058349609375, -0.149078369140625, -0.1375732421875, -0.126068115234375, -0.11456298828125, -0.103057861328125, -0.091552734375, -0.080047607421875, -0.06854248046875, -0.057037353515625, -0.0455322265625, -0.034027099609375, -0.02252197265625, -0.011016845703125, 0.00048828125, 0.011993408203125, 0.02349853515625, 0.035003662109375, 0.0465087890625, 0.058013916015625, 0.06951904296875, 0.081024169921875, 0.092529296875, 0.104034423828125, 0.11553955078125, 0.127044677734375, 0.1385498046875, 0.150054931640625, 0.16156005859375, 0.173065185546875, 0.1845703125, 0.196075439453125, 0.20758056640625, 0.219085693359375, 0.2305908203125, 0.242095947265625, 0.25360107421875, 0.265106201171875, 0.276611328125, 0.288116455078125, 0.29962158203125, 0.311126708984375, 0.3226318359375, 0.334136962890625, 0.34564208984375, 0.357147216796875, 0.36865234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 9.0, 8.0, 8.0, 14.0, 5.0, 9.0, 13.0, 17.0, 16.0, 18.0, 21.0, 23.0, 41.0, 42.0, 31.0, 35.0, 33.0, 36.0, 38.0, 45.0, 23.0, 1066.0, 37.0, 35.0, 42.0, 35.0, 34.0, 32.0, 26.0, 24.0, 27.0, 26.0, 24.0, 31.0, 18.0, 22.0, 11.0, 13.0, 7.0, 10.0, 4.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.266326904296875, -3.15570068359375, -3.045074462890625, -2.9344482421875, -2.823822021484375, -2.71319580078125, -2.602569580078125, -2.491943359375, -2.381317138671875, -2.27069091796875, -2.160064697265625, -2.0494384765625, -1.938812255859375, -1.82818603515625, -1.717559814453125, -1.60693359375, -1.496307373046875, -1.38568115234375, -1.275054931640625, -1.1644287109375, -1.053802490234375, -0.94317626953125, -0.832550048828125, -0.721923828125, -0.611297607421875, -0.50067138671875, -0.390045166015625, -0.2794189453125, -0.168792724609375, -0.05816650390625, 0.052459716796875, 0.1630859375, 0.273712158203125, 0.38433837890625, 0.494964599609375, 0.6055908203125, 0.716217041015625, 0.82684326171875, 0.937469482421875, 1.048095703125, 1.158721923828125, 1.26934814453125, 1.379974365234375, 1.4906005859375, 1.601226806640625, 1.71185302734375, 1.822479248046875, 1.93310546875, 2.043731689453125, 2.15435791015625, 2.264984130859375, 2.3756103515625, 2.486236572265625, 2.59686279296875, 2.707489013671875, 2.818115234375, 2.928741455078125, 3.03936767578125, 3.149993896484375, 3.2606201171875, 3.371246337890625, 3.48187255859375, 3.592498779296875, 3.703125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 10.0, 21.0, 25.0, 41.0, 74.0, 106.0, 142.0, 189.0, 275.0, 396.0, 620.0, 888.0, 1307.0, 1965.0, 2912.0, 4273.0, 6203.0, 9580.0, 14892.0, 23264.0, 35946.0, 59008.0, 104505.0, 207442.0, 1300688.0, 131454.0, 70678.0, 42740.0, 26744.0, 17320.0, 11200.0, 7214.0, 4833.0, 3339.0, 2190.0, 1491.0, 1049.0, 688.0, 460.0, 297.0, 216.0, 132.0, 87.0, 69.0, 51.0, 32.0, 23.0, 10.0, 5.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.198486328125, -0.19211959838867188, -0.18575286865234375, -0.17938613891601562, -0.1730194091796875, -0.16665267944335938, -0.16028594970703125, -0.15391921997070312, -0.147552490234375, -0.14118576049804688, -0.13481903076171875, -0.12845230102539062, -0.1220855712890625, -0.11571884155273438, -0.10935211181640625, -0.10298538208007812, -0.09661865234375, -0.09025192260742188, -0.08388519287109375, -0.07751846313476562, -0.0711517333984375, -0.06478500366210938, -0.05841827392578125, -0.052051544189453125, -0.045684814453125, -0.039318084716796875, -0.03295135498046875, -0.026584625244140625, -0.0202178955078125, -0.013851165771484375, -0.00748443603515625, -0.001117706298828125, 0.0052490234375, 0.011615753173828125, 0.01798248291015625, 0.024349212646484375, 0.0307159423828125, 0.037082672119140625, 0.04344940185546875, 0.049816131591796875, 0.056182861328125, 0.06254959106445312, 0.06891632080078125, 0.07528305053710938, 0.0816497802734375, 0.08801651000976562, 0.09438323974609375, 0.10074996948242188, 0.10711669921875, 0.11348342895507812, 0.11985015869140625, 0.12621688842773438, 0.1325836181640625, 0.13895034790039062, 0.14531707763671875, 0.15168380737304688, 0.158050537109375, 0.16441726684570312, 0.17078399658203125, 0.17715072631835938, 0.1835174560546875, 0.18988418579101562, 0.19625091552734375, 0.20261764526367188, 0.208984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 9.0, 6.0, 8.0, 12.0, 28.0, 36.0, 33.0, 59.0, 51.0, 63.0, 89.0, 96.0, 82.0, 78.0, 59.0, 68.0, 55.0, 39.0, 29.0, 31.0, 20.0, 14.0, 6.0, 8.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.814697265625e-05, -3.660563379526138e-05, -3.5064294934272766e-05, -3.352295607328415e-05, -3.198161721229553e-05, -3.0440278351306915e-05, -2.88989394903183e-05, -2.735760062932968e-05, -2.5816261768341064e-05, -2.4274922907352448e-05, -2.273358404636383e-05, -2.1192245185375214e-05, -1.9650906324386597e-05, -1.810956746339798e-05, -1.6568228602409363e-05, -1.5026889741420746e-05, -1.3485550880432129e-05, -1.1944212019443512e-05, -1.0402873158454895e-05, -8.861534297466278e-06, -7.320195436477661e-06, -5.778856575489044e-06, -4.237517714500427e-06, -2.6961788535118103e-06, -1.1548399925231934e-06, 3.864988684654236e-07, 1.9278377294540405e-06, 3.4691765904426575e-06, 5.010515451431274e-06, 6.551854312419891e-06, 8.093193173408508e-06, 9.634532034397125e-06, 1.1175870895385742e-05, 1.2717209756374359e-05, 1.4258548617362976e-05, 1.5799887478351593e-05, 1.734122633934021e-05, 1.8882565200328827e-05, 2.0423904061317444e-05, 2.196524292230606e-05, 2.3506581783294678e-05, 2.5047920644283295e-05, 2.658925950527191e-05, 2.813059836626053e-05, 2.9671937227249146e-05, 3.121327608823776e-05, 3.275461494922638e-05, 3.4295953810214996e-05, 3.583729267120361e-05, 3.737863153219223e-05, 3.891997039318085e-05, 4.0461309254169464e-05, 4.200264811515808e-05, 4.35439869761467e-05, 4.5085325837135315e-05, 4.662666469812393e-05, 4.816800355911255e-05, 4.9709342420101166e-05, 5.125068128108978e-05, 5.27920201420784e-05, 5.4333359003067017e-05, 5.5874697864055634e-05, 5.741603672504425e-05, 5.895737558603287e-05, 6.0498714447021484e-05]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 8.0, 12.0, 14.0, 32.0, 45.0, 57.0, 88.0, 138.0, 234.0, 719.0, 67622.0, 977232.0, 1584.0, 338.0, 137.0, 87.0, 56.0, 41.0, 31.0, 20.0, 10.0, 8.0, 6.0, 10.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012044906616210938, -0.0011721178889274597, -0.0011397451162338257, -0.0011073723435401917, -0.0010749995708465576, -0.0010426267981529236, -0.0010102540254592896, -0.0009778812527656555, -0.0009455084800720215, -0.0009131357073783875, -0.0008807629346847534, -0.0008483901619911194, -0.0008160173892974854, -0.0007836446166038513, -0.0007512718439102173, -0.0007188990712165833, -0.0006865262985229492, -0.0006541535258293152, -0.0006217807531356812, -0.0005894079804420471, -0.0005570352077484131, -0.000524662435054779, -0.000492289662361145, -0.000459916889667511, -0.00042754411697387695, -0.0003951713442802429, -0.0003627985715866089, -0.00033042579889297485, -0.0002980530261993408, -0.0002656802535057068, -0.00023330748081207275, -0.00020093470811843872, -0.0001685619354248047, -0.00013618916273117065, -0.00010381639003753662, -7.144361734390259e-05, -3.9070844650268555e-05, -6.6980719566345215e-06, 2.5674700736999512e-05, 5.8047473430633545e-05, 9.042024612426758e-05, 0.0001227930188179016, 0.00015516579151153564, 0.00018753856420516968, 0.0002199113368988037, 0.00025228410959243774, 0.0002846568822860718, 0.0003170296549797058, 0.00034940242767333984, 0.0003817752003669739, 0.0004141479730606079, 0.00044652074575424194, 0.000478893518447876, 0.00051126629114151, 0.000543639063835144, 0.0005760118365287781, 0.0006083846092224121, 0.0006407573819160461, 0.0006731301546096802, 0.0007055029273033142, 0.0007378756999969482, 0.0007702484726905823, 0.0008026212453842163, 0.0008349940180778503, 0.0008673667907714844]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 17.0, 207.0, 512.0, 251.0, 27.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802412407414522e-05, -1.4086487681197468e-05, -1.0148851288249716e-05, -6.211214895301964e-06, -2.273578502354212e-06, 1.6640569810988382e-06, 5.601694283541292e-06, 9.539331585983746e-06, 1.3476967069436796e-05, 1.741460437187925e-05, 2.13522398553323e-05, 2.528987533878535e-05, 2.9227512641227804e-05, 3.316514630569145e-05, 3.710278542712331e-05, 4.1040424548555166e-05, 4.497805639402941e-05, 4.891569187748246e-05, 5.285332736093551e-05, 5.6790966482367367e-05, 6.072860196582042e-05, 6.466623744927347e-05, 6.860387657070532e-05, 7.254151569213718e-05, 7.647914753761142e-05, 8.041678665904328e-05, 8.435441850451753e-05, 8.829205762594938e-05, 9.222968947142363e-05, 9.616732859285548e-05, 0.00010010496771428734, 0.00010404259955976158, 0.00010798023140523583, 0.00011191787052666768, 0.00011585550237214193, 0.00011979314149357378, 0.00012373077333904803, 0.00012766840518452227, 0.00013160605158191174, 0.00013554368342738599, 0.00013948132982477546, 0.0001434189616702497, 0.00014735660806763917, 0.00015129423991311342, 0.00015523187175858766, 0.00015916951815597713, 0.00016310715000145137, 0.00016704478184692562, 0.00017098241369239986, 0.0001749200455378741, 0.00017885769193526357, 0.00018279532378073782, 0.00018673295562621206, 0.00019067060202360153, 0.00019460823386907578, 0.00019854586571455002, 0.00020248349756002426, 0.0002064211294054985, 0.00021035877580288798, 0.00021429640764836222, 0.00021823403949383646, 0.00022217168589122593, 0.00022610931773670018, 0.00023004694958217442, 0.0002339845959795639]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 10.0, 5.0, 7.0, 6.0, 10.0, 9.0, 13.0, 12.0, 18.0, 11.0, 18.0, 39.0, 21.0, 33.0, 22.0, 28.0, 45.0, 41.0, 44.0, 35.0, 39.0, 38.0, 33.0, 42.0, 49.0, 44.0, 43.0, 35.0, 30.0, 18.0, 30.0, 34.0, 23.0, 19.0, 16.0, 10.0, 14.0, 15.0, 4.0, 8.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7583370208740234e-05, -1.70217826962471e-05, -1.6460195183753967e-05, -1.5898607671260834e-05, -1.53370201587677e-05, -1.4775432646274567e-05, -1.4213845133781433e-05, -1.36522576212883e-05, -1.3090670108795166e-05, -1.2529082596302032e-05, -1.1967495083808899e-05, -1.1405907571315765e-05, -1.0844320058822632e-05, -1.0282732546329498e-05, -9.721145033836365e-06, -9.159557521343231e-06, -8.597970008850098e-06, -8.036382496356964e-06, -7.4747949838638306e-06, -6.913207471370697e-06, -6.3516199588775635e-06, -5.79003244638443e-06, -5.228444933891296e-06, -4.666857421398163e-06, -4.105269908905029e-06, -3.5436823964118958e-06, -2.982094883918762e-06, -2.4205073714256287e-06, -1.8589198589324951e-06, -1.2973323464393616e-06, -7.35744833946228e-07, -1.7415732145309448e-07, 3.8743019104003906e-07, 9.490177035331726e-07, 1.5106052160263062e-06, 2.0721927285194397e-06, 2.6337802410125732e-06, 3.1953677535057068e-06, 3.7569552659988403e-06, 4.318542778491974e-06, 4.880130290985107e-06, 5.441717803478241e-06, 6.0033053159713745e-06, 6.564892828464508e-06, 7.126480340957642e-06, 7.688067853450775e-06, 8.249655365943909e-06, 8.811242878437042e-06, 9.372830390930176e-06, 9.93441790342331e-06, 1.0496005415916443e-05, 1.1057592928409576e-05, 1.161918044090271e-05, 1.2180767953395844e-05, 1.2742355465888977e-05, 1.330394297838211e-05, 1.3865530490875244e-05, 1.4427118003368378e-05, 1.4988705515861511e-05, 1.5550293028354645e-05, 1.611188054084778e-05, 1.6673468053340912e-05, 1.7235055565834045e-05, 1.779664307832718e-05, 1.8358230590820312e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 3.0, 11.0, 14.0, 12.0, 20.0, 27.0, 27.0, 27.0, 43.0, 40.0, 44.0, 57.0, 53.0, 59.0, 59.0, 71.0, 58.0, 65.0, 37.0, 66.0, 44.0, 29.0, 29.0, 28.0, 22.0, 12.0, 8.0, 10.0, 7.0, 7.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.171875, -9.92822265625, -9.6845703125, -9.44091796875, -9.197265625, -8.95361328125, -8.7099609375, -8.46630859375, -8.22265625, -7.97900390625, -7.7353515625, -7.49169921875, -7.248046875, -7.00439453125, -6.7607421875, -6.51708984375, -6.2734375, -6.02978515625, -5.7861328125, -5.54248046875, -5.298828125, -5.05517578125, -4.8115234375, -4.56787109375, -4.32421875, -4.08056640625, -3.8369140625, -3.59326171875, -3.349609375, -3.10595703125, -2.8623046875, -2.61865234375, -2.375, -2.13134765625, -1.8876953125, -1.64404296875, -1.400390625, -1.15673828125, -0.9130859375, -0.66943359375, -0.42578125, -0.18212890625, 0.0615234375, 0.30517578125, 0.548828125, 0.79248046875, 1.0361328125, 1.27978515625, 1.5234375, 1.76708984375, 2.0107421875, 2.25439453125, 2.498046875, 2.74169921875, 2.9853515625, 3.22900390625, 3.47265625, 3.71630859375, 3.9599609375, 4.20361328125, 4.447265625, 4.69091796875, 4.9345703125, 5.17822265625, 5.421875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 8.0, 20.0, 47.0, 66.0, 106.0, 237.0, 432.0, 950.0, 2171.0, 4733.0, 11459.0, 30400.0, 96838.0, 541577.0, 263079.0, 60654.0, 20999.0, 8219.0, 3452.0, 1551.0, 756.0, 380.0, 178.0, 101.0, 50.0, 32.0, 26.0, 9.0, 10.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.40234375, -7.1767578125, -6.951171875, -6.7255859375, -6.5, -6.2744140625, -6.048828125, -5.8232421875, -5.59765625, -5.3720703125, -5.146484375, -4.9208984375, -4.6953125, -4.4697265625, -4.244140625, -4.0185546875, -3.79296875, -3.5673828125, -3.341796875, -3.1162109375, -2.890625, -2.6650390625, -2.439453125, -2.2138671875, -1.98828125, -1.7626953125, -1.537109375, -1.3115234375, -1.0859375, -0.8603515625, -0.634765625, -0.4091796875, -0.18359375, 0.0419921875, 0.267578125, 0.4931640625, 0.71875, 0.9443359375, 1.169921875, 1.3955078125, 1.62109375, 1.8466796875, 2.072265625, 2.2978515625, 2.5234375, 2.7490234375, 2.974609375, 3.2001953125, 3.42578125, 3.6513671875, 3.876953125, 4.1025390625, 4.328125, 4.5537109375, 4.779296875, 5.0048828125, 5.23046875, 5.4560546875, 5.681640625, 5.9072265625, 6.1328125, 6.3583984375, 6.583984375, 6.8095703125, 7.03515625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 9.0, 6.0, 5.0, 8.0, 4.0, 11.0, 16.0, 19.0, 20.0, 22.0, 22.0, 29.0, 21.0, 32.0, 37.0, 37.0, 46.0, 45.0, 75.0, 99.0, 210.0, 1642.0, 158.0, 70.0, 57.0, 52.0, 38.0, 29.0, 41.0, 35.0, 28.0, 23.0, 12.0, 22.0, 15.0, 13.0, 10.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.390625, -16.81689453125, -16.2431640625, -15.66943359375, -15.095703125, -14.52197265625, -13.9482421875, -13.37451171875, -12.80078125, -12.22705078125, -11.6533203125, -11.07958984375, -10.505859375, -9.93212890625, -9.3583984375, -8.78466796875, -8.2109375, -7.63720703125, -7.0634765625, -6.48974609375, -5.916015625, -5.34228515625, -4.7685546875, -4.19482421875, -3.62109375, -3.04736328125, -2.4736328125, -1.89990234375, -1.326171875, -0.75244140625, -0.1787109375, 0.39501953125, 0.96875, 1.54248046875, 2.1162109375, 2.68994140625, 3.263671875, 3.83740234375, 4.4111328125, 4.98486328125, 5.55859375, 6.13232421875, 6.7060546875, 7.27978515625, 7.853515625, 8.42724609375, 9.0009765625, 9.57470703125, 10.1484375, 10.72216796875, 11.2958984375, 11.86962890625, 12.443359375, 13.01708984375, 13.5908203125, 14.16455078125, 14.73828125, 15.31201171875, 15.8857421875, 16.45947265625, 17.033203125, 17.60693359375, 18.1806640625, 18.75439453125, 19.328125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 1.0, 6.0, 5.0, 21.0, 20.0, 14.0, 23.0, 33.0, 27.0, 43.0, 68.0, 79.0, 97.0, 123.0, 187.0, 291.0, 527.0, 1777.0, 34171.0, 3033022.0, 70900.0, 2450.0, 584.0, 352.0, 216.0, 148.0, 113.0, 74.0, 63.0, 55.0, 42.0, 38.0, 37.0, 28.0, 18.0, 9.0, 11.0, 9.0, 4.0, 6.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.21875, -39.91357421875, -38.6083984375, -37.30322265625, -35.998046875, -34.69287109375, -33.3876953125, -32.08251953125, -30.77734375, -29.47216796875, -28.1669921875, -26.86181640625, -25.556640625, -24.25146484375, -22.9462890625, -21.64111328125, -20.3359375, -19.03076171875, -17.7255859375, -16.42041015625, -15.115234375, -13.81005859375, -12.5048828125, -11.19970703125, -9.89453125, -8.58935546875, -7.2841796875, -5.97900390625, -4.673828125, -3.36865234375, -2.0634765625, -0.75830078125, 0.546875, 1.85205078125, 3.1572265625, 4.46240234375, 5.767578125, 7.07275390625, 8.3779296875, 9.68310546875, 10.98828125, 12.29345703125, 13.5986328125, 14.90380859375, 16.208984375, 17.51416015625, 18.8193359375, 20.12451171875, 21.4296875, 22.73486328125, 24.0400390625, 25.34521484375, 26.650390625, 27.95556640625, 29.2607421875, 30.56591796875, 31.87109375, 33.17626953125, 34.4814453125, 35.78662109375, 37.091796875, 38.39697265625, 39.7021484375, 41.00732421875, 42.3125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [9.0, 682.0, 329.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.87465476989746, -8.509739875793457, 0.8551750183105469, 10.220090866088867, 19.585004806518555, 28.949918746948242, 38.31483459472656, 47.67974853515625, 57.04466247558594, 66.40957641601562, 75.77449035644531, 85.139404296875, 94.50431823730469, 103.86923217773438, 113.2341537475586, 122.59906768798828, 131.9639892578125, 141.3289031982422, 150.69381713867188, 160.05873107910156, 169.42364501953125, 178.78855895996094, 188.15347290039062, 197.51840209960938, 206.88330078125, 216.2482147216797, 225.61312866210938, 234.97804260253906, 244.34295654296875, 253.70787048339844, 263.0727844238281, 272.4377136230469, 281.8026428222656, 291.1675720214844, 300.532470703125, 309.89739990234375, 319.2622985839844, 328.6272277832031, 337.99212646484375, 347.3570556640625, 356.7219543457031, 366.0868835449219, 375.4517822265625, 384.81671142578125, 394.1816101074219, 403.5465393066406, 412.91143798828125, 422.2763671875, 431.64129638671875, 441.0062255859375, 450.3711242675781, 459.7360534667969, 469.1009521484375, 478.46588134765625, 487.8307800292969, 497.1957092285156, 506.56060791015625, 515.925537109375, 525.2904663085938, 534.6553344726562, 544.020263671875, 553.3851928710938, 562.7501220703125, 572.114990234375, 581.4799194335938]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 6.0, 9.0, 12.0, 6.0, 11.0, 20.0, 19.0, 16.0, 16.0, 27.0, 31.0, 21.0, 32.0, 30.0, 35.0, 36.0, 40.0, 40.0, 42.0, 23.0, 52.0, 28.0, 32.0, 38.0, 31.0, 42.0, 41.0, 26.0, 27.0, 26.0, 29.0, 24.0, 16.0, 21.0, 10.0, 7.0, 18.0, 7.0, 6.0, 6.0, 6.0, 8.0, 7.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.3968620300293, -46.868988037109375, -45.34111022949219, -43.813236236572266, -42.285362243652344, -40.757484436035156, -39.229610443115234, -37.70173645019531, -36.173858642578125, -34.6459846496582, -33.118106842041016, -31.590232849121094, -30.062358856201172, -28.534482955932617, -27.006607055664062, -25.47873306274414, -23.95085906982422, -22.422983169555664, -20.895109176635742, -19.367233276367188, -17.839359283447266, -16.31148338317871, -14.783607482910156, -13.255732536315918, -11.72785758972168, -10.199982643127441, -8.672107696533203, -7.144231796264648, -5.61635684967041, -4.088481903076172, -2.560606002807617, -1.032731056213379, 0.495147705078125, 2.0230228900909424, 3.5508980751037598, 5.078773498535156, 6.6066484451293945, 8.134523391723633, 9.662399291992188, 11.190274238586426, 12.718149185180664, 14.246024131774902, 15.77389907836914, 17.301774978637695, 18.82965087890625, 20.357524871826172, 21.885400772094727, 23.41327667236328, 24.941150665283203, 26.469026565551758, 27.99690055847168, 29.524776458740234, 31.052650451660156, 32.580528259277344, 34.108402252197266, 35.63627624511719, 37.164154052734375, 38.6920280456543, 40.219905853271484, 41.747779846191406, 43.27565383911133, 44.80352783203125, 46.33140563964844, 47.85927963256836, 49.38715362548828]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 10.0, 13.0, 20.0, 16.0, 18.0, 24.0, 25.0, 34.0, 48.0, 39.0, 48.0, 51.0, 64.0, 62.0, 52.0, 63.0, 66.0, 44.0, 42.0, 56.0, 42.0, 36.0, 26.0, 20.0, 13.0, 18.0, 14.0, 9.0, 6.0, 8.0, 1.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -10.15386962890625, -9.9014892578125, -9.64910888671875, -9.396728515625, -9.14434814453125, -8.8919677734375, -8.63958740234375, -8.38720703125, -8.13482666015625, -7.8824462890625, -7.63006591796875, -7.377685546875, -7.12530517578125, -6.8729248046875, -6.62054443359375, -6.3681640625, -6.11578369140625, -5.8634033203125, -5.61102294921875, -5.358642578125, -5.10626220703125, -4.8538818359375, -4.60150146484375, -4.34912109375, -4.09674072265625, -3.8443603515625, -3.59197998046875, -3.339599609375, -3.08721923828125, -2.8348388671875, -2.58245849609375, -2.330078125, -2.07769775390625, -1.8253173828125, -1.57293701171875, -1.320556640625, -1.06817626953125, -0.8157958984375, -0.56341552734375, -0.31103515625, -0.05865478515625, 0.1937255859375, 0.44610595703125, 0.698486328125, 0.95086669921875, 1.2032470703125, 1.45562744140625, 1.7080078125, 1.96038818359375, 2.2127685546875, 2.46514892578125, 2.717529296875, 2.96990966796875, 3.2222900390625, 3.47467041015625, 3.72705078125, 3.97943115234375, 4.2318115234375, 4.48419189453125, 4.736572265625, 4.98895263671875, 5.2413330078125, 5.49371337890625, 5.74609375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 14.0, 15.0, 14.0, 15.0, 26.0, 35.0, 40.0, 54.0, 121.0, 326.0, 1253.0, 7487.0, 117938.0, 3241381.0, 798388.0, 23487.0, 2716.0, 541.0, 151.0, 68.0, 42.0, 32.0, 19.0, 32.0, 14.0, 16.0, 16.0, 7.0, 13.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.984375, -28.2548828125, -27.525390625, -26.7958984375, -26.06640625, -25.3369140625, -24.607421875, -23.8779296875, -23.1484375, -22.4189453125, -21.689453125, -20.9599609375, -20.23046875, -19.5009765625, -18.771484375, -18.0419921875, -17.3125, -16.5830078125, -15.853515625, -15.1240234375, -14.39453125, -13.6650390625, -12.935546875, -12.2060546875, -11.4765625, -10.7470703125, -10.017578125, -9.2880859375, -8.55859375, -7.8291015625, -7.099609375, -6.3701171875, -5.640625, -4.9111328125, -4.181640625, -3.4521484375, -2.72265625, -1.9931640625, -1.263671875, -0.5341796875, 0.1953125, 0.9248046875, 1.654296875, 2.3837890625, 3.11328125, 3.8427734375, 4.572265625, 5.3017578125, 6.03125, 6.7607421875, 7.490234375, 8.2197265625, 8.94921875, 9.6787109375, 10.408203125, 11.1376953125, 11.8671875, 12.5966796875, 13.326171875, 14.0556640625, 14.78515625, 15.5146484375, 16.244140625, 16.9736328125, 17.703125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 6.0, 10.0, 16.0, 19.0, 29.0, 44.0, 41.0, 62.0, 96.0, 128.0, 176.0, 277.0, 406.0, 531.0, 567.0, 467.0, 339.0, 232.0, 175.0, 128.0, 92.0, 70.0, 45.0, 31.0, 17.0, 18.0, 12.0, 5.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.5390625, -12.125, -11.7109375, -11.296875, -10.8828125, -10.46875, -10.0546875, -9.640625, -9.2265625, -8.8125, -8.3984375, -7.984375, -7.5703125, -7.15625, -6.7421875, -6.328125, -5.9140625, -5.5, -5.0859375, -4.671875, -4.2578125, -3.84375, -3.4296875, -3.015625, -2.6015625, -2.1875, -1.7734375, -1.359375, -0.9453125, -0.53125, -0.1171875, 0.296875, 0.7109375, 1.125, 1.5390625, 1.953125, 2.3671875, 2.78125, 3.1953125, 3.609375, 4.0234375, 4.4375, 4.8515625, 5.265625, 5.6796875, 6.09375, 6.5078125, 6.921875, 7.3359375, 7.75, 8.1640625, 8.578125, 8.9921875, 9.40625, 9.8203125, 10.234375, 10.6484375, 11.0625, 11.4765625, 11.890625, 12.3046875, 12.71875, 13.1328125, 13.546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 1.0, 7.0, 14.0, 7.0, 25.0, 19.0, 24.0, 42.0, 80.0, 99.0, 128.0, 205.0, 290.0, 484.0, 1655.0, 29228.0, 3391681.0, 759309.0, 8833.0, 1006.0, 344.0, 208.0, 160.0, 131.0, 78.0, 62.0, 54.0, 30.0, 21.0, 19.0, 8.0, 10.0, 11.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0625, -43.64697265625, -42.2314453125, -40.81591796875, -39.400390625, -37.98486328125, -36.5693359375, -35.15380859375, -33.73828125, -32.32275390625, -30.9072265625, -29.49169921875, -28.076171875, -26.66064453125, -25.2451171875, -23.82958984375, -22.4140625, -20.99853515625, -19.5830078125, -18.16748046875, -16.751953125, -15.33642578125, -13.9208984375, -12.50537109375, -11.08984375, -9.67431640625, -8.2587890625, -6.84326171875, -5.427734375, -4.01220703125, -2.5966796875, -1.18115234375, 0.234375, 1.64990234375, 3.0654296875, 4.48095703125, 5.896484375, 7.31201171875, 8.7275390625, 10.14306640625, 11.55859375, 12.97412109375, 14.3896484375, 15.80517578125, 17.220703125, 18.63623046875, 20.0517578125, 21.46728515625, 22.8828125, 24.29833984375, 25.7138671875, 27.12939453125, 28.544921875, 29.96044921875, 31.3759765625, 32.79150390625, 34.20703125, 35.62255859375, 37.0380859375, 38.45361328125, 39.869140625, 41.28466796875, 42.7001953125, 44.11572265625, 45.53125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 15.0, 72.0, 207.0, 310.0, 246.0, 122.0, 31.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.3496322631836, -84.27459716796875, -79.1995620727539, -74.12452697753906, -69.04948425292969, -63.974449157714844, -58.8994140625, -53.82437515258789, -48.74934005737305, -43.6743049621582, -38.599266052246094, -33.52423095703125, -28.449193954467773, -23.374156951904297, -18.299121856689453, -13.224082946777344, -8.1490478515625, -3.0740113258361816, 2.0010251998901367, 7.076061248779297, 12.151098251342773, 17.22613525390625, 22.301170349121094, 27.376209259033203, 32.45124435424805, 37.52627944946289, 42.601318359375, 47.676353454589844, 52.75138854980469, 57.8264274597168, 62.90146255493164, 67.97650146484375, 73.05152893066406, 78.1265640258789, 83.20159912109375, 88.27664184570312, 93.35167694091797, 98.42671203613281, 103.50174713134766, 108.5767822265625, 113.65182495117188, 118.72686004638672, 123.80189514160156, 128.87693786621094, 133.95196533203125, 139.02700805664062, 144.10205078125, 149.1770782470703, 154.25210571289062, 159.3271484375, 164.4021759033203, 169.4772186279297, 174.55224609375, 179.62728881835938, 184.70233154296875, 189.77735900878906, 194.85240173339844, 199.9274444580078, 205.00247192382812, 210.0775146484375, 215.1525421142578, 220.2275848388672, 225.3026123046875, 230.37765502929688, 235.45269775390625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 7.0, 14.0, 10.0, 12.0, 20.0, 16.0, 13.0, 36.0, 27.0, 37.0, 40.0, 44.0, 35.0, 49.0, 45.0, 55.0, 48.0, 37.0, 49.0, 55.0, 45.0, 39.0, 27.0, 27.0, 27.0, 35.0, 28.0, 18.0, 25.0, 15.0, 12.0, 17.0, 8.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.188255310058594, -39.8430290222168, -38.497802734375, -37.1525764465332, -35.807350158691406, -34.46212387084961, -33.11689758300781, -31.771671295166016, -30.42644500732422, -29.081218719482422, -27.735992431640625, -26.390766143798828, -25.04553985595703, -23.700313568115234, -22.355087280273438, -21.00986099243164, -19.664636611938477, -18.31941032409668, -16.974184036254883, -15.628957748413086, -14.283731460571289, -12.938505172729492, -11.593279838562012, -10.248053550720215, -8.902827262878418, -7.557600975036621, -6.212374687194824, -4.8671488761901855, -3.5219225883483887, -2.176696300506592, -0.8314704895019531, 0.5137557983398438, 1.8589820861816406, 3.2042083740234375, 4.549434661865234, 5.894660472869873, 7.23988676071167, 8.585113525390625, 9.930338859558105, 11.275565147399902, 12.6207914352417, 13.966017723083496, 15.311244010925293, 16.656469345092773, 18.00169563293457, 19.346921920776367, 20.692148208618164, 22.03737449645996, 23.382600784301758, 24.727827072143555, 26.07305335998535, 27.41827964782715, 28.763505935668945, 30.108732223510742, 31.453956604003906, 32.7991828918457, 34.1444091796875, 35.4896354675293, 36.834861755371094, 38.18008804321289, 39.52531433105469, 40.870540618896484, 42.21576690673828, 43.56099319458008, 44.906219482421875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 8.0, 9.0, 11.0, 15.0, 33.0, 32.0, 32.0, 32.0, 37.0, 38.0, 62.0, 52.0, 55.0, 59.0, 53.0, 61.0, 52.0, 48.0, 53.0, 47.0, 40.0, 34.0, 29.0, 34.0, 11.0, 18.0, 13.0, 5.0, 4.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.1610107421875, -8.915771484375, -8.6705322265625, -8.42529296875, -8.1800537109375, -7.934814453125, -7.6895751953125, -7.4443359375, -7.1990966796875, -6.953857421875, -6.7086181640625, -6.46337890625, -6.2181396484375, -5.972900390625, -5.7276611328125, -5.482421875, -5.2371826171875, -4.991943359375, -4.7467041015625, -4.50146484375, -4.2562255859375, -4.010986328125, -3.7657470703125, -3.5205078125, -3.2752685546875, -3.030029296875, -2.7847900390625, -2.53955078125, -2.2943115234375, -2.049072265625, -1.8038330078125, -1.55859375, -1.3133544921875, -1.068115234375, -0.8228759765625, -0.57763671875, -0.3323974609375, -0.087158203125, 0.1580810546875, 0.4033203125, 0.6485595703125, 0.893798828125, 1.1390380859375, 1.38427734375, 1.6295166015625, 1.874755859375, 2.1199951171875, 2.365234375, 2.6104736328125, 2.855712890625, 3.1009521484375, 3.34619140625, 3.5914306640625, 3.836669921875, 4.0819091796875, 4.3271484375, 4.5723876953125, 4.817626953125, 5.0628662109375, 5.30810546875, 5.5533447265625, 5.798583984375, 6.0438232421875, 6.2890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 7.0, 8.0, 10.0, 9.0, 11.0, 14.0, 38.0, 45.0, 63.0, 120.0, 203.0, 400.0, 641.0, 1262.0, 2171.0, 4166.0, 7808.0, 15409.0, 31581.0, 69278.0, 177777.0, 397575.0, 197561.0, 74082.0, 33881.0, 16415.0, 8371.0, 4383.0, 2253.0, 1279.0, 706.0, 413.0, 252.0, 128.0, 68.0, 57.0, 34.0, 19.0, 14.0, 10.0, 8.0, 8.0, 3.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.375732421875, -0.3651618957519531, -0.35459136962890625, -0.3440208435058594, -0.3334503173828125, -0.3228797912597656, -0.31230926513671875, -0.3017387390136719, -0.291168212890625, -0.2805976867675781, -0.27002716064453125, -0.2594566345214844, -0.2488861083984375, -0.23831558227539062, -0.22774505615234375, -0.21717453002929688, -0.20660400390625, -0.19603347778320312, -0.18546295166015625, -0.17489242553710938, -0.1643218994140625, -0.15375137329101562, -0.14318084716796875, -0.13261032104492188, -0.122039794921875, -0.11146926879882812, -0.10089874267578125, -0.09032821655273438, -0.0797576904296875, -0.06918716430664062, -0.05861663818359375, -0.048046112060546875, -0.0374755859375, -0.026905059814453125, -0.01633453369140625, -0.005764007568359375, 0.0048065185546875, 0.015377044677734375, 0.02594757080078125, 0.036518096923828125, 0.047088623046875, 0.057659149169921875, 0.06822967529296875, 0.07880020141601562, 0.0893707275390625, 0.09994125366210938, 0.11051177978515625, 0.12108230590820312, 0.13165283203125, 0.14222335815429688, 0.15279388427734375, 0.16336441040039062, 0.1739349365234375, 0.18450546264648438, 0.19507598876953125, 0.20564651489257812, 0.216217041015625, 0.22678756713867188, 0.23735809326171875, 0.24792861938476562, 0.2584991455078125, 0.2690696716308594, 0.27964019775390625, 0.2902107238769531, 0.30078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 3.0, 5.0, 2.0, 8.0, 10.0, 12.0, 13.0, 16.0, 24.0, 24.0, 16.0, 28.0, 34.0, 29.0, 44.0, 31.0, 34.0, 31.0, 38.0, 39.0, 38.0, 1066.0, 43.0, 35.0, 39.0, 38.0, 34.0, 24.0, 22.0, 24.0, 33.0, 31.0, 21.0, 25.0, 19.0, 18.0, 13.0, 15.0, 7.0, 8.0, 6.0, 6.0, 1.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.244140625, -3.13385009765625, -3.0235595703125, -2.91326904296875, -2.802978515625, -2.69268798828125, -2.5823974609375, -2.47210693359375, -2.36181640625, -2.25152587890625, -2.1412353515625, -2.03094482421875, -1.920654296875, -1.81036376953125, -1.7000732421875, -1.58978271484375, -1.4794921875, -1.36920166015625, -1.2589111328125, -1.14862060546875, -1.038330078125, -0.92803955078125, -0.8177490234375, -0.70745849609375, -0.59716796875, -0.48687744140625, -0.3765869140625, -0.26629638671875, -0.156005859375, -0.04571533203125, 0.0645751953125, 0.17486572265625, 0.28515625, 0.39544677734375, 0.5057373046875, 0.61602783203125, 0.726318359375, 0.83660888671875, 0.9468994140625, 1.05718994140625, 1.16748046875, 1.27777099609375, 1.3880615234375, 1.49835205078125, 1.608642578125, 1.71893310546875, 1.8292236328125, 1.93951416015625, 2.0498046875, 2.16009521484375, 2.2703857421875, 2.38067626953125, 2.490966796875, 2.60125732421875, 2.7115478515625, 2.82183837890625, 2.93212890625, 3.04241943359375, 3.1527099609375, 3.26300048828125, 3.373291015625, 3.48358154296875, 3.5938720703125, 3.70416259765625, 3.814453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 12.0, 21.0, 34.0, 35.0, 54.0, 105.0, 134.0, 184.0, 248.0, 424.0, 628.0, 932.0, 1335.0, 2047.0, 2936.0, 4522.0, 7106.0, 10986.0, 16992.0, 27157.0, 44480.0, 74609.0, 146875.0, 1325092.0, 193978.0, 93612.0, 52892.0, 32435.0, 20185.0, 12785.0, 8274.0, 5360.0, 3496.0, 2422.0, 1511.0, 1039.0, 706.0, 480.0, 351.0, 216.0, 131.0, 100.0, 70.0, 42.0, 37.0, 25.0, 9.0, 5.0, 3.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2135009765625, -0.20676231384277344, -0.20002365112304688, -0.1932849884033203, -0.18654632568359375, -0.1798076629638672, -0.17306900024414062, -0.16633033752441406, -0.1595916748046875, -0.15285301208496094, -0.14611434936523438, -0.1393756866455078, -0.13263702392578125, -0.1258983612060547, -0.11915969848632812, -0.11242103576660156, -0.105682373046875, -0.09894371032714844, -0.09220504760742188, -0.08546638488769531, -0.07872772216796875, -0.07198905944824219, -0.06525039672851562, -0.05851173400878906, -0.0517730712890625, -0.04503440856933594, -0.038295745849609375, -0.03155708312988281, -0.02481842041015625, -0.018079757690429688, -0.011341094970703125, -0.0046024322509765625, 0.00213623046875, 0.008874893188476562, 0.015613555908203125, 0.022352218627929688, 0.02909088134765625, 0.03582954406738281, 0.042568206787109375, 0.04930686950683594, 0.0560455322265625, 0.06278419494628906, 0.06952285766601562, 0.07626152038574219, 0.08300018310546875, 0.08973884582519531, 0.09647750854492188, 0.10321617126464844, 0.109954833984375, 0.11669349670410156, 0.12343215942382812, 0.1301708221435547, 0.13690948486328125, 0.1436481475830078, 0.15038681030273438, 0.15712547302246094, 0.1638641357421875, 0.17060279846191406, 0.17734146118164062, 0.1840801239013672, 0.19081878662109375, 0.1975574493408203, 0.20429611206054688, 0.21103477478027344, 0.2177734375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 7.0, 3.0, 5.0, 2.0, 8.0, 10.0, 15.0, 10.0, 13.0, 18.0, 15.0, 21.0, 31.0, 31.0, 35.0, 30.0, 32.0, 33.0, 44.0, 39.0, 49.0, 51.0, 44.0, 40.0, 28.0, 44.0, 37.0, 26.0, 34.0, 38.0, 38.0, 31.0, 28.0, 18.0, 20.0, 9.0, 14.0, 10.0, 3.0, 6.0, 6.0, 3.0, 3.0, 5.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.5331974029541016e-05, -2.4520792067050934e-05, -2.3709610104560852e-05, -2.289842814207077e-05, -2.208724617958069e-05, -2.1276064217090607e-05, -2.0464882254600525e-05, -1.9653700292110443e-05, -1.884251832962036e-05, -1.803133636713028e-05, -1.7220154404640198e-05, -1.6408972442150116e-05, -1.5597790479660034e-05, -1.4786608517169952e-05, -1.397542655467987e-05, -1.3164244592189789e-05, -1.2353062629699707e-05, -1.1541880667209625e-05, -1.0730698704719543e-05, -9.919516742229462e-06, -9.10833477973938e-06, -8.297152817249298e-06, -7.485970854759216e-06, -6.6747888922691345e-06, -5.863606929779053e-06, -5.052424967288971e-06, -4.241243004798889e-06, -3.4300610423088074e-06, -2.6188790798187256e-06, -1.8076971173286438e-06, -9.96515154838562e-07, -1.8533319234848022e-07, 6.258487701416016e-07, 1.4370307326316833e-06, 2.248212695121765e-06, 3.059394657611847e-06, 3.870576620101929e-06, 4.6817585825920105e-06, 5.492940545082092e-06, 6.304122507572174e-06, 7.115304470062256e-06, 7.926486432552338e-06, 8.73766839504242e-06, 9.548850357532501e-06, 1.0360032320022583e-05, 1.1171214282512665e-05, 1.1982396245002747e-05, 1.2793578207492828e-05, 1.360476016998291e-05, 1.4415942132472992e-05, 1.5227124094963074e-05, 1.6038306057453156e-05, 1.6849488019943237e-05, 1.766066998243332e-05, 1.84718519449234e-05, 1.9283033907413483e-05, 2.0094215869903564e-05, 2.0905397832393646e-05, 2.1716579794883728e-05, 2.252776175737381e-05, 2.333894371986389e-05, 2.4150125682353973e-05, 2.4961307644844055e-05, 2.5772489607334137e-05, 2.658367156982422e-05]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 2.0, 8.0, 8.0, 10.0, 10.0, 15.0, 14.0, 21.0, 25.0, 38.0, 27.0, 42.0, 51.0, 72.0, 112.0, 140.0, 267.0, 547.0, 2349.0, 341445.0, 697241.0, 4447.0, 703.0, 276.0, 173.0, 113.0, 69.0, 54.0, 49.0, 36.0, 28.0, 24.0, 18.0, 19.0, 21.0, 15.0, 10.0, 8.0, 5.0, 5.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0005507469177246094, -0.0005335882306098938, -0.0005164295434951782, -0.0004992708563804626, -0.00048211216926574707, -0.0004649534821510315, -0.0004477947950363159, -0.00043063610792160034, -0.00041347742080688477, -0.0003963187336921692, -0.0003791600465774536, -0.00036200135946273804, -0.00034484267234802246, -0.0003276839852333069, -0.0003105252981185913, -0.00029336661100387573, -0.00027620792388916016, -0.0002590492367744446, -0.000241890549659729, -0.00022473186254501343, -0.00020757317543029785, -0.00019041448831558228, -0.0001732558012008667, -0.00015609711408615112, -0.00013893842697143555, -0.00012177973985671997, -0.0001046210527420044, -8.746236562728882e-05, -7.030367851257324e-05, -5.3144991397857666e-05, -3.598630428314209e-05, -1.8827617168426514e-05, -1.6689300537109375e-06, 1.548975706100464e-05, 3.2648444175720215e-05, 4.980713129043579e-05, 6.696581840515137e-05, 8.412450551986694e-05, 0.00010128319263458252, 0.0001184418797492981, 0.00013560056686401367, 0.00015275925397872925, 0.00016991794109344482, 0.0001870766282081604, 0.00020423531532287598, 0.00022139400243759155, 0.00023855268955230713, 0.0002557113766670227, 0.0002728700637817383, 0.00029002875089645386, 0.00030718743801116943, 0.000324346125125885, 0.0003415048122406006, 0.00035866349935531616, 0.00037582218647003174, 0.0003929808735847473, 0.0004101395606994629, 0.00042729824781417847, 0.00044445693492889404, 0.0004616156220436096, 0.0004787743091583252, 0.0004959329962730408, 0.0005130916833877563, 0.0005302503705024719, 0.0005474090576171875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 12.0, 65.0, 316.0, 397.0, 184.0, 34.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.766818604664877e-05, -1.4827658560534474e-05, -1.1987131074420176e-05, -9.14660358830588e-06, -6.306076102191582e-06, -3.4655486160772853e-06, -6.250211299629882e-07, 2.2155072656460106e-06, 5.056033842265606e-06, 7.896561328379903e-06, 1.07370888144942e-05, 1.3577616300608497e-05, 1.6418143786722794e-05, 1.925867036334239e-05, 2.2099198758951388e-05, 2.4939727154560387e-05, 2.7780253731179982e-05, 3.062078030779958e-05, 3.346130688441917e-05, 3.6301837099017575e-05, 3.914236367563717e-05, 4.1982890252256766e-05, 4.482342046685517e-05, 4.7663947043474764e-05, 5.050447362009436e-05, 5.3345000196713954e-05, 5.618552677333355e-05, 5.902605698793195e-05, 6.186657992657274e-05, 6.470711377914995e-05, 6.754764035576954e-05, 7.038816693238914e-05, 7.322868623305112e-05, 7.606921280967072e-05, 7.890973938629031e-05, 8.175026596290991e-05, 8.45907925395295e-05, 8.743132639210671e-05, 9.027185296872631e-05, 9.31123795453459e-05, 9.59529061219655e-05, 9.879343269858509e-05, 0.00010163395927520469, 0.00010447448585182428, 0.00010731501970440149, 0.00011015554628102109, 0.00011299607285764068, 0.00011583659943426028, 0.00011867712601087987, 0.00012151765258749947, 0.00012435817916411906, 0.00012719871301669627, 0.00013003923231735826, 0.00013287976616993546, 0.00013572028547059745, 0.00013856081932317466, 0.00014140133862383664, 0.00014424187247641385, 0.00014708239177707583, 0.00014992292562965304, 0.00015276344493031502, 0.00015560397878289223, 0.0001584444980835542, 0.00016128503193613142, 0.00016412556578870863]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 6.0, 4.0, 11.0, 15.0, 17.0, 13.0, 21.0, 16.0, 27.0, 25.0, 22.0, 37.0, 37.0, 44.0, 39.0, 57.0, 37.0, 43.0, 42.0, 53.0, 39.0, 43.0, 36.0, 38.0, 39.0, 32.0, 33.0, 36.0, 24.0, 27.0, 18.0, 11.0, 9.0, 8.0, 5.0, 10.0, 6.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.836474984884262e-05, -1.7775222659111023e-05, -1.7185695469379425e-05, -1.6596168279647827e-05, -1.600664108991623e-05, -1.541711390018463e-05, -1.4827586710453033e-05, -1.4238059520721436e-05, -1.3648532330989838e-05, -1.305900514125824e-05, -1.2469477951526642e-05, -1.1879950761795044e-05, -1.1290423572063446e-05, -1.0700896382331848e-05, -1.011136919260025e-05, -9.521842002868652e-06, -8.932314813137054e-06, -8.342787623405457e-06, -7.753260433673859e-06, -7.163733243942261e-06, -6.574206054210663e-06, -5.984678864479065e-06, -5.395151674747467e-06, -4.805624485015869e-06, -4.216097295284271e-06, -3.6265701055526733e-06, -3.0370429158210754e-06, -2.4475157260894775e-06, -1.8579885363578796e-06, -1.2684613466262817e-06, -6.789341568946838e-07, -8.940696716308594e-08, 5.00120222568512e-07, 1.0896474123001099e-06, 1.6791746020317078e-06, 2.2687017917633057e-06, 2.8582289814949036e-06, 3.4477561712265015e-06, 4.037283360958099e-06, 4.626810550689697e-06, 5.216337740421295e-06, 5.805864930152893e-06, 6.395392119884491e-06, 6.984919309616089e-06, 7.574446499347687e-06, 8.163973689079285e-06, 8.753500878810883e-06, 9.34302806854248e-06, 9.932555258274078e-06, 1.0522082448005676e-05, 1.1111609637737274e-05, 1.1701136827468872e-05, 1.229066401720047e-05, 1.2880191206932068e-05, 1.3469718396663666e-05, 1.4059245586395264e-05, 1.4648772776126862e-05, 1.523829996585846e-05, 1.5827827155590057e-05, 1.6417354345321655e-05, 1.7006881535053253e-05, 1.759640872478485e-05, 1.818593591451645e-05, 1.8775463104248047e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 8.0, 9.0, 11.0, 15.0, 33.0, 32.0, 32.0, 32.0, 37.0, 38.0, 62.0, 52.0, 55.0, 59.0, 53.0, 61.0, 52.0, 48.0, 53.0, 47.0, 40.0, 34.0, 29.0, 34.0, 11.0, 18.0, 13.0, 5.0, 4.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.1610107421875, -8.915771484375, -8.6705322265625, -8.42529296875, -8.1800537109375, -7.934814453125, -7.6895751953125, -7.4443359375, -7.1990966796875, -6.953857421875, -6.7086181640625, -6.46337890625, -6.2181396484375, -5.972900390625, -5.7276611328125, -5.482421875, -5.2371826171875, -4.991943359375, -4.7467041015625, -4.50146484375, -4.2562255859375, -4.010986328125, -3.7657470703125, -3.5205078125, -3.2752685546875, -3.030029296875, -2.7847900390625, -2.53955078125, -2.2943115234375, -2.049072265625, -1.8038330078125, -1.55859375, -1.3133544921875, -1.068115234375, -0.8228759765625, -0.57763671875, -0.3323974609375, -0.087158203125, 0.1580810546875, 0.4033203125, 0.6485595703125, 0.893798828125, 1.1390380859375, 1.38427734375, 1.6295166015625, 1.874755859375, 2.1199951171875, 2.365234375, 2.6104736328125, 2.855712890625, 3.1009521484375, 3.34619140625, 3.5914306640625, 3.836669921875, 4.0819091796875, 4.3271484375, 4.5723876953125, 4.817626953125, 5.0628662109375, 5.30810546875, 5.5533447265625, 5.798583984375, 6.0438232421875, 6.2890625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 12.0, 5.0, 15.0, 21.0, 37.0, 53.0, 108.0, 178.0, 329.0, 568.0, 1041.0, 1835.0, 3261.0, 5804.0, 11518.0, 32076.0, 159399.0, 606161.0, 167584.0, 33158.0, 11840.0, 5952.0, 3344.0, 1879.0, 1083.0, 552.0, 317.0, 159.0, 97.0, 59.0, 43.0, 26.0, 16.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-6.3984375, -6.22320556640625, -6.0479736328125, -5.87274169921875, -5.697509765625, -5.52227783203125, -5.3470458984375, -5.17181396484375, -4.99658203125, -4.82135009765625, -4.6461181640625, -4.47088623046875, -4.295654296875, -4.12042236328125, -3.9451904296875, -3.76995849609375, -3.5947265625, -3.41949462890625, -3.2442626953125, -3.06903076171875, -2.893798828125, -2.71856689453125, -2.5433349609375, -2.36810302734375, -2.19287109375, -2.01763916015625, -1.8424072265625, -1.66717529296875, -1.491943359375, -1.31671142578125, -1.1414794921875, -0.96624755859375, -0.791015625, -0.61578369140625, -0.4405517578125, -0.26531982421875, -0.090087890625, 0.08514404296875, 0.2603759765625, 0.43560791015625, 0.61083984375, 0.78607177734375, 0.9613037109375, 1.13653564453125, 1.311767578125, 1.48699951171875, 1.6622314453125, 1.83746337890625, 2.0126953125, 2.18792724609375, 2.3631591796875, 2.53839111328125, 2.713623046875, 2.88885498046875, 3.0640869140625, 3.23931884765625, 3.41455078125, 3.58978271484375, 3.7650146484375, 3.94024658203125, 4.115478515625, 4.29071044921875, 4.4659423828125, 4.64117431640625, 4.81640625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 8.0, 7.0, 7.0, 9.0, 12.0, 12.0, 11.0, 21.0, 22.0, 33.0, 32.0, 31.0, 31.0, 38.0, 45.0, 40.0, 52.0, 85.0, 105.0, 1586.0, 321.0, 101.0, 61.0, 48.0, 35.0, 40.0, 31.0, 34.0, 17.0, 21.0, 21.0, 19.0, 19.0, 14.0, 10.0, 12.0, 7.0, 11.0, 9.0, 3.0, 3.0, 6.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0], "bins": [-20.140625, -19.579345703125, -19.01806640625, -18.456787109375, -17.8955078125, -17.334228515625, -16.77294921875, -16.211669921875, -15.650390625, -15.089111328125, -14.52783203125, -13.966552734375, -13.4052734375, -12.843994140625, -12.28271484375, -11.721435546875, -11.16015625, -10.598876953125, -10.03759765625, -9.476318359375, -8.9150390625, -8.353759765625, -7.79248046875, -7.231201171875, -6.669921875, -6.108642578125, -5.54736328125, -4.986083984375, -4.4248046875, -3.863525390625, -3.30224609375, -2.740966796875, -2.1796875, -1.618408203125, -1.05712890625, -0.495849609375, 0.0654296875, 0.626708984375, 1.18798828125, 1.749267578125, 2.310546875, 2.871826171875, 3.43310546875, 3.994384765625, 4.5556640625, 5.116943359375, 5.67822265625, 6.239501953125, 6.80078125, 7.362060546875, 7.92333984375, 8.484619140625, 9.0458984375, 9.607177734375, 10.16845703125, 10.729736328125, 11.291015625, 11.852294921875, 12.41357421875, 12.974853515625, 13.5361328125, 14.097412109375, 14.65869140625, 15.219970703125, 15.78125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 14.0, 16.0, 14.0, 20.0, 28.0, 31.0, 45.0, 64.0, 80.0, 100.0, 151.0, 212.0, 319.0, 702.0, 7383.0, 3091838.0, 42042.0, 1229.0, 417.0, 291.0, 168.0, 154.0, 113.0, 68.0, 53.0, 40.0, 27.0, 21.0, 20.0, 17.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-58.15625, -56.5263671875, -54.896484375, -53.2666015625, -51.63671875, -50.0068359375, -48.376953125, -46.7470703125, -45.1171875, -43.4873046875, -41.857421875, -40.2275390625, -38.59765625, -36.9677734375, -35.337890625, -33.7080078125, -32.078125, -30.4482421875, -28.818359375, -27.1884765625, -25.55859375, -23.9287109375, -22.298828125, -20.6689453125, -19.0390625, -17.4091796875, -15.779296875, -14.1494140625, -12.51953125, -10.8896484375, -9.259765625, -7.6298828125, -6.0, -4.3701171875, -2.740234375, -1.1103515625, 0.51953125, 2.1494140625, 3.779296875, 5.4091796875, 7.0390625, 8.6689453125, 10.298828125, 11.9287109375, 13.55859375, 15.1884765625, 16.818359375, 18.4482421875, 20.078125, 21.7080078125, 23.337890625, 24.9677734375, 26.59765625, 28.2275390625, 29.857421875, 31.4873046875, 33.1171875, 34.7470703125, 36.376953125, 38.0068359375, 39.63671875, 41.2666015625, 42.896484375, 44.5263671875, 46.15625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 20.0, 436.0, 522.0, 37.0, 1.0, 1.0], "bins": [-241.8096923828125, -237.7845001220703, -233.75930786132812, -229.73410034179688, -225.7089080810547, -221.6837158203125, -217.6585235595703, -213.63333129882812, -209.60812377929688, -205.5829315185547, -201.5577392578125, -197.53253173828125, -193.50733947753906, -189.48214721679688, -185.4569549560547, -181.4317626953125, -177.4065704345703, -173.38137817382812, -169.35618591308594, -165.3309783935547, -161.3057861328125, -157.2805938720703, -153.25540161132812, -149.23020935058594, -145.20501708984375, -141.17982482910156, -137.15463256835938, -133.12942504882812, -129.10423278808594, -125.07904052734375, -121.05384826660156, -117.02865600585938, -113.00346374511719, -108.978271484375, -104.95307159423828, -100.9278793334961, -96.90267944335938, -92.87748718261719, -88.852294921875, -84.82710266113281, -80.8019027709961, -76.7767105102539, -72.75151062011719, -68.726318359375, -64.70112609863281, -60.675926208496094, -56.650733947753906, -52.62553787231445, -48.600341796875, -44.57514572143555, -40.549949645996094, -36.524757385253906, -32.49956130981445, -28.474365234375, -24.44917106628418, -20.42397689819336, -16.398780822753906, -12.37358570098877, -8.348390579223633, -4.323195457458496, -0.2980003356933594, 3.7271957397460938, 7.752389907836914, 11.777584075927734, 15.802780151367188]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 5.0, 10.0, 15.0, 18.0, 15.0, 18.0, 23.0, 27.0, 22.0, 25.0, 27.0, 34.0, 30.0, 42.0, 34.0, 49.0, 36.0, 35.0, 59.0, 53.0, 48.0, 47.0, 33.0, 46.0, 37.0, 37.0, 21.0, 19.0, 25.0, 16.0, 18.0, 18.0, 9.0, 13.0, 14.0, 5.0, 5.0, 2.0, 4.0, 5.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.71749496459961, -46.90679168701172, -45.09608840942383, -43.28538513183594, -41.47467803955078, -39.66397476196289, -37.853271484375, -36.04256820678711, -34.23186492919922, -32.42116165161133, -30.610456466674805, -28.799753189086914, -26.98904800415039, -25.1783447265625, -23.36764144897461, -21.55693817138672, -19.746231079101562, -17.935527801513672, -16.12482261657715, -14.314119338989258, -12.50341510772705, -10.692710876464844, -8.882007598876953, -7.071303367614746, -5.260599136352539, -3.449895143508911, -1.6391911506652832, 0.17151260375976562, 1.9822168350219727, 3.7929210662841797, 5.60362434387207, 7.414328575134277, 9.225028991699219, 11.035733222961426, 12.846437454223633, 14.657140731811523, 16.467845916748047, 18.278549194335938, 20.089252471923828, 21.89995574951172, 23.710660934448242, 25.521364212036133, 27.332069396972656, 29.142772674560547, 30.953475952148438, 32.764183044433594, 34.57488250732422, 36.385589599609375, 38.196292877197266, 40.006996154785156, 41.81769943237305, 43.62840270996094, 45.439109802246094, 47.249813079833984, 49.060516357421875, 50.871219635009766, 52.681922912597656, 54.49262619018555, 56.30332946777344, 58.114036560058594, 59.924739837646484, 61.735443115234375, 63.546146392822266, 65.35684967041016, 67.16755676269531]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 9.0, 8.0, 13.0, 8.0, 20.0, 32.0, 32.0, 36.0, 30.0, 46.0, 47.0, 66.0, 43.0, 68.0, 43.0, 59.0, 68.0, 50.0, 51.0, 38.0, 51.0, 39.0, 20.0, 43.0, 17.0, 18.0, 10.0, 14.0, 6.0, 8.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.515380859375, -9.25732421875, -8.999267578125, -8.7412109375, -8.483154296875, -8.22509765625, -7.967041015625, -7.708984375, -7.450927734375, -7.19287109375, -6.934814453125, -6.6767578125, -6.418701171875, -6.16064453125, -5.902587890625, -5.64453125, -5.386474609375, -5.12841796875, -4.870361328125, -4.6123046875, -4.354248046875, -4.09619140625, -3.838134765625, -3.580078125, -3.322021484375, -3.06396484375, -2.805908203125, -2.5478515625, -2.289794921875, -2.03173828125, -1.773681640625, -1.515625, -1.257568359375, -0.99951171875, -0.741455078125, -0.4833984375, -0.225341796875, 0.03271484375, 0.290771484375, 0.548828125, 0.806884765625, 1.06494140625, 1.322998046875, 1.5810546875, 1.839111328125, 2.09716796875, 2.355224609375, 2.61328125, 2.871337890625, 3.12939453125, 3.387451171875, 3.6455078125, 3.903564453125, 4.16162109375, 4.419677734375, 4.677734375, 4.935791015625, 5.19384765625, 5.451904296875, 5.7099609375, 5.968017578125, 6.22607421875, 6.484130859375, 6.7421875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 15.0, 17.0, 18.0, 32.0, 44.0, 64.0, 112.0, 208.0, 475.0, 1276.0, 4077.0, 17278.0, 110539.0, 1206819.0, 2459458.0, 342768.0, 39206.0, 8227.0, 2217.0, 747.0, 308.0, 124.0, 83.0, 41.0, 29.0, 23.0, 19.0, 11.0, 9.0, 9.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.118896484375, -13.70654296875, -13.294189453125, -12.8818359375, -12.469482421875, -12.05712890625, -11.644775390625, -11.232421875, -10.820068359375, -10.40771484375, -9.995361328125, -9.5830078125, -9.170654296875, -8.75830078125, -8.345947265625, -7.93359375, -7.521240234375, -7.10888671875, -6.696533203125, -6.2841796875, -5.871826171875, -5.45947265625, -5.047119140625, -4.634765625, -4.222412109375, -3.81005859375, -3.397705078125, -2.9853515625, -2.572998046875, -2.16064453125, -1.748291015625, -1.3359375, -0.923583984375, -0.51123046875, -0.098876953125, 0.3134765625, 0.725830078125, 1.13818359375, 1.550537109375, 1.962890625, 2.375244140625, 2.78759765625, 3.199951171875, 3.6123046875, 4.024658203125, 4.43701171875, 4.849365234375, 5.26171875, 5.674072265625, 6.08642578125, 6.498779296875, 6.9111328125, 7.323486328125, 7.73583984375, 8.148193359375, 8.560546875, 8.972900390625, 9.38525390625, 9.797607421875, 10.2099609375, 10.622314453125, 11.03466796875, 11.447021484375, 11.859375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 10.0, 6.0, 10.0, 16.0, 18.0, 30.0, 52.0, 51.0, 93.0, 108.0, 160.0, 250.0, 364.0, 533.0, 616.0, 548.0, 365.0, 237.0, 191.0, 122.0, 82.0, 66.0, 39.0, 35.0, 19.0, 18.0, 11.0, 10.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.7342529296875, -9.320068359375, -8.9058837890625, -8.49169921875, -8.0775146484375, -7.663330078125, -7.2491455078125, -6.8349609375, -6.4207763671875, -6.006591796875, -5.5924072265625, -5.17822265625, -4.7640380859375, -4.349853515625, -3.9356689453125, -3.521484375, -3.1072998046875, -2.693115234375, -2.2789306640625, -1.86474609375, -1.4505615234375, -1.036376953125, -0.6221923828125, -0.2080078125, 0.2061767578125, 0.620361328125, 1.0345458984375, 1.44873046875, 1.8629150390625, 2.277099609375, 2.6912841796875, 3.10546875, 3.5196533203125, 3.933837890625, 4.3480224609375, 4.76220703125, 5.1763916015625, 5.590576171875, 6.0047607421875, 6.4189453125, 6.8331298828125, 7.247314453125, 7.6614990234375, 8.07568359375, 8.4898681640625, 8.904052734375, 9.3182373046875, 9.732421875, 10.1466064453125, 10.560791015625, 10.9749755859375, 11.38916015625, 11.8033447265625, 12.217529296875, 12.6317138671875, 13.0458984375, 13.4600830078125, 13.874267578125, 14.2884521484375, 14.70263671875, 15.1168212890625, 15.531005859375, 15.9451904296875, 16.359375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 12.0, 12.0, 20.0, 21.0, 42.0, 49.0, 82.0, 106.0, 137.0, 170.0, 321.0, 532.0, 1805.0, 52152.0, 3850849.0, 281818.0, 4368.0, 689.0, 329.0, 225.0, 130.0, 107.0, 83.0, 70.0, 38.0, 34.0, 12.0, 17.0, 17.0, 11.0, 6.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -47.283203125, -45.87890625, -44.474609375, -43.0703125, -41.666015625, -40.26171875, -38.857421875, -37.453125, -36.048828125, -34.64453125, -33.240234375, -31.8359375, -30.431640625, -29.02734375, -27.623046875, -26.21875, -24.814453125, -23.41015625, -22.005859375, -20.6015625, -19.197265625, -17.79296875, -16.388671875, -14.984375, -13.580078125, -12.17578125, -10.771484375, -9.3671875, -7.962890625, -6.55859375, -5.154296875, -3.75, -2.345703125, -0.94140625, 0.462890625, 1.8671875, 3.271484375, 4.67578125, 6.080078125, 7.484375, 8.888671875, 10.29296875, 11.697265625, 13.1015625, 14.505859375, 15.91015625, 17.314453125, 18.71875, 20.123046875, 21.52734375, 22.931640625, 24.3359375, 25.740234375, 27.14453125, 28.548828125, 29.953125, 31.357421875, 32.76171875, 34.166015625, 35.5703125, 36.974609375, 38.37890625, 39.783203125, 41.1875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 21.0, 106.0, 264.0, 336.0, 201.0, 67.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-231.13645935058594, -226.4445343017578, -221.75259399414062, -217.0606689453125, -212.36874389648438, -207.67681884765625, -202.98487854003906, -198.29295349121094, -193.60101318359375, -188.90908813476562, -184.21714782714844, -179.5252227783203, -174.8332977294922, -170.141357421875, -165.44943237304688, -160.75750732421875, -156.06558227539062, -151.3736572265625, -146.6817169189453, -141.9897918701172, -137.29786682128906, -132.60592651367188, -127.91400146484375, -123.22207641601562, -118.53014373779297, -113.83821105957031, -109.14628601074219, -104.45435333251953, -99.76242065429688, -95.07049560546875, -90.3785629272461, -85.68663024902344, -80.99469757080078, -76.30276489257812, -71.61083984375, -66.91890716552734, -62.22697830200195, -57.53504943847656, -52.843116760253906, -48.151187896728516, -43.459259033203125, -38.767330169677734, -34.075401306152344, -29.383468627929688, -24.691539764404297, -19.999610900878906, -15.307680130004883, -10.61574935913086, -5.923820495605469, -1.2318906784057617, 3.4600391387939453, 8.151968955993652, 12.84389877319336, 17.53582763671875, 22.227758407592773, 26.919689178466797, 31.611618041992188, 36.30354690551758, 40.99547576904297, 45.687408447265625, 50.379337310791016, 55.071266174316406, 59.76319885253906, 64.45512390136719, 69.14705657958984]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 7.0, 8.0, 6.0, 16.0, 19.0, 11.0, 18.0, 26.0, 15.0, 33.0, 34.0, 35.0, 30.0, 33.0, 37.0, 35.0, 42.0, 40.0, 45.0, 49.0, 39.0, 37.0, 34.0, 41.0, 34.0, 38.0, 28.0, 32.0, 24.0, 21.0, 25.0, 12.0, 13.0, 14.0, 14.0, 11.0, 6.0, 11.0, 7.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-38.933815002441406, -37.81377029418945, -36.6937255859375, -35.57368469238281, -34.45363998413086, -33.333595275878906, -32.21355438232422, -31.093509674072266, -29.973464965820312, -28.85342025756836, -27.73337745666504, -26.61333465576172, -25.493289947509766, -24.373245239257812, -23.253202438354492, -22.133159637451172, -21.01311492919922, -19.893070220947266, -18.773027420043945, -17.652984619140625, -16.532939910888672, -15.412896156311035, -14.292852401733398, -13.172808647155762, -12.052764892578125, -10.932721138000488, -9.812677383422852, -8.692633628845215, -7.572589874267578, -6.452546119689941, -5.332502365112305, -4.212458610534668, -3.0924148559570312, -1.9723711013793945, -0.8523273468017578, 0.2677164077758789, 1.3877601623535156, 2.5078039169311523, 3.627847671508789, 4.747891426086426, 5.8679351806640625, 6.987978935241699, 8.108022689819336, 9.228066444396973, 10.34811019897461, 11.468153953552246, 12.588197708129883, 13.70824146270752, 14.828285217285156, 15.948328971862793, 17.06837272644043, 18.18841552734375, 19.308460235595703, 20.428504943847656, 21.548547744750977, 22.668590545654297, 23.78863525390625, 24.908679962158203, 26.028722763061523, 27.148765563964844, 28.268810272216797, 29.38885498046875, 30.50889778137207, 31.62894058227539, 32.748985290527344]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 10.0, 14.0, 16.0, 26.0, 35.0, 43.0, 41.0, 47.0, 58.0, 68.0, 59.0, 72.0, 63.0, 61.0, 45.0, 59.0, 46.0, 47.0, 41.0, 38.0, 33.0, 22.0, 18.0, 12.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.1796875, -10.90130615234375, -10.6229248046875, -10.34454345703125, -10.066162109375, -9.78778076171875, -9.5093994140625, -9.23101806640625, -8.95263671875, -8.67425537109375, -8.3958740234375, -8.11749267578125, -7.839111328125, -7.56072998046875, -7.2823486328125, -7.00396728515625, -6.7255859375, -6.44720458984375, -6.1688232421875, -5.89044189453125, -5.612060546875, -5.33367919921875, -5.0552978515625, -4.77691650390625, -4.49853515625, -4.22015380859375, -3.9417724609375, -3.66339111328125, -3.385009765625, -3.10662841796875, -2.8282470703125, -2.54986572265625, -2.271484375, -1.99310302734375, -1.7147216796875, -1.43634033203125, -1.157958984375, -0.87957763671875, -0.6011962890625, -0.32281494140625, -0.04443359375, 0.23394775390625, 0.5123291015625, 0.79071044921875, 1.069091796875, 1.34747314453125, 1.6258544921875, 1.90423583984375, 2.1826171875, 2.46099853515625, 2.7393798828125, 3.01776123046875, 3.296142578125, 3.57452392578125, 3.8529052734375, 4.13128662109375, 4.40966796875, 4.68804931640625, 4.9664306640625, 5.24481201171875, 5.523193359375, 5.80157470703125, 6.0799560546875, 6.35833740234375, 6.63671875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 2.0, 5.0, 10.0, 12.0, 7.0, 12.0, 19.0, 21.0, 37.0, 57.0, 90.0, 179.0, 309.0, 611.0, 1281.0, 2747.0, 6351.0, 14976.0, 37343.0, 100932.0, 362903.0, 357747.0, 99254.0, 36999.0, 14885.0, 6381.0, 2829.0, 1222.0, 628.0, 274.0, 158.0, 101.0, 54.0, 37.0, 27.0, 13.0, 16.0, 12.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40087890625, -0.38655853271484375, -0.3722381591796875, -0.35791778564453125, -0.343597412109375, -0.32927703857421875, -0.3149566650390625, -0.30063629150390625, -0.28631591796875, -0.27199554443359375, -0.2576751708984375, -0.24335479736328125, -0.229034423828125, -0.21471405029296875, -0.2003936767578125, -0.18607330322265625, -0.1717529296875, -0.15743255615234375, -0.1431121826171875, -0.12879180908203125, -0.114471435546875, -0.10015106201171875, -0.0858306884765625, -0.07151031494140625, -0.05718994140625, -0.04286956787109375, -0.0285491943359375, -0.01422882080078125, 9.1552734375e-05, 0.01441192626953125, 0.0287322998046875, 0.04305267333984375, 0.057373046875, 0.07169342041015625, 0.0860137939453125, 0.10033416748046875, 0.114654541015625, 0.12897491455078125, 0.1432952880859375, 0.15761566162109375, 0.17193603515625, 0.18625640869140625, 0.2005767822265625, 0.21489715576171875, 0.229217529296875, 0.24353790283203125, 0.2578582763671875, 0.27217864990234375, 0.2864990234375, 0.30081939697265625, 0.3151397705078125, 0.32946014404296875, 0.343780517578125, 0.35810089111328125, 0.3724212646484375, 0.38674163818359375, 0.40106201171875, 0.41538238525390625, 0.4297027587890625, 0.44402313232421875, 0.458343505859375, 0.47266387939453125, 0.4869842529296875, 0.5013046264648438, 0.515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 7.0, 9.0, 10.0, 7.0, 15.0, 10.0, 13.0, 13.0, 20.0, 16.0, 23.0, 34.0, 34.0, 37.0, 28.0, 37.0, 33.0, 34.0, 38.0, 47.0, 1070.0, 45.0, 58.0, 40.0, 38.0, 29.0, 29.0, 33.0, 29.0, 28.0, 25.0, 11.0, 23.0, 13.0, 17.0, 11.0, 17.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.398651123046875, -3.28363037109375, -3.168609619140625, -3.0535888671875, -2.938568115234375, -2.82354736328125, -2.708526611328125, -2.593505859375, -2.478485107421875, -2.36346435546875, -2.248443603515625, -2.1334228515625, -2.018402099609375, -1.90338134765625, -1.788360595703125, -1.67333984375, -1.558319091796875, -1.44329833984375, -1.328277587890625, -1.2132568359375, -1.098236083984375, -0.98321533203125, -0.868194580078125, -0.753173828125, -0.638153076171875, -0.52313232421875, -0.408111572265625, -0.2930908203125, -0.178070068359375, -0.06304931640625, 0.051971435546875, 0.1669921875, 0.282012939453125, 0.39703369140625, 0.512054443359375, 0.6270751953125, 0.742095947265625, 0.85711669921875, 0.972137451171875, 1.087158203125, 1.202178955078125, 1.31719970703125, 1.432220458984375, 1.5472412109375, 1.662261962890625, 1.77728271484375, 1.892303466796875, 2.00732421875, 2.122344970703125, 2.23736572265625, 2.352386474609375, 2.4674072265625, 2.582427978515625, 2.69744873046875, 2.812469482421875, 2.927490234375, 3.042510986328125, 3.15753173828125, 3.272552490234375, 3.3875732421875, 3.502593994140625, 3.61761474609375, 3.732635498046875, 3.84765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 12.0, 12.0, 23.0, 38.0, 51.0, 69.0, 100.0, 155.0, 213.0, 319.0, 419.0, 617.0, 917.0, 1275.0, 1873.0, 2791.0, 3951.0, 5760.0, 8460.0, 13141.0, 20342.0, 31750.0, 52659.0, 93792.0, 194823.0, 1322758.0, 145966.0, 73519.0, 43208.0, 26767.0, 16801.0, 11119.0, 7362.0, 5033.0, 3441.0, 2331.0, 1588.0, 1061.0, 812.0, 580.0, 378.0, 265.0, 166.0, 122.0, 100.0, 48.0, 37.0, 29.0, 27.0, 16.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.2049560546875, -0.1984100341796875, -0.191864013671875, -0.1853179931640625, -0.17877197265625, -0.1722259521484375, -0.165679931640625, -0.1591339111328125, -0.152587890625, -0.1460418701171875, -0.139495849609375, -0.1329498291015625, -0.12640380859375, -0.1198577880859375, -0.113311767578125, -0.1067657470703125, -0.1002197265625, -0.0936737060546875, -0.087127685546875, -0.0805816650390625, -0.07403564453125, -0.0674896240234375, -0.060943603515625, -0.0543975830078125, -0.0478515625, -0.0413055419921875, -0.034759521484375, -0.0282135009765625, -0.02166748046875, -0.0151214599609375, -0.008575439453125, -0.0020294189453125, 0.0045166015625, 0.0110626220703125, 0.017608642578125, 0.0241546630859375, 0.03070068359375, 0.0372467041015625, 0.043792724609375, 0.0503387451171875, 0.056884765625, 0.0634307861328125, 0.069976806640625, 0.0765228271484375, 0.08306884765625, 0.0896148681640625, 0.096160888671875, 0.1027069091796875, 0.1092529296875, 0.1157989501953125, 0.122344970703125, 0.1288909912109375, 0.13543701171875, 0.1419830322265625, 0.148529052734375, 0.1550750732421875, 0.16162109375, 0.1681671142578125, 0.174713134765625, 0.1812591552734375, 0.18780517578125, 0.1943511962890625, 0.200897216796875, 0.2074432373046875, 0.2139892578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 5.0, 8.0, 13.0, 13.0, 28.0, 24.0, 20.0, 23.0, 41.0, 40.0, 40.0, 38.0, 55.0, 59.0, 52.0, 60.0, 52.0, 60.0, 48.0, 39.0, 52.0, 35.0, 36.0, 32.0, 21.0, 23.0, 13.0, 13.0, 12.0, 9.0, 6.0, 6.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4689903259277344e-05, -3.357231616973877e-05, -3.2454729080200195e-05, -3.133714199066162e-05, -3.0219554901123047e-05, -2.9101967811584473e-05, -2.79843807220459e-05, -2.6866793632507324e-05, -2.574920654296875e-05, -2.4631619453430176e-05, -2.35140323638916e-05, -2.2396445274353027e-05, -2.1278858184814453e-05, -2.016127109527588e-05, -1.9043684005737305e-05, -1.792609691619873e-05, -1.6808509826660156e-05, -1.5690922737121582e-05, -1.4573335647583008e-05, -1.3455748558044434e-05, -1.233816146850586e-05, -1.1220574378967285e-05, -1.0102987289428711e-05, -8.985400199890137e-06, -7.867813110351562e-06, -6.750226020812988e-06, -5.632638931274414e-06, -4.51505184173584e-06, -3.3974647521972656e-06, -2.2798776626586914e-06, -1.1622905731201172e-06, -4.470348358154297e-08, 1.0728836059570312e-06, 2.1904706954956055e-06, 3.3080577850341797e-06, 4.425644874572754e-06, 5.543231964111328e-06, 6.660819053649902e-06, 7.778406143188477e-06, 8.89599323272705e-06, 1.0013580322265625e-05, 1.11311674118042e-05, 1.2248754501342773e-05, 1.3366341590881348e-05, 1.4483928680419922e-05, 1.5601515769958496e-05, 1.671910285949707e-05, 1.7836689949035645e-05, 1.895427703857422e-05, 2.0071864128112793e-05, 2.1189451217651367e-05, 2.230703830718994e-05, 2.3424625396728516e-05, 2.454221248626709e-05, 2.5659799575805664e-05, 2.6777386665344238e-05, 2.7894973754882812e-05, 2.9012560844421387e-05, 3.013014793395996e-05, 3.1247735023498535e-05, 3.236532211303711e-05, 3.3482909202575684e-05, 3.460049629211426e-05, 3.571808338165283e-05, 3.6835670471191406e-05]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 10.0, 8.0, 11.0, 10.0, 16.0, 16.0, 24.0, 25.0, 46.0, 49.0, 57.0, 84.0, 107.0, 184.0, 315.0, 979.0, 62339.0, 978841.0, 4074.0, 606.0, 235.0, 117.0, 103.0, 61.0, 44.0, 37.0, 37.0, 32.0, 19.0, 15.0, 13.0, 7.0, 10.0, 5.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007543563842773438, -0.0007316991686820984, -0.000709041953086853, -0.0006863847374916077, -0.0006637275218963623, -0.0006410703063011169, -0.0006184130907058716, -0.0005957558751106262, -0.0005730986595153809, -0.0005504414439201355, -0.0005277842283248901, -0.0005051270127296448, -0.0004824697971343994, -0.00045981258153915405, -0.0004371553659439087, -0.00041449815034866333, -0.00039184093475341797, -0.0003691837191581726, -0.00034652650356292725, -0.0003238692879676819, -0.0003012120723724365, -0.00027855485677719116, -0.0002558976411819458, -0.00023324042558670044, -0.00021058320999145508, -0.00018792599439620972, -0.00016526877880096436, -0.000142611563205719, -0.00011995434761047363, -9.729713201522827e-05, -7.463991641998291e-05, -5.198270082473755e-05, -2.9325485229492188e-05, -6.668269634246826e-06, 1.5988945960998535e-05, 3.8646161556243896e-05, 6.130337715148926e-05, 8.396059274673462e-05, 0.00010661780834197998, 0.00012927502393722534, 0.0001519322395324707, 0.00017458945512771606, 0.00019724667072296143, 0.0002199038863182068, 0.00024256110191345215, 0.0002652183175086975, 0.00028787553310394287, 0.00031053274869918823, 0.0003331899642944336, 0.00035584717988967896, 0.0003785043954849243, 0.0004011616110801697, 0.00042381882667541504, 0.0004464760422706604, 0.00046913325786590576, 0.0004917904734611511, 0.0005144476890563965, 0.0005371049046516418, 0.0005597621202468872, 0.0005824193358421326, 0.0006050765514373779, 0.0006277337670326233, 0.0006503909826278687, 0.000673048198223114, 0.0006957054138183594]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 22.0, 97.0, 245.0, 325.0, 240.0, 68.0, 12.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9814271581708454e-05, -1.745940971886739e-05, -1.5104546037036926e-05, -1.2749684174195863e-05, -1.03948214018601e-05, -8.039958629524335e-06, -5.685096766683273e-06, -3.3302330848528072e-06, -9.75371222011745e-07, 1.3794913229503436e-06, 3.734353867912432e-06, 6.089216185500845e-06, 8.44407895783661e-06, 1.0798941730172373e-05, 1.3153803593013436e-05, 1.55086672748439e-05, 1.7863529137684964e-05, 2.0218391000526026e-05, 2.257325468235649e-05, 2.4928116545197554e-05, 2.7282978408038616e-05, 2.9637842089869082e-05, 3.199270577169955e-05, 3.4347569453530014e-05, 3.670242949738167e-05, 3.905729317921214e-05, 4.14121532230638e-05, 4.376701690489426e-05, 4.612188058672473e-05, 4.8476744268555194e-05, 5.083160431240685e-05, 5.318646799423732e-05, 5.554133531404659e-05, 5.789619899587706e-05, 6.0251059039728716e-05, 6.260591908358037e-05, 6.496078276541084e-05, 6.73156464472413e-05, 6.967051012907177e-05, 7.202537381090224e-05, 7.43802374927327e-05, 7.673510117456317e-05, 7.908996485639364e-05, 8.14448285382241e-05, 8.379968494409695e-05, 8.615454862592742e-05, 8.850941230775788e-05, 9.086427598958835e-05, 9.32191323954612e-05, 9.557399607729167e-05, 9.792885975912213e-05, 0.0001002837234409526, 0.00010263857984682545, 0.00010499344352865592, 0.00010734830721048638, 0.00010970317089231685, 0.00011205803457414731, 0.00011441289825597778, 0.00011676776193780825, 0.0001191226183436811, 0.00012147748202551156, 0.00012383234570734203, 0.0001261872093891725, 0.00012854207307100296, 0.00013089693675283343]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 12.0, 8.0, 8.0, 10.0, 12.0, 15.0, 17.0, 18.0, 26.0, 22.0, 31.0, 21.0, 32.0, 39.0, 25.0, 27.0, 33.0, 44.0, 34.0, 42.0, 42.0, 38.0, 32.0, 24.0, 35.0, 37.0, 37.0, 30.0, 24.0, 29.0, 33.0, 23.0, 16.0, 21.0, 17.0, 11.0, 7.0, 10.0, 12.0, 9.0, 7.0, 3.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.728534698486328e-05, -1.6755424439907074e-05, -1.6225501894950867e-05, -1.569557934999466e-05, -1.5165656805038452e-05, -1.4635734260082245e-05, -1.4105811715126038e-05, -1.357588917016983e-05, -1.3045966625213623e-05, -1.2516044080257416e-05, -1.1986121535301208e-05, -1.1456198990345001e-05, -1.0926276445388794e-05, -1.0396353900432587e-05, -9.86643135547638e-06, -9.336508810520172e-06, -8.806586265563965e-06, -8.276663720607758e-06, -7.74674117565155e-06, -7.216818630695343e-06, -6.686896085739136e-06, -6.1569735407829285e-06, -5.627050995826721e-06, -5.097128450870514e-06, -4.567205905914307e-06, -4.037283360958099e-06, -3.507360816001892e-06, -2.977438271045685e-06, -2.4475157260894775e-06, -1.9175931811332703e-06, -1.387670636177063e-06, -8.577480912208557e-07, -3.2782554626464844e-07, 2.0209699869155884e-07, 7.320195436477661e-07, 1.2619420886039734e-06, 1.7918646335601807e-06, 2.321787178516388e-06, 2.8517097234725952e-06, 3.3816322684288025e-06, 3.91155481338501e-06, 4.441477358341217e-06, 4.971399903297424e-06, 5.501322448253632e-06, 6.031244993209839e-06, 6.561167538166046e-06, 7.091090083122253e-06, 7.621012628078461e-06, 8.150935173034668e-06, 8.680857717990875e-06, 9.210780262947083e-06, 9.74070280790329e-06, 1.0270625352859497e-05, 1.0800547897815704e-05, 1.1330470442771912e-05, 1.1860392987728119e-05, 1.2390315532684326e-05, 1.2920238077640533e-05, 1.345016062259674e-05, 1.3980083167552948e-05, 1.4510005712509155e-05, 1.5039928257465363e-05, 1.556985080242157e-05, 1.6099773347377777e-05, 1.6629695892333984e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 10.0, 14.0, 16.0, 26.0, 35.0, 43.0, 41.0, 47.0, 58.0, 68.0, 59.0, 72.0, 63.0, 61.0, 45.0, 59.0, 46.0, 47.0, 41.0, 38.0, 33.0, 22.0, 18.0, 12.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.1796875, -10.90130615234375, -10.6229248046875, -10.34454345703125, -10.066162109375, -9.78778076171875, -9.5093994140625, -9.23101806640625, -8.95263671875, -8.67425537109375, -8.3958740234375, -8.11749267578125, -7.839111328125, -7.56072998046875, -7.2823486328125, -7.00396728515625, -6.7255859375, -6.44720458984375, -6.1688232421875, -5.89044189453125, -5.612060546875, -5.33367919921875, -5.0552978515625, -4.77691650390625, -4.49853515625, -4.22015380859375, -3.9417724609375, -3.66339111328125, -3.385009765625, -3.10662841796875, -2.8282470703125, -2.54986572265625, -2.271484375, -1.99310302734375, -1.7147216796875, -1.43634033203125, -1.157958984375, -0.87957763671875, -0.6011962890625, -0.32281494140625, -0.04443359375, 0.23394775390625, 0.5123291015625, 0.79071044921875, 1.069091796875, 1.34747314453125, 1.6258544921875, 1.90423583984375, 2.1826171875, 2.46099853515625, 2.7393798828125, 3.01776123046875, 3.296142578125, 3.57452392578125, 3.8529052734375, 4.13128662109375, 4.40966796875, 4.68804931640625, 4.9664306640625, 5.24481201171875, 5.523193359375, 5.80157470703125, 6.0799560546875, 6.35833740234375, 6.63671875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 25.0, 26.0, 40.0, 60.0, 123.0, 236.0, 509.0, 1209.0, 3028.0, 8628.0, 33925.0, 347079.0, 591494.0, 45598.0, 10440.0, 3609.0, 1334.0, 559.0, 263.0, 139.0, 88.0, 42.0, 28.0, 18.0, 10.0, 6.0, 8.0, 2.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.6640625, -10.39801025390625, -10.1319580078125, -9.86590576171875, -9.599853515625, -9.33380126953125, -9.0677490234375, -8.80169677734375, -8.53564453125, -8.26959228515625, -8.0035400390625, -7.73748779296875, -7.471435546875, -7.20538330078125, -6.9393310546875, -6.67327880859375, -6.4072265625, -6.14117431640625, -5.8751220703125, -5.60906982421875, -5.343017578125, -5.07696533203125, -4.8109130859375, -4.54486083984375, -4.27880859375, -4.01275634765625, -3.7467041015625, -3.48065185546875, -3.214599609375, -2.94854736328125, -2.6824951171875, -2.41644287109375, -2.150390625, -1.88433837890625, -1.6182861328125, -1.35223388671875, -1.086181640625, -0.82012939453125, -0.5540771484375, -0.28802490234375, -0.02197265625, 0.24407958984375, 0.5101318359375, 0.77618408203125, 1.042236328125, 1.30828857421875, 1.5743408203125, 1.84039306640625, 2.1064453125, 2.37249755859375, 2.6385498046875, 2.90460205078125, 3.170654296875, 3.43670654296875, 3.7027587890625, 3.96881103515625, 4.23486328125, 4.50091552734375, 4.7669677734375, 5.03302001953125, 5.299072265625, 5.56512451171875, 5.8311767578125, 6.09722900390625, 6.36328125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 9.0, 9.0, 5.0, 14.0, 20.0, 14.0, 17.0, 25.0, 29.0, 22.0, 29.0, 20.0, 26.0, 34.0, 39.0, 33.0, 44.0, 60.0, 165.0, 1882.0, 99.0, 56.0, 50.0, 43.0, 33.0, 29.0, 39.0, 34.0, 22.0, 26.0, 22.0, 16.0, 9.0, 12.0, 16.0, 8.0, 8.0, 5.0, 6.0, 4.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-18.0625, -17.4677734375, -16.873046875, -16.2783203125, -15.68359375, -15.0888671875, -14.494140625, -13.8994140625, -13.3046875, -12.7099609375, -12.115234375, -11.5205078125, -10.92578125, -10.3310546875, -9.736328125, -9.1416015625, -8.546875, -7.9521484375, -7.357421875, -6.7626953125, -6.16796875, -5.5732421875, -4.978515625, -4.3837890625, -3.7890625, -3.1943359375, -2.599609375, -2.0048828125, -1.41015625, -0.8154296875, -0.220703125, 0.3740234375, 0.96875, 1.5634765625, 2.158203125, 2.7529296875, 3.34765625, 3.9423828125, 4.537109375, 5.1318359375, 5.7265625, 6.3212890625, 6.916015625, 7.5107421875, 8.10546875, 8.7001953125, 9.294921875, 9.8896484375, 10.484375, 11.0791015625, 11.673828125, 12.2685546875, 12.86328125, 13.4580078125, 14.052734375, 14.6474609375, 15.2421875, 15.8369140625, 16.431640625, 17.0263671875, 17.62109375, 18.2158203125, 18.810546875, 19.4052734375, 20.0]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 8.0, 8.0, 10.0, 12.0, 20.0, 13.0, 21.0, 28.0, 34.0, 49.0, 76.0, 86.0, 112.0, 166.0, 215.0, 350.0, 1087.0, 17373.0, 3112633.0, 11292.0, 914.0, 312.0, 179.0, 166.0, 139.0, 79.0, 67.0, 44.0, 47.0, 29.0, 27.0, 18.0, 24.0, 13.0, 9.0, 9.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.87451171875, -40.4990234375, -39.12353515625, -37.748046875, -36.37255859375, -34.9970703125, -33.62158203125, -32.24609375, -30.87060546875, -29.4951171875, -28.11962890625, -26.744140625, -25.36865234375, -23.9931640625, -22.61767578125, -21.2421875, -19.86669921875, -18.4912109375, -17.11572265625, -15.740234375, -14.36474609375, -12.9892578125, -11.61376953125, -10.23828125, -8.86279296875, -7.4873046875, -6.11181640625, -4.736328125, -3.36083984375, -1.9853515625, -0.60986328125, 0.765625, 2.14111328125, 3.5166015625, 4.89208984375, 6.267578125, 7.64306640625, 9.0185546875, 10.39404296875, 11.76953125, 13.14501953125, 14.5205078125, 15.89599609375, 17.271484375, 18.64697265625, 20.0224609375, 21.39794921875, 22.7734375, 24.14892578125, 25.5244140625, 26.89990234375, 28.275390625, 29.65087890625, 31.0263671875, 32.40185546875, 33.77734375, 35.15283203125, 36.5283203125, 37.90380859375, 39.279296875, 40.65478515625, 42.0302734375, 43.40576171875, 44.78125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 12.0, 216.0, 615.0, 169.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.60528564453125, -120.17302703857422, -117.74076843261719, -115.30850982666016, -112.87625122070312, -110.4439926147461, -108.01173400878906, -105.57948303222656, -103.147216796875, -100.71495819091797, -98.28269958496094, -95.8504409790039, -93.41818237304688, -90.98592376708984, -88.55366516113281, -86.12141418457031, -83.68915557861328, -81.25689697265625, -78.82463836669922, -76.39237976074219, -73.96012115478516, -71.52786254882812, -69.0956039428711, -66.66334533691406, -64.23109436035156, -61.79883575439453, -59.3665771484375, -56.93431854248047, -54.50205993652344, -52.069801330566406, -49.63754653930664, -47.20528793334961, -44.77302551269531, -42.34076690673828, -39.90850830078125, -37.47624969482422, -35.04399108886719, -32.611732482910156, -30.17947769165039, -27.74721908569336, -25.314960479736328, -22.882701873779297, -20.450443267822266, -18.018186569213867, -15.585927963256836, -13.153669357299805, -10.72141170501709, -8.289154052734375, -5.856895446777344, -3.4246373176574707, -0.9923791885375977, 1.4398789405822754, 3.8721370697021484, 6.30439567565918, 8.736653327941895, 11.16891098022461, 13.60116958618164, 16.033428192138672, 18.465686798095703, 20.8979434967041, 23.330202102661133, 25.762460708618164, 28.194717407226562, 30.626976013183594, 33.059234619140625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 6.0, 12.0, 11.0, 14.0, 15.0, 20.0, 19.0, 33.0, 21.0, 31.0, 42.0, 33.0, 48.0, 39.0, 43.0, 54.0, 46.0, 41.0, 64.0, 51.0, 39.0, 42.0, 37.0, 30.0, 27.0, 32.0, 25.0, 27.0, 20.0, 10.0, 14.0, 11.0, 8.0, 10.0, 7.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0], "bins": [-71.02820587158203, -69.24474334716797, -67.46127319335938, -65.67781066894531, -63.894344329833984, -62.110877990722656, -60.32741165161133, -58.5439453125, -56.76047897338867, -54.977012634277344, -53.193546295166016, -51.41007995605469, -49.626617431640625, -47.8431510925293, -46.05968475341797, -44.27621841430664, -42.49275207519531, -40.709285736083984, -38.925819396972656, -37.142356872558594, -35.358890533447266, -33.57542419433594, -31.79195785522461, -30.00849151611328, -28.22502899169922, -26.44156265258789, -24.658098220825195, -22.874631881713867, -21.09116554260254, -19.307701110839844, -17.524234771728516, -15.740768432617188, -13.95730209350586, -12.173836708068848, -10.39037036895752, -8.606904983520508, -6.823439121246338, -5.039973258972168, -3.2565078735351562, -1.4730415344238281, 0.3104238510131836, 2.0938897132873535, 3.8773553371429443, 5.660820960998535, 7.444286823272705, 9.227752685546875, 11.011218070983887, 12.794684410095215, 14.578149795532227, 16.361616134643555, 18.14508056640625, 19.928546905517578, 21.712013244628906, 23.495479583740234, 25.27894401550293, 27.062410354614258, 28.845874786376953, 30.62934112548828, 32.41280746459961, 34.19627380371094, 35.979736328125, 37.76320266723633, 39.546669006347656, 41.330135345458984, 43.11360168457031]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 8.0, 8.0, 14.0, 18.0, 32.0, 36.0, 33.0, 57.0, 51.0, 61.0, 65.0, 63.0, 65.0, 69.0, 54.0, 59.0, 48.0, 53.0, 34.0, 34.0, 40.0, 31.0, 13.0, 27.0, 9.0, 4.0, 5.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.40625, -11.1197509765625, -10.833251953125, -10.5467529296875, -10.26025390625, -9.9737548828125, -9.687255859375, -9.4007568359375, -9.1142578125, -8.8277587890625, -8.541259765625, -8.2547607421875, -7.96826171875, -7.6817626953125, -7.395263671875, -7.1087646484375, -6.822265625, -6.5357666015625, -6.249267578125, -5.9627685546875, -5.67626953125, -5.3897705078125, -5.103271484375, -4.8167724609375, -4.5302734375, -4.2437744140625, -3.957275390625, -3.6707763671875, -3.38427734375, -3.0977783203125, -2.811279296875, -2.5247802734375, -2.23828125, -1.9517822265625, -1.665283203125, -1.3787841796875, -1.09228515625, -0.8057861328125, -0.519287109375, -0.2327880859375, 0.0537109375, 0.3402099609375, 0.626708984375, 0.9132080078125, 1.19970703125, 1.4862060546875, 1.772705078125, 2.0592041015625, 2.345703125, 2.6322021484375, 2.918701171875, 3.2052001953125, 3.49169921875, 3.7781982421875, 4.064697265625, 4.3511962890625, 4.6376953125, 4.9241943359375, 5.210693359375, 5.4971923828125, 5.78369140625, 6.0701904296875, 6.356689453125, 6.6431884765625, 6.9296875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 8.0, 8.0, 6.0, 18.0, 20.0, 29.0, 49.0, 81.0, 130.0, 213.0, 394.0, 938.0, 3287.0, 20070.0, 304491.0, 3115754.0, 704652.0, 36559.0, 5258.0, 1238.0, 439.0, 238.0, 127.0, 70.0, 72.0, 51.0, 24.0, 20.0, 11.0, 10.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -20.13671875, -19.6015625, -19.06640625, -18.53125, -17.99609375, -17.4609375, -16.92578125, -16.390625, -15.85546875, -15.3203125, -14.78515625, -14.25, -13.71484375, -13.1796875, -12.64453125, -12.109375, -11.57421875, -11.0390625, -10.50390625, -9.96875, -9.43359375, -8.8984375, -8.36328125, -7.828125, -7.29296875, -6.7578125, -6.22265625, -5.6875, -5.15234375, -4.6171875, -4.08203125, -3.546875, -3.01171875, -2.4765625, -1.94140625, -1.40625, -0.87109375, -0.3359375, 0.19921875, 0.734375, 1.26953125, 1.8046875, 2.33984375, 2.875, 3.41015625, 3.9453125, 4.48046875, 5.015625, 5.55078125, 6.0859375, 6.62109375, 7.15625, 7.69140625, 8.2265625, 8.76171875, 9.296875, 9.83203125, 10.3671875, 10.90234375, 11.4375, 11.97265625, 12.5078125, 13.04296875, 13.578125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 12.0, 14.0, 17.0, 22.0, 33.0, 59.0, 90.0, 84.0, 125.0, 205.0, 257.0, 363.0, 536.0, 572.0, 466.0, 390.0, 236.0, 171.0, 125.0, 92.0, 51.0, 46.0, 17.0, 24.0, 11.0, 11.0, 13.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.0802001953125, -8.707275390625, -8.3343505859375, -7.96142578125, -7.5885009765625, -7.215576171875, -6.8426513671875, -6.4697265625, -6.0968017578125, -5.723876953125, -5.3509521484375, -4.97802734375, -4.6051025390625, -4.232177734375, -3.8592529296875, -3.486328125, -3.1134033203125, -2.740478515625, -2.3675537109375, -1.99462890625, -1.6217041015625, -1.248779296875, -0.8758544921875, -0.5029296875, -0.1300048828125, 0.242919921875, 0.6158447265625, 0.98876953125, 1.3616943359375, 1.734619140625, 2.1075439453125, 2.48046875, 2.8533935546875, 3.226318359375, 3.5992431640625, 3.97216796875, 4.3450927734375, 4.718017578125, 5.0909423828125, 5.4638671875, 5.8367919921875, 6.209716796875, 6.5826416015625, 6.95556640625, 7.3284912109375, 7.701416015625, 8.0743408203125, 8.447265625, 8.8201904296875, 9.193115234375, 9.5660400390625, 9.93896484375, 10.3118896484375, 10.684814453125, 11.0577392578125, 11.4306640625, 11.8035888671875, 12.176513671875, 12.5494384765625, 12.92236328125, 13.2952880859375, 13.668212890625, 14.0411376953125, 14.4140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 10.0, 10.0, 10.0, 25.0, 22.0, 48.0, 71.0, 90.0, 146.0, 203.0, 265.0, 532.0, 2271.0, 265120.0, 3908153.0, 15277.0, 804.0, 349.0, 269.0, 188.0, 132.0, 94.0, 54.0, 38.0, 28.0, 25.0, 9.0, 6.0, 8.0, 10.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-66.875, -65.126953125, -63.37890625, -61.630859375, -59.8828125, -58.134765625, -56.38671875, -54.638671875, -52.890625, -51.142578125, -49.39453125, -47.646484375, -45.8984375, -44.150390625, -42.40234375, -40.654296875, -38.90625, -37.158203125, -35.41015625, -33.662109375, -31.9140625, -30.166015625, -28.41796875, -26.669921875, -24.921875, -23.173828125, -21.42578125, -19.677734375, -17.9296875, -16.181640625, -14.43359375, -12.685546875, -10.9375, -9.189453125, -7.44140625, -5.693359375, -3.9453125, -2.197265625, -0.44921875, 1.298828125, 3.046875, 4.794921875, 6.54296875, 8.291015625, 10.0390625, 11.787109375, 13.53515625, 15.283203125, 17.03125, 18.779296875, 20.52734375, 22.275390625, 24.0234375, 25.771484375, 27.51953125, 29.267578125, 31.015625, 32.763671875, 34.51171875, 36.259765625, 38.0078125, 39.755859375, 41.50390625, 43.251953125, 45.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 85.0, 568.0, 342.0, 19.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-396.7581787109375, -387.69866943359375, -378.6391906738281, -369.5796813964844, -360.52020263671875, -351.460693359375, -342.4012145996094, -333.3417053222656, -324.2822265625, -315.22271728515625, -306.1632385253906, -297.1037292480469, -288.04425048828125, -278.9847412109375, -269.9252624511719, -260.8657531738281, -251.80625915527344, -242.74676513671875, -233.68727111816406, -224.62777709960938, -215.5682830810547, -206.5087890625, -197.44927978515625, -188.38980102539062, -179.33029174804688, -170.2707977294922, -161.2113037109375, -152.1518096923828, -143.09231567382812, -134.03282165527344, -124.97332000732422, -115.91382598876953, -106.85432434082031, -97.79483032226562, -88.73533630371094, -79.67584228515625, -70.61634826660156, -61.55685043334961, -52.497352600097656, -43.43785858154297, -34.37836456298828, -25.318870544433594, -16.259374618530273, -7.199878692626953, 1.8596153259277344, 10.919109344482422, 19.978607177734375, 29.038101196289062, 38.09759521484375, 47.15708923339844, 56.216583251953125, 65.27607727050781, 74.3355712890625, 83.39506530761719, 92.4545669555664, 101.5140609741211, 110.57355499267578, 119.63304901123047, 128.6925506591797, 137.75204467773438, 146.81153869628906, 155.87103271484375, 164.93052673339844, 173.99002075195312, 183.0495147705078]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 16.0, 20.0, 18.0, 25.0, 19.0, 22.0, 26.0, 23.0, 19.0, 26.0, 41.0, 53.0, 47.0, 32.0, 39.0, 30.0, 28.0, 44.0, 45.0, 36.0, 36.0, 40.0, 36.0, 33.0, 23.0, 33.0, 28.0, 22.0, 26.0, 11.0, 17.0, 10.0, 7.0, 12.0, 8.0, 4.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.870689392089844, -29.844736099243164, -28.818784713745117, -27.792831420898438, -26.76688003540039, -25.74092674255371, -24.71497344970703, -23.689022064208984, -22.663068771362305, -21.637115478515625, -20.611164093017578, -19.5852108001709, -18.55925750732422, -17.533306121826172, -16.507352828979492, -15.481400489807129, -14.455448150634766, -13.429495811462402, -12.403543472290039, -11.37759017944336, -10.351637840270996, -9.325685501098633, -8.299732208251953, -7.27377986907959, -6.247827529907227, -5.221875190734863, -4.195922374725342, -3.1699697971343994, -2.144017219543457, -1.1180648803710938, -0.09211206436157227, 0.9338407516479492, 1.9597930908203125, 2.985745668411255, 4.011698246002197, 5.037651062011719, 6.063603401184082, 7.089555740356445, 8.115509033203125, 9.141461372375488, 10.167413711547852, 11.193366050720215, 12.219318389892578, 13.245271682739258, 14.271224021911621, 15.297176361083984, 16.323129653930664, 17.349082946777344, 18.37503433227539, 19.40098762512207, 20.426939010620117, 21.452892303466797, 22.478843688964844, 23.504796981811523, 24.530750274658203, 25.55670166015625, 26.58265495300293, 27.60860824584961, 28.634559631347656, 29.660512924194336, 30.686466217041016, 31.712417602539062, 32.73836898803711, 33.76432418823242, 34.79027557373047]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 7.0, 16.0, 14.0, 15.0, 22.0, 28.0, 31.0, 25.0, 48.0, 45.0, 54.0, 63.0, 51.0, 42.0, 60.0, 54.0, 52.0, 45.0, 56.0, 33.0, 37.0, 31.0, 41.0, 27.0, 27.0, 16.0, 11.0, 14.0, 11.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.31280517578125, -9.0709228515625, -8.82904052734375, -8.587158203125, -8.34527587890625, -8.1033935546875, -7.86151123046875, -7.61962890625, -7.37774658203125, -7.1358642578125, -6.89398193359375, -6.652099609375, -6.41021728515625, -6.1683349609375, -5.92645263671875, -5.6845703125, -5.44268798828125, -5.2008056640625, -4.95892333984375, -4.717041015625, -4.47515869140625, -4.2332763671875, -3.99139404296875, -3.74951171875, -3.50762939453125, -3.2657470703125, -3.02386474609375, -2.781982421875, -2.54010009765625, -2.2982177734375, -2.05633544921875, -1.814453125, -1.57257080078125, -1.3306884765625, -1.08880615234375, -0.846923828125, -0.60504150390625, -0.3631591796875, -0.12127685546875, 0.12060546875, 0.36248779296875, 0.6043701171875, 0.84625244140625, 1.088134765625, 1.33001708984375, 1.5718994140625, 1.81378173828125, 2.0556640625, 2.29754638671875, 2.5394287109375, 2.78131103515625, 3.023193359375, 3.26507568359375, 3.5069580078125, 3.74884033203125, 3.99072265625, 4.23260498046875, 4.4744873046875, 4.71636962890625, 4.958251953125, 5.20013427734375, 5.4420166015625, 5.68389892578125, 5.92578125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 6.0, 10.0, 17.0, 17.0, 28.0, 29.0, 44.0, 63.0, 113.0, 197.0, 365.0, 668.0, 1162.0, 2264.0, 4427.0, 8598.0, 16684.0, 34170.0, 75649.0, 198682.0, 401942.0, 172688.0, 67376.0, 31252.0, 15623.0, 7778.0, 4133.0, 2071.0, 1163.0, 553.0, 305.0, 188.0, 118.0, 45.0, 38.0, 24.0, 18.0, 14.0, 10.0, 5.0, 9.0, 2.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3427734375, -0.330718994140625, -0.31866455078125, -0.306610107421875, -0.2945556640625, -0.282501220703125, -0.27044677734375, -0.258392333984375, -0.246337890625, -0.234283447265625, -0.22222900390625, -0.210174560546875, -0.1981201171875, -0.186065673828125, -0.17401123046875, -0.161956787109375, -0.14990234375, -0.137847900390625, -0.12579345703125, -0.113739013671875, -0.1016845703125, -0.089630126953125, -0.07757568359375, -0.065521240234375, -0.053466796875, -0.041412353515625, -0.02935791015625, -0.017303466796875, -0.0052490234375, 0.006805419921875, 0.01885986328125, 0.030914306640625, 0.04296875, 0.055023193359375, 0.06707763671875, 0.079132080078125, 0.0911865234375, 0.103240966796875, 0.11529541015625, 0.127349853515625, 0.139404296875, 0.151458740234375, 0.16351318359375, 0.175567626953125, 0.1876220703125, 0.199676513671875, 0.21173095703125, 0.223785400390625, 0.23583984375, 0.247894287109375, 0.25994873046875, 0.272003173828125, 0.2840576171875, 0.296112060546875, 0.30816650390625, 0.320220947265625, 0.332275390625, 0.344329833984375, 0.35638427734375, 0.368438720703125, 0.3804931640625, 0.392547607421875, 0.40460205078125, 0.416656494140625, 0.4287109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 7.0, 11.0, 7.0, 6.0, 16.0, 12.0, 16.0, 18.0, 18.0, 22.0, 23.0, 29.0, 31.0, 31.0, 28.0, 33.0, 35.0, 29.0, 26.0, 42.0, 33.0, 1049.0, 26.0, 52.0, 44.0, 34.0, 37.0, 25.0, 28.0, 20.0, 24.0, 24.0, 31.0, 23.0, 20.0, 13.0, 14.0, 9.0, 10.0, 8.0, 9.0, 2.0, 7.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1484375, -3.04449462890625, -2.9405517578125, -2.83660888671875, -2.732666015625, -2.62872314453125, -2.5247802734375, -2.42083740234375, -2.31689453125, -2.21295166015625, -2.1090087890625, -2.00506591796875, -1.901123046875, -1.79718017578125, -1.6932373046875, -1.58929443359375, -1.4853515625, -1.38140869140625, -1.2774658203125, -1.17352294921875, -1.069580078125, -0.96563720703125, -0.8616943359375, -0.75775146484375, -0.65380859375, -0.54986572265625, -0.4459228515625, -0.34197998046875, -0.238037109375, -0.13409423828125, -0.0301513671875, 0.07379150390625, 0.177734375, 0.28167724609375, 0.3856201171875, 0.48956298828125, 0.593505859375, 0.69744873046875, 0.8013916015625, 0.90533447265625, 1.00927734375, 1.11322021484375, 1.2171630859375, 1.32110595703125, 1.425048828125, 1.52899169921875, 1.6329345703125, 1.73687744140625, 1.8408203125, 1.94476318359375, 2.0487060546875, 2.15264892578125, 2.256591796875, 2.36053466796875, 2.4644775390625, 2.56842041015625, 2.67236328125, 2.77630615234375, 2.8802490234375, 2.98419189453125, 3.088134765625, 3.19207763671875, 3.2960205078125, 3.39996337890625, 3.50390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 7.0, 10.0, 18.0, 24.0, 31.0, 50.0, 68.0, 99.0, 133.0, 219.0, 313.0, 385.0, 565.0, 865.0, 1178.0, 1635.0, 2273.0, 3090.0, 4588.0, 6505.0, 9688.0, 14215.0, 21203.0, 31988.0, 50448.0, 85197.0, 163474.0, 1299211.0, 164090.0, 85760.0, 51022.0, 31940.0, 21136.0, 14082.0, 9654.0, 6573.0, 4445.0, 3169.0, 2209.0, 1608.0, 1138.0, 871.0, 628.0, 393.0, 305.0, 165.0, 136.0, 89.0, 81.0, 58.0, 43.0, 26.0, 15.0, 10.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0], "bins": [-0.1937255859375, -0.1875762939453125, -0.181427001953125, -0.1752777099609375, -0.16912841796875, -0.1629791259765625, -0.156829833984375, -0.1506805419921875, -0.14453125, -0.1383819580078125, -0.132232666015625, -0.1260833740234375, -0.11993408203125, -0.1137847900390625, -0.107635498046875, -0.1014862060546875, -0.0953369140625, -0.0891876220703125, -0.083038330078125, -0.0768890380859375, -0.07073974609375, -0.0645904541015625, -0.058441162109375, -0.0522918701171875, -0.046142578125, -0.0399932861328125, -0.033843994140625, -0.0276947021484375, -0.02154541015625, -0.0153961181640625, -0.009246826171875, -0.0030975341796875, 0.0030517578125, 0.0092010498046875, 0.015350341796875, 0.0214996337890625, 0.02764892578125, 0.0337982177734375, 0.039947509765625, 0.0460968017578125, 0.05224609375, 0.0583953857421875, 0.064544677734375, 0.0706939697265625, 0.07684326171875, 0.0829925537109375, 0.089141845703125, 0.0952911376953125, 0.1014404296875, 0.1075897216796875, 0.113739013671875, 0.1198883056640625, 0.12603759765625, 0.1321868896484375, 0.138336181640625, 0.1444854736328125, 0.150634765625, 0.1567840576171875, 0.162933349609375, 0.1690826416015625, 0.17523193359375, 0.1813812255859375, 0.187530517578125, 0.1936798095703125, 0.1998291015625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 0.0, 8.0, 3.0, 4.0, 9.0, 6.0, 14.0, 16.0, 21.0, 17.0, 29.0, 35.0, 41.0, 41.0, 39.0, 43.0, 44.0, 40.0, 55.0, 53.0, 42.0, 64.0, 37.0, 58.0, 37.0, 46.0, 27.0, 21.0, 34.0, 16.0, 18.0, 11.0, 13.0, 12.0, 10.0, 10.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337860107421875e-05, -3.239419311285019e-05, -3.140978515148163e-05, -3.0425377190113068e-05, -2.9440969228744507e-05, -2.8456561267375946e-05, -2.7472153306007385e-05, -2.6487745344638824e-05, -2.5503337383270264e-05, -2.4518929421901703e-05, -2.3534521460533142e-05, -2.255011349916458e-05, -2.156570553779602e-05, -2.058129757642746e-05, -1.95968896150589e-05, -1.8612481653690338e-05, -1.7628073692321777e-05, -1.6643665730953217e-05, -1.5659257769584656e-05, -1.4674849808216095e-05, -1.3690441846847534e-05, -1.2706033885478973e-05, -1.1721625924110413e-05, -1.0737217962741852e-05, -9.752810001373291e-06, -8.76840204000473e-06, -7.78399407863617e-06, -6.799586117267609e-06, -5.815178155899048e-06, -4.830770194530487e-06, -3.846362233161926e-06, -2.8619542717933655e-06, -1.8775463104248047e-06, -8.931383490562439e-07, 9.12696123123169e-08, 1.0756775736808777e-06, 2.0600855350494385e-06, 3.0444934964179993e-06, 4.02890145778656e-06, 5.013309419155121e-06, 5.997717380523682e-06, 6.9821253418922424e-06, 7.966533303260803e-06, 8.950941264629364e-06, 9.935349225997925e-06, 1.0919757187366486e-05, 1.1904165148735046e-05, 1.2888573110103607e-05, 1.3872981071472168e-05, 1.4857389032840729e-05, 1.584179699420929e-05, 1.682620495557785e-05, 1.781061291694641e-05, 1.8795020878314972e-05, 1.9779428839683533e-05, 2.0763836801052094e-05, 2.1748244762420654e-05, 2.2732652723789215e-05, 2.3717060685157776e-05, 2.4701468646526337e-05, 2.5685876607894897e-05, 2.6670284569263458e-05, 2.765469253063202e-05, 2.863910049200058e-05, 2.962350845336914e-05]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 1.0, 6.0, 7.0, 13.0, 11.0, 21.0, 11.0, 26.0, 33.0, 45.0, 43.0, 72.0, 75.0, 106.0, 214.0, 511.0, 3133.0, 917054.0, 125052.0, 1095.0, 334.0, 185.0, 106.0, 83.0, 68.0, 49.0, 43.0, 33.0, 18.0, 24.0, 15.0, 13.0, 13.0, 12.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006718635559082031, -0.0006500408053398132, -0.0006282180547714233, -0.0006063953042030334, -0.0005845725536346436, -0.0005627498030662537, -0.0005409270524978638, -0.0005191043019294739, -0.000497281551361084, -0.0004754588007926941, -0.0004536360502243042, -0.0004318132996559143, -0.0004099905490875244, -0.0003881677985191345, -0.00036634504795074463, -0.00034452229738235474, -0.00032269954681396484, -0.00030087679624557495, -0.00027905404567718506, -0.00025723129510879517, -0.00023540854454040527, -0.00021358579397201538, -0.0001917630434036255, -0.0001699402928352356, -0.0001481175422668457, -0.0001262947916984558, -0.00010447204113006592, -8.264929056167603e-05, -6.082653999328613e-05, -3.900378942489624e-05, -1.7181038856506348e-05, 4.641711711883545e-06, 2.6464462280273438e-05, 4.828721284866333e-05, 7.010996341705322e-05, 9.193271398544312e-05, 0.00011375546455383301, 0.0001355782151222229, 0.0001574009656906128, 0.00017922371625900269, 0.00020104646682739258, 0.00022286921739578247, 0.00024469196796417236, 0.00026651471853256226, 0.00028833746910095215, 0.00031016021966934204, 0.00033198297023773193, 0.0003538057208061218, 0.0003756284713745117, 0.0003974512219429016, 0.0004192739725112915, 0.0004410967230796814, 0.0004629194736480713, 0.0004847422242164612, 0.0005065649747848511, 0.000528387725353241, 0.0005502104759216309, 0.0005720332264900208, 0.0005938559770584106, 0.0006156787276268005, 0.0006375014781951904, 0.0006593242287635803, 0.0006811469793319702, 0.0007029697299003601, 0.00072479248046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 23.0, 33.0, 87.0, 119.0, 142.0, 179.0, 132.0, 123.0, 72.0, 45.0, 21.0, 14.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6474755941308104e-05, -2.5389859729330055e-05, -2.4304963517352007e-05, -2.322006730537396e-05, -2.213517109339591e-05, -2.1050274881417863e-05, -1.9965378669439815e-05, -1.8880482457461767e-05, -1.779558624548372e-05, -1.671069003350567e-05, -1.5625793821527623e-05, -1.4540897609549575e-05, -1.3456001397571526e-05, -1.2371105185593478e-05, -1.128620897361543e-05, -1.0201312761637382e-05, -9.116416549659334e-06, -8.031520337681286e-06, -6.946624125703238e-06, -5.86172791372519e-06, -4.776831701747142e-06, -3.6919354897690937e-06, -2.6070392777910456e-06, -1.5221430658129975e-06, -4.3724685383494943e-07, 6.476493581430987e-07, 1.7325455701211467e-06, 2.817441782099195e-06, 3.902337994077243e-06, 4.987234206055291e-06, 6.072130418033339e-06, 7.157026630011387e-06, 8.241921023000032e-06, 9.32681723497808e-06, 1.0411713446956128e-05, 1.1496609658934176e-05, 1.2581505870912224e-05, 1.3666402082890272e-05, 1.475129829486832e-05, 1.583619450684637e-05, 1.6921090718824416e-05, 1.8005986930802464e-05, 1.9090883142780513e-05, 2.017577935475856e-05, 2.126067556673661e-05, 2.2345571778714657e-05, 2.3430467990692705e-05, 2.4515364202670753e-05, 2.56002604146488e-05, 2.668515662662685e-05, 2.7770052838604897e-05, 2.8854949050582945e-05, 2.9939845262560993e-05, 3.102474147453904e-05, 3.210963768651709e-05, 3.319453389849514e-05, 3.4279430110473186e-05, 3.5364326322451234e-05, 3.644922253442928e-05, 3.753411874640733e-05, 3.861901495838538e-05, 3.9703911170363426e-05, 4.0788807382341474e-05, 4.187370359431952e-05, 4.295859980629757e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 9.0, 17.0, 17.0, 15.0, 15.0, 26.0, 25.0, 26.0, 21.0, 30.0, 25.0, 38.0, 35.0, 38.0, 50.0, 51.0, 36.0, 37.0, 38.0, 35.0, 49.0, 38.0, 45.0, 31.0, 24.0, 25.0, 28.0, 19.0, 24.0, 22.0, 13.0, 11.0, 15.0, 8.0, 8.0, 12.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6450881958007812e-05, -1.592002809047699e-05, -1.5389174222946167e-05, -1.4858320355415344e-05, -1.4327466487884521e-05, -1.3796612620353699e-05, -1.3265758752822876e-05, -1.2734904885292053e-05, -1.220405101776123e-05, -1.1673197150230408e-05, -1.1142343282699585e-05, -1.0611489415168762e-05, -1.008063554763794e-05, -9.549781680107117e-06, -9.018927812576294e-06, -8.488073945045471e-06, -7.957220077514648e-06, -7.426366209983826e-06, -6.895512342453003e-06, -6.36465847492218e-06, -5.833804607391357e-06, -5.302950739860535e-06, -4.772096872329712e-06, -4.241243004798889e-06, -3.7103891372680664e-06, -3.1795352697372437e-06, -2.648681402206421e-06, -2.117827534675598e-06, -1.5869736671447754e-06, -1.0561197996139526e-06, -5.252659320831299e-07, 5.587935447692871e-09, 5.364418029785156e-07, 1.0672956705093384e-06, 1.5981495380401611e-06, 2.129003405570984e-06, 2.6598572731018066e-06, 3.1907111406326294e-06, 3.721565008163452e-06, 4.252418875694275e-06, 4.783272743225098e-06, 5.31412661075592e-06, 5.844980478286743e-06, 6.375834345817566e-06, 6.906688213348389e-06, 7.4375420808792114e-06, 7.968395948410034e-06, 8.499249815940857e-06, 9.03010368347168e-06, 9.560957551002502e-06, 1.0091811418533325e-05, 1.0622665286064148e-05, 1.115351915359497e-05, 1.1684373021125793e-05, 1.2215226888656616e-05, 1.2746080756187439e-05, 1.3276934623718262e-05, 1.3807788491249084e-05, 1.4338642358779907e-05, 1.486949622631073e-05, 1.5400350093841553e-05, 1.5931203961372375e-05, 1.6462057828903198e-05, 1.699291169643402e-05, 1.7523765563964844e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 7.0, 16.0, 14.0, 15.0, 22.0, 28.0, 31.0, 25.0, 48.0, 45.0, 54.0, 63.0, 51.0, 42.0, 60.0, 54.0, 52.0, 45.0, 56.0, 33.0, 37.0, 31.0, 41.0, 27.0, 27.0, 16.0, 11.0, 14.0, 11.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.31280517578125, -9.0709228515625, -8.82904052734375, -8.587158203125, -8.34527587890625, -8.1033935546875, -7.86151123046875, -7.61962890625, -7.37774658203125, -7.1358642578125, -6.89398193359375, -6.652099609375, -6.41021728515625, -6.1683349609375, -5.92645263671875, -5.6845703125, -5.44268798828125, -5.2008056640625, -4.95892333984375, -4.717041015625, -4.47515869140625, -4.2332763671875, -3.99139404296875, -3.74951171875, -3.50762939453125, -3.2657470703125, -3.02386474609375, -2.781982421875, -2.54010009765625, -2.2982177734375, -2.05633544921875, -1.814453125, -1.57257080078125, -1.3306884765625, -1.08880615234375, -0.846923828125, -0.60504150390625, -0.3631591796875, -0.12127685546875, 0.12060546875, 0.36248779296875, 0.6043701171875, 0.84625244140625, 1.088134765625, 1.33001708984375, 1.5718994140625, 1.81378173828125, 2.0556640625, 2.29754638671875, 2.5394287109375, 2.78131103515625, 3.023193359375, 3.26507568359375, 3.5069580078125, 3.74884033203125, 3.99072265625, 4.23260498046875, 4.4744873046875, 4.71636962890625, 4.958251953125, 5.20013427734375, 5.4420166015625, 5.68389892578125, 5.92578125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 12.0, 18.0, 17.0, 30.0, 57.0, 114.0, 232.0, 528.0, 1308.0, 3495.0, 9699.0, 30969.0, 126064.0, 607829.0, 203450.0, 43875.0, 13316.0, 4572.0, 1713.0, 658.0, 258.0, 126.0, 73.0, 40.0, 25.0, 18.0, 14.0, 6.0, 8.0, 8.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.5234375, -8.3187255859375, -8.114013671875, -7.9093017578125, -7.70458984375, -7.4998779296875, -7.295166015625, -7.0904541015625, -6.8857421875, -6.6810302734375, -6.476318359375, -6.2716064453125, -6.06689453125, -5.8621826171875, -5.657470703125, -5.4527587890625, -5.248046875, -5.0433349609375, -4.838623046875, -4.6339111328125, -4.42919921875, -4.2244873046875, -4.019775390625, -3.8150634765625, -3.6103515625, -3.4056396484375, -3.200927734375, -2.9962158203125, -2.79150390625, -2.5867919921875, -2.382080078125, -2.1773681640625, -1.97265625, -1.7679443359375, -1.563232421875, -1.3585205078125, -1.15380859375, -0.9490966796875, -0.744384765625, -0.5396728515625, -0.3349609375, -0.1302490234375, 0.074462890625, 0.2791748046875, 0.48388671875, 0.6885986328125, 0.893310546875, 1.0980224609375, 1.302734375, 1.5074462890625, 1.712158203125, 1.9168701171875, 2.12158203125, 2.3262939453125, 2.531005859375, 2.7357177734375, 2.9404296875, 3.1451416015625, 3.349853515625, 3.5545654296875, 3.75927734375, 3.9639892578125, 4.168701171875, 4.3734130859375, 4.578125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 5.0, 6.0, 7.0, 8.0, 15.0, 17.0, 9.0, 16.0, 18.0, 21.0, 31.0, 34.0, 37.0, 33.0, 59.0, 62.0, 90.0, 146.0, 1751.0, 167.0, 67.0, 80.0, 53.0, 55.0, 37.0, 36.0, 33.0, 39.0, 17.0, 24.0, 14.0, 13.0, 22.0, 10.0, 8.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.234375, -23.4658203125, -22.697265625, -21.9287109375, -21.16015625, -20.3916015625, -19.623046875, -18.8544921875, -18.0859375, -17.3173828125, -16.548828125, -15.7802734375, -15.01171875, -14.2431640625, -13.474609375, -12.7060546875, -11.9375, -11.1689453125, -10.400390625, -9.6318359375, -8.86328125, -8.0947265625, -7.326171875, -6.5576171875, -5.7890625, -5.0205078125, -4.251953125, -3.4833984375, -2.71484375, -1.9462890625, -1.177734375, -0.4091796875, 0.359375, 1.1279296875, 1.896484375, 2.6650390625, 3.43359375, 4.2021484375, 4.970703125, 5.7392578125, 6.5078125, 7.2763671875, 8.044921875, 8.8134765625, 9.58203125, 10.3505859375, 11.119140625, 11.8876953125, 12.65625, 13.4248046875, 14.193359375, 14.9619140625, 15.73046875, 16.4990234375, 17.267578125, 18.0361328125, 18.8046875, 19.5732421875, 20.341796875, 21.1103515625, 21.87890625, 22.6474609375, 23.416015625, 24.1845703125, 24.953125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 17.0, 27.0, 22.0, 22.0, 43.0, 68.0, 100.0, 146.0, 217.0, 288.0, 549.0, 2749.0, 3080196.0, 59039.0, 1140.0, 353.0, 202.0, 138.0, 106.0, 74.0, 53.0, 39.0, 26.0, 20.0, 17.0, 8.0, 13.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-83.5625, -81.35107421875, -79.1396484375, -76.92822265625, -74.716796875, -72.50537109375, -70.2939453125, -68.08251953125, -65.87109375, -63.65966796875, -61.4482421875, -59.23681640625, -57.025390625, -54.81396484375, -52.6025390625, -50.39111328125, -48.1796875, -45.96826171875, -43.7568359375, -41.54541015625, -39.333984375, -37.12255859375, -34.9111328125, -32.69970703125, -30.48828125, -28.27685546875, -26.0654296875, -23.85400390625, -21.642578125, -19.43115234375, -17.2197265625, -15.00830078125, -12.796875, -10.58544921875, -8.3740234375, -6.16259765625, -3.951171875, -1.73974609375, 0.4716796875, 2.68310546875, 4.89453125, 7.10595703125, 9.3173828125, 11.52880859375, 13.740234375, 15.95166015625, 18.1630859375, 20.37451171875, 22.5859375, 24.79736328125, 27.0087890625, 29.22021484375, 31.431640625, 33.64306640625, 35.8544921875, 38.06591796875, 40.27734375, 42.48876953125, 44.7001953125, 46.91162109375, 49.123046875, 51.33447265625, 53.5458984375, 55.75732421875, 57.96875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 19.0, 926.0, 70.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-424.1913757324219, -416.69989013671875, -409.2084045410156, -401.7169189453125, -394.2254333496094, -386.73394775390625, -379.2424621582031, -371.7509765625, -364.25946044921875, -356.7679748535156, -349.2764892578125, -341.7850036621094, -334.29351806640625, -326.8020324707031, -319.310546875, -311.81903076171875, -304.32757568359375, -296.8360900878906, -289.3446044921875, -281.8531188964844, -274.36163330078125, -266.8701477050781, -259.378662109375, -251.8871612548828, -244.3956756591797, -236.90419006347656, -229.41270446777344, -221.9212188720703, -214.42971801757812, -206.938232421875, -199.44674682617188, -191.95526123046875, -184.46377563476562, -176.9722900390625, -169.48080444335938, -161.98931884765625, -154.49783325195312, -147.00634765625, -139.5148468017578, -132.0233612060547, -124.5318832397461, -117.04039764404297, -109.54890441894531, -102.05741882324219, -94.56593322753906, -87.07444763183594, -79.58296203613281, -72.09146881103516, -64.59998321533203, -57.108497619628906, -49.617008209228516, -42.125518798828125, -34.634033203125, -27.142547607421875, -19.651058197021484, -12.159568786621094, -4.668083190917969, 2.823404312133789, 10.314891815185547, 17.806379318237305, 25.297866821289062, 32.78935241699219, 40.28084182739258, 47.77233123779297, 55.263816833496094]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 3.0, 5.0, 10.0, 13.0, 12.0, 7.0, 22.0, 23.0, 22.0, 21.0, 24.0, 35.0, 26.0, 49.0, 34.0, 44.0, 38.0, 49.0, 52.0, 43.0, 42.0, 37.0, 41.0, 49.0, 32.0, 31.0, 35.0, 20.0, 29.0, 22.0, 24.0, 14.0, 12.0, 17.0, 12.0, 4.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-60.3488883972168, -58.36864471435547, -56.38840103149414, -54.40815734863281, -52.427913665771484, -50.447669982910156, -48.467430114746094, -46.4871826171875, -44.50694274902344, -42.52669906616211, -40.54645538330078, -38.56621170043945, -36.585968017578125, -34.6057243347168, -32.62548065185547, -30.645238876342773, -28.664993286132812, -26.684749603271484, -24.704505920410156, -22.724262237548828, -20.7440185546875, -18.763774871826172, -16.783533096313477, -14.803289413452148, -12.82304573059082, -10.842802047729492, -8.862558364868164, -6.882315635681152, -4.902071952819824, -2.921828269958496, -0.9415855407714844, 1.0386581420898438, 3.0188980102539062, 4.999141693115234, 6.979384899139404, 8.959628105163574, 10.939871788024902, 12.92011547088623, 14.900358200073242, 16.88060188293457, 18.8608455657959, 20.841089248657227, 22.821332931518555, 24.80157470703125, 26.781818389892578, 28.762062072753906, 30.742305755615234, 32.72254943847656, 34.70279312133789, 36.68303680419922, 38.66328048706055, 40.643524169921875, 42.6237678527832, 44.60401153564453, 46.584251403808594, 48.56449890136719, 50.54473876953125, 52.52498245239258, 54.505226135253906, 56.485469818115234, 58.46571350097656, 60.44595718383789, 62.42620086669922, 64.40644073486328, 66.38668823242188]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 8.0, 12.0, 17.0, 18.0, 27.0, 23.0, 36.0, 35.0, 52.0, 48.0, 42.0, 56.0, 54.0, 56.0, 46.0, 44.0, 54.0, 48.0, 49.0, 43.0, 34.0, 39.0, 27.0, 20.0, 23.0, 16.0, 19.0, 6.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.5859375, -9.3406982421875, -9.095458984375, -8.8502197265625, -8.60498046875, -8.3597412109375, -8.114501953125, -7.8692626953125, -7.6240234375, -7.3787841796875, -7.133544921875, -6.8883056640625, -6.64306640625, -6.3978271484375, -6.152587890625, -5.9073486328125, -5.662109375, -5.4168701171875, -5.171630859375, -4.9263916015625, -4.68115234375, -4.4359130859375, -4.190673828125, -3.9454345703125, -3.7001953125, -3.4549560546875, -3.209716796875, -2.9644775390625, -2.71923828125, -2.4739990234375, -2.228759765625, -1.9835205078125, -1.73828125, -1.4930419921875, -1.247802734375, -1.0025634765625, -0.75732421875, -0.5120849609375, -0.266845703125, -0.0216064453125, 0.2236328125, 0.4688720703125, 0.714111328125, 0.9593505859375, 1.20458984375, 1.4498291015625, 1.695068359375, 1.9403076171875, 2.185546875, 2.4307861328125, 2.676025390625, 2.9212646484375, 3.16650390625, 3.4117431640625, 3.656982421875, 3.9022216796875, 4.1474609375, 4.3927001953125, 4.637939453125, 4.8831787109375, 5.12841796875, 5.3736572265625, 5.618896484375, 5.8641357421875, 6.109375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 12.0, 7.0, 11.0, 20.0, 22.0, 28.0, 42.0, 59.0, 88.0, 102.0, 219.0, 551.0, 1902.0, 10848.0, 202340.0, 3439011.0, 515077.0, 19791.0, 2797.0, 687.0, 235.0, 129.0, 72.0, 57.0, 30.0, 35.0, 24.0, 23.0, 14.0, 14.0, 9.0, 7.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-25.625, -24.96142578125, -24.2978515625, -23.63427734375, -22.970703125, -22.30712890625, -21.6435546875, -20.97998046875, -20.31640625, -19.65283203125, -18.9892578125, -18.32568359375, -17.662109375, -16.99853515625, -16.3349609375, -15.67138671875, -15.0078125, -14.34423828125, -13.6806640625, -13.01708984375, -12.353515625, -11.68994140625, -11.0263671875, -10.36279296875, -9.69921875, -9.03564453125, -8.3720703125, -7.70849609375, -7.044921875, -6.38134765625, -5.7177734375, -5.05419921875, -4.390625, -3.72705078125, -3.0634765625, -2.39990234375, -1.736328125, -1.07275390625, -0.4091796875, 0.25439453125, 0.91796875, 1.58154296875, 2.2451171875, 2.90869140625, 3.572265625, 4.23583984375, 4.8994140625, 5.56298828125, 6.2265625, 6.89013671875, 7.5537109375, 8.21728515625, 8.880859375, 9.54443359375, 10.2080078125, 10.87158203125, 11.53515625, 12.19873046875, 12.8623046875, 13.52587890625, 14.189453125, 14.85302734375, 15.5166015625, 16.18017578125, 16.84375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 8.0, 5.0, 13.0, 18.0, 16.0, 28.0, 41.0, 45.0, 66.0, 76.0, 99.0, 150.0, 211.0, 318.0, 401.0, 535.0, 543.0, 374.0, 320.0, 202.0, 158.0, 101.0, 84.0, 48.0, 47.0, 32.0, 34.0, 23.0, 11.0, 18.0, 8.0, 5.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.315185546875, -10.98193359375, -10.648681640625, -10.3154296875, -9.982177734375, -9.64892578125, -9.315673828125, -8.982421875, -8.649169921875, -8.31591796875, -7.982666015625, -7.6494140625, -7.316162109375, -6.98291015625, -6.649658203125, -6.31640625, -5.983154296875, -5.64990234375, -5.316650390625, -4.9833984375, -4.650146484375, -4.31689453125, -3.983642578125, -3.650390625, -3.317138671875, -2.98388671875, -2.650634765625, -2.3173828125, -1.984130859375, -1.65087890625, -1.317626953125, -0.984375, -0.651123046875, -0.31787109375, 0.015380859375, 0.3486328125, 0.681884765625, 1.01513671875, 1.348388671875, 1.681640625, 2.014892578125, 2.34814453125, 2.681396484375, 3.0146484375, 3.347900390625, 3.68115234375, 4.014404296875, 4.34765625, 4.680908203125, 5.01416015625, 5.347412109375, 5.6806640625, 6.013916015625, 6.34716796875, 6.680419921875, 7.013671875, 7.346923828125, 7.68017578125, 8.013427734375, 8.3466796875, 8.679931640625, 9.01318359375, 9.346435546875, 9.6796875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 20.0, 28.0, 34.0, 51.0, 61.0, 107.0, 132.0, 234.0, 311.0, 775.0, 7137.0, 2743921.0, 1434561.0, 5224.0, 669.0, 310.0, 195.0, 139.0, 114.0, 76.0, 50.0, 32.0, 27.0, 12.0, 21.0, 8.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.6875, -61.81201171875, -59.9365234375, -58.06103515625, -56.185546875, -54.31005859375, -52.4345703125, -50.55908203125, -48.68359375, -46.80810546875, -44.9326171875, -43.05712890625, -41.181640625, -39.30615234375, -37.4306640625, -35.55517578125, -33.6796875, -31.80419921875, -29.9287109375, -28.05322265625, -26.177734375, -24.30224609375, -22.4267578125, -20.55126953125, -18.67578125, -16.80029296875, -14.9248046875, -13.04931640625, -11.173828125, -9.29833984375, -7.4228515625, -5.54736328125, -3.671875, -1.79638671875, 0.0791015625, 1.95458984375, 3.830078125, 5.70556640625, 7.5810546875, 9.45654296875, 11.33203125, 13.20751953125, 15.0830078125, 16.95849609375, 18.833984375, 20.70947265625, 22.5849609375, 24.46044921875, 26.3359375, 28.21142578125, 30.0869140625, 31.96240234375, 33.837890625, 35.71337890625, 37.5888671875, 39.46435546875, 41.33984375, 43.21533203125, 45.0908203125, 46.96630859375, 48.841796875, 50.71728515625, 52.5927734375, 54.46826171875, 56.34375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 44.0, 302.0, 492.0, 151.0, 25.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-330.3089294433594, -323.46893310546875, -316.6289367675781, -309.7889099121094, -302.94891357421875, -296.1089172363281, -289.2689208984375, -282.4289245605469, -275.58892822265625, -268.7489318847656, -261.908935546875, -255.0689239501953, -248.22891235351562, -241.388916015625, -234.54891967773438, -227.70892333984375, -220.868896484375, -214.02890014648438, -207.1888885498047, -200.34889221191406, -193.50888061523438, -186.66888427734375, -179.82888793945312, -172.9888916015625, -166.1488800048828, -159.3088836669922, -152.4688720703125, -145.62887573242188, -138.78887939453125, -131.94886779785156, -125.10887145996094, -118.26886749267578, -111.42884826660156, -104.5888442993164, -97.74884033203125, -90.90884399414062, -84.06884002685547, -77.22883605957031, -70.38883972167969, -63.54883575439453, -56.708831787109375, -49.86882781982422, -43.02882766723633, -36.18882751464844, -29.34882354736328, -22.508819580078125, -15.668819427490234, -8.828819274902344, -1.9888153076171875, 4.851186752319336, 11.69118881225586, 18.531190872192383, 25.371192932128906, 32.21119689941406, 39.05119705200195, 45.891197204589844, 52.731201171875, 59.571205139160156, 66.41120910644531, 73.25120544433594, 80.0912094116211, 86.93121337890625, 93.77120971679688, 100.61121368408203, 107.45121765136719]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 2.0, 2.0, 11.0, 10.0, 8.0, 9.0, 16.0, 8.0, 25.0, 15.0, 22.0, 33.0, 28.0, 32.0, 34.0, 33.0, 32.0, 55.0, 45.0, 37.0, 30.0, 45.0, 49.0, 44.0, 54.0, 31.0, 35.0, 27.0, 36.0, 29.0, 22.0, 23.0, 23.0, 16.0, 13.0, 6.0, 14.0, 12.0, 6.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-37.93328857421875, -36.80702590942383, -35.680763244628906, -34.55450439453125, -33.42824172973633, -32.301979064941406, -31.175716400146484, -30.049453735351562, -28.923192977905273, -27.79693031311035, -26.670669555664062, -25.54440689086914, -24.41814422607422, -23.29188346862793, -22.165620803833008, -21.03936004638672, -19.913097381591797, -18.786834716796875, -17.660573959350586, -16.534311294555664, -15.408049583435059, -14.281787872314453, -13.155525207519531, -12.029263496398926, -10.90300178527832, -9.776740074157715, -8.65047836303711, -7.5242156982421875, -6.397953987121582, -5.271692276000977, -4.145430088043213, -3.019167900085449, -1.8929061889648438, -0.7666442394256592, 0.3596177101135254, 1.48587965965271, 2.6121416091918945, 3.7384033203125, 4.864665508270264, 5.990927696228027, 7.117189407348633, 8.243451118469238, 9.369712829589844, 10.495975494384766, 11.622237205505371, 12.748498916625977, 13.874761581420898, 15.001023292541504, 16.12728500366211, 17.25354766845703, 18.37980842590332, 19.506071090698242, 20.63233184814453, 21.758594512939453, 22.884857177734375, 24.011119842529297, 25.137380599975586, 26.263643264770508, 27.389904022216797, 28.51616668701172, 29.64242935180664, 30.76869010925293, 31.89495277404785, 33.02121353149414, 34.14747619628906]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 13.0, 11.0, 9.0, 20.0, 19.0, 23.0, 27.0, 32.0, 32.0, 35.0, 48.0, 44.0, 47.0, 51.0, 58.0, 41.0, 50.0, 55.0, 51.0, 40.0, 42.0, 35.0, 35.0, 32.0, 22.0, 21.0, 20.0, 15.0, 16.0, 10.0, 8.0, 5.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0390625, -7.81182861328125, -7.5845947265625, -7.35736083984375, -7.130126953125, -6.90289306640625, -6.6756591796875, -6.44842529296875, -6.22119140625, -5.99395751953125, -5.7667236328125, -5.53948974609375, -5.312255859375, -5.08502197265625, -4.8577880859375, -4.63055419921875, -4.4033203125, -4.17608642578125, -3.9488525390625, -3.72161865234375, -3.494384765625, -3.26715087890625, -3.0399169921875, -2.81268310546875, -2.58544921875, -2.35821533203125, -2.1309814453125, -1.90374755859375, -1.676513671875, -1.44927978515625, -1.2220458984375, -0.99481201171875, -0.767578125, -0.54034423828125, -0.3131103515625, -0.08587646484375, 0.141357421875, 0.36859130859375, 0.5958251953125, 0.82305908203125, 1.05029296875, 1.27752685546875, 1.5047607421875, 1.73199462890625, 1.959228515625, 2.18646240234375, 2.4136962890625, 2.64093017578125, 2.8681640625, 3.09539794921875, 3.3226318359375, 3.54986572265625, 3.777099609375, 4.00433349609375, 4.2315673828125, 4.45880126953125, 4.68603515625, 4.91326904296875, 5.1405029296875, 5.36773681640625, 5.594970703125, 5.82220458984375, 6.0494384765625, 6.27667236328125, 6.50390625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 9.0, 11.0, 23.0, 22.0, 38.0, 71.0, 92.0, 137.0, 245.0, 361.0, 579.0, 998.0, 1528.0, 2622.0, 4207.0, 7049.0, 11870.0, 20499.0, 36260.0, 68852.0, 152549.0, 330827.0, 213680.0, 89649.0, 45067.0, 25111.0, 14501.0, 8497.0, 5122.0, 3109.0, 1936.0, 1153.0, 733.0, 419.0, 262.0, 156.0, 109.0, 62.0, 50.0, 28.0, 20.0, 16.0, 7.0, 5.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.304443359375, -0.29512786865234375, -0.2858123779296875, -0.27649688720703125, -0.267181396484375, -0.25786590576171875, -0.2485504150390625, -0.23923492431640625, -0.22991943359375, -0.22060394287109375, -0.2112884521484375, -0.20197296142578125, -0.192657470703125, -0.18334197998046875, -0.1740264892578125, -0.16471099853515625, -0.1553955078125, -0.14608001708984375, -0.1367645263671875, -0.12744903564453125, -0.118133544921875, -0.10881805419921875, -0.0995025634765625, -0.09018707275390625, -0.08087158203125, -0.07155609130859375, -0.0622406005859375, -0.05292510986328125, -0.043609619140625, -0.03429412841796875, -0.0249786376953125, -0.01566314697265625, -0.00634765625, 0.00296783447265625, 0.0122833251953125, 0.02159881591796875, 0.030914306640625, 0.04022979736328125, 0.0495452880859375, 0.05886077880859375, 0.06817626953125, 0.07749176025390625, 0.0868072509765625, 0.09612274169921875, 0.105438232421875, 0.11475372314453125, 0.1240692138671875, 0.13338470458984375, 0.1427001953125, 0.15201568603515625, 0.1613311767578125, 0.17064666748046875, 0.179962158203125, 0.18927764892578125, 0.1985931396484375, 0.20790863037109375, 0.21722412109375, 0.22653961181640625, 0.2358551025390625, 0.24517059326171875, 0.254486083984375, 0.26380157470703125, 0.2731170654296875, 0.28243255615234375, 0.291748046875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 7.0, 13.0, 12.0, 11.0, 14.0, 15.0, 24.0, 30.0, 35.0, 23.0, 21.0, 35.0, 41.0, 39.0, 36.0, 32.0, 30.0, 29.0, 1064.0, 41.0, 53.0, 51.0, 42.0, 33.0, 43.0, 27.0, 30.0, 27.0, 28.0, 10.0, 23.0, 14.0, 16.0, 14.0, 9.0, 8.0, 11.0, 7.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.0078125, -3.88079833984375, -3.7537841796875, -3.62677001953125, -3.499755859375, -3.37274169921875, -3.2457275390625, -3.11871337890625, -2.99169921875, -2.86468505859375, -2.7376708984375, -2.61065673828125, -2.483642578125, -2.35662841796875, -2.2296142578125, -2.10260009765625, -1.9755859375, -1.84857177734375, -1.7215576171875, -1.59454345703125, -1.467529296875, -1.34051513671875, -1.2135009765625, -1.08648681640625, -0.95947265625, -0.83245849609375, -0.7054443359375, -0.57843017578125, -0.451416015625, -0.32440185546875, -0.1973876953125, -0.07037353515625, 0.056640625, 0.18365478515625, 0.3106689453125, 0.43768310546875, 0.564697265625, 0.69171142578125, 0.8187255859375, 0.94573974609375, 1.07275390625, 1.19976806640625, 1.3267822265625, 1.45379638671875, 1.580810546875, 1.70782470703125, 1.8348388671875, 1.96185302734375, 2.0888671875, 2.21588134765625, 2.3428955078125, 2.46990966796875, 2.596923828125, 2.72393798828125, 2.8509521484375, 2.97796630859375, 3.10498046875, 3.23199462890625, 3.3590087890625, 3.48602294921875, 3.613037109375, 3.74005126953125, 3.8670654296875, 3.99407958984375, 4.12109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 4.0, 10.0, 15.0, 24.0, 40.0, 40.0, 65.0, 84.0, 140.0, 215.0, 316.0, 386.0, 601.0, 880.0, 1273.0, 1919.0, 2868.0, 4159.0, 6211.0, 9432.0, 14605.0, 22616.0, 35478.0, 59789.0, 107632.0, 214059.0, 1297886.0, 131224.0, 70331.0, 41079.0, 25422.0, 16409.0, 10515.0, 6864.0, 4715.0, 3084.0, 2166.0, 1445.0, 955.0, 686.0, 457.0, 330.0, 204.0, 147.0, 112.0, 84.0, 50.0, 35.0, 18.0, 18.0, 11.0, 8.0, 3.0, 8.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.2301025390625, -0.2229442596435547, -0.21578598022460938, -0.20862770080566406, -0.20146942138671875, -0.19431114196777344, -0.18715286254882812, -0.1799945831298828, -0.1728363037109375, -0.1656780242919922, -0.15851974487304688, -0.15136146545410156, -0.14420318603515625, -0.13704490661621094, -0.12988662719726562, -0.12272834777832031, -0.115570068359375, -0.10841178894042969, -0.10125350952148438, -0.09409523010253906, -0.08693695068359375, -0.07977867126464844, -0.07262039184570312, -0.06546211242675781, -0.0583038330078125, -0.05114555358886719, -0.043987274169921875, -0.03682899475097656, -0.02967071533203125, -0.022512435913085938, -0.015354156494140625, -0.008195877075195312, -0.00103759765625, 0.0061206817626953125, 0.013278961181640625, 0.020437240600585938, 0.02759552001953125, 0.03475379943847656, 0.041912078857421875, 0.04907035827636719, 0.0562286376953125, 0.06338691711425781, 0.07054519653320312, 0.07770347595214844, 0.08486175537109375, 0.09202003479003906, 0.09917831420898438, 0.10633659362792969, 0.113494873046875, 0.12065315246582031, 0.12781143188476562, 0.13496971130371094, 0.14212799072265625, 0.14928627014160156, 0.15644454956054688, 0.1636028289794922, 0.1707611083984375, 0.1779193878173828, 0.18507766723632812, 0.19223594665527344, 0.19939422607421875, 0.20655250549316406, 0.21371078491210938, 0.2208690643310547, 0.22802734375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 7.0, 11.0, 4.0, 6.0, 14.0, 23.0, 22.0, 36.0, 37.0, 24.0, 43.0, 39.0, 58.0, 63.0, 75.0, 61.0, 45.0, 58.0, 48.0, 55.0, 41.0, 35.0, 30.0, 29.0, 32.0, 20.0, 14.0, 11.0, 9.0, 10.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2378902435302734e-05, -4.1116029024124146e-05, -3.985315561294556e-05, -3.859028220176697e-05, -3.732740879058838e-05, -3.606453537940979e-05, -3.48016619682312e-05, -3.353878855705261e-05, -3.2275915145874023e-05, -3.1013041734695435e-05, -2.9750168323516846e-05, -2.8487294912338257e-05, -2.7224421501159668e-05, -2.596154808998108e-05, -2.469867467880249e-05, -2.34358012676239e-05, -2.2172927856445312e-05, -2.0910054445266724e-05, -1.9647181034088135e-05, -1.8384307622909546e-05, -1.7121434211730957e-05, -1.5858560800552368e-05, -1.459568738937378e-05, -1.333281397819519e-05, -1.2069940567016602e-05, -1.0807067155838013e-05, -9.544193744659424e-06, -8.281320333480835e-06, -7.018446922302246e-06, -5.755573511123657e-06, -4.492700099945068e-06, -3.2298266887664795e-06, -1.9669532775878906e-06, -7.040798664093018e-07, 5.587935447692871e-07, 1.821666955947876e-06, 3.084540367126465e-06, 4.347413778305054e-06, 5.610287189483643e-06, 6.8731606006622314e-06, 8.13603401184082e-06, 9.39890742301941e-06, 1.0661780834197998e-05, 1.1924654245376587e-05, 1.3187527656555176e-05, 1.4450401067733765e-05, 1.5713274478912354e-05, 1.6976147890090942e-05, 1.823902130126953e-05, 1.950189471244812e-05, 2.076476812362671e-05, 2.2027641534805298e-05, 2.3290514945983887e-05, 2.4553388357162476e-05, 2.5816261768341064e-05, 2.7079135179519653e-05, 2.8342008590698242e-05, 2.960488200187683e-05, 3.086775541305542e-05, 3.213062882423401e-05, 3.33935022354126e-05, 3.4656375646591187e-05, 3.5919249057769775e-05, 3.7182122468948364e-05, 3.844499588012695e-05]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 5.0, 6.0, 14.0, 23.0, 13.0, 22.0, 38.0, 27.0, 39.0, 64.0, 64.0, 102.0, 170.0, 276.0, 716.0, 18931.0, 1020895.0, 5747.0, 580.0, 251.0, 140.0, 98.0, 71.0, 46.0, 44.0, 35.0, 27.0, 29.0, 11.0, 12.0, 5.0, 7.0, 8.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00077056884765625, -0.0007452294230461121, -0.0007198899984359741, -0.0006945505738258362, -0.0006692111492156982, -0.0006438717246055603, -0.0006185322999954224, -0.0005931928753852844, -0.0005678534507751465, -0.0005425140261650085, -0.0005171746015548706, -0.0004918351769447327, -0.0004664957523345947, -0.0004411563277244568, -0.00041581690311431885, -0.0003904774785041809, -0.00036513805389404297, -0.00033979862928390503, -0.0003144592046737671, -0.00028911978006362915, -0.0002637803554534912, -0.00023844093084335327, -0.00021310150623321533, -0.0001877620816230774, -0.00016242265701293945, -0.00013708323240280151, -0.00011174380779266357, -8.640438318252563e-05, -6.10649585723877e-05, -3.5725533962249756e-05, -1.0386109352111816e-05, 1.4953315258026123e-05, 4.029273986816406e-05, 6.5632164478302e-05, 9.097158908843994e-05, 0.00011631101369857788, 0.00014165043830871582, 0.00016698986291885376, 0.0001923292875289917, 0.00021766871213912964, 0.00024300813674926758, 0.0002683475613594055, 0.00029368698596954346, 0.0003190264105796814, 0.00034436583518981934, 0.0003697052597999573, 0.0003950446844100952, 0.00042038410902023315, 0.0004457235336303711, 0.00047106295824050903, 0.000496402382850647, 0.0005217418074607849, 0.0005470812320709229, 0.0005724206566810608, 0.0005977600812911987, 0.0006230995059013367, 0.0006484389305114746, 0.0006737783551216125, 0.0006991177797317505, 0.0007244572043418884, 0.0007497966289520264, 0.0007751360535621643, 0.0008004754781723022, 0.0008258149027824402, 0.0008511543273925781]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 32.0, 72.0, 176.0, 233.0, 241.0, 157.0, 53.0, 28.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.698783883824944e-05, -7.534477481385693e-05, -7.370171078946441e-05, -7.205865404102951e-05, -7.0415590016637e-05, -6.877252599224448e-05, -6.712946196785197e-05, -6.548639794345945e-05, -6.384334119502455e-05, -6.220027717063203e-05, -6.0557216784218326e-05, -5.891415275982581e-05, -5.72710923734121e-05, -5.562802834901959e-05, -5.398496432462707e-05, -5.234190393821336e-05, -5.069883627584204e-05, -4.9055772251449525e-05, -4.741271186503582e-05, -4.57696478406433e-05, -4.412658745422959e-05, -4.248352342983708e-05, -4.084045940544456e-05, -3.9197399019030854e-05, -3.7554338632617146e-05, -3.591127460822463e-05, -3.426821422181092e-05, -3.2625150197418407e-05, -3.09820898110047e-05, -2.9339025786612183e-05, -2.769596358120907e-05, -2.605290137580596e-05, -2.4409839170402847e-05, -2.2766776964999735e-05, -2.1123714759596623e-05, -1.948065255419351e-05, -1.7837588529800996e-05, -1.6194526324397884e-05, -1.4551464118994772e-05, -1.2908401004096959e-05, -1.1265338798693847e-05, -9.622276593290735e-06, -7.979213478392921e-06, -6.3361512729898095e-06, -4.693088612839347e-06, -3.050025952688884e-06, -1.4069637472857721e-06, 2.3609936761204153e-07, 1.8791615730151534e-06, 3.522224233165616e-06, 5.165286893316079e-06, 6.808349098719191e-06, 8.451412213617004e-06, 1.0094474419020116e-05, 1.1737536624423228e-05, 1.3380599739321042e-05, 1.5023661944724154e-05, 1.6666725059621967e-05, 1.830978726502508e-05, 1.995284947042819e-05, 2.1595911675831303e-05, 2.323897570022382e-05, 2.4882036086637527e-05, 2.6525100111030042e-05, 2.8168162316433154e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 4.0, 5.0, 12.0, 9.0, 8.0, 11.0, 17.0, 13.0, 17.0, 20.0, 24.0, 33.0, 26.0, 35.0, 42.0, 43.0, 36.0, 42.0, 41.0, 41.0, 32.0, 37.0, 33.0, 36.0, 42.0, 34.0, 41.0, 28.0, 26.0, 36.0, 24.0, 24.0, 23.0, 22.0, 16.0, 16.0, 9.0, 10.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.9066035747528076e-05, -1.8402934074401855e-05, -1.7739832401275635e-05, -1.7076730728149414e-05, -1.6413629055023193e-05, -1.5750527381896973e-05, -1.5087425708770752e-05, -1.4424324035644531e-05, -1.376122236251831e-05, -1.309812068939209e-05, -1.2435019016265869e-05, -1.1771917343139648e-05, -1.1108815670013428e-05, -1.0445713996887207e-05, -9.782612323760986e-06, -9.119510650634766e-06, -8.456408977508545e-06, -7.793307304382324e-06, -7.1302056312561035e-06, -6.467103958129883e-06, -5.804002285003662e-06, -5.140900611877441e-06, -4.477798938751221e-06, -3.814697265625e-06, -3.1515955924987793e-06, -2.4884939193725586e-06, -1.8253922462463379e-06, -1.1622905731201172e-06, -4.991888999938965e-07, 1.6391277313232422e-07, 8.270144462585449e-07, 1.4901161193847656e-06, 2.1532177925109863e-06, 2.816319465637207e-06, 3.4794211387634277e-06, 4.1425228118896484e-06, 4.805624485015869e-06, 5.46872615814209e-06, 6.1318278312683105e-06, 6.794929504394531e-06, 7.458031177520752e-06, 8.121132850646973e-06, 8.784234523773193e-06, 9.447336196899414e-06, 1.0110437870025635e-05, 1.0773539543151855e-05, 1.1436641216278076e-05, 1.2099742889404297e-05, 1.2762844562530518e-05, 1.3425946235656738e-05, 1.4089047908782959e-05, 1.475214958190918e-05, 1.54152512550354e-05, 1.607835292816162e-05, 1.6741454601287842e-05, 1.7404556274414062e-05, 1.8067657947540283e-05, 1.8730759620666504e-05, 1.9393861293792725e-05, 2.0056962966918945e-05, 2.0720064640045166e-05, 2.1383166313171387e-05, 2.2046267986297607e-05, 2.2709369659423828e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 13.0, 11.0, 9.0, 20.0, 19.0, 23.0, 27.0, 32.0, 32.0, 35.0, 48.0, 44.0, 47.0, 51.0, 58.0, 41.0, 50.0, 55.0, 51.0, 40.0, 42.0, 35.0, 35.0, 32.0, 22.0, 21.0, 20.0, 15.0, 16.0, 10.0, 8.0, 5.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0390625, -7.81182861328125, -7.5845947265625, -7.35736083984375, -7.130126953125, -6.90289306640625, -6.6756591796875, -6.44842529296875, -6.22119140625, -5.99395751953125, -5.7667236328125, -5.53948974609375, -5.312255859375, -5.08502197265625, -4.8577880859375, -4.63055419921875, -4.4033203125, -4.17608642578125, -3.9488525390625, -3.72161865234375, -3.494384765625, -3.26715087890625, -3.0399169921875, -2.81268310546875, -2.58544921875, -2.35821533203125, -2.1309814453125, -1.90374755859375, -1.676513671875, -1.44927978515625, -1.2220458984375, -0.99481201171875, -0.767578125, -0.54034423828125, -0.3131103515625, -0.08587646484375, 0.141357421875, 0.36859130859375, 0.5958251953125, 0.82305908203125, 1.05029296875, 1.27752685546875, 1.5047607421875, 1.73199462890625, 1.959228515625, 2.18646240234375, 2.4136962890625, 2.64093017578125, 2.8681640625, 3.09539794921875, 3.3226318359375, 3.54986572265625, 3.777099609375, 4.00433349609375, 4.2315673828125, 4.45880126953125, 4.68603515625, 4.91326904296875, 5.1405029296875, 5.36773681640625, 5.594970703125, 5.82220458984375, 6.0494384765625, 6.27667236328125, 6.50390625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 11.0, 18.0, 20.0, 32.0, 40.0, 60.0, 64.0, 98.0, 145.0, 216.0, 415.0, 753.0, 1561.0, 3498.0, 8757.0, 26094.0, 95301.0, 468030.0, 338655.0, 71256.0, 20566.0, 7041.0, 2897.0, 1299.0, 675.0, 357.0, 210.0, 136.0, 77.0, 70.0, 38.0, 34.0, 34.0, 18.0, 17.0, 13.0, 10.0, 6.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-7.2265625, -7.01947021484375, -6.8123779296875, -6.60528564453125, -6.398193359375, -6.19110107421875, -5.9840087890625, -5.77691650390625, -5.56982421875, -5.36273193359375, -5.1556396484375, -4.94854736328125, -4.741455078125, -4.53436279296875, -4.3272705078125, -4.12017822265625, -3.9130859375, -3.70599365234375, -3.4989013671875, -3.29180908203125, -3.084716796875, -2.87762451171875, -2.6705322265625, -2.46343994140625, -2.25634765625, -2.04925537109375, -1.8421630859375, -1.63507080078125, -1.427978515625, -1.22088623046875, -1.0137939453125, -0.80670166015625, -0.599609375, -0.39251708984375, -0.1854248046875, 0.02166748046875, 0.228759765625, 0.43585205078125, 0.6429443359375, 0.85003662109375, 1.05712890625, 1.26422119140625, 1.4713134765625, 1.67840576171875, 1.885498046875, 2.09259033203125, 2.2996826171875, 2.50677490234375, 2.7138671875, 2.92095947265625, 3.1280517578125, 3.33514404296875, 3.542236328125, 3.74932861328125, 3.9564208984375, 4.16351318359375, 4.37060546875, 4.57769775390625, 4.7847900390625, 4.99188232421875, 5.198974609375, 5.40606689453125, 5.6131591796875, 5.82025146484375, 6.02734375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 9.0, 2.0, 14.0, 14.0, 10.0, 18.0, 25.0, 24.0, 34.0, 29.0, 29.0, 35.0, 43.0, 58.0, 62.0, 91.0, 371.0, 1642.0, 123.0, 52.0, 55.0, 53.0, 41.0, 35.0, 33.0, 23.0, 25.0, 16.0, 12.0, 10.0, 11.0, 8.0, 9.0, 8.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.15625, -26.424560546875, -25.69287109375, -24.961181640625, -24.2294921875, -23.497802734375, -22.76611328125, -22.034423828125, -21.302734375, -20.571044921875, -19.83935546875, -19.107666015625, -18.3759765625, -17.644287109375, -16.91259765625, -16.180908203125, -15.44921875, -14.717529296875, -13.98583984375, -13.254150390625, -12.5224609375, -11.790771484375, -11.05908203125, -10.327392578125, -9.595703125, -8.864013671875, -8.13232421875, -7.400634765625, -6.6689453125, -5.937255859375, -5.20556640625, -4.473876953125, -3.7421875, -3.010498046875, -2.27880859375, -1.547119140625, -0.8154296875, -0.083740234375, 0.64794921875, 1.379638671875, 2.111328125, 2.843017578125, 3.57470703125, 4.306396484375, 5.0380859375, 5.769775390625, 6.50146484375, 7.233154296875, 7.96484375, 8.696533203125, 9.42822265625, 10.159912109375, 10.8916015625, 11.623291015625, 12.35498046875, 13.086669921875, 13.818359375, 14.550048828125, 15.28173828125, 16.013427734375, 16.7451171875, 17.476806640625, 18.20849609375, 18.940185546875, 19.671875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 8.0, 12.0, 8.0, 14.0, 8.0, 14.0, 21.0, 25.0, 39.0, 45.0, 53.0, 77.0, 102.0, 139.0, 198.0, 318.0, 641.0, 3366.0, 2494593.0, 641850.0, 2504.0, 580.0, 304.0, 187.0, 141.0, 101.0, 69.0, 66.0, 53.0, 40.0, 31.0, 20.0, 22.0, 16.0, 8.0, 12.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.0, -38.515625, -37.03125, -35.546875, -34.0625, -32.578125, -31.09375, -29.609375, -28.125, -26.640625, -25.15625, -23.671875, -22.1875, -20.703125, -19.21875, -17.734375, -16.25, -14.765625, -13.28125, -11.796875, -10.3125, -8.828125, -7.34375, -5.859375, -4.375, -2.890625, -1.40625, 0.078125, 1.5625, 3.046875, 4.53125, 6.015625, 7.5, 8.984375, 10.46875, 11.953125, 13.4375, 14.921875, 16.40625, 17.890625, 19.375, 20.859375, 22.34375, 23.828125, 25.3125, 26.796875, 28.28125, 29.765625, 31.25, 32.734375, 34.21875, 35.703125, 37.1875, 38.671875, 40.15625, 41.640625, 43.125, 44.609375, 46.09375, 47.578125, 49.0625, 50.546875, 52.03125, 53.515625, 55.0]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 143.0, 718.0, 148.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-223.02232360839844, -219.00196838378906, -214.98162841796875, -210.96127319335938, -206.94091796875, -202.9205780029297, -198.9002227783203, -194.8798828125, -190.85952758789062, -186.83917236328125, -182.81883239746094, -178.79847717285156, -174.77813720703125, -170.75778198242188, -166.7374267578125, -162.7170867919922, -158.6967315673828, -154.67637634277344, -150.65603637695312, -146.63568115234375, -142.61532592773438, -138.59498596191406, -134.5746307373047, -130.55429077148438, -126.533935546875, -122.51358795166016, -118.49324035644531, -114.47288513183594, -110.4525375366211, -106.43218994140625, -102.41183471679688, -98.39148712158203, -94.37115478515625, -90.3508071899414, -86.33045959472656, -82.31010437011719, -78.28975677490234, -74.2694091796875, -70.24905395507812, -66.22870635986328, -62.20835494995117, -58.18800354003906, -54.16765594482422, -50.147308349609375, -46.126956939697266, -42.106605529785156, -38.08625793457031, -34.06591033935547, -30.04555892944336, -26.025209426879883, -22.004859924316406, -17.98451042175293, -13.964160919189453, -9.943811416625977, -5.9234619140625, -1.9031124114990234, 2.117237091064453, 6.13758659362793, 10.157936096191406, 14.178285598754883, 18.19863510131836, 22.218984603881836, 26.239334106445312, 30.25968360900879, 34.280033111572266]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 4.0, 8.0, 5.0, 11.0, 11.0, 10.0, 18.0, 20.0, 20.0, 22.0, 16.0, 24.0, 25.0, 31.0, 35.0, 36.0, 49.0, 47.0, 50.0, 48.0, 48.0, 45.0, 40.0, 42.0, 32.0, 38.0, 33.0, 28.0, 25.0, 28.0, 25.0, 19.0, 19.0, 18.0, 7.0, 4.0, 12.0, 10.0, 5.0, 9.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-60.959716796875, -59.0357666015625, -57.111820220947266, -55.187870025634766, -53.26392364501953, -51.33997344970703, -49.41602325439453, -47.4920768737793, -45.56813049316406, -43.64418029785156, -41.72023391723633, -39.79628372192383, -37.872337341308594, -35.948387145996094, -34.024436950683594, -32.10049057006836, -30.17654037475586, -28.252592086791992, -26.328643798828125, -24.404693603515625, -22.48074722290039, -20.55679702758789, -18.632848739624023, -16.708900451660156, -14.784952163696289, -12.861003875732422, -10.937055587768555, -9.013106346130371, -7.089158058166504, -5.165209770202637, -3.241260528564453, -1.317312240600586, 0.6066360473632812, 2.5305845737457275, 4.454533100128174, 6.378481864929199, 8.302430152893066, 10.226378440856934, 12.150327682495117, 14.074275970458984, 15.998224258422852, 17.92217254638672, 19.846120834350586, 21.770069122314453, 23.694019317626953, 25.617965698242188, 27.541915893554688, 29.465864181518555, 31.389812469482422, 33.31376266479492, 35.237709045410156, 37.161659240722656, 39.08560562133789, 41.00955581665039, 42.933502197265625, 44.857452392578125, 46.781402587890625, 48.705352783203125, 50.62929916381836, 52.55324935913086, 54.477195739746094, 56.401145935058594, 58.325096130371094, 60.24904251098633, 62.17298889160156]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 13.0, 13.0, 11.0, 20.0, 19.0, 21.0, 24.0, 30.0, 30.0, 37.0, 43.0, 47.0, 40.0, 50.0, 58.0, 44.0, 38.0, 48.0, 54.0, 41.0, 43.0, 42.0, 35.0, 29.0, 29.0, 26.0, 20.0, 19.0, 9.0, 11.0, 8.0, 11.0, 5.0, 5.0, 1.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.96502685546875, -7.7347412109375, -7.50445556640625, -7.274169921875, -7.04388427734375, -6.8135986328125, -6.58331298828125, -6.35302734375, -6.12274169921875, -5.8924560546875, -5.66217041015625, -5.431884765625, -5.20159912109375, -4.9713134765625, -4.74102783203125, -4.5107421875, -4.28045654296875, -4.0501708984375, -3.81988525390625, -3.589599609375, -3.35931396484375, -3.1290283203125, -2.89874267578125, -2.66845703125, -2.43817138671875, -2.2078857421875, -1.97760009765625, -1.747314453125, -1.51702880859375, -1.2867431640625, -1.05645751953125, -0.826171875, -0.59588623046875, -0.3656005859375, -0.13531494140625, 0.094970703125, 0.32525634765625, 0.5555419921875, 0.78582763671875, 1.01611328125, 1.24639892578125, 1.4766845703125, 1.70697021484375, 1.937255859375, 2.16754150390625, 2.3978271484375, 2.62811279296875, 2.8583984375, 3.08868408203125, 3.3189697265625, 3.54925537109375, 3.779541015625, 4.00982666015625, 4.2401123046875, 4.47039794921875, 4.70068359375, 4.93096923828125, 5.1612548828125, 5.39154052734375, 5.621826171875, 5.85211181640625, 6.0823974609375, 6.31268310546875, 6.54296875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 11.0, 4.0, 14.0, 16.0, 16.0, 35.0, 41.0, 46.0, 77.0, 109.0, 158.0, 277.0, 572.0, 1448.0, 5172.0, 32618.0, 647015.0, 3230400.0, 251620.0, 18931.0, 3505.0, 1025.0, 437.0, 210.0, 145.0, 109.0, 54.0, 52.0, 37.0, 25.0, 27.0, 12.0, 9.0, 7.0, 10.0, 6.0, 5.0, 2.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.765625, -20.178466796875, -19.59130859375, -19.004150390625, -18.4169921875, -17.829833984375, -17.24267578125, -16.655517578125, -16.068359375, -15.481201171875, -14.89404296875, -14.306884765625, -13.7197265625, -13.132568359375, -12.54541015625, -11.958251953125, -11.37109375, -10.783935546875, -10.19677734375, -9.609619140625, -9.0224609375, -8.435302734375, -7.84814453125, -7.260986328125, -6.673828125, -6.086669921875, -5.49951171875, -4.912353515625, -4.3251953125, -3.738037109375, -3.15087890625, -2.563720703125, -1.9765625, -1.389404296875, -0.80224609375, -0.215087890625, 0.3720703125, 0.959228515625, 1.54638671875, 2.133544921875, 2.720703125, 3.307861328125, 3.89501953125, 4.482177734375, 5.0693359375, 5.656494140625, 6.24365234375, 6.830810546875, 7.41796875, 8.005126953125, 8.59228515625, 9.179443359375, 9.7666015625, 10.353759765625, 10.94091796875, 11.528076171875, 12.115234375, 12.702392578125, 13.28955078125, 13.876708984375, 14.4638671875, 15.051025390625, 15.63818359375, 16.225341796875, 16.8125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 23.0, 19.0, 46.0, 67.0, 109.0, 171.0, 344.0, 625.0, 948.0, 732.0, 426.0, 232.0, 133.0, 75.0, 37.0, 22.0, 20.0, 18.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.984375, -28.3499755859375, -27.715576171875, -27.0811767578125, -26.44677734375, -25.8123779296875, -25.177978515625, -24.5435791015625, -23.9091796875, -23.2747802734375, -22.640380859375, -22.0059814453125, -21.37158203125, -20.7371826171875, -20.102783203125, -19.4683837890625, -18.833984375, -18.1995849609375, -17.565185546875, -16.9307861328125, -16.29638671875, -15.6619873046875, -15.027587890625, -14.3931884765625, -13.7587890625, -13.1243896484375, -12.489990234375, -11.8555908203125, -11.22119140625, -10.5867919921875, -9.952392578125, -9.3179931640625, -8.68359375, -8.0491943359375, -7.414794921875, -6.7803955078125, -6.14599609375, -5.5115966796875, -4.877197265625, -4.2427978515625, -3.6083984375, -2.9739990234375, -2.339599609375, -1.7052001953125, -1.07080078125, -0.4364013671875, 0.197998046875, 0.8323974609375, 1.466796875, 2.1011962890625, 2.735595703125, 3.3699951171875, 4.00439453125, 4.6387939453125, 5.273193359375, 5.9075927734375, 6.5419921875, 7.1763916015625, 7.810791015625, 8.4451904296875, 9.07958984375, 9.7139892578125, 10.348388671875, 10.9827880859375, 11.6171875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 21.0, 15.0, 28.0, 84.0, 140.0, 240.0, 457.0, 2851.0, 3429290.0, 758325.0, 1863.0, 452.0, 209.0, 139.0, 74.0, 47.0, 21.0, 13.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.78125, -55.31005859375, -51.8388671875, -48.36767578125, -44.896484375, -41.42529296875, -37.9541015625, -34.48291015625, -31.01171875, -27.54052734375, -24.0693359375, -20.59814453125, -17.126953125, -13.65576171875, -10.1845703125, -6.71337890625, -3.2421875, 0.22900390625, 3.7001953125, 7.17138671875, 10.642578125, 14.11376953125, 17.5849609375, 21.05615234375, 24.52734375, 27.99853515625, 31.4697265625, 34.94091796875, 38.412109375, 41.88330078125, 45.3544921875, 48.82568359375, 52.296875, 55.76806640625, 59.2392578125, 62.71044921875, 66.181640625, 69.65283203125, 73.1240234375, 76.59521484375, 80.06640625, 83.53759765625, 87.0087890625, 90.47998046875, 93.951171875, 97.42236328125, 100.8935546875, 104.36474609375, 107.8359375, 111.30712890625, 114.7783203125, 118.24951171875, 121.720703125, 125.19189453125, 128.6630859375, 132.13427734375, 135.60546875, 139.07666015625, 142.5478515625, 146.01904296875, 149.490234375, 152.96142578125, 156.4326171875, 159.90380859375, 163.375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 11.0, 57.0, 77.0, 133.0, 226.0, 200.0, 148.0, 84.0, 32.0, 17.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.05828094482422, -93.15733337402344, -90.25639343261719, -87.3554458618164, -84.45449829101562, -81.55355072021484, -78.65260314941406, -75.75166320800781, -72.85071563720703, -69.94976806640625, -67.048828125, -64.14788055419922, -61.24693298339844, -58.345985412597656, -55.44504165649414, -52.544097900390625, -49.643150329589844, -46.74220275878906, -43.84125900268555, -40.94031524658203, -38.03936767578125, -35.13842010498047, -32.23747634887695, -29.336530685424805, -26.435585021972656, -23.534639358520508, -20.63369369506836, -17.73274803161621, -14.831802368164062, -11.930856704711914, -9.029911041259766, -6.128965377807617, -3.22802734375, -0.32708168029785156, 2.573863983154297, 5.474809646606445, 8.375755310058594, 11.276700973510742, 14.17764663696289, 17.07859230041504, 19.979537963867188, 22.880483627319336, 25.781429290771484, 28.682374954223633, 31.58332061767578, 34.48426818847656, 37.38521194458008, 40.286155700683594, 43.187103271484375, 46.088050842285156, 48.98899459838867, 51.88993835449219, 54.79088592529297, 57.69183349609375, 60.592777252197266, 63.49372100830078, 66.39466857910156, 69.29561614990234, 72.19656372070312, 75.09750366210938, 77.99845123291016, 80.89939880371094, 83.80033874511719, 86.70128631591797, 89.60223388671875]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 5.0, 5.0, 3.0, 10.0, 12.0, 19.0, 15.0, 22.0, 21.0, 13.0, 33.0, 31.0, 26.0, 30.0, 39.0, 36.0, 32.0, 35.0, 40.0, 40.0, 46.0, 42.0, 33.0, 37.0, 48.0, 35.0, 28.0, 29.0, 30.0, 23.0, 24.0, 27.0, 17.0, 20.0, 13.0, 12.0, 10.0, 12.0, 8.0, 9.0, 4.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-36.830474853515625, -35.69522476196289, -34.559974670410156, -33.424720764160156, -32.28947067260742, -31.154220581054688, -30.018970489501953, -28.883718490600586, -27.74846649169922, -26.613216400146484, -25.477964401245117, -24.342714309692383, -23.207462310791016, -22.07221221923828, -20.936962127685547, -19.80171012878418, -18.666460037231445, -17.53120994567871, -16.395957946777344, -15.26070785522461, -14.125455856323242, -12.990205764770508, -11.854954719543457, -10.719703674316406, -9.584452629089355, -8.449201583862305, -7.313950538635254, -6.178699970245361, -5.0434489250183105, -3.9081978797912598, -2.772947311401367, -1.6376962661743164, -0.5024452209472656, 0.6328057050704956, 1.7680566310882568, 2.9033074378967285, 4.038558483123779, 5.17380952835083, 6.309060096740723, 7.444311141967773, 8.579562187194824, 9.714813232421875, 10.850064277648926, 11.985315322875977, 13.120565414428711, 14.255817413330078, 15.391067504882812, 16.526317596435547, 17.661569595336914, 18.79681968688965, 19.932071685791016, 21.06732177734375, 22.202573776245117, 23.33782386779785, 24.47307586669922, 25.608325958251953, 26.743576049804688, 27.878826141357422, 29.01407814025879, 30.149328231811523, 31.28458023071289, 32.419830322265625, 33.55508041381836, 34.690330505371094, 35.825584411621094]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 6.0, 6.0, 2.0, 10.0, 7.0, 13.0, 17.0, 16.0, 23.0, 26.0, 25.0, 22.0, 25.0, 50.0, 37.0, 56.0, 55.0, 46.0, 37.0, 55.0, 65.0, 51.0, 36.0, 40.0, 42.0, 36.0, 29.0, 20.0, 33.0, 24.0, 22.0, 17.0, 20.0, 12.0, 8.0, 5.0, 2.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.6368408203125, -8.398681640625, -8.1605224609375, -7.92236328125, -7.6842041015625, -7.446044921875, -7.2078857421875, -6.9697265625, -6.7315673828125, -6.493408203125, -6.2552490234375, -6.01708984375, -5.7789306640625, -5.540771484375, -5.3026123046875, -5.064453125, -4.8262939453125, -4.588134765625, -4.3499755859375, -4.11181640625, -3.8736572265625, -3.635498046875, -3.3973388671875, -3.1591796875, -2.9210205078125, -2.682861328125, -2.4447021484375, -2.20654296875, -1.9683837890625, -1.730224609375, -1.4920654296875, -1.25390625, -1.0157470703125, -0.777587890625, -0.5394287109375, -0.30126953125, -0.0631103515625, 0.175048828125, 0.4132080078125, 0.6513671875, 0.8895263671875, 1.127685546875, 1.3658447265625, 1.60400390625, 1.8421630859375, 2.080322265625, 2.3184814453125, 2.556640625, 2.7947998046875, 3.032958984375, 3.2711181640625, 3.50927734375, 3.7474365234375, 3.985595703125, 4.2237548828125, 4.4619140625, 4.7000732421875, 4.938232421875, 5.1763916015625, 5.41455078125, 5.6527099609375, 5.890869140625, 6.1290283203125, 6.3671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 12.0, 35.0, 29.0, 48.0, 81.0, 140.0, 229.0, 364.0, 621.0, 1012.0, 1821.0, 2994.0, 5055.0, 8780.0, 15101.0, 26345.0, 49080.0, 99237.0, 247104.0, 321406.0, 131563.0, 61431.0, 32540.0, 18370.0, 10308.0, 6177.0, 3521.0, 2030.0, 1213.0, 703.0, 459.0, 299.0, 154.0, 88.0, 55.0, 45.0, 24.0, 19.0, 13.0, 8.0, 6.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31591796875, -0.3057823181152344, -0.29564666748046875, -0.2855110168457031, -0.2753753662109375, -0.2652397155761719, -0.25510406494140625, -0.24496841430664062, -0.234832763671875, -0.22469711303710938, -0.21456146240234375, -0.20442581176757812, -0.1942901611328125, -0.18415451049804688, -0.17401885986328125, -0.16388320922851562, -0.15374755859375, -0.14361190795898438, -0.13347625732421875, -0.12334060668945312, -0.1132049560546875, -0.10306930541992188, -0.09293365478515625, -0.08279800415039062, -0.072662353515625, -0.06252670288085938, -0.05239105224609375, -0.042255401611328125, -0.0321197509765625, -0.021984100341796875, -0.01184844970703125, -0.001712799072265625, 0.0084228515625, 0.018558502197265625, 0.02869415283203125, 0.038829803466796875, 0.0489654541015625, 0.059101104736328125, 0.06923675537109375, 0.07937240600585938, 0.089508056640625, 0.09964370727539062, 0.10977935791015625, 0.11991500854492188, 0.1300506591796875, 0.14018630981445312, 0.15032196044921875, 0.16045761108398438, 0.17059326171875, 0.18072891235351562, 0.19086456298828125, 0.20100021362304688, 0.2111358642578125, 0.22127151489257812, 0.23140716552734375, 0.24154281616210938, 0.251678466796875, 0.2618141174316406, 0.27194976806640625, 0.2820854187011719, 0.2922210693359375, 0.3023567199707031, 0.31249237060546875, 0.3226280212402344, 0.332763671875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 9.0, 5.0, 7.0, 17.0, 17.0, 12.0, 17.0, 17.0, 17.0, 25.0, 20.0, 23.0, 29.0, 23.0, 29.0, 24.0, 35.0, 30.0, 27.0, 40.0, 44.0, 34.0, 1051.0, 36.0, 37.0, 39.0, 33.0, 34.0, 35.0, 27.0, 26.0, 23.0, 19.0, 21.0, 17.0, 12.0, 18.0, 15.0, 19.0, 8.0, 5.0, 8.0, 9.0, 8.0, 8.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.96484375, -3.845001220703125, -3.72515869140625, -3.605316162109375, -3.4854736328125, -3.365631103515625, -3.24578857421875, -3.125946044921875, -3.006103515625, -2.886260986328125, -2.76641845703125, -2.646575927734375, -2.5267333984375, -2.406890869140625, -2.28704833984375, -2.167205810546875, -2.04736328125, -1.927520751953125, -1.80767822265625, -1.687835693359375, -1.5679931640625, -1.448150634765625, -1.32830810546875, -1.208465576171875, -1.088623046875, -0.968780517578125, -0.84893798828125, -0.729095458984375, -0.6092529296875, -0.489410400390625, -0.36956787109375, -0.249725341796875, -0.1298828125, -0.010040283203125, 0.10980224609375, 0.229644775390625, 0.3494873046875, 0.469329833984375, 0.58917236328125, 0.709014892578125, 0.828857421875, 0.948699951171875, 1.06854248046875, 1.188385009765625, 1.3082275390625, 1.428070068359375, 1.54791259765625, 1.667755126953125, 1.78759765625, 1.907440185546875, 2.02728271484375, 2.147125244140625, 2.2669677734375, 2.386810302734375, 2.50665283203125, 2.626495361328125, 2.746337890625, 2.866180419921875, 2.98602294921875, 3.105865478515625, 3.2257080078125, 3.345550537109375, 3.46539306640625, 3.585235595703125, 3.705078125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 16.0, 13.0, 27.0, 30.0, 37.0, 84.0, 119.0, 146.0, 233.0, 276.0, 463.0, 637.0, 916.0, 1249.0, 1749.0, 2579.0, 3611.0, 5062.0, 7284.0, 10328.0, 14989.0, 22089.0, 32220.0, 49904.0, 82748.0, 154762.0, 1295258.0, 164813.0, 86534.0, 51637.0, 33503.0, 22489.0, 15608.0, 10686.0, 7426.0, 5125.0, 3672.0, 2556.0, 1834.0, 1329.0, 939.0, 618.0, 420.0, 376.0, 224.0, 138.0, 113.0, 76.0, 69.0, 36.0, 26.0, 18.0, 12.0, 10.0, 4.0, 4.0, 2.0, 2.0], "bins": [-0.22314453125, -0.21628761291503906, -0.20943069458007812, -0.2025737762451172, -0.19571685791015625, -0.1888599395751953, -0.18200302124023438, -0.17514610290527344, -0.1682891845703125, -0.16143226623535156, -0.15457534790039062, -0.1477184295654297, -0.14086151123046875, -0.1340045928955078, -0.12714767456054688, -0.12029075622558594, -0.113433837890625, -0.10657691955566406, -0.09972000122070312, -0.09286308288574219, -0.08600616455078125, -0.07914924621582031, -0.07229232788085938, -0.06543540954589844, -0.0585784912109375, -0.05172157287597656, -0.044864654541015625, -0.03800773620605469, -0.03115081787109375, -0.024293899536132812, -0.017436981201171875, -0.010580062866210938, -0.00372314453125, 0.0031337738037109375, 0.009990692138671875, 0.016847610473632812, 0.02370452880859375, 0.030561447143554688, 0.037418365478515625, 0.04427528381347656, 0.0511322021484375, 0.05798912048339844, 0.06484603881835938, 0.07170295715332031, 0.07855987548828125, 0.08541679382324219, 0.09227371215820312, 0.09913063049316406, 0.105987548828125, 0.11284446716308594, 0.11970138549804688, 0.1265583038330078, 0.13341522216796875, 0.1402721405029297, 0.14712905883789062, 0.15398597717285156, 0.1608428955078125, 0.16769981384277344, 0.17455673217773438, 0.1814136505126953, 0.18827056884765625, 0.1951274871826172, 0.20198440551757812, 0.20884132385253906, 0.2156982421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 9.0, 14.0, 6.0, 10.0, 17.0, 10.0, 23.0, 27.0, 20.0, 28.0, 33.0, 57.0, 45.0, 49.0, 66.0, 64.0, 46.0, 76.0, 52.0, 34.0, 49.0, 51.0, 37.0, 38.0, 25.0, 15.0, 12.0, 21.0, 11.0, 10.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.917049616575241e-05, -3.786943852901459e-05, -3.6568380892276764e-05, -3.526732325553894e-05, -3.396626561880112e-05, -3.2665207982063293e-05, -3.136415034532547e-05, -3.0063092708587646e-05, -2.8762035071849823e-05, -2.7460977435112e-05, -2.6159919798374176e-05, -2.4858862161636353e-05, -2.355780452489853e-05, -2.2256746888160706e-05, -2.0955689251422882e-05, -1.965463161468506e-05, -1.8353573977947235e-05, -1.705251634120941e-05, -1.5751458704471588e-05, -1.4450401067733765e-05, -1.3149343430995941e-05, -1.1848285794258118e-05, -1.0547228157520294e-05, -9.24617052078247e-06, -7.945112884044647e-06, -6.644055247306824e-06, -5.342997610569e-06, -4.041939973831177e-06, -2.7408823370933533e-06, -1.4398247003555298e-06, -1.387670636177063e-07, 1.1622905731201172e-06, 2.4633482098579407e-06, 3.764405846595764e-06, 5.065463483333588e-06, 6.366521120071411e-06, 7.667578756809235e-06, 8.968636393547058e-06, 1.0269694030284882e-05, 1.1570751667022705e-05, 1.2871809303760529e-05, 1.4172866940498352e-05, 1.5473924577236176e-05, 1.6774982213974e-05, 1.8076039850711823e-05, 1.9377097487449646e-05, 2.067815512418747e-05, 2.1979212760925293e-05, 2.3280270397663116e-05, 2.458132803440094e-05, 2.5882385671138763e-05, 2.7183443307876587e-05, 2.848450094461441e-05, 2.9785558581352234e-05, 3.108661621809006e-05, 3.238767385482788e-05, 3.3688731491565704e-05, 3.498978912830353e-05, 3.629084676504135e-05, 3.7591904401779175e-05, 3.8892962038517e-05, 4.019401967525482e-05, 4.1495077311992645e-05, 4.279613494873047e-05]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 7.0, 7.0, 11.0, 21.0, 21.0, 26.0, 32.0, 46.0, 71.0, 71.0, 115.0, 185.0, 340.0, 1109.0, 439975.0, 604270.0, 1283.0, 334.0, 174.0, 114.0, 69.0, 57.0, 40.0, 45.0, 24.0, 17.0, 17.0, 16.0, 11.0, 8.0, 8.0, 5.0, 9.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009493827819824219, -0.000919736921787262, -0.000890091061592102, -0.0008604452013969421, -0.0008307993412017822, -0.0008011534810066223, -0.0007715076208114624, -0.0007418617606163025, -0.0007122159004211426, -0.0006825700402259827, -0.0006529241800308228, -0.0006232783198356628, -0.0005936324596405029, -0.000563986599445343, -0.0005343407392501831, -0.0005046948790550232, -0.0004750490188598633, -0.00044540315866470337, -0.00041575729846954346, -0.00038611143827438354, -0.00035646557807922363, -0.0003268197178840637, -0.0002971738576889038, -0.0002675279974937439, -0.00023788213729858398, -0.00020823627710342407, -0.00017859041690826416, -0.00014894455671310425, -0.00011929869651794434, -8.965283632278442e-05, -6.000697612762451e-05, -3.03611159324646e-05, -7.152557373046875e-07, 2.8930604457855225e-05, 5.857646465301514e-05, 8.822232484817505e-05, 0.00011786818504333496, 0.00014751404523849487, 0.00017715990543365479, 0.0002068057656288147, 0.0002364516258239746, 0.0002660974860191345, 0.00029574334621429443, 0.00032538920640945435, 0.00035503506660461426, 0.00038468092679977417, 0.0004143267869949341, 0.000443972647190094, 0.0004736185073852539, 0.0005032643675804138, 0.0005329102277755737, 0.0005625560879707336, 0.0005922019481658936, 0.0006218478083610535, 0.0006514936685562134, 0.0006811395287513733, 0.0007107853889465332, 0.0007404312491416931, 0.000770077109336853, 0.0007997229695320129, 0.0008293688297271729, 0.0008590146899223328, 0.0008886605501174927, 0.0009183064103126526, 0.0009479522705078125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 52.0, 261.0, 400.0, 214.0, 63.0, 17.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2728581067640334e-05, -4.987321881344542e-05, -4.70178529212717e-05, -4.4162487029097974e-05, -4.130712477490306e-05, -3.8451762520708144e-05, -3.559639662853442e-05, -3.27410307363607e-05, -2.9885668482165784e-05, -2.7030304408981465e-05, -2.4174940335797146e-05, -2.1319576262612827e-05, -1.8464212189428508e-05, -1.560884811624419e-05, -1.275348404305987e-05, -9.898119969875552e-06, -7.042755896691233e-06, -4.187391823506914e-06, -1.3320277503225952e-06, 1.5233363228617236e-06, 4.3787003960460424e-06, 7.234064469230361e-06, 1.008942854241468e-05, 1.2944792615598999e-05, 1.5800156688783318e-05, 1.8655520761967637e-05, 2.1510884835151955e-05, 2.4366248908336274e-05, 2.7221612981520593e-05, 3.0076977054704912e-05, 3.293234112788923e-05, 3.578770702006295e-05, 3.864307655021548e-05, 4.14984388044104e-05, 4.435380469658412e-05, 4.720917058875784e-05, 5.006453284295276e-05, 5.291989509714767e-05, 5.5775260989321396e-05, 5.863062688149512e-05, 6.148598913569003e-05, 6.434135138988495e-05, 6.719671364407986e-05, 7.00520831742324e-05, 7.290744542842731e-05, 7.576280768262222e-05, 7.861817721277475e-05, 8.147353946696967e-05, 8.432890172116458e-05, 8.71842639753595e-05, 9.003962622955441e-05, 9.289499575970694e-05, 9.575035801390186e-05, 9.860572026809677e-05, 0.0001014610897982493, 0.00010431645205244422, 0.00010717181430663913, 0.00011002717656083405, 0.00011288253881502897, 0.0001157379083451815, 0.00011859327059937641, 0.00012144863285357133, 0.00012430400238372386, 0.00012715936463791877, 0.00013001472689211369]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 9.0, 9.0, 9.0, 5.0, 14.0, 8.0, 12.0, 17.0, 16.0, 21.0, 21.0, 31.0, 40.0, 34.0, 45.0, 41.0, 50.0, 45.0, 40.0, 42.0, 61.0, 42.0, 41.0, 33.0, 40.0, 34.0, 33.0, 35.0, 30.0, 30.0, 17.0, 16.0, 13.0, 13.0, 16.0, 9.0, 8.0, 7.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.092123031616211e-05, -2.019573003053665e-05, -1.9470229744911194e-05, -1.8744729459285736e-05, -1.801922917366028e-05, -1.729372888803482e-05, -1.6568228602409363e-05, -1.5842728316783905e-05, -1.5117228031158447e-05, -1.439172774553299e-05, -1.3666227459907532e-05, -1.2940727174282074e-05, -1.2215226888656616e-05, -1.1489726603031158e-05, -1.07642263174057e-05, -1.0038726031780243e-05, -9.313225746154785e-06, -8.587725460529327e-06, -7.86222517490387e-06, -7.136724889278412e-06, -6.411224603652954e-06, -5.685724318027496e-06, -4.9602240324020386e-06, -4.234723746776581e-06, -3.509223461151123e-06, -2.7837231755256653e-06, -2.0582228899002075e-06, -1.3327226042747498e-06, -6.07222318649292e-07, 1.1827796697616577e-07, 8.437782526016235e-07, 1.5692785382270813e-06, 2.294778823852539e-06, 3.020279109477997e-06, 3.7457793951034546e-06, 4.471279680728912e-06, 5.19677996635437e-06, 5.922280251979828e-06, 6.647780537605286e-06, 7.373280823230743e-06, 8.098781108856201e-06, 8.824281394481659e-06, 9.549781680107117e-06, 1.0275281965732574e-05, 1.1000782251358032e-05, 1.172628253698349e-05, 1.2451782822608948e-05, 1.3177283108234406e-05, 1.3902783393859863e-05, 1.4628283679485321e-05, 1.535378396511078e-05, 1.6079284250736237e-05, 1.6804784536361694e-05, 1.7530284821987152e-05, 1.825578510761261e-05, 1.8981285393238068e-05, 1.9706785678863525e-05, 2.0432285964488983e-05, 2.115778625011444e-05, 2.18832865357399e-05, 2.2608786821365356e-05, 2.3334287106990814e-05, 2.4059787392616272e-05, 2.478528767824173e-05, 2.5510787963867188e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 6.0, 6.0, 2.0, 10.0, 7.0, 13.0, 17.0, 16.0, 23.0, 26.0, 25.0, 22.0, 25.0, 50.0, 37.0, 56.0, 55.0, 46.0, 37.0, 55.0, 65.0, 51.0, 36.0, 40.0, 42.0, 36.0, 29.0, 20.0, 33.0, 24.0, 22.0, 17.0, 20.0, 12.0, 8.0, 5.0, 2.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.6368408203125, -8.398681640625, -8.1605224609375, -7.92236328125, -7.6842041015625, -7.446044921875, -7.2078857421875, -6.9697265625, -6.7315673828125, -6.493408203125, -6.2552490234375, -6.01708984375, -5.7789306640625, -5.540771484375, -5.3026123046875, -5.064453125, -4.8262939453125, -4.588134765625, -4.3499755859375, -4.11181640625, -3.8736572265625, -3.635498046875, -3.3973388671875, -3.1591796875, -2.9210205078125, -2.682861328125, -2.4447021484375, -2.20654296875, -1.9683837890625, -1.730224609375, -1.4920654296875, -1.25390625, -1.0157470703125, -0.777587890625, -0.5394287109375, -0.30126953125, -0.0631103515625, 0.175048828125, 0.4132080078125, 0.6513671875, 0.8895263671875, 1.127685546875, 1.3658447265625, 1.60400390625, 1.8421630859375, 2.080322265625, 2.3184814453125, 2.556640625, 2.7947998046875, 3.032958984375, 3.2711181640625, 3.50927734375, 3.7474365234375, 3.985595703125, 4.2237548828125, 4.4619140625, 4.7000732421875, 4.938232421875, 5.1763916015625, 5.41455078125, 5.6527099609375, 5.890869140625, 6.1290283203125, 6.3671875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 7.0, 4.0, 5.0, 9.0, 13.0, 17.0, 31.0, 33.0, 44.0, 57.0, 81.0, 125.0, 173.0, 332.0, 608.0, 1543.0, 4608.0, 20618.0, 258634.0, 710746.0, 39732.0, 7027.0, 2149.0, 868.0, 374.0, 222.0, 140.0, 85.0, 80.0, 43.0, 39.0, 32.0, 30.0, 15.0, 9.0, 7.0, 2.0, 5.0, 7.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-15.9140625, -15.48583984375, -15.0576171875, -14.62939453125, -14.201171875, -13.77294921875, -13.3447265625, -12.91650390625, -12.48828125, -12.06005859375, -11.6318359375, -11.20361328125, -10.775390625, -10.34716796875, -9.9189453125, -9.49072265625, -9.0625, -8.63427734375, -8.2060546875, -7.77783203125, -7.349609375, -6.92138671875, -6.4931640625, -6.06494140625, -5.63671875, -5.20849609375, -4.7802734375, -4.35205078125, -3.923828125, -3.49560546875, -3.0673828125, -2.63916015625, -2.2109375, -1.78271484375, -1.3544921875, -0.92626953125, -0.498046875, -0.06982421875, 0.3583984375, 0.78662109375, 1.21484375, 1.64306640625, 2.0712890625, 2.49951171875, 2.927734375, 3.35595703125, 3.7841796875, 4.21240234375, 4.640625, 5.06884765625, 5.4970703125, 5.92529296875, 6.353515625, 6.78173828125, 7.2099609375, 7.63818359375, 8.06640625, 8.49462890625, 8.9228515625, 9.35107421875, 9.779296875, 10.20751953125, 10.6357421875, 11.06396484375, 11.4921875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 9.0, 11.0, 18.0, 17.0, 37.0, 33.0, 49.0, 46.0, 56.0, 40.0, 86.0, 285.0, 1805.0, 116.0, 73.0, 64.0, 62.0, 36.0, 46.0, 33.0, 23.0, 17.0, 20.0, 11.0, 11.0, 9.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.448974609375, -26.53857421875, -25.628173828125, -24.7177734375, -23.807373046875, -22.89697265625, -21.986572265625, -21.076171875, -20.165771484375, -19.25537109375, -18.344970703125, -17.4345703125, -16.524169921875, -15.61376953125, -14.703369140625, -13.79296875, -12.882568359375, -11.97216796875, -11.061767578125, -10.1513671875, -9.240966796875, -8.33056640625, -7.420166015625, -6.509765625, -5.599365234375, -4.68896484375, -3.778564453125, -2.8681640625, -1.957763671875, -1.04736328125, -0.136962890625, 0.7734375, 1.683837890625, 2.59423828125, 3.504638671875, 4.4150390625, 5.325439453125, 6.23583984375, 7.146240234375, 8.056640625, 8.967041015625, 9.87744140625, 10.787841796875, 11.6982421875, 12.608642578125, 13.51904296875, 14.429443359375, 15.33984375, 16.250244140625, 17.16064453125, 18.071044921875, 18.9814453125, 19.891845703125, 20.80224609375, 21.712646484375, 22.623046875, 23.533447265625, 24.44384765625, 25.354248046875, 26.2646484375, 27.175048828125, 28.08544921875, 28.995849609375, 29.90625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 9.0, 18.0, 21.0, 9.0, 31.0, 36.0, 56.0, 53.0, 115.0, 160.0, 295.0, 1047.0, 278579.0, 2863135.0, 1309.0, 311.0, 144.0, 94.0, 74.0, 46.0, 38.0, 27.0, 21.0, 17.0, 6.0, 11.0, 11.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-85.3125, -82.732421875, -80.15234375, -77.572265625, -74.9921875, -72.412109375, -69.83203125, -67.251953125, -64.671875, -62.091796875, -59.51171875, -56.931640625, -54.3515625, -51.771484375, -49.19140625, -46.611328125, -44.03125, -41.451171875, -38.87109375, -36.291015625, -33.7109375, -31.130859375, -28.55078125, -25.970703125, -23.390625, -20.810546875, -18.23046875, -15.650390625, -13.0703125, -10.490234375, -7.91015625, -5.330078125, -2.75, -0.169921875, 2.41015625, 4.990234375, 7.5703125, 10.150390625, 12.73046875, 15.310546875, 17.890625, 20.470703125, 23.05078125, 25.630859375, 28.2109375, 30.791015625, 33.37109375, 35.951171875, 38.53125, 41.111328125, 43.69140625, 46.271484375, 48.8515625, 51.431640625, 54.01171875, 56.591796875, 59.171875, 61.751953125, 64.33203125, 66.912109375, 69.4921875, 72.072265625, 74.65234375, 77.232421875, 79.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 85.0, 359.0, 389.0, 149.0, 20.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.793060302734375, -46.59760284423828, -44.40214538574219, -42.206687927246094, -40.01123046875, -37.815773010253906, -35.62031555175781, -33.42485809326172, -31.229400634765625, -29.03394317626953, -26.838485717773438, -24.643028259277344, -22.44757080078125, -20.252113342285156, -18.056655883789062, -15.861198425292969, -13.665740966796875, -11.470283508300781, -9.274826049804688, -7.079368591308594, -4.8839111328125, -2.6884536743164062, -0.4929962158203125, 1.7024612426757812, 3.897918701171875, 6.093376159667969, 8.288833618164062, 10.484291076660156, 12.67974853515625, 14.875205993652344, 17.070663452148438, 19.26612091064453, 21.461578369140625, 23.65703582763672, 25.852493286132812, 28.047950744628906, 30.243408203125, 32.438865661621094, 34.63432312011719, 36.82978057861328, 39.025238037109375, 41.22069549560547, 43.41615295410156, 45.611610412597656, 47.80706787109375, 50.002525329589844, 52.19798278808594, 54.39344024658203, 56.588897705078125, 58.78435516357422, 60.97981262207031, 63.175270080566406, 65.3707275390625, 67.5661849975586, 69.76164245605469, 71.95709991455078, 74.15255737304688, 76.34801483154297, 78.54347229003906, 80.73892974853516, 82.93438720703125, 85.12984466552734, 87.32530212402344, 89.52075958251953, 91.71621704101562]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 9.0, 14.0, 11.0, 17.0, 17.0, 19.0, 22.0, 20.0, 25.0, 25.0, 22.0, 34.0, 32.0, 41.0, 43.0, 39.0, 41.0, 42.0, 49.0, 34.0, 36.0, 43.0, 33.0, 30.0, 36.0, 24.0, 33.0, 23.0, 26.0, 22.0, 15.0, 9.0, 18.0, 10.0, 18.0, 10.0, 6.0, 7.0, 5.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-71.45466613769531, -69.3211669921875, -67.18766784667969, -65.05416870117188, -62.92066955566406, -60.78717041015625, -58.65366744995117, -56.52016830444336, -54.38666915893555, -52.253170013427734, -50.11967086791992, -47.98617172241211, -45.85266876220703, -43.71916961669922, -41.585670471191406, -39.452171325683594, -37.31867218017578, -35.18517303466797, -33.051673889160156, -30.91817283630371, -28.7846736907959, -26.651174545288086, -24.51767349243164, -22.384174346923828, -20.250675201416016, -18.117176055908203, -15.983675956726074, -13.850175857543945, -11.716676712036133, -9.58317756652832, -7.449677467346191, -5.3161773681640625, -3.1826705932617188, -1.049170970916748, 1.0843286514282227, 3.2178282737731934, 5.351327896118164, 7.484827041625977, 9.618327140808105, 11.751827239990234, 13.885326385498047, 16.01882553100586, 18.152324676513672, 20.285825729370117, 22.41932487487793, 24.552824020385742, 26.686325073242188, 28.81982421875, 30.953323364257812, 33.086822509765625, 35.22032165527344, 37.35382080078125, 39.48731994628906, 41.620819091796875, 43.75432205200195, 45.887821197509766, 48.02132034301758, 50.15481948852539, 52.2883186340332, 54.421817779541016, 56.555320739746094, 58.688819885253906, 60.82231903076172, 62.95581817626953, 65.08931732177734]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 2.0, 7.0, 5.0, 5.0, 12.0, 13.0, 19.0, 14.0, 25.0, 22.0, 32.0, 26.0, 36.0, 32.0, 42.0, 47.0, 40.0, 45.0, 39.0, 53.0, 56.0, 54.0, 44.0, 36.0, 37.0, 36.0, 20.0, 35.0, 28.0, 19.0, 21.0, 22.0, 12.0, 21.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.6328125, -8.39556884765625, -8.1583251953125, -7.92108154296875, -7.683837890625, -7.44659423828125, -7.2093505859375, -6.97210693359375, -6.73486328125, -6.49761962890625, -6.2603759765625, -6.02313232421875, -5.785888671875, -5.54864501953125, -5.3114013671875, -5.07415771484375, -4.8369140625, -4.59967041015625, -4.3624267578125, -4.12518310546875, -3.887939453125, -3.65069580078125, -3.4134521484375, -3.17620849609375, -2.93896484375, -2.70172119140625, -2.4644775390625, -2.22723388671875, -1.989990234375, -1.75274658203125, -1.5155029296875, -1.27825927734375, -1.041015625, -0.80377197265625, -0.5665283203125, -0.32928466796875, -0.092041015625, 0.14520263671875, 0.3824462890625, 0.61968994140625, 0.85693359375, 1.09417724609375, 1.3314208984375, 1.56866455078125, 1.805908203125, 2.04315185546875, 2.2803955078125, 2.51763916015625, 2.7548828125, 2.99212646484375, 3.2293701171875, 3.46661376953125, 3.703857421875, 3.94110107421875, 4.1783447265625, 4.41558837890625, 4.65283203125, 4.89007568359375, 5.1273193359375, 5.36456298828125, 5.601806640625, 5.83905029296875, 6.0762939453125, 6.31353759765625, 6.55078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 2.0, 8.0, 11.0, 13.0, 30.0, 41.0, 62.0, 65.0, 105.0, 178.0, 285.0, 460.0, 730.0, 1318.0, 2477.0, 5180.0, 12089.0, 34759.0, 138259.0, 682386.0, 1858246.0, 1117847.0, 250841.0, 56970.0, 18076.0, 7033.0, 3104.0, 1531.0, 871.0, 500.0, 284.0, 158.0, 114.0, 86.0, 51.0, 44.0, 20.0, 14.0, 22.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-11.3828125, -11.08856201171875, -10.7943115234375, -10.50006103515625, -10.205810546875, -9.91156005859375, -9.6173095703125, -9.32305908203125, -9.02880859375, -8.73455810546875, -8.4403076171875, -8.14605712890625, -7.851806640625, -7.55755615234375, -7.2633056640625, -6.96905517578125, -6.6748046875, -6.38055419921875, -6.0863037109375, -5.79205322265625, -5.497802734375, -5.20355224609375, -4.9093017578125, -4.61505126953125, -4.32080078125, -4.02655029296875, -3.7322998046875, -3.43804931640625, -3.143798828125, -2.84954833984375, -2.5552978515625, -2.26104736328125, -1.966796875, -1.67254638671875, -1.3782958984375, -1.08404541015625, -0.789794921875, -0.49554443359375, -0.2012939453125, 0.09295654296875, 0.38720703125, 0.68145751953125, 0.9757080078125, 1.26995849609375, 1.564208984375, 1.85845947265625, 2.1527099609375, 2.44696044921875, 2.7412109375, 3.03546142578125, 3.3297119140625, 3.62396240234375, 3.918212890625, 4.21246337890625, 4.5067138671875, 4.80096435546875, 5.09521484375, 5.38946533203125, 5.6837158203125, 5.97796630859375, 6.272216796875, 6.56646728515625, 6.8607177734375, 7.15496826171875, 7.44921875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 17.0, 33.0, 70.0, 67.0, 101.0, 127.0, 254.0, 361.0, 535.0, 658.0, 593.0, 397.0, 278.0, 195.0, 122.0, 77.0, 54.0, 29.0, 24.0, 30.0, 14.0, 7.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.3739013671875, -10.849365234375, -10.3248291015625, -9.80029296875, -9.2757568359375, -8.751220703125, -8.2266845703125, -7.7021484375, -7.1776123046875, -6.653076171875, -6.1285400390625, -5.60400390625, -5.0794677734375, -4.554931640625, -4.0303955078125, -3.505859375, -2.9813232421875, -2.456787109375, -1.9322509765625, -1.40771484375, -0.8831787109375, -0.358642578125, 0.1658935546875, 0.6904296875, 1.2149658203125, 1.739501953125, 2.2640380859375, 2.78857421875, 3.3131103515625, 3.837646484375, 4.3621826171875, 4.88671875, 5.4112548828125, 5.935791015625, 6.4603271484375, 6.98486328125, 7.5093994140625, 8.033935546875, 8.5584716796875, 9.0830078125, 9.6075439453125, 10.132080078125, 10.6566162109375, 11.18115234375, 11.7056884765625, 12.230224609375, 12.7547607421875, 13.279296875, 13.8038330078125, 14.328369140625, 14.8529052734375, 15.37744140625, 15.9019775390625, 16.426513671875, 16.9510498046875, 17.4755859375, 18.0001220703125, 18.524658203125, 19.0491943359375, 19.57373046875, 20.0982666015625, 20.622802734375, 21.1473388671875, 21.671875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 13.0, 13.0, 26.0, 41.0, 76.0, 93.0, 172.0, 256.0, 426.0, 854.0, 4091.0, 329236.0, 3839906.0, 16243.0, 1415.0, 566.0, 292.0, 207.0, 128.0, 84.0, 61.0, 27.0, 27.0, 8.0, 6.0, 2.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.0625, -78.02099609375, -75.9794921875, -73.93798828125, -71.896484375, -69.85498046875, -67.8134765625, -65.77197265625, -63.73046875, -61.68896484375, -59.6474609375, -57.60595703125, -55.564453125, -53.52294921875, -51.4814453125, -49.43994140625, -47.3984375, -45.35693359375, -43.3154296875, -41.27392578125, -39.232421875, -37.19091796875, -35.1494140625, -33.10791015625, -31.06640625, -29.02490234375, -26.9833984375, -24.94189453125, -22.900390625, -20.85888671875, -18.8173828125, -16.77587890625, -14.734375, -12.69287109375, -10.6513671875, -8.60986328125, -6.568359375, -4.52685546875, -2.4853515625, -0.44384765625, 1.59765625, 3.63916015625, 5.6806640625, 7.72216796875, 9.763671875, 11.80517578125, 13.8466796875, 15.88818359375, 17.9296875, 19.97119140625, 22.0126953125, 24.05419921875, 26.095703125, 28.13720703125, 30.1787109375, 32.22021484375, 34.26171875, 36.30322265625, 38.3447265625, 40.38623046875, 42.427734375, 44.46923828125, 46.5107421875, 48.55224609375, 50.59375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 836.0, 180.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-677.7763061523438, -652.474365234375, -627.1724853515625, -601.8705444335938, -576.568603515625, -551.2666625976562, -525.9647216796875, -500.662841796875, -475.36090087890625, -450.0589599609375, -424.7570495605469, -399.45513916015625, -374.1531982421875, -348.85125732421875, -323.5493469238281, -298.2474365234375, -272.94549560546875, -247.64356994628906, -222.34164428710938, -197.0397186279297, -171.73779296875, -146.4358673095703, -121.13394165039062, -95.83201599121094, -70.53009033203125, -45.22816467285156, -19.926239013671875, 5.3756866455078125, 30.6776123046875, 55.97953796386719, 81.28146362304688, 106.58338928222656, 131.88531494140625, 157.18724060058594, 182.48916625976562, 207.7910919189453, 233.093017578125, 258.39495849609375, 283.6968688964844, 308.998779296875, 334.30072021484375, 359.6026611328125, 384.9045715332031, 410.20648193359375, 435.5084228515625, 460.81036376953125, 486.1122741699219, 511.4141845703125, 536.7161254882812, 562.01806640625, 587.3199462890625, 612.6218872070312, 637.923828125, 663.2257690429688, 688.5277099609375, 713.82958984375, 739.1315307617188, 764.4334716796875, 789.7353515625, 815.0372924804688, 840.3392333984375, 865.6411743164062, 890.943115234375, 916.2449951171875, 941.5469360351562]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 17.0, 13.0, 16.0, 20.0, 16.0, 30.0, 30.0, 27.0, 43.0, 48.0, 42.0, 60.0, 51.0, 75.0, 52.0, 47.0, 51.0, 35.0, 44.0, 49.0, 43.0, 34.0, 32.0, 22.0, 18.0, 17.0, 8.0, 12.0, 10.0, 9.0, 4.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-65.6796875, -64.05743408203125, -62.4351806640625, -60.81292724609375, -59.190673828125, -57.56842041015625, -55.946163177490234, -54.323909759521484, -52.701656341552734, -51.079402923583984, -49.457149505615234, -47.834896087646484, -46.21263885498047, -44.59038543701172, -42.96813201904297, -41.34587860107422, -39.72362518310547, -38.10137176513672, -36.47911834716797, -34.85686492919922, -33.23461151123047, -31.612356185913086, -29.990100860595703, -28.367847442626953, -26.745594024658203, -25.123340606689453, -23.501087188720703, -21.87883186340332, -20.25657844543457, -18.63432502746582, -17.012069702148438, -15.389816284179688, -13.767559051513672, -12.145305633544922, -10.523051261901855, -8.900796890258789, -7.278543472290039, -5.656290054321289, -4.034035682678223, -2.4117813110351562, -0.7895278930664062, 0.832726001739502, 2.45497989654541, 4.077233791351318, 5.699487686157227, 7.321741104125977, 8.943995475769043, 10.56624984741211, 12.18850326538086, 13.81075668334961, 15.433011054992676, 17.055265426635742, 18.677518844604492, 20.299772262573242, 21.922027587890625, 23.544281005859375, 25.166534423828125, 26.788787841796875, 28.411041259765625, 30.033296585083008, 31.655550003051758, 33.277801513671875, 34.90005874633789, 36.52231216430664, 38.14456558227539]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 1.0, 7.0, 6.0, 6.0, 5.0, 2.0, 9.0, 20.0, 21.0, 27.0, 26.0, 24.0, 30.0, 26.0, 41.0, 48.0, 52.0, 41.0, 46.0, 51.0, 51.0, 57.0, 43.0, 41.0, 43.0, 46.0, 25.0, 31.0, 30.0, 27.0, 30.0, 22.0, 17.0, 7.0, 13.0, 15.0, 6.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.296875, -9.0469970703125, -8.797119140625, -8.5472412109375, -8.29736328125, -8.0474853515625, -7.797607421875, -7.5477294921875, -7.2978515625, -7.0479736328125, -6.798095703125, -6.5482177734375, -6.29833984375, -6.0484619140625, -5.798583984375, -5.5487060546875, -5.298828125, -5.0489501953125, -4.799072265625, -4.5491943359375, -4.29931640625, -4.0494384765625, -3.799560546875, -3.5496826171875, -3.2998046875, -3.0499267578125, -2.800048828125, -2.5501708984375, -2.30029296875, -2.0504150390625, -1.800537109375, -1.5506591796875, -1.30078125, -1.0509033203125, -0.801025390625, -0.5511474609375, -0.30126953125, -0.0513916015625, 0.198486328125, 0.4483642578125, 0.6982421875, 0.9481201171875, 1.197998046875, 1.4478759765625, 1.69775390625, 1.9476318359375, 2.197509765625, 2.4473876953125, 2.697265625, 2.9471435546875, 3.197021484375, 3.4468994140625, 3.69677734375, 3.9466552734375, 4.196533203125, 4.4464111328125, 4.6962890625, 4.9461669921875, 5.196044921875, 5.4459228515625, 5.69580078125, 5.9456787109375, 6.195556640625, 6.4454345703125, 6.6953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 4.0, 5.0, 17.0, 22.0, 24.0, 40.0, 79.0, 90.0, 157.0, 239.0, 393.0, 712.0, 1296.0, 2225.0, 3950.0, 7367.0, 14102.0, 25867.0, 49792.0, 104143.0, 273715.0, 322682.0, 122175.0, 55806.0, 29153.0, 15755.0, 8449.0, 4521.0, 2470.0, 1351.0, 783.0, 454.0, 271.0, 168.0, 93.0, 71.0, 37.0, 27.0, 14.0, 13.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.38720703125, -0.3751411437988281, -0.36307525634765625, -0.3510093688964844, -0.3389434814453125, -0.3268775939941406, -0.31481170654296875, -0.3027458190917969, -0.290679931640625, -0.2786140441894531, -0.26654815673828125, -0.2544822692871094, -0.2424163818359375, -0.23035049438476562, -0.21828460693359375, -0.20621871948242188, -0.19415283203125, -0.18208694458007812, -0.17002105712890625, -0.15795516967773438, -0.1458892822265625, -0.13382339477539062, -0.12175750732421875, -0.10969161987304688, -0.097625732421875, -0.08555984497070312, -0.07349395751953125, -0.061428070068359375, -0.0493621826171875, -0.037296295166015625, -0.02523040771484375, -0.013164520263671875, -0.0010986328125, 0.010967254638671875, 0.02303314208984375, 0.035099029541015625, 0.0471649169921875, 0.059230804443359375, 0.07129669189453125, 0.08336257934570312, 0.095428466796875, 0.10749435424804688, 0.11956024169921875, 0.13162612915039062, 0.1436920166015625, 0.15575790405273438, 0.16782379150390625, 0.17988967895507812, 0.19195556640625, 0.20402145385742188, 0.21608734130859375, 0.22815322875976562, 0.2402191162109375, 0.2522850036621094, 0.26435089111328125, 0.2764167785644531, 0.288482666015625, 0.3005485534667969, 0.31261444091796875, 0.3246803283691406, 0.3367462158203125, 0.3488121032714844, 0.36087799072265625, 0.3729438781738281, 0.385009765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 8.0, 12.0, 11.0, 11.0, 16.0, 17.0, 23.0, 16.0, 24.0, 25.0, 31.0, 32.0, 26.0, 44.0, 31.0, 51.0, 54.0, 46.0, 1057.0, 34.0, 41.0, 36.0, 43.0, 38.0, 30.0, 35.0, 26.0, 28.0, 21.0, 32.0, 22.0, 19.0, 13.0, 10.0, 9.0, 3.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.23828125, -5.095245361328125, -4.95220947265625, -4.809173583984375, -4.6661376953125, -4.523101806640625, -4.38006591796875, -4.237030029296875, -4.093994140625, -3.950958251953125, -3.80792236328125, -3.664886474609375, -3.5218505859375, -3.378814697265625, -3.23577880859375, -3.092742919921875, -2.94970703125, -2.806671142578125, -2.66363525390625, -2.520599365234375, -2.3775634765625, -2.234527587890625, -2.09149169921875, -1.948455810546875, -1.805419921875, -1.662384033203125, -1.51934814453125, -1.376312255859375, -1.2332763671875, -1.090240478515625, -0.94720458984375, -0.804168701171875, -0.6611328125, -0.518096923828125, -0.37506103515625, -0.232025146484375, -0.0889892578125, 0.054046630859375, 0.19708251953125, 0.340118408203125, 0.483154296875, 0.626190185546875, 0.76922607421875, 0.912261962890625, 1.0552978515625, 1.198333740234375, 1.34136962890625, 1.484405517578125, 1.62744140625, 1.770477294921875, 1.91351318359375, 2.056549072265625, 2.1995849609375, 2.342620849609375, 2.48565673828125, 2.628692626953125, 2.771728515625, 2.914764404296875, 3.05780029296875, 3.200836181640625, 3.3438720703125, 3.486907958984375, 3.62994384765625, 3.772979736328125, 3.916015625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 10.0, 17.0, 33.0, 45.0, 59.0, 98.0, 150.0, 215.0, 307.0, 502.0, 699.0, 1088.0, 1576.0, 2476.0, 3765.0, 5936.0, 9017.0, 14675.0, 23720.0, 39703.0, 70990.0, 146617.0, 1345612.0, 207557.0, 93817.0, 50132.0, 29049.0, 18056.0, 11298.0, 6862.0, 4427.0, 2922.0, 1907.0, 1316.0, 837.0, 551.0, 336.0, 250.0, 147.0, 121.0, 77.0, 53.0, 35.0, 22.0, 10.0, 12.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2978515625, -0.2887458801269531, -0.27964019775390625, -0.2705345153808594, -0.2614288330078125, -0.2523231506347656, -0.24321746826171875, -0.23411178588867188, -0.225006103515625, -0.21590042114257812, -0.20679473876953125, -0.19768905639648438, -0.1885833740234375, -0.17947769165039062, -0.17037200927734375, -0.16126632690429688, -0.15216064453125, -0.14305496215820312, -0.13394927978515625, -0.12484359741210938, -0.1157379150390625, -0.10663223266601562, -0.09752655029296875, -0.08842086791992188, -0.079315185546875, -0.07020950317382812, -0.06110382080078125, -0.051998138427734375, -0.0428924560546875, -0.033786773681640625, -0.02468109130859375, -0.015575408935546875, -0.0064697265625, 0.002635955810546875, 0.01174163818359375, 0.020847320556640625, 0.0299530029296875, 0.039058685302734375, 0.04816436767578125, 0.057270050048828125, 0.066375732421875, 0.07548141479492188, 0.08458709716796875, 0.09369277954101562, 0.1027984619140625, 0.11190414428710938, 0.12100982666015625, 0.13011550903320312, 0.13922119140625, 0.14832687377929688, 0.15743255615234375, 0.16653823852539062, 0.1756439208984375, 0.18474960327148438, 0.19385528564453125, 0.20296096801757812, 0.212066650390625, 0.22117233276367188, 0.23027801513671875, 0.23938369750976562, 0.2484893798828125, 0.2575950622558594, 0.26670074462890625, 0.2758064270019531, 0.284912109375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 1.0, 4.0, 6.0, 7.0, 8.0, 13.0, 7.0, 14.0, 16.0, 20.0, 23.0, 20.0, 31.0, 28.0, 33.0, 48.0, 49.0, 50.0, 47.0, 45.0, 43.0, 33.0, 50.0, 46.0, 32.0, 42.0, 33.0, 46.0, 33.0, 34.0, 22.0, 23.0, 14.0, 11.0, 13.0, 11.0, 8.0, 4.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.0040740966796875e-05, -2.9060058295726776e-05, -2.8079375624656677e-05, -2.709869295358658e-05, -2.611801028251648e-05, -2.513732761144638e-05, -2.4156644940376282e-05, -2.3175962269306183e-05, -2.2195279598236084e-05, -2.1214596927165985e-05, -2.0233914256095886e-05, -1.9253231585025787e-05, -1.827254891395569e-05, -1.729186624288559e-05, -1.631118357181549e-05, -1.5330500900745392e-05, -1.4349818229675293e-05, -1.3369135558605194e-05, -1.2388452887535095e-05, -1.1407770216464996e-05, -1.0427087545394897e-05, -9.446404874324799e-06, -8.4657222032547e-06, -7.485039532184601e-06, -6.504356861114502e-06, -5.523674190044403e-06, -4.542991518974304e-06, -3.5623088479042053e-06, -2.5816261768341064e-06, -1.6009435057640076e-06, -6.202608346939087e-07, 3.604218363761902e-07, 1.341104507446289e-06, 2.321787178516388e-06, 3.302469849586487e-06, 4.283152520656586e-06, 5.2638351917266846e-06, 6.2445178627967834e-06, 7.225200533866882e-06, 8.205883204936981e-06, 9.18656587600708e-06, 1.0167248547077179e-05, 1.1147931218147278e-05, 1.2128613889217377e-05, 1.3109296560287476e-05, 1.4089979231357574e-05, 1.5070661902427673e-05, 1.6051344573497772e-05, 1.703202724456787e-05, 1.801270991563797e-05, 1.899339258670807e-05, 1.9974075257778168e-05, 2.0954757928848267e-05, 2.1935440599918365e-05, 2.2916123270988464e-05, 2.3896805942058563e-05, 2.4877488613128662e-05, 2.585817128419876e-05, 2.683885395526886e-05, 2.781953662633896e-05, 2.8800219297409058e-05, 2.9780901968479156e-05, 3.0761584639549255e-05, 3.1742267310619354e-05, 3.272294998168945e-05]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 16.0, 14.0, 17.0, 33.0, 46.0, 55.0, 69.0, 84.0, 84.0, 146.0, 225.0, 509.0, 3176.0, 952279.0, 89838.0, 908.0, 316.0, 174.0, 109.0, 95.0, 70.0, 44.0, 51.0, 27.0, 26.0, 19.0, 13.0, 17.0, 14.0, 11.0, 4.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007658004760742188, -0.0007431060075759888, -0.0007204115390777588, -0.0006977170705795288, -0.0006750226020812988, -0.0006523281335830688, -0.0006296336650848389, -0.0006069391965866089, -0.0005842447280883789, -0.0005615502595901489, -0.0005388557910919189, -0.000516161322593689, -0.000493466854095459, -0.000470772385597229, -0.000448077917098999, -0.00042538344860076904, -0.00040268898010253906, -0.0003799945116043091, -0.0003573000431060791, -0.0003346055746078491, -0.00031191110610961914, -0.00028921663761138916, -0.0002665221691131592, -0.0002438277006149292, -0.00022113323211669922, -0.00019843876361846924, -0.00017574429512023926, -0.00015304982662200928, -0.0001303553581237793, -0.00010766088962554932, -8.496642112731934e-05, -6.227195262908936e-05, -3.9577484130859375e-05, -1.6883015632629395e-05, 5.811452865600586e-06, 2.8505921363830566e-05, 5.120038986206055e-05, 7.389485836029053e-05, 9.658932685852051e-05, 0.00011928379535675049, 0.00014197826385498047, 0.00016467273235321045, 0.00018736720085144043, 0.0002100616693496704, 0.0002327561378479004, 0.00025545060634613037, 0.00027814507484436035, 0.00030083954334259033, 0.0003235340118408203, 0.0003462284803390503, 0.0003689229488372803, 0.00039161741733551025, 0.00041431188583374023, 0.0004370063543319702, 0.0004597008228302002, 0.0004823952913284302, 0.0005050897598266602, 0.0005277842283248901, 0.0005504786968231201, 0.0005731731653213501, 0.0005958676338195801, 0.0006185621023178101, 0.00064125657081604, 0.00066395103931427, 0.0006866455078125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 28.0, 67.0, 142.0, 215.0, 224.0, 195.0, 81.0, 31.0, 12.0, 5.0, 2.0, 3.0, 1.0], "bins": [-8.893430640455335e-05, -8.732097921893e-05, -8.570764475734904e-05, -8.40943175717257e-05, -8.248099038610235e-05, -8.086765592452139e-05, -7.925432873889804e-05, -7.764100155327469e-05, -7.602767436765134e-05, -7.4414347182028e-05, -7.280101272044703e-05, -7.118768553482369e-05, -6.957435834920034e-05, -6.796102388761938e-05, -6.634769670199603e-05, -6.473436951637268e-05, -6.312103505479172e-05, -6.150770786916837e-05, -5.9894377045566216e-05, -5.828104622196406e-05, -5.6667719036340714e-05, -5.505438821273856e-05, -5.3441057389136404e-05, -5.1827730203513056e-05, -5.02143993799109e-05, -4.8601068556308746e-05, -4.69877413706854e-05, -4.5374410547083244e-05, -4.376107972348109e-05, -4.214775253785774e-05, -4.0534421714255586e-05, -3.892109089065343e-05, -3.7307763705030084e-05, -3.569443288142793e-05, -3.408110569580458e-05, -3.2467774872202426e-05, -3.085444768657908e-05, -2.9241116862976924e-05, -2.762778603937477e-05, -2.6014457034762017e-05, -2.4401128030149266e-05, -2.2787799025536515e-05, -2.1174470020923764e-05, -1.956113919732161e-05, -1.7947810192708857e-05, -1.6334481188096106e-05, -1.4721151273988653e-05, -1.31078213598812e-05, -1.149449326476315e-05, -9.881163350655697e-06, -8.267834346042946e-06, -6.654504886682844e-06, -5.041175427322742e-06, -3.4278464227099903e-06, -1.8145165086025372e-06, -2.0118659449508414e-07, 1.4121424101176672e-06, 3.0254718694777694e-06, 4.6388013288378716e-06, 6.252130788197974e-06, 7.865460247558076e-06, 9.478789252170827e-06, 1.109211916627828e-05, 1.2705449080385733e-05, 1.4318778084998485e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 6.0, 13.0, 15.0, 22.0, 15.0, 19.0, 21.0, 21.0, 13.0, 41.0, 38.0, 42.0, 43.0, 35.0, 37.0, 42.0, 44.0, 36.0, 52.0, 44.0, 55.0, 44.0, 39.0, 37.0, 34.0, 27.0, 17.0, 33.0, 22.0, 19.0, 13.0, 13.0, 8.0, 8.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.467632293701172e-05, -2.4020671844482422e-05, -2.3365020751953125e-05, -2.2709369659423828e-05, -2.205371856689453e-05, -2.1398067474365234e-05, -2.0742416381835938e-05, -2.008676528930664e-05, -1.9431114196777344e-05, -1.8775463104248047e-05, -1.811981201171875e-05, -1.7464160919189453e-05, -1.6808509826660156e-05, -1.615285873413086e-05, -1.5497207641601562e-05, -1.4841556549072266e-05, -1.4185905456542969e-05, -1.3530254364013672e-05, -1.2874603271484375e-05, -1.2218952178955078e-05, -1.1563301086425781e-05, -1.0907649993896484e-05, -1.0251998901367188e-05, -9.59634780883789e-06, -8.940696716308594e-06, -8.285045623779297e-06, -7.62939453125e-06, -6.973743438720703e-06, -6.318092346191406e-06, -5.662441253662109e-06, -5.0067901611328125e-06, -4.351139068603516e-06, -3.6954879760742188e-06, -3.039836883544922e-06, -2.384185791015625e-06, -1.7285346984863281e-06, -1.0728836059570312e-06, -4.172325134277344e-07, 2.384185791015625e-07, 8.940696716308594e-07, 1.5497207641601562e-06, 2.205371856689453e-06, 2.86102294921875e-06, 3.516674041748047e-06, 4.172325134277344e-06, 4.827976226806641e-06, 5.4836273193359375e-06, 6.139278411865234e-06, 6.794929504394531e-06, 7.450580596923828e-06, 8.106231689453125e-06, 8.761882781982422e-06, 9.417533874511719e-06, 1.0073184967041016e-05, 1.0728836059570312e-05, 1.138448715209961e-05, 1.2040138244628906e-05, 1.2695789337158203e-05, 1.33514404296875e-05, 1.4007091522216797e-05, 1.4662742614746094e-05, 1.531839370727539e-05, 1.5974044799804688e-05, 1.6629695892333984e-05, 1.728534698486328e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 1.0, 7.0, 6.0, 6.0, 5.0, 2.0, 9.0, 20.0, 21.0, 27.0, 26.0, 24.0, 30.0, 26.0, 41.0, 48.0, 52.0, 41.0, 46.0, 51.0, 51.0, 57.0, 43.0, 41.0, 43.0, 46.0, 25.0, 31.0, 30.0, 27.0, 30.0, 22.0, 17.0, 7.0, 13.0, 15.0, 6.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.296875, -9.0469970703125, -8.797119140625, -8.5472412109375, -8.29736328125, -8.0474853515625, -7.797607421875, -7.5477294921875, -7.2978515625, -7.0479736328125, -6.798095703125, -6.5482177734375, -6.29833984375, -6.0484619140625, -5.798583984375, -5.5487060546875, -5.298828125, -5.0489501953125, -4.799072265625, -4.5491943359375, -4.29931640625, -4.0494384765625, -3.799560546875, -3.5496826171875, -3.2998046875, -3.0499267578125, -2.800048828125, -2.5501708984375, -2.30029296875, -2.0504150390625, -1.800537109375, -1.5506591796875, -1.30078125, -1.0509033203125, -0.801025390625, -0.5511474609375, -0.30126953125, -0.0513916015625, 0.198486328125, 0.4483642578125, 0.6982421875, 0.9481201171875, 1.197998046875, 1.4478759765625, 1.69775390625, 1.9476318359375, 2.197509765625, 2.4473876953125, 2.697265625, 2.9471435546875, 3.197021484375, 3.4468994140625, 3.69677734375, 3.9466552734375, 4.196533203125, 4.4464111328125, 4.6962890625, 4.9461669921875, 5.196044921875, 5.4459228515625, 5.69580078125, 5.9456787109375, 6.195556640625, 6.4454345703125, 6.6953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 6.0, 6.0, 6.0, 5.0, 9.0, 12.0, 20.0, 25.0, 45.0, 67.0, 131.0, 184.0, 395.0, 859.0, 1862.0, 4552.0, 11342.0, 30984.0, 91953.0, 332121.0, 404066.0, 110692.0, 36814.0, 13217.0, 5048.0, 2080.0, 975.0, 489.0, 240.0, 140.0, 81.0, 41.0, 23.0, 21.0, 17.0, 9.0, 9.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.8671875, -9.60107421875, -9.3349609375, -9.06884765625, -8.802734375, -8.53662109375, -8.2705078125, -8.00439453125, -7.73828125, -7.47216796875, -7.2060546875, -6.93994140625, -6.673828125, -6.40771484375, -6.1416015625, -5.87548828125, -5.609375, -5.34326171875, -5.0771484375, -4.81103515625, -4.544921875, -4.27880859375, -4.0126953125, -3.74658203125, -3.48046875, -3.21435546875, -2.9482421875, -2.68212890625, -2.416015625, -2.14990234375, -1.8837890625, -1.61767578125, -1.3515625, -1.08544921875, -0.8193359375, -0.55322265625, -0.287109375, -0.02099609375, 0.2451171875, 0.51123046875, 0.77734375, 1.04345703125, 1.3095703125, 1.57568359375, 1.841796875, 2.10791015625, 2.3740234375, 2.64013671875, 2.90625, 3.17236328125, 3.4384765625, 3.70458984375, 3.970703125, 4.23681640625, 4.5029296875, 4.76904296875, 5.03515625, 5.30126953125, 5.5673828125, 5.83349609375, 6.099609375, 6.36572265625, 6.6318359375, 6.89794921875, 7.1640625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 5.0, 8.0, 13.0, 8.0, 15.0, 24.0, 20.0, 37.0, 26.0, 47.0, 31.0, 40.0, 42.0, 54.0, 94.0, 395.0, 1612.0, 127.0, 59.0, 59.0, 53.0, 31.0, 46.0, 29.0, 40.0, 24.0, 17.0, 21.0, 12.0, 13.0, 12.0, 5.0, 6.0, 4.0, 7.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.0, -30.14208984375, -29.2841796875, -28.42626953125, -27.568359375, -26.71044921875, -25.8525390625, -24.99462890625, -24.13671875, -23.27880859375, -22.4208984375, -21.56298828125, -20.705078125, -19.84716796875, -18.9892578125, -18.13134765625, -17.2734375, -16.41552734375, -15.5576171875, -14.69970703125, -13.841796875, -12.98388671875, -12.1259765625, -11.26806640625, -10.41015625, -9.55224609375, -8.6943359375, -7.83642578125, -6.978515625, -6.12060546875, -5.2626953125, -4.40478515625, -3.546875, -2.68896484375, -1.8310546875, -0.97314453125, -0.115234375, 0.74267578125, 1.6005859375, 2.45849609375, 3.31640625, 4.17431640625, 5.0322265625, 5.89013671875, 6.748046875, 7.60595703125, 8.4638671875, 9.32177734375, 10.1796875, 11.03759765625, 11.8955078125, 12.75341796875, 13.611328125, 14.46923828125, 15.3271484375, 16.18505859375, 17.04296875, 17.90087890625, 18.7587890625, 19.61669921875, 20.474609375, 21.33251953125, 22.1904296875, 23.04833984375, 23.90625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 7.0, 6.0, 8.0, 14.0, 15.0, 20.0, 35.0, 41.0, 49.0, 87.0, 102.0, 113.0, 171.0, 251.0, 483.0, 2049.0, 80045.0, 3031025.0, 28700.0, 1238.0, 385.0, 214.0, 182.0, 113.0, 81.0, 70.0, 43.0, 39.0, 33.0, 16.0, 11.0, 12.0, 11.0, 8.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.75, -38.35009765625, -36.9501953125, -35.55029296875, -34.150390625, -32.75048828125, -31.3505859375, -29.95068359375, -28.55078125, -27.15087890625, -25.7509765625, -24.35107421875, -22.951171875, -21.55126953125, -20.1513671875, -18.75146484375, -17.3515625, -15.95166015625, -14.5517578125, -13.15185546875, -11.751953125, -10.35205078125, -8.9521484375, -7.55224609375, -6.15234375, -4.75244140625, -3.3525390625, -1.95263671875, -0.552734375, 0.84716796875, 2.2470703125, 3.64697265625, 5.046875, 6.44677734375, 7.8466796875, 9.24658203125, 10.646484375, 12.04638671875, 13.4462890625, 14.84619140625, 16.24609375, 17.64599609375, 19.0458984375, 20.44580078125, 21.845703125, 23.24560546875, 24.6455078125, 26.04541015625, 27.4453125, 28.84521484375, 30.2451171875, 31.64501953125, 33.044921875, 34.44482421875, 35.8447265625, 37.24462890625, 38.64453125, 40.04443359375, 41.4443359375, 42.84423828125, 44.244140625, 45.64404296875, 47.0439453125, 48.44384765625, 49.84375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 18.0, 42.0, 125.0, 234.0, 280.0, 199.0, 71.0, 27.0, 10.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.68923950195312, -66.94086456298828, -65.19248962402344, -63.444114685058594, -61.695735931396484, -59.94736099243164, -58.1989860534668, -56.45061111450195, -54.702232360839844, -52.953857421875, -51.205482482910156, -49.45710754394531, -47.7087287902832, -45.96035385131836, -44.211978912353516, -42.46360397338867, -40.71522903442383, -38.966854095458984, -37.21847915649414, -35.47010040283203, -33.72172546386719, -31.973350524902344, -30.2249755859375, -28.476600646972656, -26.72822380065918, -24.979848861694336, -23.23147201538086, -21.483097076416016, -19.734722137451172, -17.986345291137695, -16.23797035217285, -14.489594459533691, -12.741218566894531, -10.992842674255371, -9.244466781616211, -7.496091842651367, -5.747715950012207, -3.999340057373047, -2.250965118408203, -0.502589225769043, 1.2457866668701172, 2.9941623210906982, 4.742537975311279, 6.490913391113281, 8.239289283752441, 9.987665176391602, 11.736040115356445, 13.484416007995605, 15.232791900634766, 16.98116683959961, 18.729543685913086, 20.47791862487793, 22.226295471191406, 23.97467041015625, 25.723045349121094, 27.471420288085938, 29.219797134399414, 30.968172073364258, 32.716548919677734, 34.46492385864258, 36.21329879760742, 37.96167755126953, 39.710052490234375, 41.45842742919922, 43.20680236816406]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 6.0, 8.0, 11.0, 5.0, 7.0, 14.0, 18.0, 25.0, 25.0, 31.0, 27.0, 21.0, 35.0, 44.0, 38.0, 30.0, 53.0, 43.0, 50.0, 48.0, 46.0, 42.0, 36.0, 33.0, 38.0, 30.0, 30.0, 28.0, 27.0, 21.0, 19.0, 15.0, 21.0, 12.0, 13.0, 13.0, 13.0, 3.0, 6.0, 4.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.6532211303711, -68.45073699951172, -66.24824523925781, -64.04576110839844, -61.84327697753906, -59.64078903198242, -57.43830108642578, -55.235816955566406, -53.033329010009766, -50.830841064453125, -48.62835693359375, -46.42586898803711, -44.22338104248047, -42.020896911621094, -39.81840896606445, -37.61592102050781, -35.41343688964844, -33.2109489440918, -31.008464813232422, -28.80597686767578, -26.603490829467773, -24.401004791259766, -22.198516845703125, -19.996030807495117, -17.79354476928711, -15.591058731079102, -13.388571739196777, -11.186084747314453, -8.983598709106445, -6.7811126708984375, -4.578625679016113, -2.376138687133789, -0.1736602783203125, 2.0288262367248535, 4.2313127517700195, 6.4337992668151855, 8.636285781860352, 10.83877182006836, 13.041258811950684, 15.243745803833008, 17.446231842041016, 19.648717880249023, 21.85120391845703, 24.053691864013672, 26.25617790222168, 28.458663940429688, 30.661151885986328, 32.86363983154297, 35.066123962402344, 37.268611907958984, 39.47109603881836, 41.673583984375, 43.876068115234375, 46.078556060791016, 48.281044006347656, 50.48352813720703, 52.68601608276367, 54.88850402832031, 57.09098815917969, 59.29347610473633, 61.49596405029297, 63.698448181152344, 65.90093231201172, 68.10342407226562, 70.305908203125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 6.0, 6.0, 17.0, 9.0, 19.0, 25.0, 37.0, 23.0, 31.0, 20.0, 41.0, 42.0, 53.0, 57.0, 51.0, 49.0, 52.0, 47.0, 51.0, 45.0, 43.0, 26.0, 36.0, 29.0, 23.0, 36.0, 29.0, 22.0, 19.0, 10.0, 11.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -9.001708984375, -8.73779296875, -8.473876953125, -8.2099609375, -7.946044921875, -7.68212890625, -7.418212890625, -7.154296875, -6.890380859375, -6.62646484375, -6.362548828125, -6.0986328125, -5.834716796875, -5.57080078125, -5.306884765625, -5.04296875, -4.779052734375, -4.51513671875, -4.251220703125, -3.9873046875, -3.723388671875, -3.45947265625, -3.195556640625, -2.931640625, -2.667724609375, -2.40380859375, -2.139892578125, -1.8759765625, -1.612060546875, -1.34814453125, -1.084228515625, -0.8203125, -0.556396484375, -0.29248046875, -0.028564453125, 0.2353515625, 0.499267578125, 0.76318359375, 1.027099609375, 1.291015625, 1.554931640625, 1.81884765625, 2.082763671875, 2.3466796875, 2.610595703125, 2.87451171875, 3.138427734375, 3.40234375, 3.666259765625, 3.93017578125, 4.194091796875, 4.4580078125, 4.721923828125, 4.98583984375, 5.249755859375, 5.513671875, 5.777587890625, 6.04150390625, 6.305419921875, 6.5693359375, 6.833251953125, 7.09716796875, 7.361083984375, 7.625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 8.0, 5.0, 9.0, 6.0, 9.0, 9.0, 15.0, 20.0, 20.0, 31.0, 44.0, 59.0, 109.0, 179.0, 308.0, 664.0, 1729.0, 6093.0, 32964.0, 477908.0, 3264440.0, 372147.0, 29329.0, 5298.0, 1528.0, 639.0, 273.0, 145.0, 70.0, 49.0, 31.0, 31.0, 36.0, 13.0, 13.0, 15.0, 6.0, 7.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.75, -20.1298828125, -19.509765625, -18.8896484375, -18.26953125, -17.6494140625, -17.029296875, -16.4091796875, -15.7890625, -15.1689453125, -14.548828125, -13.9287109375, -13.30859375, -12.6884765625, -12.068359375, -11.4482421875, -10.828125, -10.2080078125, -9.587890625, -8.9677734375, -8.34765625, -7.7275390625, -7.107421875, -6.4873046875, -5.8671875, -5.2470703125, -4.626953125, -4.0068359375, -3.38671875, -2.7666015625, -2.146484375, -1.5263671875, -0.90625, -0.2861328125, 0.333984375, 0.9541015625, 1.57421875, 2.1943359375, 2.814453125, 3.4345703125, 4.0546875, 4.6748046875, 5.294921875, 5.9150390625, 6.53515625, 7.1552734375, 7.775390625, 8.3955078125, 9.015625, 9.6357421875, 10.255859375, 10.8759765625, 11.49609375, 12.1162109375, 12.736328125, 13.3564453125, 13.9765625, 14.5966796875, 15.216796875, 15.8369140625, 16.45703125, 17.0771484375, 17.697265625, 18.3173828125, 18.9375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 7.0, 10.0, 16.0, 15.0, 24.0, 35.0, 40.0, 78.0, 92.0, 102.0, 147.0, 221.0, 342.0, 448.0, 519.0, 521.0, 378.0, 271.0, 204.0, 152.0, 88.0, 104.0, 57.0, 49.0, 27.0, 23.0, 16.0, 18.0, 11.0, 13.0, 7.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.4027099609375, -9.024169921875, -8.6456298828125, -8.26708984375, -7.8885498046875, -7.510009765625, -7.1314697265625, -6.7529296875, -6.3743896484375, -5.995849609375, -5.6173095703125, -5.23876953125, -4.8602294921875, -4.481689453125, -4.1031494140625, -3.724609375, -3.3460693359375, -2.967529296875, -2.5889892578125, -2.21044921875, -1.8319091796875, -1.453369140625, -1.0748291015625, -0.6962890625, -0.3177490234375, 0.060791015625, 0.4393310546875, 0.81787109375, 1.1964111328125, 1.574951171875, 1.9534912109375, 2.33203125, 2.7105712890625, 3.089111328125, 3.4676513671875, 3.84619140625, 4.2247314453125, 4.603271484375, 4.9818115234375, 5.3603515625, 5.7388916015625, 6.117431640625, 6.4959716796875, 6.87451171875, 7.2530517578125, 7.631591796875, 8.0101318359375, 8.388671875, 8.7672119140625, 9.145751953125, 9.5242919921875, 9.90283203125, 10.2813720703125, 10.659912109375, 11.0384521484375, 11.4169921875, 11.7955322265625, 12.174072265625, 12.5526123046875, 12.93115234375, 13.3096923828125, 13.688232421875, 14.0667724609375, 14.4453125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 11.0, 12.0, 18.0, 21.0, 19.0, 26.0, 39.0, 40.0, 67.0, 90.0, 123.0, 181.0, 227.0, 421.0, 1610.0, 11701.0, 313473.0, 3789335.0, 69855.0, 5007.0, 859.0, 330.0, 215.0, 141.0, 100.0, 79.0, 66.0, 54.0, 43.0, 31.0, 26.0, 16.0, 10.0, 10.0, 9.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.125, -47.55615234375, -45.9873046875, -44.41845703125, -42.849609375, -41.28076171875, -39.7119140625, -38.14306640625, -36.57421875, -35.00537109375, -33.4365234375, -31.86767578125, -30.298828125, -28.72998046875, -27.1611328125, -25.59228515625, -24.0234375, -22.45458984375, -20.8857421875, -19.31689453125, -17.748046875, -16.17919921875, -14.6103515625, -13.04150390625, -11.47265625, -9.90380859375, -8.3349609375, -6.76611328125, -5.197265625, -3.62841796875, -2.0595703125, -0.49072265625, 1.078125, 2.64697265625, 4.2158203125, 5.78466796875, 7.353515625, 8.92236328125, 10.4912109375, 12.06005859375, 13.62890625, 15.19775390625, 16.7666015625, 18.33544921875, 19.904296875, 21.47314453125, 23.0419921875, 24.61083984375, 26.1796875, 27.74853515625, 29.3173828125, 30.88623046875, 32.455078125, 34.02392578125, 35.5927734375, 37.16162109375, 38.73046875, 40.29931640625, 41.8681640625, 43.43701171875, 45.005859375, 46.57470703125, 48.1435546875, 49.71240234375, 51.28125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0, 490.0, 462.0, 35.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-441.9351806640625, -429.9822082519531, -418.02923583984375, -406.07623291015625, -394.1232604980469, -382.1702880859375, -370.21728515625, -358.2643127441406, -346.31134033203125, -334.3583679199219, -322.4053955078125, -310.452392578125, -298.4994201660156, -286.54644775390625, -274.59344482421875, -262.6404724121094, -250.6875, -238.73452758789062, -226.7815399169922, -214.82855224609375, -202.87557983398438, -190.922607421875, -178.96961975097656, -167.01663208007812, -155.06365966796875, -143.11068725585938, -131.15769958496094, -119.20471954345703, -107.25173950195312, -95.29875946044922, -83.34577941894531, -71.3927993774414, -59.4398193359375, -47.486839294433594, -35.53385925292969, -23.58087921142578, -11.627899169921875, 0.32508087158203125, 12.278060913085938, 24.231040954589844, 36.18402099609375, 48.137001037597656, 60.08998107910156, 72.04296112060547, 83.99594116210938, 95.94892120361328, 107.90190124511719, 119.8548812866211, 131.807861328125, 143.76083374023438, 155.7138214111328, 167.66680908203125, 179.61978149414062, 191.57275390625, 203.52574157714844, 215.47872924804688, 227.43170166015625, 239.38467407226562, 251.33766174316406, 263.2906494140625, 275.2436218261719, 287.19659423828125, 299.14959716796875, 311.1025695800781, 323.0555419921875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 5.0, 9.0, 8.0, 15.0, 16.0, 24.0, 18.0, 21.0, 26.0, 31.0, 30.0, 38.0, 43.0, 39.0, 46.0, 34.0, 46.0, 38.0, 49.0, 41.0, 35.0, 43.0, 36.0, 37.0, 43.0, 25.0, 27.0, 21.0, 27.0, 21.0, 19.0, 22.0, 11.0, 5.0, 7.0, 7.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.18537521362305, -38.84290313720703, -37.50043487548828, -36.157962799072266, -34.81549072265625, -33.4730224609375, -32.130550384521484, -30.7880802154541, -29.44561004638672, -28.103139877319336, -26.760669708251953, -25.418197631835938, -24.075727462768555, -22.733257293701172, -21.390785217285156, -20.048315048217773, -18.70584487915039, -17.363374710083008, -16.020904541015625, -14.67843246459961, -13.335962295532227, -11.993492126464844, -10.651021003723145, -9.308549880981445, -7.9660797119140625, -6.6236090660095215, -5.2811384201049805, -3.9386677742004395, -2.5961971282958984, -1.2537264823913574, 0.0887441635131836, 1.4312152862548828, 2.7736892700195312, 4.116159915924072, 5.458630561828613, 6.801101207733154, 8.143571853637695, 9.486042022705078, 10.828513145446777, 12.170984268188477, 13.51345443725586, 14.855924606323242, 16.198394775390625, 17.54086685180664, 18.883337020874023, 20.225807189941406, 21.568279266357422, 22.910749435424805, 24.253219604492188, 25.59568977355957, 26.938159942626953, 28.28063201904297, 29.62310218811035, 30.965572357177734, 32.30804443359375, 33.6505126953125, 34.992984771728516, 36.33545684814453, 37.67792510986328, 39.0203971862793, 40.36286926269531, 41.70533752441406, 43.04780960083008, 44.390281677246094, 45.732749938964844]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 4.0, 4.0, 8.0, 15.0, 9.0, 13.0, 16.0, 20.0, 30.0, 25.0, 29.0, 25.0, 33.0, 33.0, 33.0, 32.0, 38.0, 36.0, 42.0, 51.0, 46.0, 43.0, 43.0, 28.0, 35.0, 36.0, 21.0, 29.0, 21.0, 28.0, 24.0, 17.0, 13.0, 24.0, 20.0, 16.0, 9.0, 14.0, 4.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.81640625, -6.6019287109375, -6.387451171875, -6.1729736328125, -5.95849609375, -5.7440185546875, -5.529541015625, -5.3150634765625, -5.1005859375, -4.8861083984375, -4.671630859375, -4.4571533203125, -4.24267578125, -4.0281982421875, -3.813720703125, -3.5992431640625, -3.384765625, -3.1702880859375, -2.955810546875, -2.7413330078125, -2.52685546875, -2.3123779296875, -2.097900390625, -1.8834228515625, -1.6689453125, -1.4544677734375, -1.239990234375, -1.0255126953125, -0.81103515625, -0.5965576171875, -0.382080078125, -0.1676025390625, 0.046875, 0.2613525390625, 0.475830078125, 0.6903076171875, 0.90478515625, 1.1192626953125, 1.333740234375, 1.5482177734375, 1.7626953125, 1.9771728515625, 2.191650390625, 2.4061279296875, 2.62060546875, 2.8350830078125, 3.049560546875, 3.2640380859375, 3.478515625, 3.6929931640625, 3.907470703125, 4.1219482421875, 4.33642578125, 4.5509033203125, 4.765380859375, 4.9798583984375, 5.1943359375, 5.4088134765625, 5.623291015625, 5.8377685546875, 6.05224609375, 6.2667236328125, 6.481201171875, 6.6956787109375, 6.91015625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 9.0, 8.0, 20.0, 13.0, 25.0, 54.0, 70.0, 83.0, 177.0, 256.0, 396.0, 572.0, 913.0, 1417.0, 2190.0, 3333.0, 5294.0, 7969.0, 12149.0, 18827.0, 30262.0, 49770.0, 87737.0, 181942.0, 293552.0, 153241.0, 77270.0, 44555.0, 27460.0, 17452.0, 10960.0, 7161.0, 4738.0, 3039.0, 1953.0, 1244.0, 867.0, 532.0, 351.0, 242.0, 161.0, 107.0, 64.0, 44.0, 33.0, 13.0, 17.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.28466796875, -0.2756004333496094, -0.26653289794921875, -0.2574653625488281, -0.2483978271484375, -0.23933029174804688, -0.23026275634765625, -0.22119522094726562, -0.212127685546875, -0.20306015014648438, -0.19399261474609375, -0.18492507934570312, -0.1758575439453125, -0.16679000854492188, -0.15772247314453125, -0.14865493774414062, -0.13958740234375, -0.13051986694335938, -0.12145233154296875, -0.11238479614257812, -0.1033172607421875, -0.09424972534179688, -0.08518218994140625, -0.07611465454101562, -0.067047119140625, -0.057979583740234375, -0.04891204833984375, -0.039844512939453125, -0.0307769775390625, -0.021709442138671875, -0.01264190673828125, -0.003574371337890625, 0.0054931640625, 0.014560699462890625, 0.02362823486328125, 0.032695770263671875, 0.0417633056640625, 0.050830841064453125, 0.05989837646484375, 0.06896591186523438, 0.078033447265625, 0.08710098266601562, 0.09616851806640625, 0.10523605346679688, 0.1143035888671875, 0.12337112426757812, 0.13243865966796875, 0.14150619506835938, 0.15057373046875, 0.15964126586914062, 0.16870880126953125, 0.17777633666992188, 0.1868438720703125, 0.19591140747070312, 0.20497894287109375, 0.21404647827148438, 0.223114013671875, 0.23218154907226562, 0.24124908447265625, 0.2503166198730469, 0.2593841552734375, 0.2684516906738281, 0.27751922607421875, 0.2865867614746094, 0.295654296875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 9.0, 6.0, 5.0, 12.0, 14.0, 12.0, 14.0, 16.0, 21.0, 16.0, 33.0, 24.0, 26.0, 22.0, 32.0, 33.0, 39.0, 31.0, 43.0, 48.0, 1067.0, 35.0, 32.0, 38.0, 45.0, 30.0, 26.0, 31.0, 35.0, 28.0, 32.0, 22.0, 21.0, 17.0, 17.0, 13.0, 15.0, 7.0, 7.0, 8.0, 8.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.62890625, -4.4925537109375, -4.356201171875, -4.2198486328125, -4.08349609375, -3.9471435546875, -3.810791015625, -3.6744384765625, -3.5380859375, -3.4017333984375, -3.265380859375, -3.1290283203125, -2.99267578125, -2.8563232421875, -2.719970703125, -2.5836181640625, -2.447265625, -2.3109130859375, -2.174560546875, -2.0382080078125, -1.90185546875, -1.7655029296875, -1.629150390625, -1.4927978515625, -1.3564453125, -1.2200927734375, -1.083740234375, -0.9473876953125, -0.81103515625, -0.6746826171875, -0.538330078125, -0.4019775390625, -0.265625, -0.1292724609375, 0.007080078125, 0.1434326171875, 0.27978515625, 0.4161376953125, 0.552490234375, 0.6888427734375, 0.8251953125, 0.9615478515625, 1.097900390625, 1.2342529296875, 1.37060546875, 1.5069580078125, 1.643310546875, 1.7796630859375, 1.916015625, 2.0523681640625, 2.188720703125, 2.3250732421875, 2.46142578125, 2.5977783203125, 2.734130859375, 2.8704833984375, 3.0068359375, 3.1431884765625, 3.279541015625, 3.4158935546875, 3.55224609375, 3.6885986328125, 3.824951171875, 3.9613037109375, 4.09765625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 8.0, 13.0, 14.0, 31.0, 36.0, 68.0, 91.0, 118.0, 158.0, 222.0, 355.0, 513.0, 734.0, 1008.0, 1522.0, 2127.0, 3156.0, 4405.0, 6738.0, 10153.0, 15479.0, 23715.0, 37888.0, 63250.0, 115528.0, 758753.0, 764319.0, 115402.0, 63017.0, 37974.0, 23905.0, 15233.0, 10206.0, 6657.0, 4492.0, 3056.0, 2073.0, 1432.0, 1048.0, 700.0, 505.0, 304.0, 225.0, 165.0, 108.0, 70.0, 57.0, 36.0, 23.0, 21.0, 9.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.263916015625, -0.25566864013671875, -0.2474212646484375, -0.23917388916015625, -0.230926513671875, -0.22267913818359375, -0.2144317626953125, -0.20618438720703125, -0.19793701171875, -0.18968963623046875, -0.1814422607421875, -0.17319488525390625, -0.164947509765625, -0.15670013427734375, -0.1484527587890625, -0.14020538330078125, -0.1319580078125, -0.12371063232421875, -0.1154632568359375, -0.10721588134765625, -0.098968505859375, -0.09072113037109375, -0.0824737548828125, -0.07422637939453125, -0.06597900390625, -0.05773162841796875, -0.0494842529296875, -0.04123687744140625, -0.032989501953125, -0.02474212646484375, -0.0164947509765625, -0.00824737548828125, 0.0, 0.00824737548828125, 0.0164947509765625, 0.02474212646484375, 0.032989501953125, 0.04123687744140625, 0.0494842529296875, 0.05773162841796875, 0.06597900390625, 0.07422637939453125, 0.0824737548828125, 0.09072113037109375, 0.098968505859375, 0.10721588134765625, 0.1154632568359375, 0.12371063232421875, 0.1319580078125, 0.14020538330078125, 0.1484527587890625, 0.15670013427734375, 0.164947509765625, 0.17319488525390625, 0.1814422607421875, 0.18968963623046875, 0.19793701171875, 0.20618438720703125, 0.2144317626953125, 0.22267913818359375, 0.230926513671875, 0.23917388916015625, 0.2474212646484375, 0.25566864013671875, 0.263916015625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 5.0, 17.0, 12.0, 8.0, 21.0, 27.0, 37.0, 43.0, 48.0, 58.0, 63.0, 63.0, 57.0, 64.0, 69.0, 53.0, 53.0, 58.0, 48.0, 35.0, 37.0, 25.0, 31.0, 14.0, 16.0, 9.0, 5.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.389617919921875e-05, -6.204750388860703e-05, -6.01988285779953e-05, -5.8350153267383575e-05, -5.650147795677185e-05, -5.4652802646160126e-05, -5.28041273355484e-05, -5.0955452024936676e-05, -4.910677671432495e-05, -4.7258101403713226e-05, -4.54094260931015e-05, -4.3560750782489777e-05, -4.171207547187805e-05, -3.986340016126633e-05, -3.80147248506546e-05, -3.616604954004288e-05, -3.431737422943115e-05, -3.246869891881943e-05, -3.06200236082077e-05, -2.8771348297595978e-05, -2.6922672986984253e-05, -2.5073997676372528e-05, -2.3225322365760803e-05, -2.137664705514908e-05, -1.9527971744537354e-05, -1.767929643392563e-05, -1.5830621123313904e-05, -1.3981945812702179e-05, -1.2133270502090454e-05, -1.028459519147873e-05, -8.435919880867004e-06, -6.5872445702552795e-06, -4.738569259643555e-06, -2.88989394903183e-06, -1.041218638420105e-06, 8.074566721916199e-07, 2.6561319828033447e-06, 4.50480729341507e-06, 6.3534826040267944e-06, 8.20215791463852e-06, 1.0050833225250244e-05, 1.1899508535861969e-05, 1.3748183846473694e-05, 1.559685915708542e-05, 1.7445534467697144e-05, 1.929420977830887e-05, 2.1142885088920593e-05, 2.2991560399532318e-05, 2.4840235710144043e-05, 2.6688911020755768e-05, 2.8537586331367493e-05, 3.0386261641979218e-05, 3.223493695259094e-05, 3.408361226320267e-05, 3.593228757381439e-05, 3.778096288442612e-05, 3.962963819503784e-05, 4.147831350564957e-05, 4.332698881626129e-05, 4.5175664126873016e-05, 4.702433943748474e-05, 4.8873014748096466e-05, 5.072169005870819e-05, 5.2570365369319916e-05, 5.441904067993164e-05]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 16.0, 25.0, 31.0, 47.0, 59.0, 76.0, 113.0, 163.0, 311.0, 1000.0, 780270.0, 264721.0, 836.0, 294.0, 161.0, 115.0, 72.0, 60.0, 39.0, 41.0, 18.0, 15.0, 19.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00118255615234375, -0.0011416822671890259, -0.0011008083820343018, -0.0010599344968795776, -0.0010190606117248535, -0.0009781867265701294, -0.0009373128414154053, -0.0008964389562606812, -0.000855565071105957, -0.0008146911859512329, -0.0007738173007965088, -0.0007329434156417847, -0.0006920695304870605, -0.0006511956453323364, -0.0006103217601776123, -0.0005694478750228882, -0.0005285739898681641, -0.00048770010471343994, -0.0004468262195587158, -0.0004059523344039917, -0.0003650784492492676, -0.00032420456409454346, -0.00028333067893981934, -0.00024245679378509521, -0.0002015829086303711, -0.00016070902347564697, -0.00011983513832092285, -7.896125316619873e-05, -3.808736801147461e-05, 2.7865171432495117e-06, 4.366040229797363e-05, 8.453428745269775e-05, 0.00012540817260742188, 0.000166282057762146, 0.00020715594291687012, 0.00024802982807159424, 0.00028890371322631836, 0.0003297775983810425, 0.0003706514835357666, 0.0004115253686904907, 0.00045239925384521484, 0.000493273138999939, 0.0005341470241546631, 0.0005750209093093872, 0.0006158947944641113, 0.0006567686796188354, 0.0006976425647735596, 0.0007385164499282837, 0.0007793903350830078, 0.0008202642202377319, 0.0008611381053924561, 0.0009020119905471802, 0.0009428858757019043, 0.0009837597608566284, 0.0010246336460113525, 0.0010655075311660767, 0.0011063814163208008, 0.001147255301475525, 0.001188129186630249, 0.0012290030717849731, 0.0012698769569396973, 0.0013107508420944214, 0.0013516247272491455, 0.0013924986124038696, 0.0014333724975585938]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 11.0, 36.0, 59.0, 154.0, 232.0, 204.0, 168.0, 90.0, 31.0, 15.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.558579424454365e-05, -1.3874724572815467e-05, -1.2163654901087284e-05, -1.04525843198644e-05, -8.741514648136217e-06, -7.0304449764080346e-06, -5.31937439518515e-06, -3.6083047234569676e-06, -1.897235051728785e-06, -1.86165152626927e-07, 1.524904746474931e-06, 3.2359748729504645e-06, 4.947044544678647e-06, 6.65811421640683e-06, 8.369184797629714e-06, 1.0080254469357897e-05, 1.179132414108608e-05, 1.3502393812814262e-05, 1.5213463484542444e-05, 1.692453406576533e-05, 1.8635604646988213e-05, 2.0346673409221694e-05, 2.2057743990444578e-05, 2.3768814571667463e-05, 2.5479883333900943e-05, 2.7190953915123828e-05, 2.890202267735731e-05, 3.061309325858019e-05, 3.2324162020813674e-05, 3.403523442102596e-05, 3.574630318325944e-05, 3.745737194549292e-05, 3.916844434570521e-05, 4.087951310793869e-05, 4.259058550815098e-05, 4.430165427038446e-05, 4.601272303261794e-05, 4.772379179485142e-05, 4.943486419506371e-05, 5.114593295729719e-05, 5.285700171953067e-05, 5.456807048176415e-05, 5.627914288197644e-05, 5.799021164420992e-05, 5.97012804064434e-05, 6.141234916867688e-05, 6.312342156888917e-05, 6.483449396910146e-05, 6.654555909335613e-05, 6.825663149356842e-05, 6.99676966178231e-05, 7.167876901803538e-05, 7.338984141824767e-05, 7.510090654250234e-05, 7.681197894271463e-05, 7.852305134292692e-05, 8.023412374313921e-05, 8.19451961433515e-05, 8.365626126760617e-05, 8.536733366781846e-05, 8.707840606803074e-05, 8.878947119228542e-05, 9.05005435924977e-05, 9.221161599271e-05, 9.392268111696467e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 6.0, 4.0, 13.0, 11.0, 10.0, 20.0, 19.0, 17.0, 16.0, 34.0, 28.0, 31.0, 30.0, 24.0, 37.0, 34.0, 37.0, 36.0, 43.0, 45.0, 34.0, 33.0, 46.0, 37.0, 22.0, 37.0, 27.0, 27.0, 29.0, 25.0, 29.0, 30.0, 20.0, 17.0, 19.0, 19.0, 9.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2351741790771484e-05, -2.1577812731266022e-05, -2.080388367176056e-05, -2.0029954612255096e-05, -1.9256025552749634e-05, -1.848209649324417e-05, -1.770816743373871e-05, -1.6934238374233246e-05, -1.6160309314727783e-05, -1.538638025522232e-05, -1.4612451195716858e-05, -1.3838522136211395e-05, -1.3064593076705933e-05, -1.229066401720047e-05, -1.1516734957695007e-05, -1.0742805898189545e-05, -9.968876838684082e-06, -9.19494777917862e-06, -8.421018719673157e-06, -7.647089660167694e-06, -6.8731606006622314e-06, -6.099231541156769e-06, -5.325302481651306e-06, -4.5513734221458435e-06, -3.777444362640381e-06, -3.0035153031349182e-06, -2.2295862436294556e-06, -1.455657184123993e-06, -6.817281246185303e-07, 9.220093488693237e-08, 8.66129994392395e-07, 1.6400590538978577e-06, 2.4139881134033203e-06, 3.187917172908783e-06, 3.961846232414246e-06, 4.735775291919708e-06, 5.509704351425171e-06, 6.2836334109306335e-06, 7.057562470436096e-06, 7.831491529941559e-06, 8.605420589447021e-06, 9.379349648952484e-06, 1.0153278708457947e-05, 1.092720776796341e-05, 1.1701136827468872e-05, 1.2475065886974335e-05, 1.3248994946479797e-05, 1.402292400598526e-05, 1.4796853065490723e-05, 1.5570782124996185e-05, 1.6344711184501648e-05, 1.711864024400711e-05, 1.7892569303512573e-05, 1.8666498363018036e-05, 1.94404274225235e-05, 2.021435648202896e-05, 2.0988285541534424e-05, 2.1762214601039886e-05, 2.253614366054535e-05, 2.3310072720050812e-05, 2.4084001779556274e-05, 2.4857930839061737e-05, 2.56318598985672e-05, 2.6405788958072662e-05, 2.7179718017578125e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 4.0, 4.0, 8.0, 15.0, 9.0, 13.0, 16.0, 20.0, 30.0, 25.0, 29.0, 25.0, 33.0, 33.0, 33.0, 32.0, 38.0, 36.0, 42.0, 51.0, 46.0, 43.0, 43.0, 28.0, 35.0, 36.0, 21.0, 29.0, 21.0, 28.0, 24.0, 17.0, 13.0, 24.0, 20.0, 16.0, 9.0, 14.0, 4.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.81640625, -6.6019287109375, -6.387451171875, -6.1729736328125, -5.95849609375, -5.7440185546875, -5.529541015625, -5.3150634765625, -5.1005859375, -4.8861083984375, -4.671630859375, -4.4571533203125, -4.24267578125, -4.0281982421875, -3.813720703125, -3.5992431640625, -3.384765625, -3.1702880859375, -2.955810546875, -2.7413330078125, -2.52685546875, -2.3123779296875, -2.097900390625, -1.8834228515625, -1.6689453125, -1.4544677734375, -1.239990234375, -1.0255126953125, -0.81103515625, -0.5965576171875, -0.382080078125, -0.1676025390625, 0.046875, 0.2613525390625, 0.475830078125, 0.6903076171875, 0.90478515625, 1.1192626953125, 1.333740234375, 1.5482177734375, 1.7626953125, 1.9771728515625, 2.191650390625, 2.4061279296875, 2.62060546875, 2.8350830078125, 3.049560546875, 3.2640380859375, 3.478515625, 3.6929931640625, 3.907470703125, 4.1219482421875, 4.33642578125, 4.5509033203125, 4.765380859375, 4.9798583984375, 5.1943359375, 5.4088134765625, 5.623291015625, 5.8377685546875, 6.05224609375, 6.2667236328125, 6.481201171875, 6.6956787109375, 6.91015625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 7.0, 2.0, 7.0, 3.0, 5.0, 6.0, 9.0, 17.0, 11.0, 25.0, 29.0, 46.0, 57.0, 83.0, 88.0, 134.0, 203.0, 314.0, 573.0, 1150.0, 3354.0, 12438.0, 83705.0, 716066.0, 199276.0, 22396.0, 4917.0, 1669.0, 760.0, 399.0, 243.0, 150.0, 96.0, 74.0, 48.0, 36.0, 28.0, 30.0, 28.0, 21.0, 11.0, 15.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.6953125, -13.262939453125, -12.83056640625, -12.398193359375, -11.9658203125, -11.533447265625, -11.10107421875, -10.668701171875, -10.236328125, -9.803955078125, -9.37158203125, -8.939208984375, -8.5068359375, -8.074462890625, -7.64208984375, -7.209716796875, -6.77734375, -6.344970703125, -5.91259765625, -5.480224609375, -5.0478515625, -4.615478515625, -4.18310546875, -3.750732421875, -3.318359375, -2.885986328125, -2.45361328125, -2.021240234375, -1.5888671875, -1.156494140625, -0.72412109375, -0.291748046875, 0.140625, 0.572998046875, 1.00537109375, 1.437744140625, 1.8701171875, 2.302490234375, 2.73486328125, 3.167236328125, 3.599609375, 4.031982421875, 4.46435546875, 4.896728515625, 5.3291015625, 5.761474609375, 6.19384765625, 6.626220703125, 7.05859375, 7.490966796875, 7.92333984375, 8.355712890625, 8.7880859375, 9.220458984375, 9.65283203125, 10.085205078125, 10.517578125, 10.949951171875, 11.38232421875, 11.814697265625, 12.2470703125, 12.679443359375, 13.11181640625, 13.544189453125, 13.9765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 5.0, 4.0, 3.0, 9.0, 7.0, 13.0, 20.0, 14.0, 23.0, 31.0, 42.0, 43.0, 50.0, 54.0, 51.0, 77.0, 134.0, 1704.0, 313.0, 68.0, 60.0, 44.0, 49.0, 40.0, 32.0, 28.0, 10.0, 22.0, 19.0, 18.0, 7.0, 9.0, 8.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.28125, -27.390625, -26.5, -25.609375, -24.71875, -23.828125, -22.9375, -22.046875, -21.15625, -20.265625, -19.375, -18.484375, -17.59375, -16.703125, -15.8125, -14.921875, -14.03125, -13.140625, -12.25, -11.359375, -10.46875, -9.578125, -8.6875, -7.796875, -6.90625, -6.015625, -5.125, -4.234375, -3.34375, -2.453125, -1.5625, -0.671875, 0.21875, 1.109375, 2.0, 2.890625, 3.78125, 4.671875, 5.5625, 6.453125, 7.34375, 8.234375, 9.125, 10.015625, 10.90625, 11.796875, 12.6875, 13.578125, 14.46875, 15.359375, 16.25, 17.140625, 18.03125, 18.921875, 19.8125, 20.703125, 21.59375, 22.484375, 23.375, 24.265625, 25.15625, 26.046875, 26.9375, 27.828125, 28.71875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 10.0, 8.0, 10.0, 9.0, 7.0, 23.0, 17.0, 24.0, 24.0, 26.0, 60.0, 62.0, 98.0, 183.0, 378.0, 1756.0, 207117.0, 2931265.0, 3392.0, 543.0, 194.0, 146.0, 80.0, 70.0, 54.0, 41.0, 17.0, 19.0, 19.0, 8.0, 9.0, 8.0, 3.0, 5.0, 3.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-66.25, -64.1875, -62.125, -60.0625, -58.0, -55.9375, -53.875, -51.8125, -49.75, -47.6875, -45.625, -43.5625, -41.5, -39.4375, -37.375, -35.3125, -33.25, -31.1875, -29.125, -27.0625, -25.0, -22.9375, -20.875, -18.8125, -16.75, -14.6875, -12.625, -10.5625, -8.5, -6.4375, -4.375, -2.3125, -0.25, 1.8125, 3.875, 5.9375, 8.0, 10.0625, 12.125, 14.1875, 16.25, 18.3125, 20.375, 22.4375, 24.5, 26.5625, 28.625, 30.6875, 32.75, 34.8125, 36.875, 38.9375, 41.0, 43.0625, 45.125, 47.1875, 49.25, 51.3125, 53.375, 55.4375, 57.5, 59.5625, 61.625, 63.6875, 65.75]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 193.0, 767.0, 51.0, 1.0, 1.0], "bins": [-314.2157897949219, -309.0068054199219, -303.7978210449219, -298.5888366699219, -293.37982177734375, -288.17083740234375, -282.96185302734375, -277.75286865234375, -272.54388427734375, -267.33489990234375, -262.12591552734375, -256.91693115234375, -251.7079315185547, -246.4989471435547, -241.28994750976562, -236.08096313476562, -230.87197875976562, -225.66299438476562, -220.45399475097656, -215.24501037597656, -210.03602600097656, -204.82704162597656, -199.6180419921875, -194.4090576171875, -189.20005798339844, -183.99107360839844, -178.78207397460938, -173.57308959960938, -168.36410522460938, -163.15512084960938, -157.9461212158203, -152.7371368408203, -147.5281524658203, -142.3191680908203, -137.11016845703125, -131.90118408203125, -126.69219970703125, -121.48320770263672, -116.27421569824219, -111.06523132324219, -105.85624694824219, -100.64725494384766, -95.43827056884766, -90.22927856445312, -85.02029418945312, -79.8113021850586, -74.60231018066406, -69.39332580566406, -64.18434143066406, -58.9753532409668, -53.76636505126953, -48.557373046875, -43.348388671875, -38.13939666748047, -32.9304084777832, -27.721420288085938, -22.51243019104004, -17.303442001342773, -12.094452857971191, -6.885463714599609, -1.6764755249023438, 3.532512664794922, 8.74150276184082, 13.950490951538086, 19.15947914123535]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 5.0, 5.0, 10.0, 21.0, 13.0, 17.0, 16.0, 19.0, 22.0, 31.0, 28.0, 37.0, 39.0, 43.0, 38.0, 34.0, 44.0, 39.0, 38.0, 36.0, 45.0, 43.0, 34.0, 31.0, 36.0, 32.0, 31.0, 35.0, 24.0, 16.0, 20.0, 15.0, 15.0, 19.0, 10.0, 13.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-68.42091369628906, -66.35364532470703, -64.286376953125, -62.21910858154297, -60.15184020996094, -58.084571838378906, -56.017303466796875, -53.950035095214844, -51.88276672363281, -49.81549835205078, -47.74822998046875, -45.68096160888672, -43.61369323730469, -41.546424865722656, -39.479156494140625, -37.411888122558594, -35.34461975097656, -33.27735137939453, -31.2100830078125, -29.14281463623047, -27.075546264648438, -25.008277893066406, -22.941009521484375, -20.873741149902344, -18.806472778320312, -16.73920440673828, -14.67193603515625, -12.604667663574219, -10.537399291992188, -8.470130920410156, -6.402862548828125, -4.335594177246094, -2.268329620361328, -0.20106124877929688, 1.8662071228027344, 3.9334754943847656, 6.000743865966797, 8.068012237548828, 10.13528060913086, 12.20254898071289, 14.269817352294922, 16.337085723876953, 18.404354095458984, 20.471622467041016, 22.538890838623047, 24.606159210205078, 26.67342758178711, 28.74069595336914, 30.807964324951172, 32.8752326965332, 34.942501068115234, 37.009769439697266, 39.0770378112793, 41.14430618286133, 43.21157455444336, 45.27884292602539, 47.34611129760742, 49.41337966918945, 51.480648040771484, 53.547916412353516, 55.61518478393555, 57.68245315551758, 59.74972152709961, 61.81698989868164, 63.88425827026367]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 3.0, 3.0, 4.0, 8.0, 17.0, 9.0, 13.0, 13.0, 25.0, 25.0, 21.0, 21.0, 20.0, 41.0, 17.0, 36.0, 31.0, 51.0, 44.0, 35.0, 38.0, 39.0, 42.0, 36.0, 40.0, 30.0, 36.0, 33.0, 24.0, 27.0, 23.0, 29.0, 21.0, 15.0, 8.0, 20.0, 19.0, 16.0, 12.0, 11.0, 8.0, 11.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6171875, -6.4071044921875, -6.197021484375, -5.9869384765625, -5.77685546875, -5.5667724609375, -5.356689453125, -5.1466064453125, -4.9365234375, -4.7264404296875, -4.516357421875, -4.3062744140625, -4.09619140625, -3.8861083984375, -3.676025390625, -3.4659423828125, -3.255859375, -3.0457763671875, -2.835693359375, -2.6256103515625, -2.41552734375, -2.2054443359375, -1.995361328125, -1.7852783203125, -1.5751953125, -1.3651123046875, -1.155029296875, -0.9449462890625, -0.73486328125, -0.5247802734375, -0.314697265625, -0.1046142578125, 0.10546875, 0.3155517578125, 0.525634765625, 0.7357177734375, 0.94580078125, 1.1558837890625, 1.365966796875, 1.5760498046875, 1.7861328125, 1.9962158203125, 2.206298828125, 2.4163818359375, 2.62646484375, 2.8365478515625, 3.046630859375, 3.2567138671875, 3.466796875, 3.6768798828125, 3.886962890625, 4.0970458984375, 4.30712890625, 4.5172119140625, 4.727294921875, 4.9373779296875, 5.1474609375, 5.3575439453125, 5.567626953125, 5.7777099609375, 5.98779296875, 6.1978759765625, 6.407958984375, 6.6180419921875, 6.828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 4.0, 11.0, 11.0, 10.0, 11.0, 21.0, 26.0, 33.0, 49.0, 76.0, 111.0, 182.0, 290.0, 619.0, 1049.0, 2190.0, 5470.0, 15726.0, 63065.0, 614171.0, 2813263.0, 589927.0, 62803.0, 15207.0, 5288.0, 2268.0, 1015.0, 556.0, 254.0, 207.0, 113.0, 64.0, 37.0, 45.0, 18.0, 20.0, 12.0, 15.0, 4.0, 12.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.0390625, -14.5615234375, -14.083984375, -13.6064453125, -13.12890625, -12.6513671875, -12.173828125, -11.6962890625, -11.21875, -10.7412109375, -10.263671875, -9.7861328125, -9.30859375, -8.8310546875, -8.353515625, -7.8759765625, -7.3984375, -6.9208984375, -6.443359375, -5.9658203125, -5.48828125, -5.0107421875, -4.533203125, -4.0556640625, -3.578125, -3.1005859375, -2.623046875, -2.1455078125, -1.66796875, -1.1904296875, -0.712890625, -0.2353515625, 0.2421875, 0.7197265625, 1.197265625, 1.6748046875, 2.15234375, 2.6298828125, 3.107421875, 3.5849609375, 4.0625, 4.5400390625, 5.017578125, 5.4951171875, 5.97265625, 6.4501953125, 6.927734375, 7.4052734375, 7.8828125, 8.3603515625, 8.837890625, 9.3154296875, 9.79296875, 10.2705078125, 10.748046875, 11.2255859375, 11.703125, 12.1806640625, 12.658203125, 13.1357421875, 13.61328125, 14.0908203125, 14.568359375, 15.0458984375, 15.5234375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 5.0, 8.0, 14.0, 31.0, 39.0, 44.0, 59.0, 88.0, 106.0, 168.0, 222.0, 347.0, 480.0, 533.0, 585.0, 390.0, 298.0, 188.0, 116.0, 102.0, 71.0, 47.0, 38.0, 14.0, 19.0, 17.0, 8.0, 9.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.609375, -14.2115478515625, -13.813720703125, -13.4158935546875, -13.01806640625, -12.6202392578125, -12.222412109375, -11.8245849609375, -11.4267578125, -11.0289306640625, -10.631103515625, -10.2332763671875, -9.83544921875, -9.4376220703125, -9.039794921875, -8.6419677734375, -8.244140625, -7.8463134765625, -7.448486328125, -7.0506591796875, -6.65283203125, -6.2550048828125, -5.857177734375, -5.4593505859375, -5.0615234375, -4.6636962890625, -4.265869140625, -3.8680419921875, -3.47021484375, -3.0723876953125, -2.674560546875, -2.2767333984375, -1.87890625, -1.4810791015625, -1.083251953125, -0.6854248046875, -0.28759765625, 0.1102294921875, 0.508056640625, 0.9058837890625, 1.3037109375, 1.7015380859375, 2.099365234375, 2.4971923828125, 2.89501953125, 3.2928466796875, 3.690673828125, 4.0885009765625, 4.486328125, 4.8841552734375, 5.281982421875, 5.6798095703125, 6.07763671875, 6.4754638671875, 6.873291015625, 7.2711181640625, 7.6689453125, 8.0667724609375, 8.464599609375, 8.8624267578125, 9.26025390625, 9.6580810546875, 10.055908203125, 10.4537353515625, 10.8515625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 5.0, 12.0, 9.0, 15.0, 29.0, 33.0, 36.0, 51.0, 66.0, 83.0, 111.0, 161.0, 234.0, 550.0, 1591.0, 8261.0, 104694.0, 3685290.0, 371088.0, 17705.0, 2534.0, 660.0, 300.0, 171.0, 158.0, 99.0, 75.0, 62.0, 45.0, 17.0, 24.0, 22.0, 17.0, 20.0, 8.0, 5.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-41.21875, -39.99462890625, -38.7705078125, -37.54638671875, -36.322265625, -35.09814453125, -33.8740234375, -32.64990234375, -31.42578125, -30.20166015625, -28.9775390625, -27.75341796875, -26.529296875, -25.30517578125, -24.0810546875, -22.85693359375, -21.6328125, -20.40869140625, -19.1845703125, -17.96044921875, -16.736328125, -15.51220703125, -14.2880859375, -13.06396484375, -11.83984375, -10.61572265625, -9.3916015625, -8.16748046875, -6.943359375, -5.71923828125, -4.4951171875, -3.27099609375, -2.046875, -0.82275390625, 0.4013671875, 1.62548828125, 2.849609375, 4.07373046875, 5.2978515625, 6.52197265625, 7.74609375, 8.97021484375, 10.1943359375, 11.41845703125, 12.642578125, 13.86669921875, 15.0908203125, 16.31494140625, 17.5390625, 18.76318359375, 19.9873046875, 21.21142578125, 22.435546875, 23.65966796875, 24.8837890625, 26.10791015625, 27.33203125, 28.55615234375, 29.7802734375, 31.00439453125, 32.228515625, 33.45263671875, 34.6767578125, 35.90087890625, 37.125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 22.0, 302.0, 588.0, 100.0, 6.0, 2.0, 1.0, 1.0], "bins": [-540.53515625, -531.2622680664062, -521.9893188476562, -512.7164306640625, -503.44354248046875, -494.1706237792969, -484.8977355957031, -475.62481689453125, -466.3519287109375, -457.0790100097656, -447.8061218261719, -438.533203125, -429.26031494140625, -419.9873962402344, -410.7145080566406, -401.44158935546875, -392.168701171875, -382.8957824707031, -373.6228942871094, -364.3499755859375, -355.07708740234375, -345.8041687011719, -336.5312805175781, -327.25836181640625, -317.9854431152344, -308.7125244140625, -299.43963623046875, -290.1667175292969, -280.8938293457031, -271.62091064453125, -262.3480224609375, -253.07510375976562, -243.80221557617188, -234.52931213378906, -225.25640869140625, -215.98350524902344, -206.71060180664062, -197.4376983642578, -188.164794921875, -178.89187622070312, -169.61898803710938, -160.34608459472656, -151.07318115234375, -141.80027770996094, -132.52737426757812, -123.25447082519531, -113.98155975341797, -104.70865631103516, -95.43575286865234, -86.16284942626953, -76.88994598388672, -67.61703491210938, -58.34413528442383, -49.071231842041016, -39.79832458496094, -30.525421142578125, -21.252517700195312, -11.979613304138184, -2.7067089080810547, 6.566196441650391, 15.839099884033203, 25.112003326416016, 34.384910583496094, 43.657814025878906, 52.93071746826172]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 2.0, 6.0, 8.0, 9.0, 10.0, 11.0, 17.0, 14.0, 15.0, 17.0, 28.0, 23.0, 28.0, 30.0, 33.0, 34.0, 47.0, 38.0, 38.0, 36.0, 41.0, 46.0, 43.0, 30.0, 38.0, 28.0, 50.0, 27.0, 28.0, 24.0, 27.0, 39.0, 15.0, 20.0, 16.0, 11.0, 14.0, 13.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-38.980796813964844, -37.87997055053711, -36.779144287109375, -35.678321838378906, -34.57749557495117, -33.47666931152344, -32.3758430480957, -31.27501678466797, -30.174192428588867, -29.073366165161133, -27.97254180908203, -26.871715545654297, -25.770889282226562, -24.67006492614746, -23.569238662719727, -22.468414306640625, -21.36758804321289, -20.266761779785156, -19.165937423706055, -18.06511116027832, -16.96428680419922, -15.863460540771484, -14.76263427734375, -13.661808967590332, -12.560983657836914, -11.460158348083496, -10.359333038330078, -9.258506774902344, -8.157681465148926, -7.056856155395508, -5.956030368804932, -4.8552045822143555, -3.7543811798095703, -2.6535556316375732, -1.5527300834655762, -0.4519045352935791, 0.648921012878418, 1.749746322631836, 2.850572109222412, 3.9513978958129883, 5.052223205566406, 6.153048515319824, 7.2538743019104, 8.354700088500977, 9.455525398254395, 10.556350708007812, 11.657176971435547, 12.758002281188965, 13.858827590942383, 14.9596529006958, 16.06047821044922, 17.161304473876953, 18.262130737304688, 19.36295509338379, 20.463781356811523, 21.564605712890625, 22.66543197631836, 23.766258239746094, 24.867082595825195, 25.96790885925293, 27.06873321533203, 28.169559478759766, 29.2703857421875, 30.371212005615234, 31.472036361694336]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 1.0, 3.0, 11.0, 11.0, 9.0, 14.0, 11.0, 19.0, 18.0, 19.0, 25.0, 25.0, 36.0, 33.0, 36.0, 32.0, 35.0, 42.0, 40.0, 43.0, 49.0, 39.0, 37.0, 42.0, 30.0, 28.0, 36.0, 30.0, 26.0, 29.0, 20.0, 20.0, 17.0, 22.0, 21.0, 20.0, 13.0, 15.0, 12.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.4453125, -7.2249755859375, -7.004638671875, -6.7843017578125, -6.56396484375, -6.3436279296875, -6.123291015625, -5.9029541015625, -5.6826171875, -5.4622802734375, -5.241943359375, -5.0216064453125, -4.80126953125, -4.5809326171875, -4.360595703125, -4.1402587890625, -3.919921875, -3.6995849609375, -3.479248046875, -3.2589111328125, -3.03857421875, -2.8182373046875, -2.597900390625, -2.3775634765625, -2.1572265625, -1.9368896484375, -1.716552734375, -1.4962158203125, -1.27587890625, -1.0555419921875, -0.835205078125, -0.6148681640625, -0.39453125, -0.1741943359375, 0.046142578125, 0.2664794921875, 0.48681640625, 0.7071533203125, 0.927490234375, 1.1478271484375, 1.3681640625, 1.5885009765625, 1.808837890625, 2.0291748046875, 2.24951171875, 2.4698486328125, 2.690185546875, 2.9105224609375, 3.130859375, 3.3511962890625, 3.571533203125, 3.7918701171875, 4.01220703125, 4.2325439453125, 4.452880859375, 4.6732177734375, 4.8935546875, 5.1138916015625, 5.334228515625, 5.5545654296875, 5.77490234375, 5.9952392578125, 6.215576171875, 6.4359130859375, 6.65625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 5.0, 9.0, 15.0, 11.0, 26.0, 42.0, 42.0, 90.0, 107.0, 145.0, 239.0, 368.0, 568.0, 786.0, 1252.0, 1954.0, 2792.0, 4388.0, 6516.0, 9615.0, 14855.0, 23875.0, 38374.0, 64155.0, 119390.0, 243239.0, 234552.0, 114762.0, 63240.0, 37672.0, 22900.0, 14529.0, 9067.0, 6325.0, 4117.0, 2800.0, 1881.0, 1303.0, 805.0, 583.0, 380.0, 237.0, 168.0, 121.0, 99.0, 66.0, 40.0, 15.0, 16.0, 14.0, 1.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.28955078125, -0.28076934814453125, -0.2719879150390625, -0.26320648193359375, -0.254425048828125, -0.24564361572265625, -0.2368621826171875, -0.22808074951171875, -0.21929931640625, -0.21051788330078125, -0.2017364501953125, -0.19295501708984375, -0.184173583984375, -0.17539215087890625, -0.1666107177734375, -0.15782928466796875, -0.1490478515625, -0.14026641845703125, -0.1314849853515625, -0.12270355224609375, -0.113922119140625, -0.10514068603515625, -0.0963592529296875, -0.08757781982421875, -0.07879638671875, -0.07001495361328125, -0.0612335205078125, -0.05245208740234375, -0.043670654296875, -0.03488922119140625, -0.0261077880859375, -0.01732635498046875, -0.008544921875, 0.00023651123046875, 0.0090179443359375, 0.01779937744140625, 0.026580810546875, 0.03536224365234375, 0.0441436767578125, 0.05292510986328125, 0.06170654296875, 0.07048797607421875, 0.0792694091796875, 0.08805084228515625, 0.096832275390625, 0.10561370849609375, 0.1143951416015625, 0.12317657470703125, 0.1319580078125, 0.14073944091796875, 0.1495208740234375, 0.15830230712890625, 0.167083740234375, 0.17586517333984375, 0.1846466064453125, 0.19342803955078125, 0.20220947265625, 0.21099090576171875, 0.2197723388671875, 0.22855377197265625, 0.237335205078125, 0.24611663818359375, 0.2548980712890625, 0.26367950439453125, 0.2724609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 5.0, 10.0, 16.0, 13.0, 21.0, 22.0, 21.0, 22.0, 33.0, 34.0, 31.0, 44.0, 40.0, 47.0, 43.0, 51.0, 1065.0, 35.0, 43.0, 32.0, 47.0, 57.0, 39.0, 33.0, 26.0, 22.0, 34.0, 21.0, 17.0, 18.0, 12.0, 10.0, 12.0, 3.0, 10.0, 3.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.6759033203125, -4.519775390625, -4.3636474609375, -4.20751953125, -4.0513916015625, -3.895263671875, -3.7391357421875, -3.5830078125, -3.4268798828125, -3.270751953125, -3.1146240234375, -2.95849609375, -2.8023681640625, -2.646240234375, -2.4901123046875, -2.333984375, -2.1778564453125, -2.021728515625, -1.8656005859375, -1.70947265625, -1.5533447265625, -1.397216796875, -1.2410888671875, -1.0849609375, -0.9288330078125, -0.772705078125, -0.6165771484375, -0.46044921875, -0.3043212890625, -0.148193359375, 0.0079345703125, 0.1640625, 0.3201904296875, 0.476318359375, 0.6324462890625, 0.78857421875, 0.9447021484375, 1.100830078125, 1.2569580078125, 1.4130859375, 1.5692138671875, 1.725341796875, 1.8814697265625, 2.03759765625, 2.1937255859375, 2.349853515625, 2.5059814453125, 2.662109375, 2.8182373046875, 2.974365234375, 3.1304931640625, 3.28662109375, 3.4427490234375, 3.598876953125, 3.7550048828125, 3.9111328125, 4.0672607421875, 4.223388671875, 4.3795166015625, 4.53564453125, 4.6917724609375, 4.847900390625, 5.0040283203125, 5.16015625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 11.0, 20.0, 12.0, 29.0, 55.0, 81.0, 100.0, 131.0, 199.0, 305.0, 385.0, 619.0, 865.0, 1244.0, 1815.0, 2830.0, 4185.0, 6216.0, 9784.0, 15306.0, 24514.0, 40728.0, 71121.0, 141020.0, 1320282.0, 212115.0, 101060.0, 54314.0, 32051.0, 19473.0, 12309.0, 8022.0, 5263.0, 3380.0, 2325.0, 1498.0, 1067.0, 742.0, 467.0, 366.0, 241.0, 194.0, 107.0, 82.0, 58.0, 36.0, 29.0, 27.0, 16.0, 10.0, 6.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.269287109375, -0.26053619384765625, -0.2517852783203125, -0.24303436279296875, -0.234283447265625, -0.22553253173828125, -0.2167816162109375, -0.20803070068359375, -0.19927978515625, -0.19052886962890625, -0.1817779541015625, -0.17302703857421875, -0.164276123046875, -0.15552520751953125, -0.1467742919921875, -0.13802337646484375, -0.1292724609375, -0.12052154541015625, -0.1117706298828125, -0.10301971435546875, -0.094268798828125, -0.08551788330078125, -0.0767669677734375, -0.06801605224609375, -0.05926513671875, -0.05051422119140625, -0.0417633056640625, -0.03301239013671875, -0.024261474609375, -0.01551055908203125, -0.0067596435546875, 0.00199127197265625, 0.0107421875, 0.01949310302734375, 0.0282440185546875, 0.03699493408203125, 0.045745849609375, 0.05449676513671875, 0.0632476806640625, 0.07199859619140625, 0.08074951171875, 0.08950042724609375, 0.0982513427734375, 0.10700225830078125, 0.115753173828125, 0.12450408935546875, 0.1332550048828125, 0.14200592041015625, 0.1507568359375, 0.15950775146484375, 0.1682586669921875, 0.17700958251953125, 0.185760498046875, 0.19451141357421875, 0.2032623291015625, 0.21201324462890625, 0.22076416015625, 0.22951507568359375, 0.2382659912109375, 0.24701690673828125, 0.255767822265625, 0.26451873779296875, 0.2732696533203125, 0.28202056884765625, 0.290771484375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 6.0, 6.0, 11.0, 16.0, 15.0, 22.0, 13.0, 17.0, 30.0, 39.0, 44.0, 42.0, 65.0, 50.0, 58.0, 49.0, 52.0, 47.0, 73.0, 56.0, 45.0, 47.0, 27.0, 29.0, 31.0, 13.0, 25.0, 15.0, 18.0, 9.0, 7.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.7326087951660156e-05, -4.5903027057647705e-05, -4.4479966163635254e-05, -4.30569052696228e-05, -4.163384437561035e-05, -4.02107834815979e-05, -3.878772258758545e-05, -3.7364661693573e-05, -3.594160079956055e-05, -3.4518539905548096e-05, -3.3095479011535645e-05, -3.167241811752319e-05, -3.0249357223510742e-05, -2.882629632949829e-05, -2.740323543548584e-05, -2.598017454147339e-05, -2.4557113647460938e-05, -2.3134052753448486e-05, -2.1710991859436035e-05, -2.0287930965423584e-05, -1.8864870071411133e-05, -1.744180917739868e-05, -1.601874828338623e-05, -1.459568738937378e-05, -1.3172626495361328e-05, -1.1749565601348877e-05, -1.0326504707336426e-05, -8.903443813323975e-06, -7.4803829193115234e-06, -6.057322025299072e-06, -4.634261131286621e-06, -3.21120023727417e-06, -1.7881393432617188e-06, -3.650784492492676e-07, 1.0579824447631836e-06, 2.4810433387756348e-06, 3.904104232788086e-06, 5.327165126800537e-06, 6.750226020812988e-06, 8.17328691482544e-06, 9.59634780883789e-06, 1.1019408702850342e-05, 1.2442469596862793e-05, 1.3865530490875244e-05, 1.5288591384887695e-05, 1.6711652278900146e-05, 1.8134713172912598e-05, 1.955777406692505e-05, 2.09808349609375e-05, 2.240389585494995e-05, 2.3826956748962402e-05, 2.5250017642974854e-05, 2.6673078536987305e-05, 2.8096139430999756e-05, 2.9519200325012207e-05, 3.094226121902466e-05, 3.236532211303711e-05, 3.378838300704956e-05, 3.521144390106201e-05, 3.663450479507446e-05, 3.8057565689086914e-05, 3.9480626583099365e-05, 4.0903687477111816e-05, 4.232674837112427e-05, 4.374980926513672e-05]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 16.0, 9.0, 12.0, 19.0, 29.0, 31.0, 38.0, 58.0, 67.0, 80.0, 114.0, 199.0, 394.0, 951.0, 253726.0, 790240.0, 1331.0, 439.0, 246.0, 132.0, 92.0, 58.0, 72.0, 36.0, 49.0, 17.0, 25.0, 15.0, 17.0, 9.0, 6.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000904083251953125, -0.0008740425109863281, -0.0008440017700195312, -0.0008139610290527344, -0.0007839202880859375, -0.0007538795471191406, -0.0007238388061523438, -0.0006937980651855469, -0.00066375732421875, -0.0006337165832519531, -0.0006036758422851562, -0.0005736351013183594, -0.0005435943603515625, -0.0005135536193847656, -0.00048351287841796875, -0.0004534721374511719, -0.000423431396484375, -0.0003933906555175781, -0.00036334991455078125, -0.0003333091735839844, -0.0003032684326171875, -0.0002732276916503906, -0.00024318695068359375, -0.00021314620971679688, -0.00018310546875, -0.00015306472778320312, -0.00012302398681640625, -9.298324584960938e-05, -6.29425048828125e-05, -3.2901763916015625e-05, -2.86102294921875e-06, 2.7179718017578125e-05, 5.7220458984375e-05, 8.726119995117188e-05, 0.00011730194091796875, 0.00014734268188476562, 0.0001773834228515625, 0.00020742416381835938, 0.00023746490478515625, 0.0002675056457519531, 0.00029754638671875, 0.0003275871276855469, 0.00035762786865234375, 0.0003876686096191406, 0.0004177093505859375, 0.0004477500915527344, 0.00047779083251953125, 0.0005078315734863281, 0.000537872314453125, 0.0005679130554199219, 0.0005979537963867188, 0.0006279945373535156, 0.0006580352783203125, 0.0006880760192871094, 0.0007181167602539062, 0.0007481575012207031, 0.0007781982421875, 0.0008082389831542969, 0.0008382797241210938, 0.0008683204650878906, 0.0008983612060546875, 0.0009284019470214844, 0.0009584426879882812, 0.0009884834289550781, 0.001018524169921875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 67.0, 808.0, 137.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.702547686174512e-05, -8.932573109632358e-05, -8.162598533090204e-05, -7.392624684143811e-05, -6.622650107601658e-05, -5.8526755310595036e-05, -5.08270131831523e-05, -4.312727105570957e-05, -3.542752529028803e-05, -2.7727781343855895e-05, -2.002803739742376e-05, -1.2328293450991623e-05, -4.628549504559487e-06, 3.0711962608620524e-06, 1.0770938388304785e-05, 1.8470680515747517e-05, 2.6170426281169057e-05, 3.3870172046590596e-05, 4.156991417403333e-05, 4.926965630147606e-05, 5.69694020668976e-05, 6.466914783231914e-05, 7.236888632178307e-05, 8.00686320872046e-05, 8.776837785262614e-05, 9.546812361804768e-05, 0.00010316786938346922, 0.00011086760787293315, 0.00011856735363835469, 0.00012626709940377623, 0.00013396683789324015, 0.0001416665909346193, 0.00014936630032025278, 0.0001570660388097167, 0.00016476579185109586, 0.00017246553034055978, 0.00018016528338193893, 0.00018786502187140286, 0.00019556476036086679, 0.0002032644988503307, 0.00021096425189170986, 0.0002186639903811738, 0.00022636374342255294, 0.00023406348191201687, 0.0002417632204014808, 0.0002494629588909447, 0.0002571627264842391, 0.000264862464973703, 0.00027256220346316695, 0.0002802619419526309, 0.0002879616804420948, 0.0002956614480353892, 0.0003033611865248531, 0.00031106092501431704, 0.00031876066350378096, 0.0003264604019932449, 0.00033416016958653927, 0.0003418599080760032, 0.0003495596465654671, 0.0003572594141587615, 0.0003649591526482254, 0.00037265889113768935, 0.0003803586296271533, 0.0003880583681166172, 0.00039575810660608113]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 8.0, 2.0, 7.0, 9.0, 18.0, 18.0, 20.0, 17.0, 14.0, 21.0, 29.0, 28.0, 32.0, 23.0, 32.0, 34.0, 33.0, 26.0, 37.0, 35.0, 46.0, 40.0, 48.0, 44.0, 28.0, 29.0, 27.0, 27.0, 34.0, 38.0, 21.0, 29.0, 28.0, 19.0, 18.0, 12.0, 7.0, 13.0, 9.0, 12.0, 3.0, 5.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.2113323211669922e-05, -2.1422281861305237e-05, -2.0731240510940552e-05, -2.0040199160575867e-05, -1.934915781021118e-05, -1.8658116459846497e-05, -1.796707510948181e-05, -1.7276033759117126e-05, -1.658499240875244e-05, -1.5893951058387756e-05, -1.5202909708023071e-05, -1.4511868357658386e-05, -1.3820827007293701e-05, -1.3129785656929016e-05, -1.2438744306564331e-05, -1.1747702956199646e-05, -1.1056661605834961e-05, -1.0365620255470276e-05, -9.67457890510559e-06, -8.983537554740906e-06, -8.29249620437622e-06, -7.601454854011536e-06, -6.910413503646851e-06, -6.2193721532821655e-06, -5.5283308029174805e-06, -4.837289452552795e-06, -4.14624810218811e-06, -3.4552067518234253e-06, -2.7641654014587402e-06, -2.073124051094055e-06, -1.3820827007293701e-06, -6.910413503646851e-07, 0.0, 6.910413503646851e-07, 1.3820827007293701e-06, 2.073124051094055e-06, 2.7641654014587402e-06, 3.4552067518234253e-06, 4.14624810218811e-06, 4.837289452552795e-06, 5.5283308029174805e-06, 6.2193721532821655e-06, 6.910413503646851e-06, 7.601454854011536e-06, 8.29249620437622e-06, 8.983537554740906e-06, 9.67457890510559e-06, 1.0365620255470276e-05, 1.1056661605834961e-05, 1.1747702956199646e-05, 1.2438744306564331e-05, 1.3129785656929016e-05, 1.3820827007293701e-05, 1.4511868357658386e-05, 1.5202909708023071e-05, 1.5893951058387756e-05, 1.658499240875244e-05, 1.7276033759117126e-05, 1.796707510948181e-05, 1.8658116459846497e-05, 1.934915781021118e-05, 2.0040199160575867e-05, 2.0731240510940552e-05, 2.1422281861305237e-05, 2.2113323211669922e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 1.0, 3.0, 11.0, 11.0, 9.0, 14.0, 11.0, 19.0, 18.0, 19.0, 25.0, 25.0, 36.0, 33.0, 36.0, 32.0, 35.0, 42.0, 40.0, 43.0, 49.0, 39.0, 37.0, 42.0, 30.0, 28.0, 36.0, 30.0, 26.0, 29.0, 20.0, 20.0, 17.0, 22.0, 21.0, 20.0, 13.0, 15.0, 12.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.4453125, -7.2249755859375, -7.004638671875, -6.7843017578125, -6.56396484375, -6.3436279296875, -6.123291015625, -5.9029541015625, -5.6826171875, -5.4622802734375, -5.241943359375, -5.0216064453125, -4.80126953125, -4.5809326171875, -4.360595703125, -4.1402587890625, -3.919921875, -3.6995849609375, -3.479248046875, -3.2589111328125, -3.03857421875, -2.8182373046875, -2.597900390625, -2.3775634765625, -2.1572265625, -1.9368896484375, -1.716552734375, -1.4962158203125, -1.27587890625, -1.0555419921875, -0.835205078125, -0.6148681640625, -0.39453125, -0.1741943359375, 0.046142578125, 0.2664794921875, 0.48681640625, 0.7071533203125, 0.927490234375, 1.1478271484375, 1.3681640625, 1.5885009765625, 1.808837890625, 2.0291748046875, 2.24951171875, 2.4698486328125, 2.690185546875, 2.9105224609375, 3.130859375, 3.3511962890625, 3.571533203125, 3.7918701171875, 4.01220703125, 4.2325439453125, 4.452880859375, 4.6732177734375, 4.8935546875, 5.1138916015625, 5.334228515625, 5.5545654296875, 5.77490234375, 5.9952392578125, 6.215576171875, 6.4359130859375, 6.65625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 4.0, 6.0, 19.0, 20.0, 22.0, 34.0, 30.0, 43.0, 61.0, 89.0, 107.0, 190.0, 251.0, 328.0, 483.0, 682.0, 1297.0, 3532.0, 12261.0, 64127.0, 740137.0, 189159.0, 24694.0, 6059.0, 1984.0, 943.0, 582.0, 363.0, 252.0, 191.0, 126.0, 102.0, 80.0, 57.0, 50.0, 46.0, 29.0, 27.0, 20.0, 17.0, 11.0, 6.0, 7.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.421875, -17.875732421875, -17.32958984375, -16.783447265625, -16.2373046875, -15.691162109375, -15.14501953125, -14.598876953125, -14.052734375, -13.506591796875, -12.96044921875, -12.414306640625, -11.8681640625, -11.322021484375, -10.77587890625, -10.229736328125, -9.68359375, -9.137451171875, -8.59130859375, -8.045166015625, -7.4990234375, -6.952880859375, -6.40673828125, -5.860595703125, -5.314453125, -4.768310546875, -4.22216796875, -3.676025390625, -3.1298828125, -2.583740234375, -2.03759765625, -1.491455078125, -0.9453125, -0.399169921875, 0.14697265625, 0.693115234375, 1.2392578125, 1.785400390625, 2.33154296875, 2.877685546875, 3.423828125, 3.969970703125, 4.51611328125, 5.062255859375, 5.6083984375, 6.154541015625, 6.70068359375, 7.246826171875, 7.79296875, 8.339111328125, 8.88525390625, 9.431396484375, 9.9775390625, 10.523681640625, 11.06982421875, 11.615966796875, 12.162109375, 12.708251953125, 13.25439453125, 13.800537109375, 14.3466796875, 14.892822265625, 15.43896484375, 15.985107421875, 16.53125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 4.0, 9.0, 6.0, 13.0, 20.0, 28.0, 30.0, 29.0, 43.0, 32.0, 51.0, 30.0, 47.0, 81.0, 203.0, 1759.0, 208.0, 66.0, 66.0, 53.0, 42.0, 37.0, 48.0, 24.0, 18.0, 25.0, 16.0, 7.0, 11.0, 7.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.546875, -29.7099609375, -28.873046875, -28.0361328125, -27.19921875, -26.3623046875, -25.525390625, -24.6884765625, -23.8515625, -23.0146484375, -22.177734375, -21.3408203125, -20.50390625, -19.6669921875, -18.830078125, -17.9931640625, -17.15625, -16.3193359375, -15.482421875, -14.6455078125, -13.80859375, -12.9716796875, -12.134765625, -11.2978515625, -10.4609375, -9.6240234375, -8.787109375, -7.9501953125, -7.11328125, -6.2763671875, -5.439453125, -4.6025390625, -3.765625, -2.9287109375, -2.091796875, -1.2548828125, -0.41796875, 0.4189453125, 1.255859375, 2.0927734375, 2.9296875, 3.7666015625, 4.603515625, 5.4404296875, 6.27734375, 7.1142578125, 7.951171875, 8.7880859375, 9.625, 10.4619140625, 11.298828125, 12.1357421875, 12.97265625, 13.8095703125, 14.646484375, 15.4833984375, 16.3203125, 17.1572265625, 17.994140625, 18.8310546875, 19.66796875, 20.5048828125, 21.341796875, 22.1787109375, 23.015625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 2.0, 8.0, 13.0, 9.0, 13.0, 22.0, 23.0, 25.0, 46.0, 61.0, 62.0, 114.0, 164.0, 452.0, 5036.0, 3082937.0, 54968.0, 1005.0, 272.0, 100.0, 82.0, 50.0, 54.0, 38.0, 34.0, 35.0, 19.0, 7.0, 11.0, 9.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.96875, -60.69873046875, -58.4287109375, -56.15869140625, -53.888671875, -51.61865234375, -49.3486328125, -47.07861328125, -44.80859375, -42.53857421875, -40.2685546875, -37.99853515625, -35.728515625, -33.45849609375, -31.1884765625, -28.91845703125, -26.6484375, -24.37841796875, -22.1083984375, -19.83837890625, -17.568359375, -15.29833984375, -13.0283203125, -10.75830078125, -8.48828125, -6.21826171875, -3.9482421875, -1.67822265625, 0.591796875, 2.86181640625, 5.1318359375, 7.40185546875, 9.671875, 11.94189453125, 14.2119140625, 16.48193359375, 18.751953125, 21.02197265625, 23.2919921875, 25.56201171875, 27.83203125, 30.10205078125, 32.3720703125, 34.64208984375, 36.912109375, 39.18212890625, 41.4521484375, 43.72216796875, 45.9921875, 48.26220703125, 50.5322265625, 52.80224609375, 55.072265625, 57.34228515625, 59.6123046875, 61.88232421875, 64.15234375, 66.42236328125, 68.6923828125, 70.96240234375, 73.232421875, 75.50244140625, 77.7724609375, 80.04248046875, 82.3125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 186.0, 690.0, 139.0], "bins": [-277.3063049316406, -272.86236572265625, -268.41845703125, -263.9745178222656, -259.5306091308594, -255.086669921875, -250.64276123046875, -246.19882202148438, -241.75489807128906, -237.31097412109375, -232.86705017089844, -228.42312622070312, -223.9792022705078, -219.5352783203125, -215.09133911132812, -210.6474151611328, -206.2034912109375, -201.7595672607422, -197.31564331054688, -192.87171936035156, -188.42779541015625, -183.98385620117188, -179.53994750976562, -175.09600830078125, -170.652099609375, -166.2081756591797, -161.76425170898438, -157.32032775878906, -152.87640380859375, -148.43246459960938, -143.98855590820312, -139.54461669921875, -135.10069274902344, -130.65676879882812, -126.21284484863281, -121.7689208984375, -117.32498931884766, -112.88106536865234, -108.43714141845703, -103.99321746826172, -99.54928588867188, -95.10536193847656, -90.66143798828125, -86.21751403808594, -81.7735824584961, -77.32965850830078, -72.88573455810547, -68.44181060791016, -63.99787902832031, -59.553955078125, -55.11002731323242, -50.66610336303711, -46.22217559814453, -41.77825164794922, -37.334327697753906, -32.890403747558594, -28.44647789001465, -24.002552032470703, -19.55862808227539, -15.114702224731445, -10.6707763671875, -6.226850509643555, -1.7829265594482422, 2.660999298095703, 7.104925155639648]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 11.0, 11.0, 23.0, 21.0, 22.0, 20.0, 30.0, 27.0, 32.0, 29.0, 46.0, 41.0, 47.0, 35.0, 39.0, 47.0, 57.0, 47.0, 34.0, 39.0, 36.0, 39.0, 23.0, 27.0, 26.0, 25.0, 30.0, 16.0, 20.0, 19.0, 17.0, 7.0, 8.0, 10.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-64.79795837402344, -62.87803268432617, -60.95810317993164, -59.038177490234375, -57.11825180053711, -55.198326110839844, -53.27839660644531, -51.35847091674805, -49.43854522705078, -47.518619537353516, -45.598690032958984, -43.67876434326172, -41.75883865356445, -39.83891296386719, -37.918983459472656, -35.99905776977539, -34.07912826538086, -32.159202575683594, -30.239274978637695, -28.319347381591797, -26.39942169189453, -24.479494094848633, -22.559566497802734, -20.63964080810547, -18.71971321105957, -16.799785614013672, -14.879859924316406, -12.959932327270508, -11.040005683898926, -9.120079040527344, -7.200151443481445, -5.280224800109863, -3.3602943420410156, -1.4403674602508545, 0.47955942153930664, 2.399486541748047, 4.319413185119629, 6.239339828491211, 8.15926742553711, 10.079194068908691, 11.999120712280273, 13.919047355651855, 15.838973999023438, 17.758901596069336, 19.678829193115234, 21.5987548828125, 23.5186824798584, 25.438610076904297, 27.358535766601562, 29.27846336364746, 31.198389053344727, 33.118316650390625, 35.03824234008789, 36.958168029785156, 38.87809753417969, 40.79802322387695, 42.71794891357422, 44.637874603271484, 46.557804107666016, 48.47772979736328, 50.39765548706055, 52.31758117675781, 54.237510681152344, 56.15743637084961, 58.07736587524414]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 7.0, 14.0, 6.0, 7.0, 18.0, 21.0, 16.0, 25.0, 32.0, 35.0, 27.0, 37.0, 33.0, 43.0, 34.0, 50.0, 45.0, 48.0, 40.0, 37.0, 52.0, 32.0, 29.0, 34.0, 38.0, 25.0, 25.0, 26.0, 18.0, 19.0, 30.0, 18.0, 17.0, 9.0, 7.0, 10.0, 11.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.35247802734375, -7.1151123046875, -6.87774658203125, -6.640380859375, -6.40301513671875, -6.1656494140625, -5.92828369140625, -5.69091796875, -5.45355224609375, -5.2161865234375, -4.97882080078125, -4.741455078125, -4.50408935546875, -4.2667236328125, -4.02935791015625, -3.7919921875, -3.55462646484375, -3.3172607421875, -3.07989501953125, -2.842529296875, -2.60516357421875, -2.3677978515625, -2.13043212890625, -1.89306640625, -1.65570068359375, -1.4183349609375, -1.18096923828125, -0.943603515625, -0.70623779296875, -0.4688720703125, -0.23150634765625, 0.005859375, 0.24322509765625, 0.4805908203125, 0.71795654296875, 0.955322265625, 1.19268798828125, 1.4300537109375, 1.66741943359375, 1.90478515625, 2.14215087890625, 2.3795166015625, 2.61688232421875, 2.854248046875, 3.09161376953125, 3.3289794921875, 3.56634521484375, 3.8037109375, 4.04107666015625, 4.2784423828125, 4.51580810546875, 4.753173828125, 4.99053955078125, 5.2279052734375, 5.46527099609375, 5.70263671875, 5.94000244140625, 6.1773681640625, 6.41473388671875, 6.652099609375, 6.88946533203125, 7.1268310546875, 7.36419677734375, 7.6015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 8.0, 16.0, 22.0, 21.0, 31.0, 37.0, 49.0, 75.0, 101.0, 140.0, 200.0, 269.0, 420.0, 671.0, 1184.0, 2041.0, 4085.0, 9267.0, 25551.0, 106657.0, 808325.0, 2429619.0, 669369.0, 94816.0, 23596.0, 8710.0, 3888.0, 1908.0, 1091.0, 653.0, 457.0, 274.0, 184.0, 152.0, 102.0, 72.0, 50.0, 40.0, 35.0, 23.0, 14.0, 14.0, 9.0, 7.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.359375, -10.9737548828125, -10.588134765625, -10.2025146484375, -9.81689453125, -9.4312744140625, -9.045654296875, -8.6600341796875, -8.2744140625, -7.8887939453125, -7.503173828125, -7.1175537109375, -6.73193359375, -6.3463134765625, -5.960693359375, -5.5750732421875, -5.189453125, -4.8038330078125, -4.418212890625, -4.0325927734375, -3.64697265625, -3.2613525390625, -2.875732421875, -2.4901123046875, -2.1044921875, -1.7188720703125, -1.333251953125, -0.9476318359375, -0.56201171875, -0.1763916015625, 0.209228515625, 0.5948486328125, 0.98046875, 1.3660888671875, 1.751708984375, 2.1373291015625, 2.52294921875, 2.9085693359375, 3.294189453125, 3.6798095703125, 4.0654296875, 4.4510498046875, 4.836669921875, 5.2222900390625, 5.60791015625, 5.9935302734375, 6.379150390625, 6.7647705078125, 7.150390625, 7.5360107421875, 7.921630859375, 8.3072509765625, 8.69287109375, 9.0784912109375, 9.464111328125, 9.8497314453125, 10.2353515625, 10.6209716796875, 11.006591796875, 11.3922119140625, 11.77783203125, 12.1634521484375, 12.549072265625, 12.9346923828125, 13.3203125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 4.0, 6.0, 9.0, 12.0, 21.0, 19.0, 32.0, 51.0, 54.0, 85.0, 146.0, 209.0, 323.0, 492.0, 697.0, 661.0, 435.0, 303.0, 161.0, 116.0, 83.0, 41.0, 32.0, 22.0, 14.0, 12.0, 16.0, 8.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.953125, -14.510986328125, -14.06884765625, -13.626708984375, -13.1845703125, -12.742431640625, -12.30029296875, -11.858154296875, -11.416015625, -10.973876953125, -10.53173828125, -10.089599609375, -9.6474609375, -9.205322265625, -8.76318359375, -8.321044921875, -7.87890625, -7.436767578125, -6.99462890625, -6.552490234375, -6.1103515625, -5.668212890625, -5.22607421875, -4.783935546875, -4.341796875, -3.899658203125, -3.45751953125, -3.015380859375, -2.5732421875, -2.131103515625, -1.68896484375, -1.246826171875, -0.8046875, -0.362548828125, 0.07958984375, 0.521728515625, 0.9638671875, 1.406005859375, 1.84814453125, 2.290283203125, 2.732421875, 3.174560546875, 3.61669921875, 4.058837890625, 4.5009765625, 4.943115234375, 5.38525390625, 5.827392578125, 6.26953125, 6.711669921875, 7.15380859375, 7.595947265625, 8.0380859375, 8.480224609375, 8.92236328125, 9.364501953125, 9.806640625, 10.248779296875, 10.69091796875, 11.133056640625, 11.5751953125, 12.017333984375, 12.45947265625, 12.901611328125, 13.34375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 7.0, 5.0, 7.0, 8.0, 18.0, 24.0, 31.0, 54.0, 86.0, 121.0, 151.0, 308.0, 865.0, 3777.0, 42913.0, 3196934.0, 924312.0, 20889.0, 2300.0, 614.0, 271.0, 167.0, 125.0, 81.0, 55.0, 40.0, 38.0, 25.0, 12.0, 12.0, 8.0, 8.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.65625, -31.28857421875, -29.9208984375, -28.55322265625, -27.185546875, -25.81787109375, -24.4501953125, -23.08251953125, -21.71484375, -20.34716796875, -18.9794921875, -17.61181640625, -16.244140625, -14.87646484375, -13.5087890625, -12.14111328125, -10.7734375, -9.40576171875, -8.0380859375, -6.67041015625, -5.302734375, -3.93505859375, -2.5673828125, -1.19970703125, 0.16796875, 1.53564453125, 2.9033203125, 4.27099609375, 5.638671875, 7.00634765625, 8.3740234375, 9.74169921875, 11.109375, 12.47705078125, 13.8447265625, 15.21240234375, 16.580078125, 17.94775390625, 19.3154296875, 20.68310546875, 22.05078125, 23.41845703125, 24.7861328125, 26.15380859375, 27.521484375, 28.88916015625, 30.2568359375, 31.62451171875, 32.9921875, 34.35986328125, 35.7275390625, 37.09521484375, 38.462890625, 39.83056640625, 41.1982421875, 42.56591796875, 43.93359375, 45.30126953125, 46.6689453125, 48.03662109375, 49.404296875, 50.77197265625, 52.1396484375, 53.50732421875, 54.875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 250.0, 718.0, 47.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-729.0388793945312, -716.0861206054688, -703.1334228515625, -690.1806640625, -677.2279663085938, -664.2752075195312, -651.3224487304688, -638.3697509765625, -625.4169921875, -612.4642333984375, -599.5115356445312, -586.5587768554688, -573.6060791015625, -560.6533203125, -547.7005615234375, -534.7478637695312, -521.7951049804688, -508.8423767089844, -495.8896484375, -482.9368896484375, -469.9841613769531, -457.03143310546875, -444.0787048339844, -431.1259765625, -418.1732482910156, -405.22052001953125, -392.2677917480469, -379.3150329589844, -366.3623046875, -353.4095764160156, -340.45684814453125, -327.50408935546875, -314.5513610839844, -301.5986328125, -288.6459045410156, -275.6931457519531, -262.74041748046875, -249.78768920898438, -236.8349609375, -223.88221740722656, -210.92947387695312, -197.97674560546875, -185.0240020751953, -172.07127380371094, -159.1185302734375, -146.16580200195312, -133.21307373046875, -120.26033020019531, -107.3075942993164, -94.3548583984375, -81.4021224975586, -68.44938659667969, -55.49665451049805, -42.543922424316406, -29.5911865234375, -16.638450622558594, -3.6857147216796875, 9.267020225524902, 22.219755172729492, 35.172489166259766, 48.12522506713867, 61.07795715332031, 74.03069305419922, 86.98342895507812, 99.93616485595703]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 4.0, 12.0, 11.0, 10.0, 23.0, 25.0, 20.0, 26.0, 31.0, 32.0, 20.0, 36.0, 36.0, 34.0, 44.0, 51.0, 51.0, 49.0, 39.0, 43.0, 57.0, 35.0, 30.0, 31.0, 36.0, 24.0, 31.0, 30.0, 18.0, 21.0, 16.0, 7.0, 15.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0], "bins": [-46.636356353759766, -45.42142868041992, -44.20650100708008, -42.991573333740234, -41.77664566040039, -40.56171798706055, -39.3467903137207, -38.13186264038086, -36.916934967041016, -35.70200729370117, -34.48707962036133, -33.272151947021484, -32.05722427368164, -30.842296600341797, -29.627368927001953, -28.41244125366211, -27.197511672973633, -25.98258399963379, -24.767656326293945, -23.5527286529541, -22.337800979614258, -21.122873306274414, -19.907943725585938, -18.693016052246094, -17.47808837890625, -16.263160705566406, -15.048233032226562, -13.833305358886719, -12.618377685546875, -11.403450012207031, -10.188521385192871, -8.973593711853027, -7.758668899536133, -6.543741226196289, -5.328813552856445, -4.113885402679443, -2.8989577293395996, -1.6840300559997559, -0.4691019058227539, 0.7458257675170898, 1.9607534408569336, 3.1756811141967773, 4.390608787536621, 5.605536937713623, 6.820464611053467, 8.035392761230469, 9.250320434570312, 10.465248107910156, 11.68017578125, 12.895103454589844, 14.110031127929688, 15.324958801269531, 16.539886474609375, 17.75481414794922, 18.969741821289062, 20.184669494628906, 21.39959716796875, 22.614524841308594, 23.829452514648438, 25.04438018798828, 26.259307861328125, 27.47423553466797, 28.689163208007812, 29.904090881347656, 31.119020462036133]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 9.0, 15.0, 12.0, 7.0, 18.0, 9.0, 20.0, 19.0, 20.0, 37.0, 23.0, 30.0, 38.0, 26.0, 39.0, 56.0, 30.0, 38.0, 48.0, 44.0, 43.0, 45.0, 32.0, 32.0, 34.0, 32.0, 25.0, 21.0, 25.0, 31.0, 23.0, 19.0, 16.0, 23.0, 10.0, 6.0, 15.0, 4.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.0859375, -7.85247802734375, -7.6190185546875, -7.38555908203125, -7.152099609375, -6.91864013671875, -6.6851806640625, -6.45172119140625, -6.21826171875, -5.98480224609375, -5.7513427734375, -5.51788330078125, -5.284423828125, -5.05096435546875, -4.8175048828125, -4.58404541015625, -4.3505859375, -4.11712646484375, -3.8836669921875, -3.65020751953125, -3.416748046875, -3.18328857421875, -2.9498291015625, -2.71636962890625, -2.48291015625, -2.24945068359375, -2.0159912109375, -1.78253173828125, -1.549072265625, -1.31561279296875, -1.0821533203125, -0.84869384765625, -0.615234375, -0.38177490234375, -0.1483154296875, 0.08514404296875, 0.318603515625, 0.55206298828125, 0.7855224609375, 1.01898193359375, 1.25244140625, 1.48590087890625, 1.7193603515625, 1.95281982421875, 2.186279296875, 2.41973876953125, 2.6531982421875, 2.88665771484375, 3.1201171875, 3.35357666015625, 3.5870361328125, 3.82049560546875, 4.053955078125, 4.28741455078125, 4.5208740234375, 4.75433349609375, 4.98779296875, 5.22125244140625, 5.4547119140625, 5.68817138671875, 5.921630859375, 6.15509033203125, 6.3885498046875, 6.62200927734375, 6.85546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 14.0, 29.0, 35.0, 44.0, 76.0, 120.0, 142.0, 206.0, 321.0, 504.0, 775.0, 1201.0, 1640.0, 2585.0, 3904.0, 5970.0, 9136.0, 13563.0, 20814.0, 32468.0, 52433.0, 92693.0, 189801.0, 273605.0, 146662.0, 75021.0, 43861.0, 27933.0, 18106.0, 11753.0, 7794.0, 5111.0, 3415.0, 2252.0, 1519.0, 983.0, 707.0, 443.0, 292.0, 201.0, 131.0, 93.0, 57.0, 50.0, 32.0, 19.0, 11.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.313232421875, -0.304107666015625, -0.29498291015625, -0.285858154296875, -0.2767333984375, -0.267608642578125, -0.25848388671875, -0.249359130859375, -0.240234375, -0.231109619140625, -0.22198486328125, -0.212860107421875, -0.2037353515625, -0.194610595703125, -0.18548583984375, -0.176361083984375, -0.167236328125, -0.158111572265625, -0.14898681640625, -0.139862060546875, -0.1307373046875, -0.121612548828125, -0.11248779296875, -0.103363037109375, -0.09423828125, -0.085113525390625, -0.07598876953125, -0.066864013671875, -0.0577392578125, -0.048614501953125, -0.03948974609375, -0.030364990234375, -0.021240234375, -0.012115478515625, -0.00299072265625, 0.006134033203125, 0.0152587890625, 0.024383544921875, 0.03350830078125, 0.042633056640625, 0.0517578125, 0.060882568359375, 0.07000732421875, 0.079132080078125, 0.0882568359375, 0.097381591796875, 0.10650634765625, 0.115631103515625, 0.124755859375, 0.133880615234375, 0.14300537109375, 0.152130126953125, 0.1612548828125, 0.170379638671875, 0.17950439453125, 0.188629150390625, 0.19775390625, 0.206878662109375, 0.21600341796875, 0.225128173828125, 0.2342529296875, 0.243377685546875, 0.25250244140625, 0.261627197265625, 0.270751953125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 6.0, 5.0, 11.0, 8.0, 12.0, 15.0, 19.0, 20.0, 27.0, 28.0, 18.0, 28.0, 21.0, 39.0, 37.0, 34.0, 43.0, 34.0, 33.0, 1060.0, 36.0, 42.0, 50.0, 28.0, 43.0, 41.0, 38.0, 27.0, 29.0, 27.0, 28.0, 16.0, 22.0, 19.0, 8.0, 11.0, 8.0, 7.0, 7.0, 6.0, 6.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.91015625, -4.7552490234375, -4.600341796875, -4.4454345703125, -4.29052734375, -4.1356201171875, -3.980712890625, -3.8258056640625, -3.6708984375, -3.5159912109375, -3.361083984375, -3.2061767578125, -3.05126953125, -2.8963623046875, -2.741455078125, -2.5865478515625, -2.431640625, -2.2767333984375, -2.121826171875, -1.9669189453125, -1.81201171875, -1.6571044921875, -1.502197265625, -1.3472900390625, -1.1923828125, -1.0374755859375, -0.882568359375, -0.7276611328125, -0.57275390625, -0.4178466796875, -0.262939453125, -0.1080322265625, 0.046875, 0.2017822265625, 0.356689453125, 0.5115966796875, 0.66650390625, 0.8214111328125, 0.976318359375, 1.1312255859375, 1.2861328125, 1.4410400390625, 1.595947265625, 1.7508544921875, 1.90576171875, 2.0606689453125, 2.215576171875, 2.3704833984375, 2.525390625, 2.6802978515625, 2.835205078125, 2.9901123046875, 3.14501953125, 3.2999267578125, 3.454833984375, 3.6097412109375, 3.7646484375, 3.9195556640625, 4.074462890625, 4.2293701171875, 4.38427734375, 4.5391845703125, 4.694091796875, 4.8489990234375, 5.00390625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 9.0, 8.0, 14.0, 19.0, 33.0, 31.0, 48.0, 70.0, 108.0, 145.0, 219.0, 277.0, 411.0, 598.0, 800.0, 1139.0, 1626.0, 2436.0, 3343.0, 4887.0, 7506.0, 11311.0, 16753.0, 25927.0, 41785.0, 69884.0, 130757.0, 1299417.0, 210611.0, 104483.0, 58351.0, 35991.0, 22884.0, 14520.0, 9818.0, 6362.0, 4445.0, 3038.0, 2084.0, 1466.0, 1025.0, 721.0, 505.0, 368.0, 270.0, 202.0, 118.0, 93.0, 80.0, 41.0, 33.0, 16.0, 17.0, 13.0, 5.0, 5.0, 8.0, 0.0, 2.0, 3.0], "bins": [-0.28173828125, -0.27288818359375, -0.2640380859375, -0.25518798828125, -0.246337890625, -0.23748779296875, -0.2286376953125, -0.21978759765625, -0.2109375, -0.20208740234375, -0.1932373046875, -0.18438720703125, -0.175537109375, -0.16668701171875, -0.1578369140625, -0.14898681640625, -0.14013671875, -0.13128662109375, -0.1224365234375, -0.11358642578125, -0.104736328125, -0.09588623046875, -0.0870361328125, -0.07818603515625, -0.0693359375, -0.06048583984375, -0.0516357421875, -0.04278564453125, -0.033935546875, -0.02508544921875, -0.0162353515625, -0.00738525390625, 0.00146484375, 0.01031494140625, 0.0191650390625, 0.02801513671875, 0.036865234375, 0.04571533203125, 0.0545654296875, 0.06341552734375, 0.072265625, 0.08111572265625, 0.0899658203125, 0.09881591796875, 0.107666015625, 0.11651611328125, 0.1253662109375, 0.13421630859375, 0.14306640625, 0.15191650390625, 0.1607666015625, 0.16961669921875, 0.178466796875, 0.18731689453125, 0.1961669921875, 0.20501708984375, 0.2138671875, 0.22271728515625, 0.2315673828125, 0.24041748046875, 0.249267578125, 0.25811767578125, 0.2669677734375, 0.27581787109375, 0.28466796875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 7.0, 7.0, 8.0, 12.0, 16.0, 11.0, 22.0, 17.0, 21.0, 15.0, 28.0, 33.0, 38.0, 39.0, 45.0, 33.0, 39.0, 42.0, 49.0, 62.0, 38.0, 40.0, 47.0, 42.0, 40.0, 38.0, 32.0, 19.0, 33.0, 27.0, 21.0, 15.0, 14.0, 7.0, 9.0, 3.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.719329833984375e-05, -3.600027412176132e-05, -3.4807249903678894e-05, -3.3614225685596466e-05, -3.242120146751404e-05, -3.122817724943161e-05, -3.0035153031349182e-05, -2.8842128813266754e-05, -2.7649104595184326e-05, -2.6456080377101898e-05, -2.526305615901947e-05, -2.4070031940937042e-05, -2.2877007722854614e-05, -2.1683983504772186e-05, -2.0490959286689758e-05, -1.929793506860733e-05, -1.8104910850524902e-05, -1.6911886632442474e-05, -1.5718862414360046e-05, -1.4525838196277618e-05, -1.333281397819519e-05, -1.2139789760112762e-05, -1.0946765542030334e-05, -9.753741323947906e-06, -8.560717105865479e-06, -7.3676928877830505e-06, -6.1746686697006226e-06, -4.981644451618195e-06, -3.7886202335357666e-06, -2.5955960154533386e-06, -1.4025717973709106e-06, -2.0954757928848267e-07, 9.834766387939453e-07, 2.1765008568763733e-06, 3.3695250749588013e-06, 4.562549293041229e-06, 5.755573511123657e-06, 6.948597729206085e-06, 8.141621947288513e-06, 9.334646165370941e-06, 1.0527670383453369e-05, 1.1720694601535797e-05, 1.2913718819618225e-05, 1.4106743037700653e-05, 1.529976725578308e-05, 1.649279147386551e-05, 1.7685815691947937e-05, 1.8878839910030365e-05, 2.0071864128112793e-05, 2.126488834619522e-05, 2.245791256427765e-05, 2.3650936782360077e-05, 2.4843961000442505e-05, 2.6036985218524933e-05, 2.723000943660736e-05, 2.842303365468979e-05, 2.9616057872772217e-05, 3.0809082090854645e-05, 3.200210630893707e-05, 3.31951305270195e-05, 3.438815474510193e-05, 3.558117896318436e-05, 3.6774203181266785e-05, 3.796722739934921e-05, 3.916025161743164e-05]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 2.0, 5.0, 13.0, 12.0, 20.0, 21.0, 33.0, 46.0, 45.0, 67.0, 65.0, 84.0, 103.0, 163.0, 230.0, 425.0, 1110.0, 139280.0, 902855.0, 2483.0, 529.0, 282.0, 160.0, 108.0, 67.0, 60.0, 48.0, 41.0, 35.0, 35.0, 27.0, 22.0, 11.0, 15.0, 5.0, 13.0, 5.0, 3.0, 4.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008502006530761719, -0.0008245855569839478, -0.0007989704608917236, -0.0007733553647994995, -0.0007477402687072754, -0.0007221251726150513, -0.0006965100765228271, -0.000670894980430603, -0.0006452798843383789, -0.0006196647882461548, -0.0005940496921539307, -0.0005684345960617065, -0.0005428194999694824, -0.0005172044038772583, -0.0004915893077850342, -0.00046597421169281006, -0.00044035911560058594, -0.0004147440195083618, -0.0003891289234161377, -0.0003635138273239136, -0.00033789873123168945, -0.00031228363513946533, -0.0002866685390472412, -0.0002610534429550171, -0.00023543834686279297, -0.00020982325077056885, -0.00018420815467834473, -0.0001585930585861206, -0.00013297796249389648, -0.00010736286640167236, -8.174777030944824e-05, -5.613267421722412e-05, -3.0517578125e-05, -4.902482032775879e-06, 2.0712614059448242e-05, 4.632771015167236e-05, 7.194280624389648e-05, 9.75579023361206e-05, 0.00012317299842834473, 0.00014878809452056885, 0.00017440319061279297, 0.0002000182867050171, 0.0002256333827972412, 0.00025124847888946533, 0.00027686357498168945, 0.0003024786710739136, 0.0003280937671661377, 0.0003537088632583618, 0.00037932395935058594, 0.00040493905544281006, 0.0004305541515350342, 0.0004561692476272583, 0.0004817843437194824, 0.0005073994398117065, 0.0005330145359039307, 0.0005586296319961548, 0.0005842447280883789, 0.000609859824180603, 0.0006354749202728271, 0.0006610900163650513, 0.0006867051124572754, 0.0007123202085494995, 0.0007379353046417236, 0.0007635504007339478, 0.0007891654968261719]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 17.0, 71.0, 196.0, 317.0, 254.0, 116.0, 34.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.061084837303497e-05, -3.817475226242095e-05, -3.573865251382813e-05, -3.330255640321411e-05, -3.0866460292600095e-05, -2.843036418198608e-05, -2.599426625238266e-05, -2.3558168322779238e-05, -2.112207221216522e-05, -1.8685976101551205e-05, -1.6249878171947785e-05, -1.3813781151839066e-05, -1.1377684131730348e-05, -8.94158711162163e-06, -6.505490091512911e-06, -4.069392161909491e-06, -1.6332960512954742e-06, 8.028009688132443e-07, 3.2388979889219627e-06, 5.674995009030681e-06, 8.1110920291394e-06, 1.0547189049248118e-05, 1.2983286069356836e-05, 1.5419383998960257e-05, 1.7855480109574273e-05, 2.029157622018829e-05, 2.272767414979171e-05, 2.516377207939513e-05, 2.7599868190009147e-05, 3.0035964300623164e-05, 3.247206041123718e-05, 3.4908160159830004e-05, 3.7344252632465214e-05, 3.978034874307923e-05, 4.221644485369325e-05, 4.465254460228607e-05, 4.708864071290009e-05, 4.9524736823514104e-05, 5.196083657210693e-05, 5.4396932682720944e-05, 5.683302879333496e-05, 5.926912490394898e-05, 6.1705221014563e-05, 6.414132076315582e-05, 6.657741323579103e-05, 6.901351298438385e-05, 7.144961273297668e-05, 7.388570520561188e-05, 7.632180495420471e-05, 7.875790470279753e-05, 8.119399717543274e-05, 8.363009692402557e-05, 8.606619667261839e-05, 8.85022891452536e-05, 9.093838889384642e-05, 9.337448864243925e-05, 9.581058111507446e-05, 9.824668086366728e-05, 0.00010068277333630249, 0.00010311887308489531, 0.00010555496555753052, 0.00010799106530612335, 0.00011042716505471617, 0.00011286325752735138, 0.0001152993572759442]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 18.0, 13.0, 6.0, 22.0, 18.0, 28.0, 20.0, 34.0, 31.0, 35.0, 32.0, 54.0, 33.0, 41.0, 39.0, 36.0, 39.0, 58.0, 43.0, 47.0, 38.0, 31.0, 19.0, 31.0, 15.0, 20.0, 17.0, 18.0, 19.0, 17.0, 13.0, 16.0, 15.0, 10.0, 4.0, 6.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1785497665405273e-05, -2.110004425048828e-05, -2.041459083557129e-05, -1.9729137420654297e-05, -1.9043684005737305e-05, -1.8358230590820312e-05, -1.767277717590332e-05, -1.6987323760986328e-05, -1.6301870346069336e-05, -1.5616416931152344e-05, -1.4930963516235352e-05, -1.424551010131836e-05, -1.3560056686401367e-05, -1.2874603271484375e-05, -1.2189149856567383e-05, -1.150369644165039e-05, -1.0818243026733398e-05, -1.0132789611816406e-05, -9.447336196899414e-06, -8.761882781982422e-06, -8.07642936706543e-06, -7.3909759521484375e-06, -6.705522537231445e-06, -6.020069122314453e-06, -5.334615707397461e-06, -4.649162292480469e-06, -3.9637088775634766e-06, -3.2782554626464844e-06, -2.592802047729492e-06, -1.9073486328125e-06, -1.2218952178955078e-06, -5.364418029785156e-07, 1.4901161193847656e-07, 8.344650268554688e-07, 1.519918441772461e-06, 2.205371856689453e-06, 2.8908252716064453e-06, 3.5762786865234375e-06, 4.26173210144043e-06, 4.947185516357422e-06, 5.632638931274414e-06, 6.318092346191406e-06, 7.0035457611083984e-06, 7.68899917602539e-06, 8.374452590942383e-06, 9.059906005859375e-06, 9.745359420776367e-06, 1.043081283569336e-05, 1.1116266250610352e-05, 1.1801719665527344e-05, 1.2487173080444336e-05, 1.3172626495361328e-05, 1.385807991027832e-05, 1.4543533325195312e-05, 1.5228986740112305e-05, 1.5914440155029297e-05, 1.659989356994629e-05, 1.728534698486328e-05, 1.7970800399780273e-05, 1.8656253814697266e-05, 1.9341707229614258e-05, 2.002716064453125e-05, 2.0712614059448242e-05, 2.1398067474365234e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 9.0, 15.0, 12.0, 7.0, 18.0, 9.0, 20.0, 19.0, 20.0, 37.0, 23.0, 30.0, 38.0, 26.0, 39.0, 56.0, 30.0, 38.0, 48.0, 44.0, 43.0, 45.0, 32.0, 32.0, 34.0, 32.0, 25.0, 21.0, 25.0, 31.0, 23.0, 19.0, 16.0, 23.0, 10.0, 6.0, 15.0, 4.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.0859375, -7.85247802734375, -7.6190185546875, -7.38555908203125, -7.152099609375, -6.91864013671875, -6.6851806640625, -6.45172119140625, -6.21826171875, -5.98480224609375, -5.7513427734375, -5.51788330078125, -5.284423828125, -5.05096435546875, -4.8175048828125, -4.58404541015625, -4.3505859375, -4.11712646484375, -3.8836669921875, -3.65020751953125, -3.416748046875, -3.18328857421875, -2.9498291015625, -2.71636962890625, -2.48291015625, -2.24945068359375, -2.0159912109375, -1.78253173828125, -1.549072265625, -1.31561279296875, -1.0821533203125, -0.84869384765625, -0.615234375, -0.38177490234375, -0.1483154296875, 0.08514404296875, 0.318603515625, 0.55206298828125, 0.7855224609375, 1.01898193359375, 1.25244140625, 1.48590087890625, 1.7193603515625, 1.95281982421875, 2.186279296875, 2.41973876953125, 2.6531982421875, 2.88665771484375, 3.1201171875, 3.35357666015625, 3.5870361328125, 3.82049560546875, 4.053955078125, 4.28741455078125, 4.5208740234375, 4.75433349609375, 4.98779296875, 5.22125244140625, 5.4547119140625, 5.68817138671875, 5.921630859375, 6.15509033203125, 6.3885498046875, 6.62200927734375, 6.85546875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 6.0, 8.0, 3.0, 9.0, 16.0, 7.0, 25.0, 33.0, 41.0, 56.0, 72.0, 83.0, 115.0, 160.0, 242.0, 385.0, 645.0, 1085.0, 1900.0, 3599.0, 7245.0, 16559.0, 45827.0, 155888.0, 474128.0, 234690.0, 64496.0, 21834.0, 9006.0, 4397.0, 2389.0, 1356.0, 774.0, 456.0, 313.0, 192.0, 134.0, 96.0, 75.0, 62.0, 43.0, 23.0, 26.0, 25.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.109375, -9.817626953125, -9.52587890625, -9.234130859375, -8.9423828125, -8.650634765625, -8.35888671875, -8.067138671875, -7.775390625, -7.483642578125, -7.19189453125, -6.900146484375, -6.6083984375, -6.316650390625, -6.02490234375, -5.733154296875, -5.44140625, -5.149658203125, -4.85791015625, -4.566162109375, -4.2744140625, -3.982666015625, -3.69091796875, -3.399169921875, -3.107421875, -2.815673828125, -2.52392578125, -2.232177734375, -1.9404296875, -1.648681640625, -1.35693359375, -1.065185546875, -0.7734375, -0.481689453125, -0.18994140625, 0.101806640625, 0.3935546875, 0.685302734375, 0.97705078125, 1.268798828125, 1.560546875, 1.852294921875, 2.14404296875, 2.435791015625, 2.7275390625, 3.019287109375, 3.31103515625, 3.602783203125, 3.89453125, 4.186279296875, 4.47802734375, 4.769775390625, 5.0615234375, 5.353271484375, 5.64501953125, 5.936767578125, 6.228515625, 6.520263671875, 6.81201171875, 7.103759765625, 7.3955078125, 7.687255859375, 7.97900390625, 8.270751953125, 8.5625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 5.0, 10.0, 7.0, 8.0, 10.0, 15.0, 16.0, 22.0, 19.0, 19.0, 30.0, 33.0, 35.0, 46.0, 36.0, 47.0, 57.0, 106.0, 301.0, 1521.0, 185.0, 86.0, 61.0, 55.0, 47.0, 32.0, 37.0, 25.0, 30.0, 31.0, 15.0, 16.0, 13.0, 8.0, 12.0, 11.0, 9.0, 7.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.796875, -21.14306640625, -20.4892578125, -19.83544921875, -19.181640625, -18.52783203125, -17.8740234375, -17.22021484375, -16.56640625, -15.91259765625, -15.2587890625, -14.60498046875, -13.951171875, -13.29736328125, -12.6435546875, -11.98974609375, -11.3359375, -10.68212890625, -10.0283203125, -9.37451171875, -8.720703125, -8.06689453125, -7.4130859375, -6.75927734375, -6.10546875, -5.45166015625, -4.7978515625, -4.14404296875, -3.490234375, -2.83642578125, -2.1826171875, -1.52880859375, -0.875, -0.22119140625, 0.4326171875, 1.08642578125, 1.740234375, 2.39404296875, 3.0478515625, 3.70166015625, 4.35546875, 5.00927734375, 5.6630859375, 6.31689453125, 6.970703125, 7.62451171875, 8.2783203125, 8.93212890625, 9.5859375, 10.23974609375, 10.8935546875, 11.54736328125, 12.201171875, 12.85498046875, 13.5087890625, 14.16259765625, 14.81640625, 15.47021484375, 16.1240234375, 16.77783203125, 17.431640625, 18.08544921875, 18.7392578125, 19.39306640625, 20.046875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 8.0, 10.0, 23.0, 20.0, 32.0, 48.0, 67.0, 94.0, 133.0, 189.0, 368.0, 1111.0, 7516.0, 213723.0, 2887636.0, 30661.0, 2680.0, 596.0, 275.0, 160.0, 106.0, 65.0, 54.0, 32.0, 25.0, 15.0, 12.0, 9.0, 12.0, 3.0, 3.0, 9.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.9375, -34.75, -33.5625, -32.375, -31.1875, -30.0, -28.8125, -27.625, -26.4375, -25.25, -24.0625, -22.875, -21.6875, -20.5, -19.3125, -18.125, -16.9375, -15.75, -14.5625, -13.375, -12.1875, -11.0, -9.8125, -8.625, -7.4375, -6.25, -5.0625, -3.875, -2.6875, -1.5, -0.3125, 0.875, 2.0625, 3.25, 4.4375, 5.625, 6.8125, 8.0, 9.1875, 10.375, 11.5625, 12.75, 13.9375, 15.125, 16.3125, 17.5, 18.6875, 19.875, 21.0625, 22.25, 23.4375, 24.625, 25.8125, 27.0, 28.1875, 29.375, 30.5625, 31.75, 32.9375, 34.125, 35.3125, 36.5, 37.6875, 38.875, 40.0625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 242.0, 760.0, 14.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.68547821044922, -106.94771575927734, -98.20995330810547, -89.4721908569336, -80.73442840576172, -71.99666595458984, -63.25890350341797, -54.521141052246094, -45.78337860107422, -37.045616149902344, -28.30785369873047, -19.570091247558594, -10.832328796386719, -2.0945663452148438, 6.643196105957031, 15.380958557128906, 24.11872100830078, 32.856483459472656, 41.59424591064453, 50.332008361816406, 59.06977081298828, 67.80753326416016, 76.54529571533203, 85.2830581665039, 94.02082061767578, 102.75858306884766, 111.49634552001953, 120.2341079711914, 128.97186279296875, 137.70962524414062, 146.4473876953125, 155.18515014648438, 163.92291259765625, 172.66067504882812, 181.3984375, 190.13619995117188, 198.87396240234375, 207.61172485351562, 216.3494873046875, 225.08724975585938, 233.82501220703125, 242.56277465820312, 251.300537109375, 260.0382995605469, 268.77606201171875, 277.5138244628906, 286.2515869140625, 294.9893493652344, 303.72711181640625, 312.4648742675781, 321.20263671875, 329.9403991699219, 338.67816162109375, 347.4159240722656, 356.1536865234375, 364.8914489746094, 373.62921142578125, 382.3669738769531, 391.104736328125, 399.8424987792969, 408.58026123046875, 417.3180236816406, 426.0557861328125, 434.7935485839844, 443.53131103515625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 5.0, 3.0, 8.0, 8.0, 11.0, 9.0, 17.0, 12.0, 20.0, 21.0, 17.0, 21.0, 21.0, 32.0, 39.0, 31.0, 24.0, 44.0, 43.0, 44.0, 42.0, 37.0, 34.0, 33.0, 44.0, 38.0, 36.0, 26.0, 34.0, 28.0, 32.0, 23.0, 22.0, 15.0, 22.0, 17.0, 17.0, 14.0, 10.0, 10.0, 18.0, 5.0, 4.0, 6.0, 5.0, 4.0, 1.0, 5.0], "bins": [-57.76106643676758, -56.302818298339844, -54.84457015991211, -53.386322021484375, -51.928077697753906, -50.46982955932617, -49.01158142089844, -47.5533332824707, -46.09508514404297, -44.636837005615234, -43.1785888671875, -41.720340728759766, -40.26209259033203, -38.80384826660156, -37.34560012817383, -35.887351989746094, -34.42910385131836, -32.970855712890625, -31.51260757446289, -30.05436134338379, -28.596113204956055, -27.13786506652832, -25.67961883544922, -24.221370697021484, -22.76312255859375, -21.304874420166016, -19.84662628173828, -18.38838005065918, -16.930131912231445, -15.471883773803711, -14.013636589050293, -12.555389404296875, -11.097137451171875, -9.63888931274414, -8.180642127990723, -6.7223944664001465, -5.26414680480957, -3.805899143218994, -2.347651481628418, -0.889404296875, 0.5688438415527344, 2.0270915031433105, 3.4853391647338867, 4.943586826324463, 6.401834487915039, 7.860082149505615, 9.318329811096191, 10.77657699584961, 12.234825134277344, 13.693073272705078, 15.151320457458496, 16.609567642211914, 18.06781578063965, 19.526063919067383, 20.984310150146484, 22.44255828857422, 23.900806427001953, 25.359054565429688, 26.817302703857422, 28.275548934936523, 29.733797073364258, 31.192045211791992, 32.650291442871094, 34.10853958129883, 35.56678771972656]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 7.0, 4.0, 10.0, 16.0, 18.0, 10.0, 13.0, 19.0, 11.0, 24.0, 37.0, 27.0, 37.0, 29.0, 24.0, 36.0, 46.0, 42.0, 40.0, 46.0, 40.0, 40.0, 44.0, 24.0, 34.0, 39.0, 29.0, 28.0, 24.0, 30.0, 14.0, 21.0, 29.0, 16.0, 16.0, 12.0, 4.0, 12.0, 7.0, 3.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-8.234375, -8.003173828125, -7.77197265625, -7.540771484375, -7.3095703125, -7.078369140625, -6.84716796875, -6.615966796875, -6.384765625, -6.153564453125, -5.92236328125, -5.691162109375, -5.4599609375, -5.228759765625, -4.99755859375, -4.766357421875, -4.53515625, -4.303955078125, -4.07275390625, -3.841552734375, -3.6103515625, -3.379150390625, -3.14794921875, -2.916748046875, -2.685546875, -2.454345703125, -2.22314453125, -1.991943359375, -1.7607421875, -1.529541015625, -1.29833984375, -1.067138671875, -0.8359375, -0.604736328125, -0.37353515625, -0.142333984375, 0.0888671875, 0.320068359375, 0.55126953125, 0.782470703125, 1.013671875, 1.244873046875, 1.47607421875, 1.707275390625, 1.9384765625, 2.169677734375, 2.40087890625, 2.632080078125, 2.86328125, 3.094482421875, 3.32568359375, 3.556884765625, 3.7880859375, 4.019287109375, 4.25048828125, 4.481689453125, 4.712890625, 4.944091796875, 5.17529296875, 5.406494140625, 5.6376953125, 5.868896484375, 6.10009765625, 6.331298828125, 6.5625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 0.0, 8.0, 10.0, 3.0, 14.0, 18.0, 23.0, 19.0, 21.0, 24.0, 43.0, 61.0, 101.0, 172.0, 273.0, 507.0, 1177.0, 2727.0, 7350.0, 23423.0, 118384.0, 1247699.0, 2412959.0, 315803.0, 43837.0, 12027.0, 4163.0, 1682.0, 740.0, 370.0, 224.0, 124.0, 76.0, 59.0, 40.0, 22.0, 14.0, 18.0, 14.0, 6.0, 11.0, 5.0, 6.0, 1.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-15.5234375, -15.0560302734375, -14.588623046875, -14.1212158203125, -13.65380859375, -13.1864013671875, -12.718994140625, -12.2515869140625, -11.7841796875, -11.3167724609375, -10.849365234375, -10.3819580078125, -9.91455078125, -9.4471435546875, -8.979736328125, -8.5123291015625, -8.044921875, -7.5775146484375, -7.110107421875, -6.6427001953125, -6.17529296875, -5.7078857421875, -5.240478515625, -4.7730712890625, -4.3056640625, -3.8382568359375, -3.370849609375, -2.9034423828125, -2.43603515625, -1.9686279296875, -1.501220703125, -1.0338134765625, -0.56640625, -0.0989990234375, 0.368408203125, 0.8358154296875, 1.30322265625, 1.7706298828125, 2.238037109375, 2.7054443359375, 3.1728515625, 3.6402587890625, 4.107666015625, 4.5750732421875, 5.04248046875, 5.5098876953125, 5.977294921875, 6.4447021484375, 6.912109375, 7.3795166015625, 7.846923828125, 8.3143310546875, 8.78173828125, 9.2491455078125, 9.716552734375, 10.1839599609375, 10.6513671875, 11.1187744140625, 11.586181640625, 12.0535888671875, 12.52099609375, 12.9884033203125, 13.455810546875, 13.9232177734375, 14.390625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 6.0, 9.0, 9.0, 11.0, 23.0, 21.0, 27.0, 29.0, 40.0, 60.0, 81.0, 129.0, 178.0, 259.0, 393.0, 497.0, 567.0, 445.0, 342.0, 258.0, 170.0, 114.0, 90.0, 66.0, 66.0, 38.0, 32.0, 28.0, 17.0, 11.0, 10.0, 8.0, 6.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.0859375, -8.7762451171875, -8.466552734375, -8.1568603515625, -7.84716796875, -7.5374755859375, -7.227783203125, -6.9180908203125, -6.6083984375, -6.2987060546875, -5.989013671875, -5.6793212890625, -5.36962890625, -5.0599365234375, -4.750244140625, -4.4405517578125, -4.130859375, -3.8211669921875, -3.511474609375, -3.2017822265625, -2.89208984375, -2.5823974609375, -2.272705078125, -1.9630126953125, -1.6533203125, -1.3436279296875, -1.033935546875, -0.7242431640625, -0.41455078125, -0.1048583984375, 0.204833984375, 0.5145263671875, 0.82421875, 1.1339111328125, 1.443603515625, 1.7532958984375, 2.06298828125, 2.3726806640625, 2.682373046875, 2.9920654296875, 3.3017578125, 3.6114501953125, 3.921142578125, 4.2308349609375, 4.54052734375, 4.8502197265625, 5.159912109375, 5.4696044921875, 5.779296875, 6.0889892578125, 6.398681640625, 6.7083740234375, 7.01806640625, 7.3277587890625, 7.637451171875, 7.9471435546875, 8.2568359375, 8.5665283203125, 8.876220703125, 9.1859130859375, 9.49560546875, 9.8052978515625, 10.114990234375, 10.4246826171875, 10.734375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 10.0, 9.0, 15.0, 21.0, 24.0, 42.0, 61.0, 90.0, 197.0, 593.0, 1781.0, 7050.0, 33839.0, 276939.0, 3425043.0, 393297.0, 43328.0, 8452.0, 2225.0, 678.0, 259.0, 129.0, 65.0, 44.0, 30.0, 15.0, 15.0, 10.0, 8.0, 4.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.61328125, -25.8203125, -25.02734375, -24.234375, -23.44140625, -22.6484375, -21.85546875, -21.0625, -20.26953125, -19.4765625, -18.68359375, -17.890625, -17.09765625, -16.3046875, -15.51171875, -14.71875, -13.92578125, -13.1328125, -12.33984375, -11.546875, -10.75390625, -9.9609375, -9.16796875, -8.375, -7.58203125, -6.7890625, -5.99609375, -5.203125, -4.41015625, -3.6171875, -2.82421875, -2.03125, -1.23828125, -0.4453125, 0.34765625, 1.140625, 1.93359375, 2.7265625, 3.51953125, 4.3125, 5.10546875, 5.8984375, 6.69140625, 7.484375, 8.27734375, 9.0703125, 9.86328125, 10.65625, 11.44921875, 12.2421875, 13.03515625, 13.828125, 14.62109375, 15.4140625, 16.20703125, 17.0, 17.79296875, 18.5859375, 19.37890625, 20.171875, 20.96484375, 21.7578125, 22.55078125, 23.34375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 9.0, 178.0, 669.0, 150.0, 12.0, 0.0, 1.0], "bins": [-546.9300537109375, -537.7235717773438, -528.51708984375, -519.3106079101562, -510.1041564941406, -500.8976745605469, -491.69122314453125, -482.4847412109375, -473.27825927734375, -464.07177734375, -454.86529541015625, -445.6588439941406, -436.4523620605469, -427.2458801269531, -418.0394287109375, -408.83294677734375, -399.62646484375, -390.41998291015625, -381.2135009765625, -372.0070495605469, -362.8005676269531, -353.5940856933594, -344.38763427734375, -335.18115234375, -325.97467041015625, -316.7681884765625, -307.56170654296875, -298.3552551269531, -289.1487731933594, -279.9422912597656, -270.73583984375, -261.52935791015625, -252.32284545898438, -243.11636352539062, -233.90989685058594, -224.70343017578125, -215.4969482421875, -206.29046630859375, -197.08399963378906, -187.87753295898438, -178.67105102539062, -169.46456909179688, -160.2581024169922, -151.0516357421875, -141.84515380859375, -132.638671875, -123.43220520019531, -114.2257308959961, -105.01925659179688, -95.81278228759766, -86.60630798339844, -77.39983367919922, -68.193359375, -58.98688507080078, -49.78041076660156, -40.573936462402344, -31.367462158203125, -22.160987854003906, -12.954513549804688, -3.7480392456054688, 5.45843505859375, 14.664909362792969, 23.871383666992188, 33.077857971191406, 42.284332275390625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 3.0, 4.0, 1.0, 8.0, 5.0, 8.0, 8.0, 8.0, 8.0, 17.0, 14.0, 14.0, 21.0, 11.0, 17.0, 14.0, 26.0, 27.0, 26.0, 27.0, 22.0, 26.0, 30.0, 27.0, 44.0, 34.0, 35.0, 38.0, 37.0, 37.0, 32.0, 38.0, 32.0, 25.0, 28.0, 27.0, 28.0, 24.0, 22.0, 15.0, 21.0, 14.0, 19.0, 16.0, 11.0, 9.0, 9.0, 9.0, 9.0, 3.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-29.99409294128418, -29.009191513061523, -28.024290084838867, -27.039386749267578, -26.054485321044922, -25.069583892822266, -24.08468246459961, -23.099781036376953, -22.114879608154297, -21.12997817993164, -20.145076751708984, -19.160175323486328, -18.17527198791504, -17.190370559692383, -16.205469131469727, -15.22056770324707, -14.235664367675781, -13.250762939453125, -12.265860557556152, -11.280959129333496, -10.296056747436523, -9.311155319213867, -8.326253890991211, -7.3413519859313965, -6.356450080871582, -5.371548175811768, -4.386646270751953, -3.401744842529297, -2.4168429374694824, -1.431941032409668, -0.4470396041870117, 0.5378623008728027, 1.52276611328125, 2.5076680183410645, 3.4925696849823, 4.477471351623535, 5.46237325668335, 6.447275161743164, 7.43217658996582, 8.417078018188477, 9.40198040008545, 10.386881828308105, 11.371784210205078, 12.356685638427734, 13.34158706665039, 14.326489448547363, 15.31139087677002, 16.296293258666992, 17.28119468688965, 18.266096115112305, 19.25099754333496, 20.23590087890625, 21.220802307128906, 22.205703735351562, 23.19060516357422, 24.175506591796875, 25.16040802001953, 26.145309448242188, 27.130210876464844, 28.1151123046875, 29.10001564025879, 30.084917068481445, 31.0698184967041, 32.05472183227539, 33.03962326049805]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 7.0, 5.0, 10.0, 9.0, 18.0, 19.0, 19.0, 20.0, 35.0, 23.0, 39.0, 33.0, 43.0, 40.0, 35.0, 36.0, 38.0, 43.0, 44.0, 35.0, 53.0, 43.0, 42.0, 31.0, 28.0, 33.0, 26.0, 26.0, 22.0, 21.0, 20.0, 10.0, 15.0, 11.0, 10.0, 7.0, 7.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.57421875, -7.32110595703125, -7.0679931640625, -6.81488037109375, -6.561767578125, -6.30865478515625, -6.0555419921875, -5.80242919921875, -5.54931640625, -5.29620361328125, -5.0430908203125, -4.78997802734375, -4.536865234375, -4.28375244140625, -4.0306396484375, -3.77752685546875, -3.5244140625, -3.27130126953125, -3.0181884765625, -2.76507568359375, -2.511962890625, -2.25885009765625, -2.0057373046875, -1.75262451171875, -1.49951171875, -1.24639892578125, -0.9932861328125, -0.74017333984375, -0.487060546875, -0.23394775390625, 0.0191650390625, 0.27227783203125, 0.525390625, 0.77850341796875, 1.0316162109375, 1.28472900390625, 1.537841796875, 1.79095458984375, 2.0440673828125, 2.29718017578125, 2.55029296875, 2.80340576171875, 3.0565185546875, 3.30963134765625, 3.562744140625, 3.81585693359375, 4.0689697265625, 4.32208251953125, 4.5751953125, 4.82830810546875, 5.0814208984375, 5.33453369140625, 5.587646484375, 5.84075927734375, 6.0938720703125, 6.34698486328125, 6.60009765625, 6.85321044921875, 7.1063232421875, 7.35943603515625, 7.612548828125, 7.86566162109375, 8.1187744140625, 8.37188720703125, 8.625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 4.0, 7.0, 14.0, 14.0, 21.0, 46.0, 56.0, 104.0, 128.0, 186.0, 320.0, 463.0, 620.0, 903.0, 1339.0, 1909.0, 2845.0, 3981.0, 5918.0, 8491.0, 12397.0, 18353.0, 27832.0, 43344.0, 71616.0, 130623.0, 243114.0, 200301.0, 103175.0, 59332.0, 36740.0, 23791.0, 15861.0, 10918.0, 7303.0, 5032.0, 3532.0, 2522.0, 1687.0, 1145.0, 828.0, 597.0, 382.0, 280.0, 163.0, 121.0, 70.0, 41.0, 35.0, 21.0, 13.0, 11.0, 11.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.2595481872558594, -0.25054168701171875, -0.24153518676757812, -0.2325286865234375, -0.22352218627929688, -0.21451568603515625, -0.20550918579101562, -0.196502685546875, -0.18749618530273438, -0.17848968505859375, -0.16948318481445312, -0.1604766845703125, -0.15147018432617188, -0.14246368408203125, -0.13345718383789062, -0.12445068359375, -0.11544418334960938, -0.10643768310546875, -0.09743118286132812, -0.0884246826171875, -0.07941818237304688, -0.07041168212890625, -0.061405181884765625, -0.052398681640625, -0.043392181396484375, -0.03438568115234375, -0.025379180908203125, -0.0163726806640625, -0.007366180419921875, 0.00164031982421875, 0.010646820068359375, 0.0196533203125, 0.028659820556640625, 0.03766632080078125, 0.046672821044921875, 0.0556793212890625, 0.06468582153320312, 0.07369232177734375, 0.08269882202148438, 0.091705322265625, 0.10071182250976562, 0.10971832275390625, 0.11872482299804688, 0.1277313232421875, 0.13673782348632812, 0.14574432373046875, 0.15475082397460938, 0.16375732421875, 0.17276382446289062, 0.18177032470703125, 0.19077682495117188, 0.1997833251953125, 0.20878982543945312, 0.21779632568359375, 0.22680282592773438, 0.235809326171875, 0.24481582641601562, 0.25382232666015625, 0.2628288269042969, 0.2718353271484375, 0.2808418273925781, 0.28984832763671875, 0.2988548278808594, 0.307861328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 4.0, 8.0, 9.0, 11.0, 12.0, 12.0, 17.0, 16.0, 26.0, 17.0, 34.0, 35.0, 27.0, 36.0, 41.0, 42.0, 54.0, 48.0, 41.0, 1061.0, 39.0, 35.0, 35.0, 33.0, 43.0, 32.0, 32.0, 30.0, 29.0, 26.0, 22.0, 20.0, 15.0, 18.0, 14.0, 15.0, 3.0, 9.0, 6.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.765625, -5.5914306640625, -5.417236328125, -5.2430419921875, -5.06884765625, -4.8946533203125, -4.720458984375, -4.5462646484375, -4.3720703125, -4.1978759765625, -4.023681640625, -3.8494873046875, -3.67529296875, -3.5010986328125, -3.326904296875, -3.1527099609375, -2.978515625, -2.8043212890625, -2.630126953125, -2.4559326171875, -2.28173828125, -2.1075439453125, -1.933349609375, -1.7591552734375, -1.5849609375, -1.4107666015625, -1.236572265625, -1.0623779296875, -0.88818359375, -0.7139892578125, -0.539794921875, -0.3656005859375, -0.19140625, -0.0172119140625, 0.156982421875, 0.3311767578125, 0.50537109375, 0.6795654296875, 0.853759765625, 1.0279541015625, 1.2021484375, 1.3763427734375, 1.550537109375, 1.7247314453125, 1.89892578125, 2.0731201171875, 2.247314453125, 2.4215087890625, 2.595703125, 2.7698974609375, 2.944091796875, 3.1182861328125, 3.29248046875, 3.4666748046875, 3.640869140625, 3.8150634765625, 3.9892578125, 4.1634521484375, 4.337646484375, 4.5118408203125, 4.68603515625, 4.8602294921875, 5.034423828125, 5.2086181640625, 5.3828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 17.0, 11.0, 21.0, 18.0, 25.0, 48.0, 61.0, 97.0, 157.0, 223.0, 247.0, 397.0, 648.0, 836.0, 1243.0, 1874.0, 2785.0, 4174.0, 6160.0, 9515.0, 14650.0, 23187.0, 37172.0, 62623.0, 118633.0, 1297936.0, 239202.0, 113194.0, 60504.0, 36035.0, 22851.0, 14350.0, 9270.0, 6122.0, 4132.0, 2782.0, 1841.0, 1283.0, 836.0, 621.0, 404.0, 297.0, 203.0, 126.0, 85.0, 72.0, 62.0, 35.0, 21.0, 14.0, 8.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.328125, -0.3181724548339844, -0.30821990966796875, -0.2982673645019531, -0.2883148193359375, -0.2783622741699219, -0.26840972900390625, -0.2584571838378906, -0.248504638671875, -0.23855209350585938, -0.22859954833984375, -0.21864700317382812, -0.2086944580078125, -0.19874191284179688, -0.18878936767578125, -0.17883682250976562, -0.16888427734375, -0.15893173217773438, -0.14897918701171875, -0.13902664184570312, -0.1290740966796875, -0.11912155151367188, -0.10916900634765625, -0.09921646118164062, -0.089263916015625, -0.07931137084960938, -0.06935882568359375, -0.059406280517578125, -0.0494537353515625, -0.039501190185546875, -0.02954864501953125, -0.019596099853515625, -0.0096435546875, 0.000308990478515625, 0.01026153564453125, 0.020214080810546875, 0.0301666259765625, 0.040119171142578125, 0.05007171630859375, 0.060024261474609375, 0.069976806640625, 0.07992935180664062, 0.08988189697265625, 0.09983444213867188, 0.1097869873046875, 0.11973953247070312, 0.12969207763671875, 0.13964462280273438, 0.14959716796875, 0.15954971313476562, 0.16950225830078125, 0.17945480346679688, 0.1894073486328125, 0.19935989379882812, 0.20931243896484375, 0.21926498413085938, 0.229217529296875, 0.23917007446289062, 0.24912261962890625, 0.2590751647949219, 0.2690277099609375, 0.2789802551269531, 0.28893280029296875, 0.2988853454589844, 0.308837890625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 5.0, 10.0, 10.0, 10.0, 22.0, 13.0, 17.0, 16.0, 26.0, 33.0, 44.0, 31.0, 33.0, 40.0, 43.0, 45.0, 41.0, 48.0, 45.0, 42.0, 41.0, 30.0, 47.0, 41.0, 31.0, 35.0, 19.0, 25.0, 31.0, 19.0, 18.0, 12.0, 13.0, 16.0, 7.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.184246063232422e-05, -4.064291715621948e-05, -3.9443373680114746e-05, -3.824383020401001e-05, -3.7044286727905273e-05, -3.584474325180054e-05, -3.46451997756958e-05, -3.3445656299591064e-05, -3.224611282348633e-05, -3.104656934738159e-05, -2.9847025871276855e-05, -2.864748239517212e-05, -2.7447938919067383e-05, -2.6248395442962646e-05, -2.504885196685791e-05, -2.3849308490753174e-05, -2.2649765014648438e-05, -2.14502215385437e-05, -2.0250678062438965e-05, -1.905113458633423e-05, -1.7851591110229492e-05, -1.6652047634124756e-05, -1.545250415802002e-05, -1.4252960681915283e-05, -1.3053417205810547e-05, -1.185387372970581e-05, -1.0654330253601074e-05, -9.454786777496338e-06, -8.255243301391602e-06, -7.055699825286865e-06, -5.856156349182129e-06, -4.656612873077393e-06, -3.4570693969726562e-06, -2.25752592086792e-06, -1.0579824447631836e-06, 1.4156103134155273e-07, 1.341104507446289e-06, 2.5406479835510254e-06, 3.7401914596557617e-06, 4.939734935760498e-06, 6.139278411865234e-06, 7.338821887969971e-06, 8.538365364074707e-06, 9.737908840179443e-06, 1.093745231628418e-05, 1.2136995792388916e-05, 1.3336539268493652e-05, 1.4536082744598389e-05, 1.5735626220703125e-05, 1.693516969680786e-05, 1.8134713172912598e-05, 1.9334256649017334e-05, 2.053380012512207e-05, 2.1733343601226807e-05, 2.2932887077331543e-05, 2.413243055343628e-05, 2.5331974029541016e-05, 2.6531517505645752e-05, 2.7731060981750488e-05, 2.8930604457855225e-05, 3.013014793395996e-05, 3.13296914100647e-05, 3.2529234886169434e-05, 3.372877836227417e-05, 3.4928321838378906e-05]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 14.0, 3.0, 7.0, 17.0, 24.0, 24.0, 23.0, 35.0, 37.0, 37.0, 50.0, 60.0, 62.0, 78.0, 123.0, 167.0, 239.0, 377.0, 782.0, 18314.0, 994658.0, 31175.0, 871.0, 387.0, 247.0, 165.0, 115.0, 69.0, 73.0, 46.0, 49.0, 44.0, 34.0, 33.0, 23.0, 12.0, 16.0, 13.0, 10.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00066375732421875, -0.0006412863731384277, -0.0006188154220581055, -0.0005963444709777832, -0.0005738735198974609, -0.0005514025688171387, -0.0005289316177368164, -0.0005064606666564941, -0.0004839897155761719, -0.0004615187644958496, -0.00043904781341552734, -0.0004165768623352051, -0.0003941059112548828, -0.00037163496017456055, -0.0003491640090942383, -0.000326693058013916, -0.00030422210693359375, -0.0002817511558532715, -0.0002592802047729492, -0.00023680925369262695, -0.0002143383026123047, -0.00019186735153198242, -0.00016939640045166016, -0.0001469254493713379, -0.00012445449829101562, -0.00010198354721069336, -7.95125961303711e-05, -5.704164505004883e-05, -3.457069396972656e-05, -1.2099742889404297e-05, 1.0371208190917969e-05, 3.2842159271240234e-05, 5.53131103515625e-05, 7.778406143188477e-05, 0.00010025501251220703, 0.0001227259635925293, 0.00014519691467285156, 0.00016766786575317383, 0.0001901388168334961, 0.00021260976791381836, 0.00023508071899414062, 0.0002575516700744629, 0.00028002262115478516, 0.0003024935722351074, 0.0003249645233154297, 0.00034743547439575195, 0.0003699064254760742, 0.0003923773765563965, 0.00041484832763671875, 0.000437319278717041, 0.0004597902297973633, 0.00048226118087768555, 0.0005047321319580078, 0.0005272030830383301, 0.0005496740341186523, 0.0005721449851989746, 0.0005946159362792969, 0.0006170868873596191, 0.0006395578384399414, 0.0006620287895202637, 0.0006844997406005859, 0.0007069706916809082, 0.0007294416427612305, 0.0007519125938415527, 0.000774383544921875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 13.0, 18.0, 65.0, 134.0, 212.0, 223.0, 157.0, 113.0, 52.0, 15.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.637664849520661e-05, -3.458403443801217e-05, -3.2791420380817726e-05, -3.0998806323623285e-05, -2.9206192266428843e-05, -2.74135782092344e-05, -2.5620962333050556e-05, -2.3828348275856115e-05, -2.2035734218661673e-05, -2.0243120161467232e-05, -1.845050610427279e-05, -1.6657890228088945e-05, -1.4865277080389205e-05, -1.3072663023194764e-05, -1.128004805650562e-05, -9.487433999311179e-06, -7.694819942116737e-06, -5.902205884922296e-06, -4.109591372980503e-06, -2.316976861038711e-06, -5.243628038442694e-07, 1.2682512533501722e-06, 3.0608662200393155e-06, 4.853480277233757e-06, 6.646094334428199e-06, 8.43870839162264e-06, 1.0231322448817082e-05, 1.2023937415506225e-05, 1.3816551472700667e-05, 1.560916643938981e-05, 1.740178049658425e-05, 1.9194394553778693e-05, 2.0987004972994328e-05, 2.277961903018877e-05, 2.457223308738321e-05, 2.6364847144577652e-05, 2.8157461201772094e-05, 2.9950075258966535e-05, 3.174268931616098e-05, 3.353530337335542e-05, 3.532791743054986e-05, 3.71205314877443e-05, 3.891314554493874e-05, 4.0705759602133185e-05, 4.2498373659327626e-05, 4.429098771652207e-05, 4.608360177371651e-05, 4.787621583091095e-05, 4.96688335260842e-05, 5.146144758327864e-05, 5.325406164047308e-05, 5.5046675697667524e-05, 5.6839289754861966e-05, 5.863190381205641e-05, 6.0424521507229656e-05, 6.22171355644241e-05, 6.400974962161854e-05, 6.580236367881298e-05, 6.759497773600742e-05, 6.938759179320186e-05, 7.11802058503963e-05, 7.297281990759075e-05, 7.476543396478519e-05, 7.655804802197963e-05, 7.835066207917407e-05]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 7.0, 15.0, 6.0, 10.0, 17.0, 19.0, 22.0, 22.0, 18.0, 18.0, 21.0, 18.0, 18.0, 30.0, 44.0, 47.0, 32.0, 35.0, 37.0, 36.0, 38.0, 40.0, 42.0, 38.0, 44.0, 26.0, 25.0, 29.0, 32.0, 21.0, 20.0, 28.0, 20.0, 22.0, 12.0, 17.0, 14.0, 6.0, 6.0, 11.0, 5.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.092123031616211e-05, -2.0256265997886658e-05, -1.9591301679611206e-05, -1.8926337361335754e-05, -1.8261373043060303e-05, -1.759640872478485e-05, -1.69314444065094e-05, -1.6266480088233948e-05, -1.5601515769958496e-05, -1.4936551451683044e-05, -1.4271587133407593e-05, -1.3606622815132141e-05, -1.294165849685669e-05, -1.2276694178581238e-05, -1.1611729860305786e-05, -1.0946765542030334e-05, -1.0281801223754883e-05, -9.616836905479431e-06, -8.95187258720398e-06, -8.286908268928528e-06, -7.621943950653076e-06, -6.9569796323776245e-06, -6.292015314102173e-06, -5.627050995826721e-06, -4.9620866775512695e-06, -4.297122359275818e-06, -3.632158041000366e-06, -2.9671937227249146e-06, -2.302229404449463e-06, -1.6372650861740112e-06, -9.723007678985596e-07, -3.073364496231079e-07, 3.5762786865234375e-07, 1.0225921869277954e-06, 1.687556505203247e-06, 2.3525208234786987e-06, 3.0174851417541504e-06, 3.682449460029602e-06, 4.347413778305054e-06, 5.012378096580505e-06, 5.677342414855957e-06, 6.342306733131409e-06, 7.00727105140686e-06, 7.672235369682312e-06, 8.337199687957764e-06, 9.002164006233215e-06, 9.667128324508667e-06, 1.0332092642784119e-05, 1.099705696105957e-05, 1.1662021279335022e-05, 1.2326985597610474e-05, 1.2991949915885925e-05, 1.3656914234161377e-05, 1.4321878552436829e-05, 1.498684287071228e-05, 1.5651807188987732e-05, 1.6316771507263184e-05, 1.6981735825538635e-05, 1.7646700143814087e-05, 1.831166446208954e-05, 1.897662878036499e-05, 1.9641593098640442e-05, 2.0306557416915894e-05, 2.0971521735191345e-05, 2.1636486053466797e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 7.0, 5.0, 10.0, 9.0, 18.0, 19.0, 19.0, 20.0, 35.0, 23.0, 39.0, 33.0, 43.0, 40.0, 35.0, 36.0, 38.0, 43.0, 44.0, 35.0, 53.0, 43.0, 42.0, 31.0, 28.0, 33.0, 26.0, 26.0, 22.0, 21.0, 20.0, 10.0, 15.0, 11.0, 10.0, 7.0, 7.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.57421875, -7.32110595703125, -7.0679931640625, -6.81488037109375, -6.561767578125, -6.30865478515625, -6.0555419921875, -5.80242919921875, -5.54931640625, -5.29620361328125, -5.0430908203125, -4.78997802734375, -4.536865234375, -4.28375244140625, -4.0306396484375, -3.77752685546875, -3.5244140625, -3.27130126953125, -3.0181884765625, -2.76507568359375, -2.511962890625, -2.25885009765625, -2.0057373046875, -1.75262451171875, -1.49951171875, -1.24639892578125, -0.9932861328125, -0.74017333984375, -0.487060546875, -0.23394775390625, 0.0191650390625, 0.27227783203125, 0.525390625, 0.77850341796875, 1.0316162109375, 1.28472900390625, 1.537841796875, 1.79095458984375, 2.0440673828125, 2.29718017578125, 2.55029296875, 2.80340576171875, 3.0565185546875, 3.30963134765625, 3.562744140625, 3.81585693359375, 4.0689697265625, 4.32208251953125, 4.5751953125, 4.82830810546875, 5.0814208984375, 5.33453369140625, 5.587646484375, 5.84075927734375, 6.0938720703125, 6.34698486328125, 6.60009765625, 6.85321044921875, 7.1063232421875, 7.35943603515625, 7.612548828125, 7.86566162109375, 8.1187744140625, 8.37188720703125, 8.625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 1.0, 9.0, 7.0, 11.0, 18.0, 26.0, 28.0, 31.0, 54.0, 68.0, 82.0, 117.0, 172.0, 261.0, 403.0, 716.0, 1156.0, 1948.0, 3463.0, 6199.0, 11944.0, 24988.0, 62788.0, 213019.0, 463120.0, 161893.0, 51215.0, 21262.0, 10401.0, 5619.0, 3012.0, 1716.0, 1012.0, 600.0, 357.0, 230.0, 167.0, 109.0, 85.0, 71.0, 45.0, 35.0, 24.0, 18.0, 8.0, 15.0, 8.0, 9.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.796875, -9.5035400390625, -9.210205078125, -8.9168701171875, -8.62353515625, -8.3302001953125, -8.036865234375, -7.7435302734375, -7.4501953125, -7.1568603515625, -6.863525390625, -6.5701904296875, -6.27685546875, -5.9835205078125, -5.690185546875, -5.3968505859375, -5.103515625, -4.8101806640625, -4.516845703125, -4.2235107421875, -3.93017578125, -3.6368408203125, -3.343505859375, -3.0501708984375, -2.7568359375, -2.4635009765625, -2.170166015625, -1.8768310546875, -1.58349609375, -1.2901611328125, -0.996826171875, -0.7034912109375, -0.41015625, -0.1168212890625, 0.176513671875, 0.4698486328125, 0.76318359375, 1.0565185546875, 1.349853515625, 1.6431884765625, 1.9365234375, 2.2298583984375, 2.523193359375, 2.8165283203125, 3.10986328125, 3.4031982421875, 3.696533203125, 3.9898681640625, 4.283203125, 4.5765380859375, 4.869873046875, 5.1632080078125, 5.45654296875, 5.7498779296875, 6.043212890625, 6.3365478515625, 6.6298828125, 6.9232177734375, 7.216552734375, 7.5098876953125, 7.80322265625, 8.0965576171875, 8.389892578125, 8.6832275390625, 8.9765625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 9.0, 10.0, 10.0, 14.0, 16.0, 16.0, 25.0, 26.0, 25.0, 39.0, 35.0, 26.0, 43.0, 54.0, 68.0, 125.0, 335.0, 1473.0, 156.0, 90.0, 66.0, 54.0, 43.0, 35.0, 35.0, 30.0, 23.0, 25.0, 21.0, 23.0, 15.0, 13.0, 10.0, 11.0, 8.0, 6.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-21.890625, -21.229736328125, -20.56884765625, -19.907958984375, -19.2470703125, -18.586181640625, -17.92529296875, -17.264404296875, -16.603515625, -15.942626953125, -15.28173828125, -14.620849609375, -13.9599609375, -13.299072265625, -12.63818359375, -11.977294921875, -11.31640625, -10.655517578125, -9.99462890625, -9.333740234375, -8.6728515625, -8.011962890625, -7.35107421875, -6.690185546875, -6.029296875, -5.368408203125, -4.70751953125, -4.046630859375, -3.3857421875, -2.724853515625, -2.06396484375, -1.403076171875, -0.7421875, -0.081298828125, 0.57958984375, 1.240478515625, 1.9013671875, 2.562255859375, 3.22314453125, 3.884033203125, 4.544921875, 5.205810546875, 5.86669921875, 6.527587890625, 7.1884765625, 7.849365234375, 8.51025390625, 9.171142578125, 9.83203125, 10.492919921875, 11.15380859375, 11.814697265625, 12.4755859375, 13.136474609375, 13.79736328125, 14.458251953125, 15.119140625, 15.780029296875, 16.44091796875, 17.101806640625, 17.7626953125, 18.423583984375, 19.08447265625, 19.745361328125, 20.40625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 7.0, 6.0, 7.0, 7.0, 14.0, 12.0, 22.0, 30.0, 43.0, 67.0, 96.0, 125.0, 180.0, 358.0, 941.0, 6945.0, 296823.0, 2818628.0, 18650.0, 1610.0, 449.0, 229.0, 128.0, 100.0, 55.0, 40.0, 33.0, 22.0, 20.0, 13.0, 10.0, 8.0, 8.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.21875, -34.8349609375, -33.451171875, -32.0673828125, -30.68359375, -29.2998046875, -27.916015625, -26.5322265625, -25.1484375, -23.7646484375, -22.380859375, -20.9970703125, -19.61328125, -18.2294921875, -16.845703125, -15.4619140625, -14.078125, -12.6943359375, -11.310546875, -9.9267578125, -8.54296875, -7.1591796875, -5.775390625, -4.3916015625, -3.0078125, -1.6240234375, -0.240234375, 1.1435546875, 2.52734375, 3.9111328125, 5.294921875, 6.6787109375, 8.0625, 9.4462890625, 10.830078125, 12.2138671875, 13.59765625, 14.9814453125, 16.365234375, 17.7490234375, 19.1328125, 20.5166015625, 21.900390625, 23.2841796875, 24.66796875, 26.0517578125, 27.435546875, 28.8193359375, 30.203125, 31.5869140625, 32.970703125, 34.3544921875, 35.73828125, 37.1220703125, 38.505859375, 39.8896484375, 41.2734375, 42.6572265625, 44.041015625, 45.4248046875, 46.80859375, 48.1923828125, 49.576171875, 50.9599609375, 52.34375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 22.0, 51.0, 92.0, 170.0, 208.0, 198.0, 139.0, 71.0, 32.0, 15.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.14478302001953, -64.75980377197266, -63.374820709228516, -61.989837646484375, -60.6048583984375, -59.219879150390625, -57.834896087646484, -56.449913024902344, -55.06493377685547, -53.679954528808594, -52.29497146606445, -50.90998840332031, -49.52500915527344, -48.14002990722656, -46.75504684448242, -45.37006378173828, -43.985084533691406, -42.60010528564453, -41.21512222290039, -39.83013916015625, -38.445159912109375, -37.0601806640625, -35.67519760131836, -34.29021453857422, -32.905235290527344, -31.520254135131836, -30.135272979736328, -28.75029182434082, -27.365310668945312, -25.980329513549805, -24.595348358154297, -23.21036720275879, -21.82538604736328, -20.440404891967773, -19.055423736572266, -17.670442581176758, -16.28546142578125, -14.900480270385742, -13.515499114990234, -12.130517959594727, -10.745536804199219, -9.360555648803711, -7.975574493408203, -6.590593338012695, -5.2056121826171875, -3.8206310272216797, -2.435649871826172, -1.050668716430664, 0.33431243896484375, 1.7192935943603516, 3.1042747497558594, 4.489255905151367, 5.874237060546875, 7.259218215942383, 8.64419937133789, 10.029180526733398, 11.414161682128906, 12.799142837524414, 14.184123992919922, 15.56910514831543, 16.954086303710938, 18.339067459106445, 19.724048614501953, 21.10902976989746, 22.49401092529297]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 10.0, 9.0, 19.0, 12.0, 22.0, 11.0, 17.0, 28.0, 21.0, 32.0, 38.0, 33.0, 39.0, 56.0, 53.0, 31.0, 41.0, 43.0, 47.0, 43.0, 47.0, 40.0, 44.0, 29.0, 49.0, 30.0, 23.0, 21.0, 18.0, 19.0, 8.0, 13.0, 12.0, 10.0, 6.0, 8.0, 4.0, 2.0, 7.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.21969985961914, -47.57644271850586, -45.93318557739258, -44.2899284362793, -42.646671295166016, -41.00341033935547, -39.36015319824219, -37.716896057128906, -36.073638916015625, -34.430381774902344, -32.78712463378906, -31.14386749267578, -29.500608444213867, -27.857351303100586, -26.214094161987305, -24.57083511352539, -22.927579879760742, -21.28432273864746, -19.64106559753418, -17.997806549072266, -16.354549407958984, -14.711292266845703, -13.068035125732422, -11.424777030944824, -9.781519889831543, -8.138262748718262, -6.495004653930664, -4.851747512817383, -3.2084898948669434, -1.565232276916504, 0.07802486419677734, 1.721282958984375, 3.3645401000976562, 5.007797718048096, 6.651055335998535, 8.294312477111816, 9.937570571899414, 11.580827713012695, 13.224084854125977, 14.867342948913574, 16.510601043701172, 18.153858184814453, 19.797115325927734, 21.440372467041016, 23.08363151550293, 24.72688865661621, 26.370145797729492, 28.013404846191406, 29.656660079956055, 31.299917221069336, 32.94317626953125, 34.58643341064453, 36.22969055175781, 37.872947692871094, 39.516204833984375, 41.159461975097656, 42.80271911621094, 44.44597625732422, 46.0892333984375, 47.73249053955078, 49.37574768066406, 51.019004821777344, 52.662261962890625, 54.30552291870117, 55.94878005981445]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 5.0, 9.0, 6.0, 16.0, 10.0, 11.0, 15.0, 15.0, 30.0, 22.0, 33.0, 28.0, 40.0, 42.0, 30.0, 36.0, 32.0, 34.0, 42.0, 44.0, 42.0, 51.0, 40.0, 42.0, 30.0, 26.0, 30.0, 32.0, 27.0, 15.0, 22.0, 30.0, 19.0, 9.0, 15.0, 11.0, 7.0, 4.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.5, -8.2520751953125, -8.004150390625, -7.7562255859375, -7.50830078125, -7.2603759765625, -7.012451171875, -6.7645263671875, -6.5166015625, -6.2686767578125, -6.020751953125, -5.7728271484375, -5.52490234375, -5.2769775390625, -5.029052734375, -4.7811279296875, -4.533203125, -4.2852783203125, -4.037353515625, -3.7894287109375, -3.54150390625, -3.2935791015625, -3.045654296875, -2.7977294921875, -2.5498046875, -2.3018798828125, -2.053955078125, -1.8060302734375, -1.55810546875, -1.3101806640625, -1.062255859375, -0.8143310546875, -0.56640625, -0.3184814453125, -0.070556640625, 0.1773681640625, 0.42529296875, 0.6732177734375, 0.921142578125, 1.1690673828125, 1.4169921875, 1.6649169921875, 1.912841796875, 2.1607666015625, 2.40869140625, 2.6566162109375, 2.904541015625, 3.1524658203125, 3.400390625, 3.6483154296875, 3.896240234375, 4.1441650390625, 4.39208984375, 4.6400146484375, 4.887939453125, 5.1358642578125, 5.3837890625, 5.6317138671875, 5.879638671875, 6.1275634765625, 6.37548828125, 6.6234130859375, 6.871337890625, 7.1192626953125, 7.3671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 9.0, 4.0, 6.0, 12.0, 14.0, 23.0, 17.0, 24.0, 36.0, 22.0, 42.0, 61.0, 57.0, 100.0, 121.0, 164.0, 203.0, 283.0, 322.0, 520.0, 21724.0, 4166185.0, 2384.0, 502.0, 341.0, 280.0, 186.0, 145.0, 120.0, 75.0, 59.0, 51.0, 39.0, 24.0, 23.0, 20.0, 18.0, 17.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-128.375, -124.40234375, -120.4296875, -116.45703125, -112.484375, -108.51171875, -104.5390625, -100.56640625, -96.59375, -92.62109375, -88.6484375, -84.67578125, -80.703125, -76.73046875, -72.7578125, -68.78515625, -64.8125, -60.83984375, -56.8671875, -52.89453125, -48.921875, -44.94921875, -40.9765625, -37.00390625, -33.03125, -29.05859375, -25.0859375, -21.11328125, -17.140625, -13.16796875, -9.1953125, -5.22265625, -1.25, 2.72265625, 6.6953125, 10.66796875, 14.640625, 18.61328125, 22.5859375, 26.55859375, 30.53125, 34.50390625, 38.4765625, 42.44921875, 46.421875, 50.39453125, 54.3671875, 58.33984375, 62.3125, 66.28515625, 70.2578125, 74.23046875, 78.203125, 82.17578125, 86.1484375, 90.12109375, 94.09375, 98.06640625, 102.0390625, 106.01171875, 109.984375, 113.95703125, 117.9296875, 121.90234375, 125.875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 8.0, 11.0, 16.0, 14.0, 23.0, 25.0, 31.0, 39.0, 50.0, 78.0, 85.0, 130.0, 212.0, 359.0, 527.0, 623.0, 560.0, 412.0, 250.0, 176.0, 119.0, 80.0, 51.0, 46.0, 42.0, 32.0, 14.0, 9.0, 4.0, 4.0, 6.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-13.3125, -12.9488525390625, -12.585205078125, -12.2215576171875, -11.85791015625, -11.4942626953125, -11.130615234375, -10.7669677734375, -10.4033203125, -10.0396728515625, -9.676025390625, -9.3123779296875, -8.94873046875, -8.5850830078125, -8.221435546875, -7.8577880859375, -7.494140625, -7.1304931640625, -6.766845703125, -6.4031982421875, -6.03955078125, -5.6759033203125, -5.312255859375, -4.9486083984375, -4.5849609375, -4.2213134765625, -3.857666015625, -3.4940185546875, -3.13037109375, -2.7667236328125, -2.403076171875, -2.0394287109375, -1.67578125, -1.3121337890625, -0.948486328125, -0.5848388671875, -0.22119140625, 0.1424560546875, 0.506103515625, 0.8697509765625, 1.2333984375, 1.5970458984375, 1.960693359375, 2.3243408203125, 2.68798828125, 3.0516357421875, 3.415283203125, 3.7789306640625, 4.142578125, 4.5062255859375, 4.869873046875, 5.2335205078125, 5.59716796875, 5.9608154296875, 6.324462890625, 6.6881103515625, 7.0517578125, 7.4154052734375, 7.779052734375, 8.1427001953125, 8.50634765625, 8.8699951171875, 9.233642578125, 9.5972900390625, 9.9609375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 3.0, 7.0, 7.0, 16.0, 20.0, 19.0, 18.0, 27.0, 38.0, 44.0, 41.0, 59.0, 114.0, 494.0, 16237.0, 4068703.0, 106629.0, 1166.0, 198.0, 102.0, 58.0, 50.0, 42.0, 35.0, 36.0, 25.0, 17.0, 12.0, 13.0, 9.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-85.0625, -82.677734375, -80.29296875, -77.908203125, -75.5234375, -73.138671875, -70.75390625, -68.369140625, -65.984375, -63.599609375, -61.21484375, -58.830078125, -56.4453125, -54.060546875, -51.67578125, -49.291015625, -46.90625, -44.521484375, -42.13671875, -39.751953125, -37.3671875, -34.982421875, -32.59765625, -30.212890625, -27.828125, -25.443359375, -23.05859375, -20.673828125, -18.2890625, -15.904296875, -13.51953125, -11.134765625, -8.75, -6.365234375, -3.98046875, -1.595703125, 0.7890625, 3.173828125, 5.55859375, 7.943359375, 10.328125, 12.712890625, 15.09765625, 17.482421875, 19.8671875, 22.251953125, 24.63671875, 27.021484375, 29.40625, 31.791015625, 34.17578125, 36.560546875, 38.9453125, 41.330078125, 43.71484375, 46.099609375, 48.484375, 50.869140625, 53.25390625, 55.638671875, 58.0234375, 60.408203125, 62.79296875, 65.177734375, 67.5625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 8.0, 18.0, 53.0, 83.0, 144.0, 201.0, 197.0, 151.0, 72.0, 46.0, 25.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.45285034179688, -98.22171783447266, -95.99059295654297, -93.75946044921875, -91.52833557128906, -89.29720306396484, -87.06607818603516, -84.83494567871094, -82.60382080078125, -80.37268829345703, -78.14156341552734, -75.91043090820312, -73.67930603027344, -71.44817352294922, -69.21704864501953, -66.98591613769531, -64.7547836303711, -62.52365493774414, -60.29252624511719, -58.061397552490234, -55.83026885986328, -53.59913635253906, -51.36800765991211, -49.136878967285156, -46.9057502746582, -44.67462158203125, -42.4434928894043, -40.212364196777344, -37.981231689453125, -35.75010681152344, -33.51897430419922, -31.287845611572266, -29.056720733642578, -26.825592041015625, -24.594463348388672, -22.363332748413086, -20.132204055786133, -17.90107536315918, -15.66994571685791, -13.43881607055664, -11.207687377929688, -8.976558685302734, -6.745429039001465, -4.5142998695373535, -2.283170700073242, -0.05204200744628906, 2.1790876388549805, 4.41021728515625, 6.641345977783203, 8.872474670410156, 11.103604316711426, 13.334733963012695, 15.565862655639648, 17.7969913482666, 20.028121948242188, 22.25925064086914, 24.490379333496094, 26.721508026123047, 28.95263671875, 31.183767318725586, 33.414894104003906, 35.646026611328125, 37.87715530395508, 40.10828399658203, 42.339412689208984]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0, 6.0, 11.0, 8.0, 15.0, 13.0, 12.0, 28.0, 28.0, 28.0, 33.0, 29.0, 23.0, 28.0, 41.0, 37.0, 44.0, 46.0, 51.0, 34.0, 58.0, 38.0, 33.0, 43.0, 41.0, 35.0, 30.0, 30.0, 25.0, 23.0, 13.0, 15.0, 20.0, 17.0, 10.0, 7.0, 5.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-36.95637512207031, -35.78951644897461, -34.622657775878906, -33.4557991027832, -32.2889404296875, -31.122081756591797, -29.95522117614746, -28.788362503051758, -27.621503829956055, -26.45464515686035, -25.28778648376465, -24.120927810668945, -22.95406723022461, -21.787208557128906, -20.620349884033203, -19.4534912109375, -18.286632537841797, -17.119773864746094, -15.95291519165039, -14.786055564880371, -13.619196891784668, -12.452338218688965, -11.285478591918945, -10.118619918823242, -8.951761245727539, -7.784902572631836, -6.618043422698975, -5.451184272766113, -4.28432559967041, -3.117466926574707, -1.9506077766418457, -0.7837486267089844, 0.3831138610839844, 1.5499727725982666, 2.716831684112549, 3.883690595626831, 5.050549507141113, 6.217408180236816, 7.384267330169678, 8.551126480102539, 9.717985153198242, 10.884843826293945, 12.051702499389648, 13.218562126159668, 14.385420799255371, 15.552279472351074, 16.719139099121094, 17.885997772216797, 19.0528564453125, 20.219715118408203, 21.386573791503906, 22.55343246459961, 23.720291137695312, 24.887149810791016, 26.05401039123535, 27.220869064331055, 28.387727737426758, 29.55458641052246, 30.721445083618164, 31.888303756713867, 33.0551643371582, 34.222023010253906, 35.38888168334961, 36.55574035644531, 37.722599029541016]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 3.0, 12.0, 11.0, 13.0, 11.0, 14.0, 27.0, 26.0, 17.0, 28.0, 36.0, 36.0, 40.0, 39.0, 35.0, 38.0, 42.0, 38.0, 39.0, 42.0, 40.0, 51.0, 30.0, 39.0, 25.0, 29.0, 35.0, 25.0, 26.0, 23.0, 20.0, 28.0, 8.0, 10.0, 11.0, 10.0, 13.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.4453125, -8.19189453125, -7.9384765625, -7.68505859375, -7.431640625, -7.17822265625, -6.9248046875, -6.67138671875, -6.41796875, -6.16455078125, -5.9111328125, -5.65771484375, -5.404296875, -5.15087890625, -4.8974609375, -4.64404296875, -4.390625, -4.13720703125, -3.8837890625, -3.63037109375, -3.376953125, -3.12353515625, -2.8701171875, -2.61669921875, -2.36328125, -2.10986328125, -1.8564453125, -1.60302734375, -1.349609375, -1.09619140625, -0.8427734375, -0.58935546875, -0.3359375, -0.08251953125, 0.1708984375, 0.42431640625, 0.677734375, 0.93115234375, 1.1845703125, 1.43798828125, 1.69140625, 1.94482421875, 2.1982421875, 2.45166015625, 2.705078125, 2.95849609375, 3.2119140625, 3.46533203125, 3.71875, 3.97216796875, 4.2255859375, 4.47900390625, 4.732421875, 4.98583984375, 5.2392578125, 5.49267578125, 5.74609375, 5.99951171875, 6.2529296875, 6.50634765625, 6.759765625, 7.01318359375, 7.2666015625, 7.52001953125, 7.7734375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 11.0, 20.0, 17.0, 19.0, 54.0, 64.0, 97.0, 173.0, 246.0, 381.0, 659.0, 1022.0, 1627.0, 2557.0, 4358.0, 7280.0, 12311.0, 21552.0, 38592.0, 73118.0, 156537.0, 312727.0, 209812.0, 94298.0, 47548.0, 26169.0, 15004.0, 8811.0, 5100.0, 3266.0, 1926.0, 1126.0, 724.0, 523.0, 289.0, 179.0, 106.0, 72.0, 50.0, 39.0, 31.0, 20.0, 8.0, 9.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.397705078125, -0.385894775390625, -0.37408447265625, -0.362274169921875, -0.3504638671875, -0.338653564453125, -0.32684326171875, -0.315032958984375, -0.30322265625, -0.291412353515625, -0.27960205078125, -0.267791748046875, -0.2559814453125, -0.244171142578125, -0.23236083984375, -0.220550537109375, -0.208740234375, -0.196929931640625, -0.18511962890625, -0.173309326171875, -0.1614990234375, -0.149688720703125, -0.13787841796875, -0.126068115234375, -0.1142578125, -0.102447509765625, -0.09063720703125, -0.078826904296875, -0.0670166015625, -0.055206298828125, -0.04339599609375, -0.031585693359375, -0.019775390625, -0.007965087890625, 0.00384521484375, 0.015655517578125, 0.0274658203125, 0.039276123046875, 0.05108642578125, 0.062896728515625, 0.07470703125, 0.086517333984375, 0.09832763671875, 0.110137939453125, 0.1219482421875, 0.133758544921875, 0.14556884765625, 0.157379150390625, 0.169189453125, 0.180999755859375, 0.19281005859375, 0.204620361328125, 0.2164306640625, 0.228240966796875, 0.24005126953125, 0.251861572265625, 0.263671875, 0.275482177734375, 0.28729248046875, 0.299102783203125, 0.3109130859375, 0.322723388671875, 0.33453369140625, 0.346343994140625, 0.358154296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 5.0, 5.0, 7.0, 8.0, 11.0, 16.0, 13.0, 14.0, 21.0, 25.0, 25.0, 19.0, 29.0, 34.0, 32.0, 31.0, 36.0, 33.0, 27.0, 32.0, 37.0, 1058.0, 33.0, 38.0, 42.0, 34.0, 27.0, 42.0, 36.0, 26.0, 30.0, 22.0, 25.0, 24.0, 18.0, 14.0, 13.0, 10.0, 13.0, 8.0, 10.0, 7.0, 7.0, 4.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0], "bins": [-4.24609375, -4.10284423828125, -3.9595947265625, -3.81634521484375, -3.673095703125, -3.52984619140625, -3.3865966796875, -3.24334716796875, -3.10009765625, -2.95684814453125, -2.8135986328125, -2.67034912109375, -2.527099609375, -2.38385009765625, -2.2406005859375, -2.09735107421875, -1.9541015625, -1.81085205078125, -1.6676025390625, -1.52435302734375, -1.381103515625, -1.23785400390625, -1.0946044921875, -0.95135498046875, -0.80810546875, -0.66485595703125, -0.5216064453125, -0.37835693359375, -0.235107421875, -0.09185791015625, 0.0513916015625, 0.19464111328125, 0.337890625, 0.48114013671875, 0.6243896484375, 0.76763916015625, 0.910888671875, 1.05413818359375, 1.1973876953125, 1.34063720703125, 1.48388671875, 1.62713623046875, 1.7703857421875, 1.91363525390625, 2.056884765625, 2.20013427734375, 2.3433837890625, 2.48663330078125, 2.6298828125, 2.77313232421875, 2.9163818359375, 3.05963134765625, 3.202880859375, 3.34613037109375, 3.4893798828125, 3.63262939453125, 3.77587890625, 3.91912841796875, 4.0623779296875, 4.20562744140625, 4.348876953125, 4.49212646484375, 4.6353759765625, 4.77862548828125, 4.921875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 15.0, 29.0, 45.0, 60.0, 76.0, 120.0, 161.0, 205.0, 315.0, 453.0, 671.0, 969.0, 1430.0, 2052.0, 2939.0, 4401.0, 6494.0, 10032.0, 15447.0, 24287.0, 38884.0, 64325.0, 118659.0, 755600.0, 757672.0, 118695.0, 64418.0, 38771.0, 24357.0, 15237.0, 9846.0, 6562.0, 4352.0, 3092.0, 1935.0, 1395.0, 878.0, 692.0, 447.0, 333.0, 257.0, 162.0, 105.0, 73.0, 51.0, 23.0, 23.0, 22.0, 13.0, 15.0, 6.0, 7.0, 7.0, 2.0, 3.0, 1.0], "bins": [-0.28759765625, -0.2786102294921875, -0.269622802734375, -0.2606353759765625, -0.25164794921875, -0.2426605224609375, -0.233673095703125, -0.2246856689453125, -0.2156982421875, -0.2067108154296875, -0.197723388671875, -0.1887359619140625, -0.17974853515625, -0.1707611083984375, -0.161773681640625, -0.1527862548828125, -0.143798828125, -0.1348114013671875, -0.125823974609375, -0.1168365478515625, -0.10784912109375, -0.0988616943359375, -0.089874267578125, -0.0808868408203125, -0.0718994140625, -0.0629119873046875, -0.053924560546875, -0.0449371337890625, -0.03594970703125, -0.0269622802734375, -0.017974853515625, -0.0089874267578125, 0.0, 0.0089874267578125, 0.017974853515625, 0.0269622802734375, 0.03594970703125, 0.0449371337890625, 0.053924560546875, 0.0629119873046875, 0.0718994140625, 0.0808868408203125, 0.089874267578125, 0.0988616943359375, 0.10784912109375, 0.1168365478515625, 0.125823974609375, 0.1348114013671875, 0.143798828125, 0.1527862548828125, 0.161773681640625, 0.1707611083984375, 0.17974853515625, 0.1887359619140625, 0.197723388671875, 0.2067108154296875, 0.2156982421875, 0.2246856689453125, 0.233673095703125, 0.2426605224609375, 0.25164794921875, 0.2606353759765625, 0.269622802734375, 0.2786102294921875, 0.28759765625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 10.0, 6.0, 8.0, 10.0, 12.0, 16.0, 24.0, 25.0, 35.0, 32.0, 28.0, 37.0, 33.0, 53.0, 43.0, 44.0, 39.0, 46.0, 50.0, 51.0, 40.0, 36.0, 42.0, 33.0, 37.0, 40.0, 34.0, 25.0, 23.0, 23.0, 10.0, 7.0, 6.0, 6.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.40614128112793e-05, -5.254708230495453e-05, -5.103275179862976e-05, -4.951842129230499e-05, -4.8004090785980225e-05, -4.6489760279655457e-05, -4.497542977333069e-05, -4.346109926700592e-05, -4.194676876068115e-05, -4.0432438254356384e-05, -3.8918107748031616e-05, -3.740377724170685e-05, -3.588944673538208e-05, -3.437511622905731e-05, -3.2860785722732544e-05, -3.1346455216407776e-05, -2.9832124710083008e-05, -2.831779420375824e-05, -2.680346369743347e-05, -2.5289133191108704e-05, -2.3774802684783936e-05, -2.2260472178459167e-05, -2.07461416721344e-05, -1.923181116580963e-05, -1.7717480659484863e-05, -1.6203150153160095e-05, -1.4688819646835327e-05, -1.3174489140510559e-05, -1.1660158634185791e-05, -1.0145828127861023e-05, -8.631497621536255e-06, -7.117167115211487e-06, -5.602836608886719e-06, -4.088506102561951e-06, -2.5741755962371826e-06, -1.0598450899124146e-06, 4.544854164123535e-07, 1.9688159227371216e-06, 3.4831464290618896e-06, 4.997476935386658e-06, 6.511807441711426e-06, 8.026137948036194e-06, 9.540468454360962e-06, 1.105479896068573e-05, 1.2569129467010498e-05, 1.4083459973335266e-05, 1.5597790479660034e-05, 1.7112120985984802e-05, 1.862645149230957e-05, 2.014078199863434e-05, 2.1655112504959106e-05, 2.3169443011283875e-05, 2.4683773517608643e-05, 2.619810402393341e-05, 2.771243453025818e-05, 2.9226765036582947e-05, 3.0741095542907715e-05, 3.225542604923248e-05, 3.376975655555725e-05, 3.528408706188202e-05, 3.679841756820679e-05, 3.8312748074531555e-05, 3.982707858085632e-05, 4.134140908718109e-05, 4.285573959350586e-05]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 11.0, 10.0, 19.0, 10.0, 25.0, 32.0, 44.0, 82.0, 87.0, 94.0, 120.0, 163.0, 274.0, 431.0, 919.0, 18124.0, 1018490.0, 7306.0, 827.0, 455.0, 275.0, 160.0, 116.0, 83.0, 65.0, 61.0, 55.0, 41.0, 28.0, 21.0, 22.0, 15.0, 13.0, 9.0, 10.0, 7.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008196830749511719, -0.0007908567786216736, -0.0007620304822921753, -0.000733204185962677, -0.0007043778896331787, -0.0006755515933036804, -0.0006467252969741821, -0.0006178990006446838, -0.0005890727043151855, -0.0005602464079856873, -0.000531420111656189, -0.0005025938153266907, -0.0004737675189971924, -0.0004449412226676941, -0.0004161149263381958, -0.0003872886300086975, -0.0003584623336791992, -0.00032963603734970093, -0.00030080974102020264, -0.00027198344469070435, -0.00024315714836120605, -0.00021433085203170776, -0.00018550455570220947, -0.00015667825937271118, -0.0001278519630432129, -9.90256667137146e-05, -7.019937038421631e-05, -4.137307405471802e-05, -1.2546777725219727e-05, 1.6279518604278564e-05, 4.5105814933776855e-05, 7.393211126327515e-05, 0.00010275840759277344, 0.00013158470392227173, 0.00016041100025177002, 0.0001892372965812683, 0.0002180635929107666, 0.0002468898892402649, 0.0002757161855697632, 0.0003045424818992615, 0.00033336877822875977, 0.00036219507455825806, 0.00039102137088775635, 0.00041984766721725464, 0.00044867396354675293, 0.0004775002598762512, 0.0005063265562057495, 0.0005351528525352478, 0.0005639791488647461, 0.0005928054451942444, 0.0006216317415237427, 0.000650458037853241, 0.0006792843341827393, 0.0007081106305122375, 0.0007369369268417358, 0.0007657632231712341, 0.0007945895195007324, 0.0008234158158302307, 0.000852242112159729, 0.0008810684084892273, 0.0009098947048187256, 0.0009387210011482239, 0.0009675472974777222, 0.0009963735938072205, 0.0010251998901367188]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 44.0, 726.0, 236.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.995835716836154e-05, -9.209144627675414e-05, -8.422453538514674e-05, -7.635762449353933e-05, -6.849071360193193e-05, -6.0623802710324526e-05, -5.275689181871712e-05, -4.488998092710972e-05, -3.7023070035502315e-05, -2.915615914389491e-05, -2.1289248252287507e-05, -1.3422337360680103e-05, -5.5554264690726995e-06, 2.311484422534704e-06, 1.0178395314142108e-05, 1.8045306205749512e-05, 2.5912217097356915e-05, 3.377912798896432e-05, 4.164603888057172e-05, 4.951294977217913e-05, 5.737986066378653e-05, 6.524677155539393e-05, 7.311368244700134e-05, 8.098059333860874e-05, 8.884750423021615e-05, 9.671441512182355e-05, 0.00010458132601343095, 0.00011244823690503836, 0.00012031514779664576, 0.00012818205868825316, 0.00013604896957986057, 0.00014391588047146797, 0.00015178279136307538, 0.00015964970225468278, 0.00016751661314629018, 0.0001753835240378976, 0.000183250434929505, 0.0001911173458211124, 0.0001989842567127198, 0.0002068511676043272, 0.0002147180784959346, 0.000222584989387542, 0.0002304519002791494, 0.00023831881117075682, 0.0002461857220623642, 0.0002540526329539716, 0.00026191954384557903, 0.00026978645473718643, 0.00027765336562879384, 0.00028552027652040124, 0.00029338718741200864, 0.00030125409830361605, 0.00030912100919522345, 0.00031698792008683085, 0.00032485483097843826, 0.00033272174187004566, 0.00034058865276165307, 0.00034845556365326047, 0.0003563224745448679, 0.0003641893854364753, 0.0003720562963280827, 0.0003799232072196901, 0.0003877901181112975, 0.0003956570290029049, 0.0004035239398945123]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 4.0, 3.0, 6.0, 11.0, 7.0, 17.0, 19.0, 17.0, 18.0, 20.0, 25.0, 37.0, 41.0, 34.0, 56.0, 42.0, 44.0, 46.0, 50.0, 46.0, 38.0, 47.0, 57.0, 39.0, 38.0, 36.0, 34.0, 26.0, 23.0, 22.0, 20.0, 14.0, 11.0, 14.0, 10.0, 6.0, 6.0, 3.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9742717742919922e-05, -2.8721988201141357e-05, -2.7701258659362793e-05, -2.668052911758423e-05, -2.5659799575805664e-05, -2.46390700340271e-05, -2.3618340492248535e-05, -2.259761095046997e-05, -2.1576881408691406e-05, -2.0556151866912842e-05, -1.9535422325134277e-05, -1.8514692783355713e-05, -1.749396324157715e-05, -1.6473233699798584e-05, -1.545250415802002e-05, -1.4431774616241455e-05, -1.341104507446289e-05, -1.2390315532684326e-05, -1.1369585990905762e-05, -1.0348856449127197e-05, -9.328126907348633e-06, -8.307397365570068e-06, -7.286667823791504e-06, -6.2659382820129395e-06, -5.245208740234375e-06, -4.2244791984558105e-06, -3.203749656677246e-06, -2.1830201148986816e-06, -1.1622905731201172e-06, -1.4156103134155273e-07, 8.791685104370117e-07, 1.8998980522155762e-06, 2.9206275939941406e-06, 3.941357135772705e-06, 4.9620866775512695e-06, 5.982816219329834e-06, 7.0035457611083984e-06, 8.024275302886963e-06, 9.045004844665527e-06, 1.0065734386444092e-05, 1.1086463928222656e-05, 1.210719347000122e-05, 1.3127923011779785e-05, 1.414865255355835e-05, 1.5169382095336914e-05, 1.619011163711548e-05, 1.7210841178894043e-05, 1.8231570720672607e-05, 1.9252300262451172e-05, 2.0273029804229736e-05, 2.12937593460083e-05, 2.2314488887786865e-05, 2.333521842956543e-05, 2.4355947971343994e-05, 2.537667751312256e-05, 2.6397407054901123e-05, 2.7418136596679688e-05, 2.8438866138458252e-05, 2.9459595680236816e-05, 3.048032522201538e-05, 3.1501054763793945e-05, 3.252178430557251e-05, 3.3542513847351074e-05, 3.456324338912964e-05, 3.55839729309082e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 3.0, 12.0, 11.0, 13.0, 11.0, 14.0, 27.0, 26.0, 17.0, 28.0, 36.0, 36.0, 40.0, 39.0, 35.0, 38.0, 42.0, 38.0, 39.0, 42.0, 40.0, 51.0, 30.0, 39.0, 25.0, 29.0, 35.0, 25.0, 26.0, 23.0, 20.0, 28.0, 8.0, 10.0, 11.0, 10.0, 13.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.4453125, -8.19189453125, -7.9384765625, -7.68505859375, -7.431640625, -7.17822265625, -6.9248046875, -6.67138671875, -6.41796875, -6.16455078125, -5.9111328125, -5.65771484375, -5.404296875, -5.15087890625, -4.8974609375, -4.64404296875, -4.390625, -4.13720703125, -3.8837890625, -3.63037109375, -3.376953125, -3.12353515625, -2.8701171875, -2.61669921875, -2.36328125, -2.10986328125, -1.8564453125, -1.60302734375, -1.349609375, -1.09619140625, -0.8427734375, -0.58935546875, -0.3359375, -0.08251953125, 0.1708984375, 0.42431640625, 0.677734375, 0.93115234375, 1.1845703125, 1.43798828125, 1.69140625, 1.94482421875, 2.1982421875, 2.45166015625, 2.705078125, 2.95849609375, 3.2119140625, 3.46533203125, 3.71875, 3.97216796875, 4.2255859375, 4.47900390625, 4.732421875, 4.98583984375, 5.2392578125, 5.49267578125, 5.74609375, 5.99951171875, 6.2529296875, 6.50634765625, 6.759765625, 7.01318359375, 7.2666015625, 7.52001953125, 7.7734375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 8.0, 5.0, 7.0, 12.0, 12.0, 23.0, 32.0, 46.0, 70.0, 87.0, 103.0, 136.0, 185.0, 243.0, 333.0, 440.0, 533.0, 752.0, 1037.0, 1550.0, 2806.0, 6885.0, 22648.0, 97631.0, 420038.0, 374657.0, 84148.0, 19924.0, 6068.0, 2689.0, 1490.0, 991.0, 714.0, 543.0, 430.0, 317.0, 236.0, 176.0, 133.0, 110.0, 67.0, 71.0, 47.0, 34.0, 20.0, 17.0, 17.0, 7.0, 8.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-12.828125, -12.4266357421875, -12.025146484375, -11.6236572265625, -11.22216796875, -10.8206787109375, -10.419189453125, -10.0177001953125, -9.6162109375, -9.2147216796875, -8.813232421875, -8.4117431640625, -8.01025390625, -7.6087646484375, -7.207275390625, -6.8057861328125, -6.404296875, -6.0028076171875, -5.601318359375, -5.1998291015625, -4.79833984375, -4.3968505859375, -3.995361328125, -3.5938720703125, -3.1923828125, -2.7908935546875, -2.389404296875, -1.9879150390625, -1.58642578125, -1.1849365234375, -0.783447265625, -0.3819580078125, 0.01953125, 0.4210205078125, 0.822509765625, 1.2239990234375, 1.62548828125, 2.0269775390625, 2.428466796875, 2.8299560546875, 3.2314453125, 3.6329345703125, 4.034423828125, 4.4359130859375, 4.83740234375, 5.2388916015625, 5.640380859375, 6.0418701171875, 6.443359375, 6.8448486328125, 7.246337890625, 7.6478271484375, 8.04931640625, 8.4508056640625, 8.852294921875, 9.2537841796875, 9.6552734375, 10.0567626953125, 10.458251953125, 10.8597412109375, 11.26123046875, 11.6627197265625, 12.064208984375, 12.4656982421875, 12.8671875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 8.0, 6.0, 6.0, 2.0, 10.0, 23.0, 24.0, 35.0, 38.0, 36.0, 47.0, 81.0, 98.0, 143.0, 1527.0, 388.0, 143.0, 91.0, 54.0, 57.0, 49.0, 37.0, 30.0, 30.0, 17.0, 12.0, 10.0, 5.0, 9.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.84375, -28.937255859375, -28.03076171875, -27.124267578125, -26.2177734375, -25.311279296875, -24.40478515625, -23.498291015625, -22.591796875, -21.685302734375, -20.77880859375, -19.872314453125, -18.9658203125, -18.059326171875, -17.15283203125, -16.246337890625, -15.33984375, -14.433349609375, -13.52685546875, -12.620361328125, -11.7138671875, -10.807373046875, -9.90087890625, -8.994384765625, -8.087890625, -7.181396484375, -6.27490234375, -5.368408203125, -4.4619140625, -3.555419921875, -2.64892578125, -1.742431640625, -0.8359375, 0.070556640625, 0.97705078125, 1.883544921875, 2.7900390625, 3.696533203125, 4.60302734375, 5.509521484375, 6.416015625, 7.322509765625, 8.22900390625, 9.135498046875, 10.0419921875, 10.948486328125, 11.85498046875, 12.761474609375, 13.66796875, 14.574462890625, 15.48095703125, 16.387451171875, 17.2939453125, 18.200439453125, 19.10693359375, 20.013427734375, 20.919921875, 21.826416015625, 22.73291015625, 23.639404296875, 24.5458984375, 25.452392578125, 26.35888671875, 27.265380859375, 28.171875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 3.0, 6.0, 7.0, 3.0, 7.0, 7.0, 12.0, 14.0, 16.0, 27.0, 15.0, 39.0, 43.0, 79.0, 114.0, 183.0, 282.0, 601.0, 1381.0, 35159.0, 3101556.0, 4116.0, 942.0, 412.0, 184.0, 158.0, 92.0, 67.0, 36.0, 35.0, 15.0, 18.0, 17.0, 8.0, 8.0, 8.0, 12.0, 4.0, 9.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-70.9375, -68.671875, -66.40625, -64.140625, -61.875, -59.609375, -57.34375, -55.078125, -52.8125, -50.546875, -48.28125, -46.015625, -43.75, -41.484375, -39.21875, -36.953125, -34.6875, -32.421875, -30.15625, -27.890625, -25.625, -23.359375, -21.09375, -18.828125, -16.5625, -14.296875, -12.03125, -9.765625, -7.5, -5.234375, -2.96875, -0.703125, 1.5625, 3.828125, 6.09375, 8.359375, 10.625, 12.890625, 15.15625, 17.421875, 19.6875, 21.953125, 24.21875, 26.484375, 28.75, 31.015625, 33.28125, 35.546875, 37.8125, 40.078125, 42.34375, 44.609375, 46.875, 49.140625, 51.40625, 53.671875, 55.9375, 58.203125, 60.46875, 62.734375, 65.0, 67.265625, 69.53125, 71.796875, 74.0625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 45.0, 589.0, 363.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.72169494628906, -103.73809051513672, -96.75448608398438, -89.77088928222656, -82.78728485107422, -75.80368041992188, -68.82008361816406, -61.83647918701172, -54.852874755859375, -47.86927032470703, -40.88566970825195, -33.902069091796875, -26.91846466064453, -19.934860229492188, -12.95125961303711, -5.967658996582031, 1.0159454345703125, 7.999547958374023, 14.983150482177734, 21.966753005981445, 28.950355529785156, 35.9339599609375, 42.91756057739258, 49.901161193847656, 56.884765625, 63.868370056152344, 70.85197448730469, 77.8355712890625, 84.81917572021484, 91.80278015136719, 98.786376953125, 105.76998138427734, 112.75357055664062, 119.73717498779297, 126.72077941894531, 133.70437622070312, 140.68798828125, 147.6715850830078, 154.65518188476562, 161.6387939453125, 168.6223907470703, 175.60598754882812, 182.589599609375, 189.5731964111328, 196.55679321289062, 203.5404052734375, 210.5240020751953, 217.50759887695312, 224.4912109375, 231.4748077392578, 238.4584197998047, 245.4420166015625, 252.42562866210938, 259.40924072265625, 266.392822265625, 273.3764343261719, 280.36004638671875, 287.3436584472656, 294.3272399902344, 301.31085205078125, 308.2944641113281, 315.278076171875, 322.26165771484375, 329.2452697753906, 336.2288513183594]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 10.0, 11.0, 13.0, 10.0, 12.0, 23.0, 16.0, 21.0, 33.0, 34.0, 38.0, 47.0, 39.0, 42.0, 43.0, 53.0, 54.0, 43.0, 55.0, 51.0, 41.0, 46.0, 44.0, 48.0, 22.0, 22.0, 30.0, 23.0, 13.0, 16.0, 8.0, 11.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75548553466797, -68.21150207519531, -65.66751861572266, -63.123538970947266, -60.57955551147461, -58.03557205200195, -55.49159240722656, -52.947608947753906, -50.40362548828125, -47.859642028808594, -45.31565856933594, -42.77167892456055, -40.22769546508789, -37.683712005615234, -35.139732360839844, -32.59574890136719, -30.05176544189453, -27.507781982421875, -24.96380043029785, -22.419818878173828, -19.875835418701172, -17.331851959228516, -14.787870407104492, -12.243888854980469, -9.699905395507812, -7.155922889709473, -4.611940383911133, -2.067957878112793, 0.4760246276855469, 3.0200071334838867, 5.563989639282227, 8.10797119140625, 10.651962280273438, 13.195944786071777, 15.739927291870117, 18.28390884399414, 20.827892303466797, 23.371875762939453, 25.915857315063477, 28.4598388671875, 31.003822326660156, 33.54780578613281, 36.09178924560547, 38.63576889038086, 41.179752349853516, 43.72373580932617, 46.26771545410156, 48.81169891357422, 51.355682373046875, 53.89966583251953, 56.44364929199219, 58.98762893676758, 61.531612396240234, 64.07559204101562, 66.61957550048828, 69.16355895996094, 71.7075424194336, 74.25152587890625, 76.7955093383789, 79.33949279785156, 81.88346862792969, 84.42745208740234, 86.971435546875, 89.51541900634766, 92.05940246582031]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 7.0, 3.0, 8.0, 16.0, 9.0, 9.0, 17.0, 19.0, 20.0, 22.0, 25.0, 38.0, 45.0, 36.0, 41.0, 43.0, 44.0, 36.0, 40.0, 42.0, 37.0, 45.0, 43.0, 41.0, 40.0, 32.0, 26.0, 22.0, 29.0, 25.0, 30.0, 18.0, 18.0, 10.0, 11.0, 11.0, 6.0, 10.0, 1.0, 4.0, 8.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-9.6015625, -9.33587646484375, -9.0701904296875, -8.80450439453125, -8.538818359375, -8.27313232421875, -8.0074462890625, -7.74176025390625, -7.47607421875, -7.21038818359375, -6.9447021484375, -6.67901611328125, -6.413330078125, -6.14764404296875, -5.8819580078125, -5.61627197265625, -5.3505859375, -5.08489990234375, -4.8192138671875, -4.55352783203125, -4.287841796875, -4.02215576171875, -3.7564697265625, -3.49078369140625, -3.22509765625, -2.95941162109375, -2.6937255859375, -2.42803955078125, -2.162353515625, -1.89666748046875, -1.6309814453125, -1.36529541015625, -1.099609375, -0.83392333984375, -0.5682373046875, -0.30255126953125, -0.036865234375, 0.22882080078125, 0.4945068359375, 0.76019287109375, 1.02587890625, 1.29156494140625, 1.5572509765625, 1.82293701171875, 2.088623046875, 2.35430908203125, 2.6199951171875, 2.88568115234375, 3.1513671875, 3.41705322265625, 3.6827392578125, 3.94842529296875, 4.214111328125, 4.47979736328125, 4.7454833984375, 5.01116943359375, 5.27685546875, 5.54254150390625, 5.8082275390625, 6.07391357421875, 6.339599609375, 6.60528564453125, 6.8709716796875, 7.13665771484375, 7.40234375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 8.0, 15.0, 11.0, 13.0, 15.0, 23.0, 27.0, 40.0, 51.0, 53.0, 89.0, 141.0, 193.0, 340.0, 624.0, 1273.0, 3214.0, 11462.0, 74065.0, 1192348.0, 2644281.0, 234211.0, 22944.0, 5095.0, 1799.0, 719.0, 454.0, 223.0, 155.0, 104.0, 62.0, 42.0, 43.0, 37.0, 23.0, 20.0, 13.0, 10.0, 8.0, 6.0, 2.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.942138671875, -17.30615234375, -16.670166015625, -16.0341796875, -15.398193359375, -14.76220703125, -14.126220703125, -13.490234375, -12.854248046875, -12.21826171875, -11.582275390625, -10.9462890625, -10.310302734375, -9.67431640625, -9.038330078125, -8.40234375, -7.766357421875, -7.13037109375, -6.494384765625, -5.8583984375, -5.222412109375, -4.58642578125, -3.950439453125, -3.314453125, -2.678466796875, -2.04248046875, -1.406494140625, -0.7705078125, -0.134521484375, 0.50146484375, 1.137451171875, 1.7734375, 2.409423828125, 3.04541015625, 3.681396484375, 4.3173828125, 4.953369140625, 5.58935546875, 6.225341796875, 6.861328125, 7.497314453125, 8.13330078125, 8.769287109375, 9.4052734375, 10.041259765625, 10.67724609375, 11.313232421875, 11.94921875, 12.585205078125, 13.22119140625, 13.857177734375, 14.4931640625, 15.129150390625, 15.76513671875, 16.401123046875, 17.037109375, 17.673095703125, 18.30908203125, 18.945068359375, 19.5810546875, 20.217041015625, 20.85302734375, 21.489013671875, 22.125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 7.0, 15.0, 14.0, 18.0, 24.0, 44.0, 50.0, 91.0, 133.0, 243.0, 340.0, 661.0, 899.0, 626.0, 328.0, 219.0, 123.0, 85.0, 54.0, 35.0, 18.0, 13.0, 8.0, 8.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.984375, -26.300537109375, -25.61669921875, -24.932861328125, -24.2490234375, -23.565185546875, -22.88134765625, -22.197509765625, -21.513671875, -20.829833984375, -20.14599609375, -19.462158203125, -18.7783203125, -18.094482421875, -17.41064453125, -16.726806640625, -16.04296875, -15.359130859375, -14.67529296875, -13.991455078125, -13.3076171875, -12.623779296875, -11.93994140625, -11.256103515625, -10.572265625, -9.888427734375, -9.20458984375, -8.520751953125, -7.8369140625, -7.153076171875, -6.46923828125, -5.785400390625, -5.1015625, -4.417724609375, -3.73388671875, -3.050048828125, -2.3662109375, -1.682373046875, -0.99853515625, -0.314697265625, 0.369140625, 1.052978515625, 1.73681640625, 2.420654296875, 3.1044921875, 3.788330078125, 4.47216796875, 5.156005859375, 5.83984375, 6.523681640625, 7.20751953125, 7.891357421875, 8.5751953125, 9.259033203125, 9.94287109375, 10.626708984375, 11.310546875, 11.994384765625, 12.67822265625, 13.362060546875, 14.0458984375, 14.729736328125, 15.41357421875, 16.097412109375, 16.78125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 5.0, 12.0, 9.0, 17.0, 26.0, 21.0, 56.0, 89.0, 159.0, 307.0, 571.0, 1478.0, 6820.0, 97326.0, 3592226.0, 473155.0, 17602.0, 2640.0, 805.0, 404.0, 205.0, 124.0, 57.0, 57.0, 34.0, 21.0, 14.0, 13.0, 8.0, 6.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.397705078125, -27.24853515625, -26.099365234375, -24.9501953125, -23.801025390625, -22.65185546875, -21.502685546875, -20.353515625, -19.204345703125, -18.05517578125, -16.906005859375, -15.7568359375, -14.607666015625, -13.45849609375, -12.309326171875, -11.16015625, -10.010986328125, -8.86181640625, -7.712646484375, -6.5634765625, -5.414306640625, -4.26513671875, -3.115966796875, -1.966796875, -0.817626953125, 0.33154296875, 1.480712890625, 2.6298828125, 3.779052734375, 4.92822265625, 6.077392578125, 7.2265625, 8.375732421875, 9.52490234375, 10.674072265625, 11.8232421875, 12.972412109375, 14.12158203125, 15.270751953125, 16.419921875, 17.569091796875, 18.71826171875, 19.867431640625, 21.0166015625, 22.165771484375, 23.31494140625, 24.464111328125, 25.61328125, 26.762451171875, 27.91162109375, 29.060791015625, 30.2099609375, 31.359130859375, 32.50830078125, 33.657470703125, 34.806640625, 35.955810546875, 37.10498046875, 38.254150390625, 39.4033203125, 40.552490234375, 41.70166015625, 42.850830078125, 44.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 36.0, 761.0, 214.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-523.7356567382812, -508.21014404296875, -492.6846618652344, -477.1591491699219, -461.6336669921875, -446.108154296875, -430.5826416015625, -415.0571594238281, -399.53167724609375, -384.00616455078125, -368.4806823730469, -352.9551696777344, -337.4296875, -321.9041748046875, -306.378662109375, -290.8531799316406, -275.3276672363281, -259.8021545410156, -244.27667236328125, -228.75115966796875, -213.22567749023438, -197.70016479492188, -182.17466735839844, -166.649169921875, -151.12367248535156, -135.59817504882812, -120.07267761230469, -104.54717254638672, -89.02167510986328, -73.49617767333984, -57.970672607421875, -42.44517517089844, -26.919647216796875, -11.394147872924805, 4.131351470947266, 19.65685272216797, 35.182350158691406, 50.707847595214844, 66.23335266113281, 81.75885009765625, 97.28434753417969, 112.80984497070312, 128.33534240722656, 143.86083984375, 159.3863525390625, 174.91183471679688, 190.43734741210938, 205.9628448486328, 221.48834228515625, 237.0138397216797, 252.53933715820312, 268.0648498535156, 283.59033203125, 299.1158447265625, 314.641357421875, 330.1668395996094, 345.69232177734375, 361.21783447265625, 376.7433166503906, 392.2688293457031, 407.7943115234375, 423.31982421875, 438.8453369140625, 454.3708190917969, 469.8963317871094]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 6.0, 9.0, 15.0, 17.0, 20.0, 17.0, 19.0, 33.0, 38.0, 31.0, 36.0, 41.0, 47.0, 48.0, 58.0, 42.0, 49.0, 57.0, 48.0, 49.0, 35.0, 41.0, 28.0, 43.0, 13.0, 21.0, 19.0, 15.0, 13.0, 23.0, 12.0, 12.0, 13.0, 9.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.2219009399414, -65.24609375, -63.270286560058594, -61.29447937011719, -59.31867218017578, -57.342864990234375, -55.36705780029297, -53.3912467956543, -51.41543960571289, -49.439632415771484, -47.46382522583008, -45.48801803588867, -43.512210845947266, -41.536399841308594, -39.56059265136719, -37.58478546142578, -35.608978271484375, -33.63317108154297, -31.657363891601562, -29.681556701660156, -27.705747604370117, -25.72994041442871, -23.754133224487305, -21.778324127197266, -19.802520751953125, -17.82671356201172, -15.850905418395996, -13.87509822845459, -11.899290084838867, -9.923482894897461, -7.947675704956055, -5.971867561340332, -3.9960594177246094, -2.020251750946045, -0.04444432258605957, 1.9313631057739258, 3.9071707725524902, 5.882978439331055, 7.858785629272461, 9.834593772888184, 11.81040096282959, 13.786208152770996, 15.762016296386719, 17.737823486328125, 19.71363067626953, 21.689437866210938, 23.665245056152344, 25.641054153442383, 27.61686134338379, 29.592668533325195, 31.5684757232666, 33.54428482055664, 35.52009201049805, 37.49589920043945, 39.47170639038086, 41.447513580322266, 43.42332077026367, 45.39912796020508, 47.374935150146484, 49.35074234008789, 51.3265495300293, 53.30236053466797, 55.278167724609375, 57.25397491455078, 59.22978210449219]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 6.0, 9.0, 10.0, 17.0, 14.0, 21.0, 23.0, 31.0, 31.0, 27.0, 32.0, 38.0, 45.0, 34.0, 40.0, 37.0, 48.0, 29.0, 44.0, 47.0, 35.0, 33.0, 40.0, 29.0, 32.0, 35.0, 23.0, 29.0, 23.0, 10.0, 15.0, 21.0, 11.0, 11.0, 15.0, 6.0, 3.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-6.84765625, -6.64874267578125, -6.4498291015625, -6.25091552734375, -6.052001953125, -5.85308837890625, -5.6541748046875, -5.45526123046875, -5.25634765625, -5.05743408203125, -4.8585205078125, -4.65960693359375, -4.460693359375, -4.26177978515625, -4.0628662109375, -3.86395263671875, -3.6650390625, -3.46612548828125, -3.2672119140625, -3.06829833984375, -2.869384765625, -2.67047119140625, -2.4715576171875, -2.27264404296875, -2.07373046875, -1.87481689453125, -1.6759033203125, -1.47698974609375, -1.278076171875, -1.07916259765625, -0.8802490234375, -0.68133544921875, -0.482421875, -0.28350830078125, -0.0845947265625, 0.11431884765625, 0.313232421875, 0.51214599609375, 0.7110595703125, 0.90997314453125, 1.10888671875, 1.30780029296875, 1.5067138671875, 1.70562744140625, 1.904541015625, 2.10345458984375, 2.3023681640625, 2.50128173828125, 2.7001953125, 2.89910888671875, 3.0980224609375, 3.29693603515625, 3.495849609375, 3.69476318359375, 3.8936767578125, 4.09259033203125, 4.29150390625, 4.49041748046875, 4.6893310546875, 4.88824462890625, 5.087158203125, 5.28607177734375, 5.4849853515625, 5.68389892578125, 5.8828125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 12.0, 13.0, 31.0, 46.0, 40.0, 79.0, 121.0, 179.0, 299.0, 438.0, 646.0, 1022.0, 1506.0, 2266.0, 3540.0, 5515.0, 8477.0, 13768.0, 22257.0, 37591.0, 66733.0, 131757.0, 263708.0, 230698.0, 111812.0, 58601.0, 33276.0, 19935.0, 12260.0, 7809.0, 4907.0, 3124.0, 2043.0, 1318.0, 879.0, 595.0, 402.0, 282.0, 174.0, 117.0, 97.0, 54.0, 40.0, 29.0, 11.0, 13.0, 12.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.2939453125, -0.28527069091796875, -0.2765960693359375, -0.26792144775390625, -0.259246826171875, -0.25057220458984375, -0.2418975830078125, -0.23322296142578125, -0.22454833984375, -0.21587371826171875, -0.2071990966796875, -0.19852447509765625, -0.189849853515625, -0.18117523193359375, -0.1725006103515625, -0.16382598876953125, -0.1551513671875, -0.14647674560546875, -0.1378021240234375, -0.12912750244140625, -0.120452880859375, -0.11177825927734375, -0.1031036376953125, -0.09442901611328125, -0.08575439453125, -0.07707977294921875, -0.0684051513671875, -0.05973052978515625, -0.051055908203125, -0.04238128662109375, -0.0337066650390625, -0.02503204345703125, -0.016357421875, -0.00768280029296875, 0.0009918212890625, 0.00966644287109375, 0.018341064453125, 0.02701568603515625, 0.0356903076171875, 0.04436492919921875, 0.05303955078125, 0.06171417236328125, 0.0703887939453125, 0.07906341552734375, 0.087738037109375, 0.09641265869140625, 0.1050872802734375, 0.11376190185546875, 0.1224365234375, 0.13111114501953125, 0.1397857666015625, 0.14846038818359375, 0.157135009765625, 0.16580963134765625, 0.1744842529296875, 0.18315887451171875, 0.19183349609375, 0.20050811767578125, 0.2091827392578125, 0.21785736083984375, 0.226531982421875, 0.23520660400390625, 0.2438812255859375, 0.25255584716796875, 0.26123046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 4.0, 5.0, 16.0, 9.0, 11.0, 25.0, 19.0, 29.0, 27.0, 27.0, 36.0, 31.0, 32.0, 48.0, 41.0, 51.0, 39.0, 1075.0, 45.0, 51.0, 40.0, 32.0, 44.0, 34.0, 41.0, 29.0, 27.0, 18.0, 19.0, 18.0, 25.0, 17.0, 15.0, 9.0, 10.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.21484375, -4.07421875, -3.93359375, -3.79296875, -3.65234375, -3.51171875, -3.37109375, -3.23046875, -3.08984375, -2.94921875, -2.80859375, -2.66796875, -2.52734375, -2.38671875, -2.24609375, -2.10546875, -1.96484375, -1.82421875, -1.68359375, -1.54296875, -1.40234375, -1.26171875, -1.12109375, -0.98046875, -0.83984375, -0.69921875, -0.55859375, -0.41796875, -0.27734375, -0.13671875, 0.00390625, 0.14453125, 0.28515625, 0.42578125, 0.56640625, 0.70703125, 0.84765625, 0.98828125, 1.12890625, 1.26953125, 1.41015625, 1.55078125, 1.69140625, 1.83203125, 1.97265625, 2.11328125, 2.25390625, 2.39453125, 2.53515625, 2.67578125, 2.81640625, 2.95703125, 3.09765625, 3.23828125, 3.37890625, 3.51953125, 3.66015625, 3.80078125, 3.94140625, 4.08203125, 4.22265625, 4.36328125, 4.50390625, 4.64453125, 4.78515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 10.0, 17.0, 18.0, 30.0, 49.0, 64.0, 87.0, 142.0, 190.0, 289.0, 395.0, 633.0, 975.0, 1420.0, 2193.0, 3445.0, 5267.0, 8403.0, 13625.0, 22074.0, 37417.0, 66615.0, 134640.0, 1327184.0, 230572.0, 104324.0, 54415.0, 31556.0, 18841.0, 11382.0, 7392.0, 4662.0, 2982.0, 1888.0, 1269.0, 824.0, 592.0, 385.0, 254.0, 184.0, 116.0, 93.0, 63.0, 44.0, 30.0, 28.0, 12.0, 8.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.255859375, -0.24756240844726562, -0.23926544189453125, -0.23096847534179688, -0.2226715087890625, -0.21437454223632812, -0.20607757568359375, -0.19778060913085938, -0.189483642578125, -0.18118667602539062, -0.17288970947265625, -0.16459274291992188, -0.1562957763671875, -0.14799880981445312, -0.13970184326171875, -0.13140487670898438, -0.12310791015625, -0.11481094360351562, -0.10651397705078125, -0.09821701049804688, -0.0899200439453125, -0.08162307739257812, -0.07332611083984375, -0.06502914428710938, -0.056732177734375, -0.048435211181640625, -0.04013824462890625, -0.031841278076171875, -0.0235443115234375, -0.015247344970703125, -0.00695037841796875, 0.001346588134765625, 0.0096435546875, 0.017940521240234375, 0.02623748779296875, 0.034534454345703125, 0.0428314208984375, 0.051128387451171875, 0.05942535400390625, 0.06772232055664062, 0.076019287109375, 0.08431625366210938, 0.09261322021484375, 0.10091018676757812, 0.1092071533203125, 0.11750411987304688, 0.12580108642578125, 0.13409805297851562, 0.14239501953125, 0.15069198608398438, 0.15898895263671875, 0.16728591918945312, 0.1755828857421875, 0.18387985229492188, 0.19217681884765625, 0.20047378540039062, 0.208770751953125, 0.21706771850585938, 0.22536468505859375, 0.23366165161132812, 0.2419586181640625, 0.2502555847167969, 0.25855255126953125, 0.2668495178222656, 0.275146484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 6.0, 15.0, 9.0, 28.0, 28.0, 25.0, 41.0, 42.0, 44.0, 51.0, 65.0, 69.0, 63.0, 59.0, 73.0, 59.0, 52.0, 36.0, 39.0, 40.0, 33.0, 28.0, 15.0, 12.0, 9.0, 12.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.239620804786682e-05, -5.090981721878052e-05, -4.9423426389694214e-05, -4.793703556060791e-05, -4.6450644731521606e-05, -4.49642539024353e-05, -4.3477863073349e-05, -4.1991472244262695e-05, -4.050508141517639e-05, -3.901869058609009e-05, -3.7532299757003784e-05, -3.604590892791748e-05, -3.455951809883118e-05, -3.307312726974487e-05, -3.158673644065857e-05, -3.0100345611572266e-05, -2.8613954782485962e-05, -2.7127563953399658e-05, -2.5641173124313354e-05, -2.415478229522705e-05, -2.2668391466140747e-05, -2.1182000637054443e-05, -1.969560980796814e-05, -1.8209218978881836e-05, -1.6722828149795532e-05, -1.5236437320709229e-05, -1.3750046491622925e-05, -1.2263655662536621e-05, -1.0777264833450317e-05, -9.290874004364014e-06, -7.80448317527771e-06, -6.318092346191406e-06, -4.8317015171051025e-06, -3.345310688018799e-06, -1.8589198589324951e-06, -3.725290298461914e-07, 1.1138617992401123e-06, 2.600252628326416e-06, 4.08664345741272e-06, 5.5730342864990234e-06, 7.059425115585327e-06, 8.545815944671631e-06, 1.0032206773757935e-05, 1.1518597602844238e-05, 1.3004988431930542e-05, 1.4491379261016846e-05, 1.597777009010315e-05, 1.7464160919189453e-05, 1.8950551748275757e-05, 2.043694257736206e-05, 2.1923333406448364e-05, 2.3409724235534668e-05, 2.489611506462097e-05, 2.6382505893707275e-05, 2.786889672279358e-05, 2.9355287551879883e-05, 3.0841678380966187e-05, 3.232806921005249e-05, 3.3814460039138794e-05, 3.53008508682251e-05, 3.67872416973114e-05, 3.8273632526397705e-05, 3.976002335548401e-05, 4.124641418457031e-05]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 9.0, 3.0, 10.0, 8.0, 14.0, 19.0, 18.0, 27.0, 36.0, 62.0, 83.0, 89.0, 136.0, 165.0, 315.0, 657.0, 2908.0, 1020681.0, 21248.0, 792.0, 441.0, 243.0, 156.0, 103.0, 76.0, 64.0, 37.0, 40.0, 26.0, 23.0, 15.0, 14.0, 12.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0007872581481933594, -0.0007587894797325134, -0.0007303208112716675, -0.0007018521428108215, -0.0006733834743499756, -0.0006449148058891296, -0.0006164461374282837, -0.0005879774689674377, -0.0005595088005065918, -0.0005310401320457458, -0.0005025714635848999, -0.00047410279512405396, -0.000445634126663208, -0.00041716545820236206, -0.0003886967897415161, -0.00036022812128067017, -0.0003317594528198242, -0.00030329078435897827, -0.0002748221158981323, -0.0002463534474372864, -0.00021788477897644043, -0.00018941611051559448, -0.00016094744205474854, -0.0001324787735939026, -0.00010401010513305664, -7.55414366722107e-05, -4.7072768211364746e-05, -1.86040997505188e-05, 9.864568710327148e-06, 3.8333237171173096e-05, 6.680190563201904e-05, 9.527057409286499e-05, 0.00012373924255371094, 0.00015220791101455688, 0.00018067657947540283, 0.00020914524793624878, 0.00023761391639709473, 0.0002660825848579407, 0.0002945512533187866, 0.00032301992177963257, 0.0003514885902404785, 0.00037995725870132446, 0.0004084259271621704, 0.00043689459562301636, 0.0004653632640838623, 0.0004938319325447083, 0.0005223006010055542, 0.0005507692694664001, 0.0005792379379272461, 0.000607706606388092, 0.000636175274848938, 0.0006646439433097839, 0.0006931126117706299, 0.0007215812802314758, 0.0007500499486923218, 0.0007785186171531677, 0.0008069872856140137, 0.0008354559540748596, 0.0008639246225357056, 0.0008923932909965515, 0.0009208619594573975, 0.0009493306279182434, 0.0009777992963790894, 0.0010062679648399353, 0.0010347366333007812]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 23.0, 82.0, 202.0, 255.0, 250.0, 127.0, 42.0, 13.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.117852510418743e-05, -6.939018931007013e-05, -6.760186079191044e-05, -6.581352499779314e-05, -6.402519647963345e-05, -6.223686068551615e-05, -6.0448528529377654e-05, -5.866019637323916e-05, -5.6871864217100665e-05, -5.508353206096217e-05, -5.3295199904823676e-05, -5.150686774868518e-05, -4.971853195456788e-05, -4.793020343640819e-05, -4.614186764229089e-05, -4.4353535486152396e-05, -4.25652033300139e-05, -4.0776871173875406e-05, -3.898853901773691e-05, -3.720020686159842e-05, -3.541187470545992e-05, -3.362353891134262e-05, -3.1835206755204126e-05, -3.004687459906563e-05, -2.8258542442927137e-05, -2.6470210286788642e-05, -2.4681878130650148e-05, -2.289354415552225e-05, -2.1105211999383755e-05, -1.931687984324526e-05, -1.7528545868117362e-05, -1.5740213711978868e-05, -1.3951877917861566e-05, -1.2163545761723071e-05, -1.0375212696089875e-05, -8.586879630456679e-06, -6.798547474318184e-06, -5.010215318179689e-06, -3.221882252546493e-06, -1.4335491869132966e-06, 3.5478296922519803e-07, 2.1431155801110435e-06, 3.931448190996889e-06, 5.7197808018827345e-06, 7.50811341276858e-06, 9.296445568907075e-06, 1.1084778634540271e-05, 1.2873111700173467e-05, 1.4661443856311962e-05, 1.6449776012450457e-05, 1.823810816858895e-05, 2.002644214371685e-05, 2.1814774299855344e-05, 2.360310645599384e-05, 2.5391440431121737e-05, 2.717977258726023e-05, 2.8968104743398726e-05, 3.075643689953722e-05, 3.2544769055675715e-05, 3.433310121181421e-05, 3.6121433367952704e-05, 3.7909769162070006e-05, 3.96981013182085e-05, 4.1486433474346995e-05, 4.327476563048549e-05]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 7.0, 5.0, 13.0, 16.0, 11.0, 27.0, 17.0, 33.0, 26.0, 33.0, 28.0, 40.0, 39.0, 50.0, 46.0, 44.0, 42.0, 56.0, 31.0, 32.0, 35.0, 33.0, 41.0, 37.0, 37.0, 23.0, 27.0, 21.0, 23.0, 15.0, 16.0, 16.0, 9.0, 12.0, 7.0, 8.0, 8.0, 6.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0444393157958984e-05, -1.976173371076584e-05, -1.9079074263572693e-05, -1.8396414816379547e-05, -1.77137553691864e-05, -1.7031095921993256e-05, -1.634843647480011e-05, -1.5665777027606964e-05, -1.4983117580413818e-05, -1.4300458133220673e-05, -1.3617798686027527e-05, -1.2935139238834381e-05, -1.2252479791641235e-05, -1.156982034444809e-05, -1.0887160897254944e-05, -1.0204501450061798e-05, -9.521842002868652e-06, -8.839182555675507e-06, -8.15652310848236e-06, -7.473863661289215e-06, -6.791204214096069e-06, -6.108544766902924e-06, -5.425885319709778e-06, -4.743225872516632e-06, -4.060566425323486e-06, -3.3779069781303406e-06, -2.695247530937195e-06, -2.012588083744049e-06, -1.3299286365509033e-06, -6.472691893577576e-07, 3.5390257835388184e-08, 7.180497050285339e-07, 1.4007091522216797e-06, 2.0833685994148254e-06, 2.766028046607971e-06, 3.448687493801117e-06, 4.131346940994263e-06, 4.8140063881874084e-06, 5.496665835380554e-06, 6.1793252825737e-06, 6.861984729766846e-06, 7.5446441769599915e-06, 8.227303624153137e-06, 8.909963071346283e-06, 9.592622518539429e-06, 1.0275281965732574e-05, 1.095794141292572e-05, 1.1640600860118866e-05, 1.2323260307312012e-05, 1.3005919754505157e-05, 1.3688579201698303e-05, 1.4371238648891449e-05, 1.5053898096084595e-05, 1.573655754327774e-05, 1.6419216990470886e-05, 1.7101876437664032e-05, 1.7784535884857178e-05, 1.8467195332050323e-05, 1.914985477924347e-05, 1.9832514226436615e-05, 2.051517367362976e-05, 2.1197833120822906e-05, 2.1880492568016052e-05, 2.2563152015209198e-05, 2.3245811462402344e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 6.0, 9.0, 10.0, 17.0, 14.0, 21.0, 23.0, 31.0, 31.0, 27.0, 32.0, 38.0, 45.0, 34.0, 40.0, 37.0, 48.0, 29.0, 44.0, 47.0, 35.0, 33.0, 40.0, 29.0, 32.0, 35.0, 23.0, 29.0, 23.0, 10.0, 15.0, 21.0, 11.0, 11.0, 15.0, 6.0, 3.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-6.84765625, -6.64874267578125, -6.4498291015625, -6.25091552734375, -6.052001953125, -5.85308837890625, -5.6541748046875, -5.45526123046875, -5.25634765625, -5.05743408203125, -4.8585205078125, -4.65960693359375, -4.460693359375, -4.26177978515625, -4.0628662109375, -3.86395263671875, -3.6650390625, -3.46612548828125, -3.2672119140625, -3.06829833984375, -2.869384765625, -2.67047119140625, -2.4715576171875, -2.27264404296875, -2.07373046875, -1.87481689453125, -1.6759033203125, -1.47698974609375, -1.278076171875, -1.07916259765625, -0.8802490234375, -0.68133544921875, -0.482421875, -0.28350830078125, -0.0845947265625, 0.11431884765625, 0.313232421875, 0.51214599609375, 0.7110595703125, 0.90997314453125, 1.10888671875, 1.30780029296875, 1.5067138671875, 1.70562744140625, 1.904541015625, 2.10345458984375, 2.3023681640625, 2.50128173828125, 2.7001953125, 2.89910888671875, 3.0980224609375, 3.29693603515625, 3.495849609375, 3.69476318359375, 3.8936767578125, 4.09259033203125, 4.29150390625, 4.49041748046875, 4.6893310546875, 4.88824462890625, 5.087158203125, 5.28607177734375, 5.4849853515625, 5.68389892578125, 5.8828125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 10.0, 11.0, 9.0, 9.0, 23.0, 21.0, 35.0, 43.0, 65.0, 87.0, 107.0, 162.0, 238.0, 309.0, 453.0, 602.0, 905.0, 1475.0, 2401.0, 4575.0, 12241.0, 62719.0, 553809.0, 349278.0, 39661.0, 9223.0, 3800.0, 2019.0, 1377.0, 919.0, 531.0, 390.0, 293.0, 207.0, 151.0, 99.0, 84.0, 56.0, 32.0, 39.0, 24.0, 18.0, 11.0, 8.0, 9.0, 2.0, 7.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.46875, -13.9677734375, -13.466796875, -12.9658203125, -12.46484375, -11.9638671875, -11.462890625, -10.9619140625, -10.4609375, -9.9599609375, -9.458984375, -8.9580078125, -8.45703125, -7.9560546875, -7.455078125, -6.9541015625, -6.453125, -5.9521484375, -5.451171875, -4.9501953125, -4.44921875, -3.9482421875, -3.447265625, -2.9462890625, -2.4453125, -1.9443359375, -1.443359375, -0.9423828125, -0.44140625, 0.0595703125, 0.560546875, 1.0615234375, 1.5625, 2.0634765625, 2.564453125, 3.0654296875, 3.56640625, 4.0673828125, 4.568359375, 5.0693359375, 5.5703125, 6.0712890625, 6.572265625, 7.0732421875, 7.57421875, 8.0751953125, 8.576171875, 9.0771484375, 9.578125, 10.0791015625, 10.580078125, 11.0810546875, 11.58203125, 12.0830078125, 12.583984375, 13.0849609375, 13.5859375, 14.0869140625, 14.587890625, 15.0888671875, 15.58984375, 16.0908203125, 16.591796875, 17.0927734375, 17.59375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 10.0, 10.0, 11.0, 17.0, 22.0, 26.0, 33.0, 30.0, 41.0, 41.0, 57.0, 66.0, 96.0, 235.0, 1666.0, 217.0, 69.0, 71.0, 54.0, 45.0, 28.0, 45.0, 28.0, 19.0, 19.0, 15.0, 15.0, 13.0, 11.0, 3.0, 11.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.946044921875, -19.26708984375, -18.588134765625, -17.9091796875, -17.230224609375, -16.55126953125, -15.872314453125, -15.193359375, -14.514404296875, -13.83544921875, -13.156494140625, -12.4775390625, -11.798583984375, -11.11962890625, -10.440673828125, -9.76171875, -9.082763671875, -8.40380859375, -7.724853515625, -7.0458984375, -6.366943359375, -5.68798828125, -5.009033203125, -4.330078125, -3.651123046875, -2.97216796875, -2.293212890625, -1.6142578125, -0.935302734375, -0.25634765625, 0.422607421875, 1.1015625, 1.780517578125, 2.45947265625, 3.138427734375, 3.8173828125, 4.496337890625, 5.17529296875, 5.854248046875, 6.533203125, 7.212158203125, 7.89111328125, 8.570068359375, 9.2490234375, 9.927978515625, 10.60693359375, 11.285888671875, 11.96484375, 12.643798828125, 13.32275390625, 14.001708984375, 14.6806640625, 15.359619140625, 16.03857421875, 16.717529296875, 17.396484375, 18.075439453125, 18.75439453125, 19.433349609375, 20.1123046875, 20.791259765625, 21.47021484375, 22.149169921875, 22.828125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 12.0, 18.0, 16.0, 25.0, 25.0, 39.0, 45.0, 61.0, 78.0, 105.0, 151.0, 206.0, 319.0, 652.0, 1942.0, 194644.0, 2942260.0, 3028.0, 819.0, 426.0, 227.0, 153.0, 114.0, 77.0, 63.0, 40.0, 44.0, 20.0, 20.0, 12.0, 10.0, 12.0, 4.0, 8.0, 5.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-60.3125, -58.68798828125, -57.0634765625, -55.43896484375, -53.814453125, -52.18994140625, -50.5654296875, -48.94091796875, -47.31640625, -45.69189453125, -44.0673828125, -42.44287109375, -40.818359375, -39.19384765625, -37.5693359375, -35.94482421875, -34.3203125, -32.69580078125, -31.0712890625, -29.44677734375, -27.822265625, -26.19775390625, -24.5732421875, -22.94873046875, -21.32421875, -19.69970703125, -18.0751953125, -16.45068359375, -14.826171875, -13.20166015625, -11.5771484375, -9.95263671875, -8.328125, -6.70361328125, -5.0791015625, -3.45458984375, -1.830078125, -0.20556640625, 1.4189453125, 3.04345703125, 4.66796875, 6.29248046875, 7.9169921875, 9.54150390625, 11.166015625, 12.79052734375, 14.4150390625, 16.03955078125, 17.6640625, 19.28857421875, 20.9130859375, 22.53759765625, 24.162109375, 25.78662109375, 27.4111328125, 29.03564453125, 30.66015625, 32.28466796875, 33.9091796875, 35.53369140625, 37.158203125, 38.78271484375, 40.4072265625, 42.03173828125, 43.65625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 293.0, 651.0, 61.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.8982849121094, -297.026611328125, -290.15496826171875, -283.2832946777344, -276.41162109375, -269.53997802734375, -262.6683044433594, -255.79664611816406, -248.92498779296875, -242.05332946777344, -235.18167114257812, -228.30999755859375, -221.43833923339844, -214.56668090820312, -207.69500732421875, -200.82334899902344, -193.95169067382812, -187.0800323486328, -180.2083740234375, -173.33670043945312, -166.4650421142578, -159.5933837890625, -152.72171020507812, -145.8500518798828, -138.9783935546875, -132.1067352294922, -125.23506927490234, -118.3634033203125, -111.49174499511719, -104.62008666992188, -97.74842071533203, -90.87675476074219, -84.00508117675781, -77.1334228515625, -70.26175689697266, -63.39009475708008, -56.5184326171875, -49.64677047729492, -42.775108337402344, -35.903446197509766, -29.031784057617188, -22.16012191772461, -15.288459777832031, -8.416797637939453, -1.545135498046875, 5.326526641845703, 12.198188781738281, 19.06985092163086, 25.941513061523438, 32.813175201416016, 39.684837341308594, 46.55649948120117, 53.42816162109375, 60.29982376098633, 67.1714859008789, 74.04315185546875, 80.91481018066406, 87.78646850585938, 94.65813446044922, 101.52980041503906, 108.40145874023438, 115.27311706542969, 122.14478302001953, 129.01644897460938, 135.8881072998047]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 5.0, 0.0, 3.0, 6.0, 8.0, 7.0, 7.0, 11.0, 13.0, 14.0, 11.0, 22.0, 32.0, 33.0, 25.0, 34.0, 33.0, 28.0, 38.0, 41.0, 44.0, 50.0, 46.0, 45.0, 47.0, 45.0, 32.0, 36.0, 41.0, 27.0, 24.0, 37.0, 19.0, 16.0, 21.0, 12.0, 14.0, 20.0, 9.0, 7.0, 12.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-50.88621139526367, -49.14295196533203, -47.399696350097656, -45.656436920166016, -43.91318130493164, -42.169921875, -40.426666259765625, -38.683406829833984, -36.940147399902344, -35.1968879699707, -33.45363235473633, -31.710372924804688, -29.967117309570312, -28.223857879638672, -26.480600357055664, -24.737342834472656, -22.99408721923828, -21.250829696655273, -19.507572174072266, -17.764312744140625, -16.02105712890625, -14.277798652648926, -12.534540176391602, -10.791282653808594, -9.048025131225586, -7.304767608642578, -5.561509609222412, -3.818251609802246, -2.0749940872192383, -0.33173656463623047, 1.4115219116210938, 3.1547794342041016, 4.898033142089844, 6.641290664672852, 8.38454818725586, 10.127806663513184, 11.871064186096191, 13.6143217086792, 15.357580184936523, 17.10083770751953, 18.84409523010254, 20.587352752685547, 22.330610275268555, 24.073867797851562, 25.817127227783203, 27.560382843017578, 29.30364227294922, 31.046899795532227, 32.790157318115234, 34.533416748046875, 36.27667236328125, 38.01993179321289, 39.763187408447266, 41.506446838378906, 43.24970245361328, 44.99296188354492, 46.73622131347656, 48.4794807434082, 50.22273635864258, 51.96599578857422, 53.709251403808594, 55.452510833740234, 57.195770263671875, 58.93902587890625, 60.682281494140625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 7.0, 9.0, 12.0, 25.0, 17.0, 28.0, 24.0, 24.0, 23.0, 26.0, 38.0, 42.0, 30.0, 35.0, 48.0, 37.0, 30.0, 42.0, 46.0, 41.0, 50.0, 41.0, 42.0, 35.0, 23.0, 22.0, 29.0, 25.0, 20.0, 15.0, 8.0, 11.0, 17.0, 10.0, 18.0, 7.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.125, -6.9095458984375, -6.694091796875, -6.4786376953125, -6.26318359375, -6.0477294921875, -5.832275390625, -5.6168212890625, -5.4013671875, -5.1859130859375, -4.970458984375, -4.7550048828125, -4.53955078125, -4.3240966796875, -4.108642578125, -3.8931884765625, -3.677734375, -3.4622802734375, -3.246826171875, -3.0313720703125, -2.81591796875, -2.6004638671875, -2.385009765625, -2.1695556640625, -1.9541015625, -1.7386474609375, -1.523193359375, -1.3077392578125, -1.09228515625, -0.8768310546875, -0.661376953125, -0.4459228515625, -0.23046875, -0.0150146484375, 0.200439453125, 0.4158935546875, 0.63134765625, 0.8468017578125, 1.062255859375, 1.2777099609375, 1.4931640625, 1.7086181640625, 1.924072265625, 2.1395263671875, 2.35498046875, 2.5704345703125, 2.785888671875, 3.0013427734375, 3.216796875, 3.4322509765625, 3.647705078125, 3.8631591796875, 4.07861328125, 4.2940673828125, 4.509521484375, 4.7249755859375, 4.9404296875, 5.1558837890625, 5.371337890625, 5.5867919921875, 5.80224609375, 6.0177001953125, 6.233154296875, 6.4486083984375, 6.6640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 9.0, 14.0, 16.0, 22.0, 37.0, 58.0, 92.0, 128.0, 197.0, 307.0, 505.0, 798.0, 1426.0, 2453.0, 4105.0, 8451.0, 20396.0, 98129.0, 876980.0, 2460010.0, 616764.0, 69781.0, 17223.0, 7298.0, 3722.0, 2132.0, 1212.0, 782.0, 457.0, 273.0, 183.0, 119.0, 63.0, 50.0, 26.0, 21.0, 6.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.875, -12.477783203125, -12.08056640625, -11.683349609375, -11.2861328125, -10.888916015625, -10.49169921875, -10.094482421875, -9.697265625, -9.300048828125, -8.90283203125, -8.505615234375, -8.1083984375, -7.711181640625, -7.31396484375, -6.916748046875, -6.51953125, -6.122314453125, -5.72509765625, -5.327880859375, -4.9306640625, -4.533447265625, -4.13623046875, -3.739013671875, -3.341796875, -2.944580078125, -2.54736328125, -2.150146484375, -1.7529296875, -1.355712890625, -0.95849609375, -0.561279296875, -0.1640625, 0.233154296875, 0.63037109375, 1.027587890625, 1.4248046875, 1.822021484375, 2.21923828125, 2.616455078125, 3.013671875, 3.410888671875, 3.80810546875, 4.205322265625, 4.6025390625, 4.999755859375, 5.39697265625, 5.794189453125, 6.19140625, 6.588623046875, 6.98583984375, 7.383056640625, 7.7802734375, 8.177490234375, 8.57470703125, 8.971923828125, 9.369140625, 9.766357421875, 10.16357421875, 10.560791015625, 10.9580078125, 11.355224609375, 11.75244140625, 12.149658203125, 12.546875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 11.0, 60.0, 435.0, 2564.0, 878.0, 116.0, 15.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.6875, -78.359375, -76.03125, -73.703125, -71.375, -69.046875, -66.71875, -64.390625, -62.0625, -59.734375, -57.40625, -55.078125, -52.75, -50.421875, -48.09375, -45.765625, -43.4375, -41.109375, -38.78125, -36.453125, -34.125, -31.796875, -29.46875, -27.140625, -24.8125, -22.484375, -20.15625, -17.828125, -15.5, -13.171875, -10.84375, -8.515625, -6.1875, -3.859375, -1.53125, 0.796875, 3.125, 5.453125, 7.78125, 10.109375, 12.4375, 14.765625, 17.09375, 19.421875, 21.75, 24.078125, 26.40625, 28.734375, 31.0625, 33.390625, 35.71875, 38.046875, 40.375, 42.703125, 45.03125, 47.359375, 49.6875, 52.015625, 54.34375, 56.671875, 59.0, 61.328125, 63.65625, 65.984375, 68.3125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 41.0, 131.0, 573.0, 6654.0, 4183093.0, 3200.0, 414.0, 126.0, 25.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.1875, -118.0322265625, -113.876953125, -109.7216796875, -105.56640625, -101.4111328125, -97.255859375, -93.1005859375, -88.9453125, -84.7900390625, -80.634765625, -76.4794921875, -72.32421875, -68.1689453125, -64.013671875, -59.8583984375, -55.703125, -51.5478515625, -47.392578125, -43.2373046875, -39.08203125, -34.9267578125, -30.771484375, -26.6162109375, -22.4609375, -18.3056640625, -14.150390625, -9.9951171875, -5.83984375, -1.6845703125, 2.470703125, 6.6259765625, 10.78125, 14.9365234375, 19.091796875, 23.2470703125, 27.40234375, 31.5576171875, 35.712890625, 39.8681640625, 44.0234375, 48.1787109375, 52.333984375, 56.4892578125, 60.64453125, 64.7998046875, 68.955078125, 73.1103515625, 77.265625, 81.4208984375, 85.576171875, 89.7314453125, 93.88671875, 98.0419921875, 102.197265625, 106.3525390625, 110.5078125, 114.6630859375, 118.818359375, 122.9736328125, 127.12890625, 131.2841796875, 135.439453125, 139.5947265625, 143.75]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 34.0, 341.0, 542.0, 92.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-393.16925048828125, -384.27490234375, -375.38055419921875, -366.4862365722656, -357.5918884277344, -348.6975402832031, -339.8031921386719, -330.90887451171875, -322.0145263671875, -313.12017822265625, -304.225830078125, -295.3315124511719, -286.4371643066406, -277.5428161621094, -268.6484680175781, -259.754150390625, -250.8597869873047, -241.96543884277344, -233.07110595703125, -224.1767578125, -215.2824249267578, -206.38807678222656, -197.49374389648438, -188.59939575195312, -179.70504760742188, -170.81069946289062, -161.91636657714844, -153.0220184326172, -144.127685546875, -135.23333740234375, -126.33899688720703, -117.44465637207031, -108.55030822753906, -99.65596771240234, -90.76162719726562, -81.86727905273438, -72.97294616699219, -64.07859802246094, -55.18425750732422, -46.2899169921875, -37.39557647705078, -28.501235961914062, -19.60689353942871, -10.71255111694336, -1.8182106018066406, 7.076129913330078, 15.970474243164062, 24.86481475830078, 33.7591552734375, 42.65349578857422, 51.54783630371094, 60.44218063354492, 69.33651733398438, 78.23086547851562, 87.12520599365234, 96.01954650878906, 104.91388702392578, 113.8082275390625, 122.70256805419922, 131.59690856933594, 140.4912567138672, 149.38558959960938, 158.27993774414062, 167.17428588867188, 176.06861877441406]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 10.0, 4.0, 12.0, 16.0, 11.0, 17.0, 12.0, 19.0, 33.0, 36.0, 25.0, 38.0, 31.0, 41.0, 36.0, 44.0, 36.0, 38.0, 35.0, 51.0, 39.0, 40.0, 35.0, 38.0, 33.0, 40.0, 35.0, 29.0, 26.0, 15.0, 19.0, 17.0, 17.0, 11.0, 8.0, 11.0, 4.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-60.02388381958008, -58.277339935302734, -56.530799865722656, -54.78425598144531, -53.03771209716797, -51.291168212890625, -49.54462814331055, -47.7980842590332, -46.051544189453125, -44.30500030517578, -42.5584602355957, -40.81191635131836, -39.065372467041016, -37.31883239746094, -35.572288513183594, -33.82574462890625, -32.079200744628906, -30.332658767700195, -28.58611488342285, -26.83957290649414, -25.093029022216797, -23.346487045288086, -21.599945068359375, -19.85340118408203, -18.10685920715332, -16.36031723022461, -14.613773345947266, -12.867231369018555, -11.120688438415527, -9.3741455078125, -7.627603530883789, -5.881060600280762, -4.134513854980469, -2.3879711627960205, -0.6414284706115723, 1.1051139831542969, 2.851656913757324, 4.598199844360352, 6.3447418212890625, 8.09128475189209, 9.837827682495117, 11.584370613098145, 13.330913543701172, 15.077455520629883, 16.823997497558594, 18.570541381835938, 20.31708335876465, 22.06362533569336, 23.810169219970703, 25.556711196899414, 27.303255081176758, 29.04979705810547, 30.796340942382812, 32.542884826660156, 34.289424896240234, 36.03596878051758, 37.782508850097656, 39.529052734375, 41.27559280395508, 43.02213668823242, 44.768680572509766, 46.515220642089844, 48.26176452636719, 50.00830841064453, 51.754852294921875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 7.0, 4.0, 6.0, 7.0, 10.0, 15.0, 5.0, 13.0, 15.0, 14.0, 19.0, 16.0, 20.0, 13.0, 30.0, 24.0, 27.0, 27.0, 22.0, 28.0, 32.0, 40.0, 35.0, 38.0, 25.0, 34.0, 51.0, 33.0, 31.0, 38.0, 36.0, 33.0, 22.0, 22.0, 20.0, 23.0, 14.0, 22.0, 22.0, 19.0, 17.0, 14.0, 10.0, 8.0, 11.0, 5.0, 6.0, 3.0, 4.0, 5.0, 5.0, 1.0, 5.0, 0.0, 0.0, 5.0], "bins": [-5.4765625, -5.3099365234375, -5.143310546875, -4.9766845703125, -4.81005859375, -4.6434326171875, -4.476806640625, -4.3101806640625, -4.1435546875, -3.9769287109375, -3.810302734375, -3.6436767578125, -3.47705078125, -3.3104248046875, -3.143798828125, -2.9771728515625, -2.810546875, -2.6439208984375, -2.477294921875, -2.3106689453125, -2.14404296875, -1.9774169921875, -1.810791015625, -1.6441650390625, -1.4775390625, -1.3109130859375, -1.144287109375, -0.9776611328125, -0.81103515625, -0.6444091796875, -0.477783203125, -0.3111572265625, -0.14453125, 0.0220947265625, 0.188720703125, 0.3553466796875, 0.52197265625, 0.6885986328125, 0.855224609375, 1.0218505859375, 1.1884765625, 1.3551025390625, 1.521728515625, 1.6883544921875, 1.85498046875, 2.0216064453125, 2.188232421875, 2.3548583984375, 2.521484375, 2.6881103515625, 2.854736328125, 3.0213623046875, 3.18798828125, 3.3546142578125, 3.521240234375, 3.6878662109375, 3.8544921875, 4.0211181640625, 4.187744140625, 4.3543701171875, 4.52099609375, 4.6876220703125, 4.854248046875, 5.0208740234375, 5.1875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 11.0, 25.0, 33.0, 43.0, 58.0, 78.0, 123.0, 160.0, 252.0, 363.0, 556.0, 794.0, 1119.0, 1530.0, 2254.0, 3111.0, 4528.0, 6319.0, 9288.0, 12867.0, 19210.0, 28106.0, 43002.0, 69946.0, 127399.0, 236289.0, 200789.0, 103574.0, 59057.0, 37405.0, 24733.0, 16729.0, 11457.0, 8171.0, 5782.0, 4010.0, 2863.0, 1924.0, 1416.0, 972.0, 650.0, 478.0, 349.0, 228.0, 169.0, 101.0, 61.0, 61.0, 37.0, 23.0, 16.0, 13.0, 9.0, 5.0, 1.0, 4.0, 3.0], "bins": [-0.212890625, -0.2064075469970703, -0.19992446899414062, -0.19344139099121094, -0.18695831298828125, -0.18047523498535156, -0.17399215698242188, -0.1675090789794922, -0.1610260009765625, -0.1545429229736328, -0.14805984497070312, -0.14157676696777344, -0.13509368896484375, -0.12861061096191406, -0.12212753295898438, -0.11564445495605469, -0.109161376953125, -0.10267829895019531, -0.09619522094726562, -0.08971214294433594, -0.08322906494140625, -0.07674598693847656, -0.07026290893554688, -0.06377983093261719, -0.0572967529296875, -0.05081367492675781, -0.044330596923828125, -0.03784751892089844, -0.03136444091796875, -0.024881362915039062, -0.018398284912109375, -0.011915206909179688, -0.00543212890625, 0.0010509490966796875, 0.007534027099609375, 0.014017105102539062, 0.02050018310546875, 0.026983261108398438, 0.033466339111328125, 0.03994941711425781, 0.0464324951171875, 0.05291557312011719, 0.059398651123046875, 0.06588172912597656, 0.07236480712890625, 0.07884788513183594, 0.08533096313476562, 0.09181404113769531, 0.098297119140625, 0.10478019714355469, 0.11126327514648438, 0.11774635314941406, 0.12422943115234375, 0.13071250915527344, 0.13719558715820312, 0.1436786651611328, 0.1501617431640625, 0.1566448211669922, 0.16312789916992188, 0.16961097717285156, 0.17609405517578125, 0.18257713317871094, 0.18906021118164062, 0.1955432891845703, 0.2020263671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 13.0, 18.0, 14.0, 14.0, 16.0, 13.0, 27.0, 28.0, 21.0, 20.0, 36.0, 37.0, 42.0, 52.0, 44.0, 37.0, 48.0, 1068.0, 45.0, 29.0, 32.0, 37.0, 37.0, 33.0, 25.0, 26.0, 29.0, 25.0, 27.0, 22.0, 13.0, 14.0, 7.0, 13.0, 13.0, 10.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.875732421875, -3.74755859375, -3.619384765625, -3.4912109375, -3.363037109375, -3.23486328125, -3.106689453125, -2.978515625, -2.850341796875, -2.72216796875, -2.593994140625, -2.4658203125, -2.337646484375, -2.20947265625, -2.081298828125, -1.953125, -1.824951171875, -1.69677734375, -1.568603515625, -1.4404296875, -1.312255859375, -1.18408203125, -1.055908203125, -0.927734375, -0.799560546875, -0.67138671875, -0.543212890625, -0.4150390625, -0.286865234375, -0.15869140625, -0.030517578125, 0.09765625, 0.225830078125, 0.35400390625, 0.482177734375, 0.6103515625, 0.738525390625, 0.86669921875, 0.994873046875, 1.123046875, 1.251220703125, 1.37939453125, 1.507568359375, 1.6357421875, 1.763916015625, 1.89208984375, 2.020263671875, 2.1484375, 2.276611328125, 2.40478515625, 2.532958984375, 2.6611328125, 2.789306640625, 2.91748046875, 3.045654296875, 3.173828125, 3.302001953125, 3.43017578125, 3.558349609375, 3.6865234375, 3.814697265625, 3.94287109375, 4.071044921875, 4.19921875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 9.0, 11.0, 13.0, 15.0, 28.0, 30.0, 37.0, 67.0, 90.0, 143.0, 178.0, 304.0, 441.0, 615.0, 882.0, 1274.0, 1901.0, 2859.0, 4216.0, 6291.0, 9374.0, 14351.0, 22613.0, 35442.0, 58700.0, 109119.0, 233863.0, 1303353.0, 120680.0, 63484.0, 37473.0, 23911.0, 15381.0, 9832.0, 6688.0, 4329.0, 2980.0, 1999.0, 1373.0, 864.0, 597.0, 409.0, 289.0, 200.0, 157.0, 93.0, 49.0, 49.0, 29.0, 18.0, 12.0, 5.0, 10.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2261962890625, -0.2189159393310547, -0.21163558959960938, -0.20435523986816406, -0.19707489013671875, -0.18979454040527344, -0.18251419067382812, -0.1752338409423828, -0.1679534912109375, -0.1606731414794922, -0.15339279174804688, -0.14611244201660156, -0.13883209228515625, -0.13155174255371094, -0.12427139282226562, -0.11699104309082031, -0.109710693359375, -0.10243034362792969, -0.09514999389648438, -0.08786964416503906, -0.08058929443359375, -0.07330894470214844, -0.06602859497070312, -0.05874824523925781, -0.0514678955078125, -0.04418754577636719, -0.036907196044921875, -0.029626846313476562, -0.02234649658203125, -0.015066146850585938, -0.007785797119140625, -0.0005054473876953125, 0.00677490234375, 0.014055252075195312, 0.021335601806640625, 0.028615951538085938, 0.03589630126953125, 0.04317665100097656, 0.050457000732421875, 0.05773735046386719, 0.0650177001953125, 0.07229804992675781, 0.07957839965820312, 0.08685874938964844, 0.09413909912109375, 0.10141944885253906, 0.10869979858398438, 0.11598014831542969, 0.123260498046875, 0.1305408477783203, 0.13782119750976562, 0.14510154724121094, 0.15238189697265625, 0.15966224670410156, 0.16694259643554688, 0.1742229461669922, 0.1815032958984375, 0.1887836456298828, 0.19606399536132812, 0.20334434509277344, 0.21062469482421875, 0.21790504455566406, 0.22518539428710938, 0.2324657440185547, 0.23974609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 4.0, 12.0, 9.0, 10.0, 22.0, 16.0, 18.0, 24.0, 41.0, 36.0, 48.0, 45.0, 45.0, 43.0, 53.0, 52.0, 67.0, 73.0, 48.0, 59.0, 33.0, 33.0, 24.0, 30.0, 28.0, 20.0, 14.0, 16.0, 15.0, 6.0, 8.0, 11.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.750490188598633e-05, -4.61135059595108e-05, -4.472211003303528e-05, -4.3330714106559753e-05, -4.193931818008423e-05, -4.0547922253608704e-05, -3.915652632713318e-05, -3.7765130400657654e-05, -3.637373447418213e-05, -3.4982338547706604e-05, -3.359094262123108e-05, -3.2199546694755554e-05, -3.080815076828003e-05, -2.9416754841804504e-05, -2.802535891532898e-05, -2.6633962988853455e-05, -2.524256706237793e-05, -2.3851171135902405e-05, -2.245977520942688e-05, -2.1068379282951355e-05, -1.967698335647583e-05, -1.8285587430000305e-05, -1.689419150352478e-05, -1.5502795577049255e-05, -1.411139965057373e-05, -1.2720003724098206e-05, -1.132860779762268e-05, -9.937211871147156e-06, -8.545815944671631e-06, -7.154420018196106e-06, -5.763024091720581e-06, -4.371628165245056e-06, -2.9802322387695312e-06, -1.5888363122940063e-06, -1.9744038581848145e-07, 1.1939555406570435e-06, 2.5853514671325684e-06, 3.976747393608093e-06, 5.368143320083618e-06, 6.759539246559143e-06, 8.150935173034668e-06, 9.542331099510193e-06, 1.0933727025985718e-05, 1.2325122952461243e-05, 1.3716518878936768e-05, 1.5107914805412292e-05, 1.6499310731887817e-05, 1.7890706658363342e-05, 1.9282102584838867e-05, 2.0673498511314392e-05, 2.2064894437789917e-05, 2.3456290364265442e-05, 2.4847686290740967e-05, 2.6239082217216492e-05, 2.7630478143692017e-05, 2.902187407016754e-05, 3.0413269996643066e-05, 3.180466592311859e-05, 3.3196061849594116e-05, 3.458745777606964e-05, 3.5978853702545166e-05, 3.737024962902069e-05, 3.8761645555496216e-05, 4.015304148197174e-05, 4.1544437408447266e-05]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 7.0, 12.0, 10.0, 7.0, 17.0, 16.0, 12.0, 22.0, 38.0, 40.0, 39.0, 57.0, 77.0, 82.0, 115.0, 204.0, 294.0, 452.0, 962.0, 21525.0, 1019161.0, 3223.0, 748.0, 413.0, 243.0, 188.0, 150.0, 93.0, 80.0, 51.0, 45.0, 31.0, 28.0, 28.0, 22.0, 15.0, 11.0, 7.0, 6.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0007410049438476562, -0.0007165893912315369, -0.0006921738386154175, -0.0006677582859992981, -0.0006433427333831787, -0.0006189271807670593, -0.0005945116281509399, -0.0005700960755348206, -0.0005456805229187012, -0.0005212649703025818, -0.0004968494176864624, -0.000472433865070343, -0.00044801831245422363, -0.00042360275983810425, -0.00039918720722198486, -0.0003747716546058655, -0.0003503561019897461, -0.0003259405493736267, -0.0003015249967575073, -0.00027710944414138794, -0.00025269389152526855, -0.00022827833890914917, -0.00020386278629302979, -0.0001794472336769104, -0.00015503168106079102, -0.00013061612844467163, -0.00010620057582855225, -8.178502321243286e-05, -5.7369470596313477e-05, -3.295391798019409e-05, -8.538365364074707e-06, 1.5877187252044678e-05, 4.029273986816406e-05, 6.470829248428345e-05, 8.912384510040283e-05, 0.00011353939771652222, 0.0001379549503326416, 0.00016237050294876099, 0.00018678605556488037, 0.00021120160818099976, 0.00023561716079711914, 0.0002600327134132385, 0.0002844482660293579, 0.0003088638186454773, 0.0003332793712615967, 0.00035769492387771606, 0.00038211047649383545, 0.00040652602910995483, 0.0004309415817260742, 0.0004553571343421936, 0.000479772686958313, 0.0005041882395744324, 0.0005286037921905518, 0.0005530193448066711, 0.0005774348974227905, 0.0006018504500389099, 0.0006262660026550293, 0.0006506815552711487, 0.0006750971078872681, 0.0006995126605033875, 0.0007239282131195068, 0.0007483437657356262, 0.0007727593183517456, 0.000797174870967865, 0.0008215904235839844]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 13.0, 74.0, 248.0, 419.0, 200.0, 51.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.832685615634546e-05, -3.5987362934974954e-05, -3.364786971360445e-05, -3.130837649223395e-05, -2.8968883270863444e-05, -2.662939004949294e-05, -2.4289896828122437e-05, -2.1950403606751934e-05, -1.961091038538143e-05, -1.7271417164010927e-05, -1.4931923942640424e-05, -1.259243072126992e-05, -1.0252937499899417e-05, -7.913444278528914e-06, -5.5739510571584105e-06, -3.2344578357879072e-06, -8.949646144174039e-07, 1.4445286069530994e-06, 3.7840218283236027e-06, 6.123515049694106e-06, 8.46300827106461e-06, 1.0802501492435113e-05, 1.3141994713805616e-05, 1.548148793517612e-05, 1.7820981156546623e-05, 2.0160474377917126e-05, 2.249996759928763e-05, 2.4839460820658132e-05, 2.7178954042028636e-05, 2.951844726339914e-05, 3.185794048476964e-05, 3.4197433706140146e-05, 3.6536919651553035e-05, 3.887641287292354e-05, 4.121590609429404e-05, 4.3555399315664545e-05, 4.589489253703505e-05, 4.823438575840555e-05, 5.0573878979776055e-05, 5.291337220114656e-05, 5.525286542251706e-05, 5.7592358643887565e-05, 5.993185186525807e-05, 6.227134144864976e-05, 6.461083830799907e-05, 6.695033516734838e-05, 6.928982475074008e-05, 7.162931433413178e-05, 7.396881119348109e-05, 7.63083080528304e-05, 7.86477976362221e-05, 8.098728721961379e-05, 8.33267840789631e-05, 8.566628093831241e-05, 8.800577052170411e-05, 9.03452601050958e-05, 9.268475696444511e-05, 9.502425382379442e-05, 9.736374340718612e-05, 9.970323299057782e-05, 0.00010204272984992713, 0.00010438222670927644, 0.00010672171629266813, 0.00010906120587605983, 0.00011140070273540914]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 4.0, 6.0, 7.0, 8.0, 8.0, 10.0, 12.0, 32.0, 24.0, 14.0, 26.0, 42.0, 30.0, 31.0, 36.0, 34.0, 44.0, 43.0, 28.0, 32.0, 35.0, 38.0, 40.0, 38.0, 42.0, 37.0, 32.0, 36.0, 30.0, 24.0, 18.0, 17.0, 27.0, 22.0, 16.0, 13.0, 13.0, 10.0, 12.0, 5.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1755695343017578e-05, -2.1027401089668274e-05, -2.029910683631897e-05, -1.9570812582969666e-05, -1.884251832962036e-05, -1.8114224076271057e-05, -1.7385929822921753e-05, -1.665763556957245e-05, -1.5929341316223145e-05, -1.520104706287384e-05, -1.4472752809524536e-05, -1.3744458556175232e-05, -1.3016164302825928e-05, -1.2287870049476624e-05, -1.155957579612732e-05, -1.0831281542778015e-05, -1.0102987289428711e-05, -9.374693036079407e-06, -8.646398782730103e-06, -7.918104529380798e-06, -7.189810276031494e-06, -6.46151602268219e-06, -5.733221769332886e-06, -5.0049275159835815e-06, -4.276633262634277e-06, -3.548339009284973e-06, -2.820044755935669e-06, -2.0917505025863647e-06, -1.3634562492370605e-06, -6.351619958877563e-07, 9.313225746154785e-08, 8.21426510810852e-07, 1.5497207641601562e-06, 2.2780150175094604e-06, 3.0063092708587646e-06, 3.734603524208069e-06, 4.462897777557373e-06, 5.191192030906677e-06, 5.9194862842559814e-06, 6.647780537605286e-06, 7.37607479095459e-06, 8.104369044303894e-06, 8.832663297653198e-06, 9.560957551002502e-06, 1.0289251804351807e-05, 1.101754605770111e-05, 1.1745840311050415e-05, 1.247413456439972e-05, 1.3202428817749023e-05, 1.3930723071098328e-05, 1.4659017324447632e-05, 1.5387311577796936e-05, 1.611560583114624e-05, 1.6843900084495544e-05, 1.757219433784485e-05, 1.8300488591194153e-05, 1.9028782844543457e-05, 1.975707709789276e-05, 2.0485371351242065e-05, 2.121366560459137e-05, 2.1941959857940674e-05, 2.2670254111289978e-05, 2.3398548364639282e-05, 2.4126842617988586e-05, 2.485513687133789e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 7.0, 4.0, 6.0, 7.0, 10.0, 15.0, 5.0, 13.0, 15.0, 16.0, 18.0, 15.0, 20.0, 13.0, 30.0, 24.0, 28.0, 26.0, 22.0, 28.0, 32.0, 40.0, 35.0, 39.0, 24.0, 34.0, 51.0, 33.0, 31.0, 39.0, 35.0, 33.0, 23.0, 21.0, 21.0, 22.0, 14.0, 22.0, 23.0, 18.0, 17.0, 14.0, 11.0, 7.0, 11.0, 5.0, 6.0, 3.0, 4.0, 5.0, 5.0, 1.0, 5.0, 0.0, 0.0, 5.0], "bins": [-5.47265625, -5.30609130859375, -5.1395263671875, -4.97296142578125, -4.806396484375, -4.63983154296875, -4.4732666015625, -4.30670166015625, -4.14013671875, -3.97357177734375, -3.8070068359375, -3.64044189453125, -3.473876953125, -3.30731201171875, -3.1407470703125, -2.97418212890625, -2.8076171875, -2.64105224609375, -2.4744873046875, -2.30792236328125, -2.141357421875, -1.97479248046875, -1.8082275390625, -1.64166259765625, -1.47509765625, -1.30853271484375, -1.1419677734375, -0.97540283203125, -0.808837890625, -0.64227294921875, -0.4757080078125, -0.30914306640625, -0.142578125, 0.02398681640625, 0.1905517578125, 0.35711669921875, 0.523681640625, 0.69024658203125, 0.8568115234375, 1.02337646484375, 1.18994140625, 1.35650634765625, 1.5230712890625, 1.68963623046875, 1.856201171875, 2.02276611328125, 2.1893310546875, 2.35589599609375, 2.5224609375, 2.68902587890625, 2.8555908203125, 3.02215576171875, 3.188720703125, 3.35528564453125, 3.5218505859375, 3.68841552734375, 3.85498046875, 4.02154541015625, 4.1881103515625, 4.35467529296875, 4.521240234375, 4.68780517578125, 4.8543701171875, 5.02093505859375, 5.1875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 5.0, 6.0, 8.0, 12.0, 23.0, 17.0, 25.0, 34.0, 61.0, 56.0, 85.0, 97.0, 139.0, 195.0, 293.0, 459.0, 728.0, 1144.0, 2082.0, 4371.0, 11408.0, 38343.0, 169309.0, 571914.0, 184637.0, 40504.0, 12246.0, 4735.0, 2187.0, 1167.0, 738.0, 419.0, 311.0, 201.0, 147.0, 113.0, 76.0, 63.0, 40.0, 40.0, 24.0, 17.0, 19.0, 11.0, 10.0, 11.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0], "bins": [-10.3046875, -9.997314453125, -9.68994140625, -9.382568359375, -9.0751953125, -8.767822265625, -8.46044921875, -8.153076171875, -7.845703125, -7.538330078125, -7.23095703125, -6.923583984375, -6.6162109375, -6.308837890625, -6.00146484375, -5.694091796875, -5.38671875, -5.079345703125, -4.77197265625, -4.464599609375, -4.1572265625, -3.849853515625, -3.54248046875, -3.235107421875, -2.927734375, -2.620361328125, -2.31298828125, -2.005615234375, -1.6982421875, -1.390869140625, -1.08349609375, -0.776123046875, -0.46875, -0.161376953125, 0.14599609375, 0.453369140625, 0.7607421875, 1.068115234375, 1.37548828125, 1.682861328125, 1.990234375, 2.297607421875, 2.60498046875, 2.912353515625, 3.2197265625, 3.527099609375, 3.83447265625, 4.141845703125, 4.44921875, 4.756591796875, 5.06396484375, 5.371337890625, 5.6787109375, 5.986083984375, 6.29345703125, 6.600830078125, 6.908203125, 7.215576171875, 7.52294921875, 7.830322265625, 8.1376953125, 8.445068359375, 8.75244140625, 9.059814453125, 9.3671875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 12.0, 5.0, 9.0, 12.0, 18.0, 25.0, 32.0, 30.0, 49.0, 51.0, 81.0, 102.0, 221.0, 1642.0, 287.0, 120.0, 79.0, 59.0, 43.0, 35.0, 35.0, 24.0, 18.0, 15.0, 6.0, 8.0, 7.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.515625, -27.6142578125, -26.712890625, -25.8115234375, -24.91015625, -24.0087890625, -23.107421875, -22.2060546875, -21.3046875, -20.4033203125, -19.501953125, -18.6005859375, -17.69921875, -16.7978515625, -15.896484375, -14.9951171875, -14.09375, -13.1923828125, -12.291015625, -11.3896484375, -10.48828125, -9.5869140625, -8.685546875, -7.7841796875, -6.8828125, -5.9814453125, -5.080078125, -4.1787109375, -3.27734375, -2.3759765625, -1.474609375, -0.5732421875, 0.328125, 1.2294921875, 2.130859375, 3.0322265625, 3.93359375, 4.8349609375, 5.736328125, 6.6376953125, 7.5390625, 8.4404296875, 9.341796875, 10.2431640625, 11.14453125, 12.0458984375, 12.947265625, 13.8486328125, 14.75, 15.6513671875, 16.552734375, 17.4541015625, 18.35546875, 19.2568359375, 20.158203125, 21.0595703125, 21.9609375, 22.8623046875, 23.763671875, 24.6650390625, 25.56640625, 26.4677734375, 27.369140625, 28.2705078125, 29.171875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 5.0, 9.0, 10.0, 30.0, 25.0, 52.0, 88.0, 180.0, 361.0, 1036.0, 49237.0, 3092058.0, 1569.0, 491.0, 244.0, 104.0, 64.0, 43.0, 25.0, 21.0, 10.0, 10.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.375, -84.658203125, -81.94140625, -79.224609375, -76.5078125, -73.791015625, -71.07421875, -68.357421875, -65.640625, -62.923828125, -60.20703125, -57.490234375, -54.7734375, -52.056640625, -49.33984375, -46.623046875, -43.90625, -41.189453125, -38.47265625, -35.755859375, -33.0390625, -30.322265625, -27.60546875, -24.888671875, -22.171875, -19.455078125, -16.73828125, -14.021484375, -11.3046875, -8.587890625, -5.87109375, -3.154296875, -0.4375, 2.279296875, 4.99609375, 7.712890625, 10.4296875, 13.146484375, 15.86328125, 18.580078125, 21.296875, 24.013671875, 26.73046875, 29.447265625, 32.1640625, 34.880859375, 37.59765625, 40.314453125, 43.03125, 45.748046875, 48.46484375, 51.181640625, 53.8984375, 56.615234375, 59.33203125, 62.048828125, 64.765625, 67.482421875, 70.19921875, 72.916015625, 75.6328125, 78.349609375, 81.06640625, 83.783203125, 86.5]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 64.0, 946.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-652.4319458007812, -639.9717407226562, -627.5115356445312, -615.0513305664062, -602.5911254882812, -590.1309814453125, -577.6707763671875, -565.2105712890625, -552.7503662109375, -540.2901611328125, -527.8299560546875, -515.3697509765625, -502.9095764160156, -490.4493713378906, -477.9891662597656, -465.52899169921875, -453.06878662109375, -440.60858154296875, -428.14837646484375, -415.6882019042969, -403.2279968261719, -390.7677917480469, -378.3075866699219, -365.847412109375, -353.3871765136719, -340.9269714355469, -328.4667663574219, -316.006591796875, -303.54638671875, -291.086181640625, -278.6259765625, -266.165771484375, -253.70559692382812, -241.24539184570312, -228.7852020263672, -216.3249969482422, -203.86480712890625, -191.40460205078125, -178.94439697265625, -166.4842071533203, -154.02401733398438, -141.56381225585938, -129.10362243652344, -116.64341735839844, -104.1832275390625, -91.7230224609375, -79.26282501220703, -66.80262756347656, -54.34242248535156, -41.882225036621094, -29.422025680541992, -16.96182632446289, -4.501628875732422, 7.958568572998047, 20.41876983642578, 32.87896728515625, 45.33916473388672, 57.79936218261719, 70.25955963134766, 82.71975708007812, 95.17996215820312, 107.64015197753906, 120.10035705566406, 132.560546875, 145.020751953125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 2.0, 3.0, 3.0, 11.0, 14.0, 16.0, 11.0, 10.0, 19.0, 10.0, 23.0, 19.0, 31.0, 26.0, 25.0, 31.0, 33.0, 36.0, 35.0, 41.0, 47.0, 44.0, 40.0, 41.0, 47.0, 52.0, 30.0, 33.0, 37.0, 28.0, 24.0, 22.0, 24.0, 18.0, 19.0, 13.0, 11.0, 12.0, 14.0, 9.0, 9.0, 7.0, 5.0, 6.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-58.724098205566406, -57.130638122558594, -55.537174224853516, -53.9437141418457, -52.350250244140625, -50.75679016113281, -49.163330078125, -47.56986618041992, -45.97640609741211, -44.3829460144043, -42.78948211669922, -41.196022033691406, -39.60255813598633, -38.009098052978516, -36.41563415527344, -34.822174072265625, -33.22871398925781, -31.635251998901367, -30.041790008544922, -28.44832992553711, -26.854867935180664, -25.26140594482422, -23.667943954467773, -22.074481964111328, -20.48101806640625, -18.887556076049805, -17.29409408569336, -15.70063304901123, -14.107172012329102, -12.513710021972656, -10.920248031616211, -9.326786994934082, -7.733325958251953, -6.139864444732666, -4.546402931213379, -2.9529409408569336, -1.3594794273376465, 0.23398208618164062, 1.827444076538086, 3.420905113220215, 5.01436710357666, 6.607828617095947, 8.201290130615234, 9.79475212097168, 11.388214111328125, 12.981675148010254, 14.5751371383667, 16.168598175048828, 17.762060165405273, 19.35552215576172, 20.948984146118164, 22.54244613647461, 24.135906219482422, 25.729368209838867, 27.322830200195312, 28.916290283203125, 30.509754180908203, 32.103214263916016, 33.696678161621094, 35.290138244628906, 36.883602142333984, 38.4770622253418, 40.070526123046875, 41.66398620605469, 43.2574462890625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 12.0, 8.0, 6.0, 18.0, 10.0, 17.0, 18.0, 15.0, 22.0, 18.0, 23.0, 30.0, 34.0, 28.0, 29.0, 30.0, 27.0, 39.0, 39.0, 48.0, 64.0, 49.0, 33.0, 35.0, 38.0, 32.0, 28.0, 33.0, 30.0, 21.0, 16.0, 26.0, 24.0, 13.0, 16.0, 19.0, 8.0, 5.0, 12.0, 3.0, 4.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.2099609375, -5.994140625, -5.7783203125, -5.5625, -5.3466796875, -5.130859375, -4.9150390625, -4.69921875, -4.4833984375, -4.267578125, -4.0517578125, -3.8359375, -3.6201171875, -3.404296875, -3.1884765625, -2.97265625, -2.7568359375, -2.541015625, -2.3251953125, -2.109375, -1.8935546875, -1.677734375, -1.4619140625, -1.24609375, -1.0302734375, -0.814453125, -0.5986328125, -0.3828125, -0.1669921875, 0.048828125, 0.2646484375, 0.48046875, 0.6962890625, 0.912109375, 1.1279296875, 1.34375, 1.5595703125, 1.775390625, 1.9912109375, 2.20703125, 2.4228515625, 2.638671875, 2.8544921875, 3.0703125, 3.2861328125, 3.501953125, 3.7177734375, 3.93359375, 4.1494140625, 4.365234375, 4.5810546875, 4.796875, 5.0126953125, 5.228515625, 5.4443359375, 5.66015625, 5.8759765625, 6.091796875, 6.3076171875, 6.5234375, 6.7392578125, 6.955078125, 7.1708984375, 7.38671875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 18.0, 9.0, 13.0, 29.0, 21.0, 40.0, 40.0, 52.0, 78.0, 76.0, 113.0, 167.0, 190.0, 234.0, 375.0, 588.0, 1082.0, 3205.0, 48617.0, 3491304.0, 634712.0, 9105.0, 1634.0, 807.0, 472.0, 342.0, 240.0, 159.0, 122.0, 92.0, 64.0, 64.0, 46.0, 39.0, 25.0, 30.0, 16.0, 12.0, 16.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-44.59375, -43.23193359375, -41.8701171875, -40.50830078125, -39.146484375, -37.78466796875, -36.4228515625, -35.06103515625, -33.69921875, -32.33740234375, -30.9755859375, -29.61376953125, -28.251953125, -26.89013671875, -25.5283203125, -24.16650390625, -22.8046875, -21.44287109375, -20.0810546875, -18.71923828125, -17.357421875, -15.99560546875, -14.6337890625, -13.27197265625, -11.91015625, -10.54833984375, -9.1865234375, -7.82470703125, -6.462890625, -5.10107421875, -3.7392578125, -2.37744140625, -1.015625, 0.34619140625, 1.7080078125, 3.06982421875, 4.431640625, 5.79345703125, 7.1552734375, 8.51708984375, 9.87890625, 11.24072265625, 12.6025390625, 13.96435546875, 15.326171875, 16.68798828125, 18.0498046875, 19.41162109375, 20.7734375, 22.13525390625, 23.4970703125, 24.85888671875, 26.220703125, 27.58251953125, 28.9443359375, 30.30615234375, 31.66796875, 33.02978515625, 34.3916015625, 35.75341796875, 37.115234375, 38.47705078125, 39.8388671875, 41.20068359375, 42.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 19.0, 34.0, 95.0, 248.0, 662.0, 1319.0, 1015.0, 392.0, 172.0, 66.0, 29.0, 11.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -37.240234375, -36.13671875, -35.033203125, -33.9296875, -32.826171875, -31.72265625, -30.619140625, -29.515625, -28.412109375, -27.30859375, -26.205078125, -25.1015625, -23.998046875, -22.89453125, -21.791015625, -20.6875, -19.583984375, -18.48046875, -17.376953125, -16.2734375, -15.169921875, -14.06640625, -12.962890625, -11.859375, -10.755859375, -9.65234375, -8.548828125, -7.4453125, -6.341796875, -5.23828125, -4.134765625, -3.03125, -1.927734375, -0.82421875, 0.279296875, 1.3828125, 2.486328125, 3.58984375, 4.693359375, 5.796875, 6.900390625, 8.00390625, 9.107421875, 10.2109375, 11.314453125, 12.41796875, 13.521484375, 14.625, 15.728515625, 16.83203125, 17.935546875, 19.0390625, 20.142578125, 21.24609375, 22.349609375, 23.453125, 24.556640625, 25.66015625, 26.763671875, 27.8671875, 28.970703125, 30.07421875, 31.177734375, 32.28125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 10.0, 16.0, 19.0, 29.0, 37.0, 62.0, 105.0, 128.0, 209.0, 456.0, 1073.0, 3531.0, 16707.0, 142313.0, 2507626.0, 1420260.0, 85799.0, 11377.0, 2602.0, 911.0, 401.0, 219.0, 108.0, 95.0, 51.0, 38.0, 20.0, 22.0, 7.0, 12.0, 8.0, 9.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.34375, -17.75, -17.15625, -16.5625, -15.96875, -15.375, -14.78125, -14.1875, -13.59375, -13.0, -12.40625, -11.8125, -11.21875, -10.625, -10.03125, -9.4375, -8.84375, -8.25, -7.65625, -7.0625, -6.46875, -5.875, -5.28125, -4.6875, -4.09375, -3.5, -2.90625, -2.3125, -1.71875, -1.125, -0.53125, 0.0625, 0.65625, 1.25, 1.84375, 2.4375, 3.03125, 3.625, 4.21875, 4.8125, 5.40625, 6.0, 6.59375, 7.1875, 7.78125, 8.375, 8.96875, 9.5625, 10.15625, 10.75, 11.34375, 11.9375, 12.53125, 13.125, 13.71875, 14.3125, 14.90625, 15.5, 16.09375, 16.6875, 17.28125, 17.875, 18.46875, 19.0625, 19.65625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 8.0, 12.0, 25.0, 27.0, 49.0, 71.0, 93.0, 104.0, 149.0, 127.0, 85.0, 76.0, 44.0, 41.0, 30.0, 14.0, 19.0, 9.0, 3.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.96427154541016, -68.47563934326172, -64.98700714111328, -61.498374938964844, -58.009742736816406, -54.52111053466797, -51.03247833251953, -47.543846130371094, -44.055213928222656, -40.56658172607422, -37.07794952392578, -33.589317321777344, -30.100685119628906, -26.61205291748047, -23.12342071533203, -19.634788513183594, -16.146156311035156, -12.657524108886719, -9.168891906738281, -5.680259704589844, -2.1916275024414062, 1.2970046997070312, 4.785636901855469, 8.274269104003906, 11.762901306152344, 15.251533508300781, 18.74016571044922, 22.228797912597656, 25.717430114746094, 29.20606231689453, 32.69469451904297, 36.183326721191406, 39.671966552734375, 43.16059875488281, 46.64923095703125, 50.13786315917969, 53.626495361328125, 57.11512756347656, 60.603759765625, 64.09239196777344, 67.58102416992188, 71.06965637207031, 74.55828857421875, 78.04692077636719, 81.53555297851562, 85.02418518066406, 88.5128173828125, 92.00144958496094, 95.49008178710938, 98.97871398925781, 102.46734619140625, 105.95597839355469, 109.44461059570312, 112.93324279785156, 116.421875, 119.91050720214844, 123.39913940429688, 126.88777160644531, 130.37640380859375, 133.8650360107422, 137.35366821289062, 140.84230041503906, 144.3309326171875, 147.81956481933594, 151.30819702148438]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 9.0, 11.0, 11.0, 10.0, 13.0, 14.0, 20.0, 32.0, 21.0, 30.0, 30.0, 31.0, 31.0, 45.0, 46.0, 44.0, 44.0, 48.0, 40.0, 53.0, 44.0, 45.0, 31.0, 37.0, 39.0, 31.0, 26.0, 22.0, 22.0, 14.0, 16.0, 19.0, 16.0, 10.0, 12.0, 6.0, 4.0, 4.0, 4.0, 4.0, 0.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.928001403808594, -47.194942474365234, -45.461883544921875, -43.728824615478516, -41.995765686035156, -40.2627067565918, -38.52964782714844, -36.79658508300781, -35.06352996826172, -33.33047103881836, -31.597412109375, -29.86435317993164, -28.13129425048828, -26.398235321044922, -24.66517448425293, -22.93211555480957, -21.199054718017578, -19.46599578857422, -17.73293685913086, -15.999876976013184, -14.266818046569824, -12.533759117126465, -10.800699234008789, -9.06764030456543, -7.33458137512207, -5.601522445678711, -3.8684630393981934, -2.135403633117676, -0.4023447036743164, 1.330714225769043, 3.0637741088867188, 4.796833038330078, 6.529895782470703, 8.262954711914062, 9.996013641357422, 11.729073524475098, 13.462132453918457, 15.195191383361816, 16.928251266479492, 18.66131019592285, 20.39436912536621, 22.12742805480957, 23.86048698425293, 25.593547821044922, 27.32660675048828, 29.05966567993164, 30.792724609375, 32.52578353881836, 34.25884246826172, 35.99190139770508, 37.72496032714844, 39.4580192565918, 41.191078186035156, 42.924137115478516, 44.657196044921875, 46.3902587890625, 48.123313903808594, 49.85637283325195, 51.58943176269531, 53.32249069213867, 55.05554962158203, 56.78860855102539, 58.52166748046875, 60.254730224609375, 61.987789154052734]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 9.0, 13.0, 11.0, 16.0, 23.0, 18.0, 23.0, 28.0, 29.0, 25.0, 34.0, 44.0, 34.0, 48.0, 49.0, 50.0, 41.0, 44.0, 49.0, 38.0, 40.0, 41.0, 18.0, 42.0, 33.0, 25.0, 24.0, 22.0, 15.0, 16.0, 5.0, 10.0, 17.0, 9.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-87.1875, -84.24609375, -81.3046875, -78.36328125, -75.421875, -72.48046875, -69.5390625, -66.59765625, -63.65625, -60.71484375, -57.7734375, -54.83203125, -51.890625, -48.94921875, -46.0078125, -43.06640625, -40.125, -37.18359375, -34.2421875, -31.30078125, -28.359375, -25.41796875, -22.4765625, -19.53515625, -16.59375, -13.65234375, -10.7109375, -7.76953125, -4.828125, -1.88671875, 1.0546875, 3.99609375, 6.9375, 9.87890625, 12.8203125, 15.76171875, 18.703125, 21.64453125, 24.5859375, 27.52734375, 30.46875, 33.41015625, 36.3515625, 39.29296875, 42.234375, 45.17578125, 48.1171875, 51.05859375, 54.0, 56.94140625, 59.8828125, 62.82421875, 65.765625, 68.70703125, 71.6484375, 74.58984375, 77.53125, 80.47265625, 83.4140625, 86.35546875, 89.296875, 92.23828125, 95.1796875, 98.12109375, 101.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 12.0, 14.0, 23.0, 43.0, 40.0, 45.0, 58.0, 87.0, 128.0, 179.0, 237.0, 321.0, 423.0, 663.0, 891.0, 1129.0, 1648.0, 2272.0, 3345.0, 4818.0, 7013.0, 10348.0, 15598.0, 24385.0, 39233.0, 68079.0, 131645.0, 258320.0, 216286.0, 106083.0, 56681.0, 33822.0, 20977.0, 13759.0, 9209.0, 6127.0, 4267.0, 2972.0, 2116.0, 1466.0, 1019.0, 759.0, 565.0, 386.0, 272.0, 233.0, 132.0, 109.0, 104.0, 79.0, 47.0, 32.0, 20.0, 15.0, 8.0, 5.0, 5.0, 2.0, 6.0, 2.0, 2.0], "bins": [-3.775390625, -3.652984619140625, -3.53057861328125, -3.408172607421875, -3.2857666015625, -3.163360595703125, -3.04095458984375, -2.918548583984375, -2.796142578125, -2.673736572265625, -2.55133056640625, -2.428924560546875, -2.3065185546875, -2.184112548828125, -2.06170654296875, -1.939300537109375, -1.81689453125, -1.694488525390625, -1.57208251953125, -1.449676513671875, -1.3272705078125, -1.204864501953125, -1.08245849609375, -0.960052490234375, -0.837646484375, -0.715240478515625, -0.59283447265625, -0.470428466796875, -0.3480224609375, -0.225616455078125, -0.10321044921875, 0.019195556640625, 0.1416015625, 0.264007568359375, 0.38641357421875, 0.508819580078125, 0.6312255859375, 0.753631591796875, 0.87603759765625, 0.998443603515625, 1.120849609375, 1.243255615234375, 1.36566162109375, 1.488067626953125, 1.6104736328125, 1.732879638671875, 1.85528564453125, 1.977691650390625, 2.10009765625, 2.222503662109375, 2.34490966796875, 2.467315673828125, 2.5897216796875, 2.712127685546875, 2.83453369140625, 2.956939697265625, 3.079345703125, 3.201751708984375, 3.32415771484375, 3.446563720703125, 3.5689697265625, 3.691375732421875, 3.81378173828125, 3.936187744140625, 4.05859375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 3.0, 6.0, 5.0, 2.0, 7.0, 11.0, 9.0, 10.0, 13.0, 21.0, 19.0, 14.0, 15.0, 25.0, 22.0, 22.0, 32.0, 24.0, 32.0, 32.0, 40.0, 32.0, 45.0, 40.0, 1058.0, 41.0, 48.0, 33.0, 38.0, 39.0, 40.0, 26.0, 31.0, 29.0, 24.0, 26.0, 14.0, 21.0, 22.0, 15.0, 12.0, 6.0, 10.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.21875, -47.43994140625, -45.6611328125, -43.88232421875, -42.103515625, -40.32470703125, -38.5458984375, -36.76708984375, -34.98828125, -33.20947265625, -31.4306640625, -29.65185546875, -27.873046875, -26.09423828125, -24.3154296875, -22.53662109375, -20.7578125, -18.97900390625, -17.2001953125, -15.42138671875, -13.642578125, -11.86376953125, -10.0849609375, -8.30615234375, -6.52734375, -4.74853515625, -2.9697265625, -1.19091796875, 0.587890625, 2.36669921875, 4.1455078125, 5.92431640625, 7.703125, 9.48193359375, 11.2607421875, 13.03955078125, 14.818359375, 16.59716796875, 18.3759765625, 20.15478515625, 21.93359375, 23.71240234375, 25.4912109375, 27.27001953125, 29.048828125, 30.82763671875, 32.6064453125, 34.38525390625, 36.1640625, 37.94287109375, 39.7216796875, 41.50048828125, 43.279296875, 45.05810546875, 46.8369140625, 48.61572265625, 50.39453125, 52.17333984375, 53.9521484375, 55.73095703125, 57.509765625, 59.28857421875, 61.0673828125, 62.84619140625, 64.625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 11.0, 13.0, 26.0, 41.0, 37.0, 69.0, 110.0, 134.0, 227.0, 356.0, 517.0, 752.0, 1245.0, 1772.0, 2649.0, 4060.0, 6284.0, 9548.0, 14919.0, 23960.0, 38361.0, 65521.0, 127258.0, 1308172.0, 229706.0, 108486.0, 58704.0, 34500.0, 21250.0, 13319.0, 8897.0, 5564.0, 3639.0, 2376.0, 1590.0, 1070.0, 681.0, 443.0, 297.0, 211.0, 113.0, 80.0, 67.0, 37.0, 24.0, 14.0, 9.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.396484375, -3.286529541015625, -3.17657470703125, -3.066619873046875, -2.9566650390625, -2.846710205078125, -2.73675537109375, -2.626800537109375, -2.516845703125, -2.406890869140625, -2.29693603515625, -2.186981201171875, -2.0770263671875, -1.967071533203125, -1.85711669921875, -1.747161865234375, -1.63720703125, -1.527252197265625, -1.41729736328125, -1.307342529296875, -1.1973876953125, -1.087432861328125, -0.97747802734375, -0.867523193359375, -0.757568359375, -0.647613525390625, -0.53765869140625, -0.427703857421875, -0.3177490234375, -0.207794189453125, -0.09783935546875, 0.012115478515625, 0.1220703125, 0.232025146484375, 0.34197998046875, 0.451934814453125, 0.5618896484375, 0.671844482421875, 0.78179931640625, 0.891754150390625, 1.001708984375, 1.111663818359375, 1.22161865234375, 1.331573486328125, 1.4415283203125, 1.551483154296875, 1.66143798828125, 1.771392822265625, 1.88134765625, 1.991302490234375, 2.10125732421875, 2.211212158203125, 2.3211669921875, 2.431121826171875, 2.54107666015625, 2.651031494140625, 2.760986328125, 2.870941162109375, 2.98089599609375, 3.090850830078125, 3.2008056640625, 3.310760498046875, 3.42071533203125, 3.530670166015625, 3.640625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 3.0, 10.0, 18.0, 10.0, 24.0, 25.0, 16.0, 31.0, 26.0, 42.0, 45.0, 50.0, 32.0, 45.0, 45.0, 40.0, 42.0, 34.0, 58.0, 40.0, 38.0, 28.0, 32.0, 32.0, 27.0, 29.0, 30.0, 16.0, 22.0, 16.0, 12.0, 15.0, 9.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004935264587402344, -0.00047782063484191895, -0.0004621148109436035, -0.0004464089870452881, -0.00043070316314697266, -0.0004149973392486572, -0.0003992915153503418, -0.00038358569145202637, -0.00036787986755371094, -0.0003521740436553955, -0.0003364682197570801, -0.00032076239585876465, -0.0003050565719604492, -0.0002893507480621338, -0.00027364492416381836, -0.00025793910026550293, -0.0002422332763671875, -0.00022652745246887207, -0.00021082162857055664, -0.0001951158046722412, -0.00017940998077392578, -0.00016370415687561035, -0.00014799833297729492, -0.0001322925090789795, -0.00011658668518066406, -0.00010088086128234863, -8.51750373840332e-05, -6.946921348571777e-05, -5.3763389587402344e-05, -3.8057565689086914e-05, -2.2351741790771484e-05, -6.645917892456055e-06, 9.059906005859375e-06, 2.4765729904174805e-05, 4.0471553802490234e-05, 5.6177377700805664e-05, 7.18832015991211e-05, 8.758902549743652e-05, 0.00010329484939575195, 0.00011900067329406738, 0.0001347064971923828, 0.00015041232109069824, 0.00016611814498901367, 0.0001818239688873291, 0.00019752979278564453, 0.00021323561668395996, 0.0002289414405822754, 0.0002446472644805908, 0.00026035308837890625, 0.0002760589122772217, 0.0002917647361755371, 0.00030747056007385254, 0.00032317638397216797, 0.0003388822078704834, 0.00035458803176879883, 0.00037029385566711426, 0.0003859996795654297, 0.0004017055034637451, 0.00041741132736206055, 0.000433117151260376, 0.0004488229751586914, 0.00046452879905700684, 0.00048023462295532227, 0.0004959404468536377, 0.0005116462707519531]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 10.0, 8.0, 9.0, 12.0, 18.0, 26.0, 28.0, 41.0, 41.0, 57.0, 91.0, 125.0, 171.0, 234.0, 315.0, 560.0, 886.0, 1599.0, 3460.0, 8241.0, 22448.0, 67098.0, 188054.0, 339966.0, 256686.0, 102110.0, 33995.0, 12239.0, 4699.0, 2182.0, 1136.0, 634.0, 396.0, 260.0, 188.0, 143.0, 103.0, 71.0, 53.0, 41.0, 29.0, 23.0, 18.0, 16.0, 8.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027332305908203125, -0.002644181251525879, -0.0025551319122314453, -0.0024660825729370117, -0.002377033233642578, -0.0022879838943481445, -0.002198934555053711, -0.0021098852157592773, -0.0020208358764648438, -0.0019317865371704102, -0.0018427371978759766, -0.001753687858581543, -0.0016646385192871094, -0.0015755891799926758, -0.0014865398406982422, -0.0013974905014038086, -0.001308441162109375, -0.0012193918228149414, -0.0011303424835205078, -0.0010412931442260742, -0.0009522438049316406, -0.000863194465637207, -0.0007741451263427734, -0.0006850957870483398, -0.0005960464477539062, -0.0005069971084594727, -0.00041794776916503906, -0.00032889842987060547, -0.00023984909057617188, -0.00015079975128173828, -6.175041198730469e-05, 2.7298927307128906e-05, 0.0001163482666015625, 0.0002053976058959961, 0.0002944469451904297, 0.0003834962844848633, 0.0004725456237792969, 0.0005615949630737305, 0.0006506443023681641, 0.0007396936416625977, 0.0008287429809570312, 0.0009177923202514648, 0.0010068416595458984, 0.001095890998840332, 0.0011849403381347656, 0.0012739896774291992, 0.0013630390167236328, 0.0014520883560180664, 0.0015411376953125, 0.0016301870346069336, 0.0017192363739013672, 0.0018082857131958008, 0.0018973350524902344, 0.001986384391784668, 0.0020754337310791016, 0.002164483070373535, 0.0022535324096679688, 0.0023425817489624023, 0.002431631088256836, 0.0025206804275512695, 0.002609729766845703, 0.0026987791061401367, 0.0027878284454345703, 0.002876877784729004, 0.0029659271240234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 14.0, 12.0, 39.0, 59.0, 94.0, 111.0, 139.0, 122.0, 124.0, 102.0, 84.0, 37.0, 26.0, 15.0, 11.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00046734235365875065, -0.00044212109060026705, -0.00041689982754178345, -0.00039167856448329985, -0.00036645730142481625, -0.0003412360674701631, -0.0003160148044116795, -0.0002907935413531959, -0.0002655722782947123, -0.0002403510152362287, -0.0002151297521777451, -0.0001899084891192615, -0.0001646872260607779, -0.00013946597755420953, -0.00011424471449572593, -8.902345143724233e-05, -6.38021738268435e-05, -3.85809107683599e-05, -1.3359651347855106e-05, 1.1861608072649688e-05, 3.708287113113329e-05, 6.230412691365927e-05, 8.752538997214288e-05, 0.00011274665303062648, 0.00013796791608911008, 0.00016318917914759368, 0.00018841044220607728, 0.00021363169071264565, 0.00023885295377112925, 0.00026407421682961285, 0.00028929547988809645, 0.00031451674294658005, 0.0003397380351088941, 0.0003649592981673777, 0.0003901805612258613, 0.0004154018242843449, 0.0004406230873428285, 0.0004658443504013121, 0.0004910656134597957, 0.0005162868765182793, 0.0005415081395767629, 0.0005667294026352465, 0.0005919506656937301, 0.0006171719287522137, 0.0006423931918106973, 0.0006676144548691809, 0.0006928357179276645, 0.0007180569809861481, 0.0007432781858369708, 0.0007684994488954544, 0.000793720711953938, 0.0008189419750124216, 0.0008441632380709052, 0.0008693845011293888, 0.0008946057641878724, 0.000919827027246356, 0.0009450482903048396, 0.0009702695533633232, 0.0009954908164218068, 0.0010207120794802904, 0.001045933342538774, 0.0010711546055972576, 0.0010963758686557412, 0.0011215971317142248, 0.0011468183947727084]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 5.0, 7.0, 6.0, 1.0, 4.0, 7.0, 12.0, 8.0, 20.0, 13.0, 17.0, 16.0, 22.0, 24.0, 24.0, 24.0, 31.0, 27.0, 36.0, 32.0, 41.0, 33.0, 32.0, 43.0, 37.0, 43.0, 50.0, 43.0, 40.0, 30.0, 34.0, 30.0, 17.0, 25.0, 26.0, 18.0, 22.0, 16.0, 22.0, 13.0, 10.0, 9.0, 8.0, 8.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002949833869934082, -0.0002853376790881157, -0.0002756919711828232, -0.00026604626327753067, -0.00025640055537223816, -0.00024675484746694565, -0.00023710913956165314, -0.00022746343165636063, -0.00021781772375106812, -0.0002081720158457756, -0.0001985263079404831, -0.00018888060003519058, -0.00017923489212989807, -0.00016958918422460556, -0.00015994347631931305, -0.00015029776841402054, -0.00014065206050872803, -0.00013100635260343552, -0.000121360644698143, -0.0001117149367928505, -0.00010206922888755798, -9.242352098226547e-05, -8.277781307697296e-05, -7.313210517168045e-05, -6.348639726638794e-05, -5.384068936109543e-05, -4.419498145580292e-05, -3.4549273550510406e-05, -2.4903565645217896e-05, -1.5257857739925385e-05, -5.6121498346328735e-06, 4.0335580706596375e-06, 1.3679265975952148e-05, 2.332497388124466e-05, 3.297068178653717e-05, 4.261638969182968e-05, 5.226209759712219e-05, 6.19078055024147e-05, 7.155351340770721e-05, 8.119922131299973e-05, 9.084492921829224e-05, 0.00010049063712358475, 0.00011013634502887726, 0.00011978205293416977, 0.00012942776083946228, 0.0001390734687447548, 0.0001487191766500473, 0.0001583648845553398, 0.00016801059246063232, 0.00017765630036592484, 0.00018730200827121735, 0.00019694771617650986, 0.00020659342408180237, 0.00021623913198709488, 0.0002258848398923874, 0.0002355305477976799, 0.0002451762557029724, 0.0002548219636082649, 0.00026446767151355743, 0.00027411337941884995, 0.00028375908732414246, 0.00029340479522943497, 0.0003030505031347275, 0.00031269621104002, 0.0003223419189453125]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 9.0, 13.0, 11.0, 16.0, 24.0, 18.0, 22.0, 29.0, 28.0, 26.0, 34.0, 44.0, 34.0, 47.0, 49.0, 51.0, 41.0, 44.0, 48.0, 38.0, 40.0, 41.0, 19.0, 41.0, 33.0, 26.0, 23.0, 22.0, 15.0, 16.0, 5.0, 10.0, 17.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-87.125, -84.1845703125, -81.244140625, -78.3037109375, -75.36328125, -72.4228515625, -69.482421875, -66.5419921875, -63.6015625, -60.6611328125, -57.720703125, -54.7802734375, -51.83984375, -48.8994140625, -45.958984375, -43.0185546875, -40.078125, -37.1376953125, -34.197265625, -31.2568359375, -28.31640625, -25.3759765625, -22.435546875, -19.4951171875, -16.5546875, -13.6142578125, -10.673828125, -7.7333984375, -4.79296875, -1.8525390625, 1.087890625, 4.0283203125, 6.96875, 9.9091796875, 12.849609375, 15.7900390625, 18.73046875, 21.6708984375, 24.611328125, 27.5517578125, 30.4921875, 33.4326171875, 36.373046875, 39.3134765625, 42.25390625, 45.1943359375, 48.134765625, 51.0751953125, 54.015625, 56.9560546875, 59.896484375, 62.8369140625, 65.77734375, 68.7177734375, 71.658203125, 74.5986328125, 77.5390625, 80.4794921875, 83.419921875, 86.3603515625, 89.30078125, 92.2412109375, 95.181640625, 98.1220703125, 101.0625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 7.0, 6.0, 2.0, 8.0, 18.0, 22.0, 25.0, 36.0, 58.0, 82.0, 80.0, 135.0, 191.0, 281.0, 478.0, 755.0, 1285.0, 2256.0, 4677.0, 11005.0, 33286.0, 135993.0, 493711.0, 271055.0, 61380.0, 17627.0, 6669.0, 3098.0, 1650.0, 952.0, 545.0, 344.0, 250.0, 167.0, 124.0, 81.0, 51.0, 39.0, 32.0, 28.0, 17.0, 8.0, 9.0, 6.0, 14.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.953125, -15.41650390625, -14.8798828125, -14.34326171875, -13.806640625, -13.27001953125, -12.7333984375, -12.19677734375, -11.66015625, -11.12353515625, -10.5869140625, -10.05029296875, -9.513671875, -8.97705078125, -8.4404296875, -7.90380859375, -7.3671875, -6.83056640625, -6.2939453125, -5.75732421875, -5.220703125, -4.68408203125, -4.1474609375, -3.61083984375, -3.07421875, -2.53759765625, -2.0009765625, -1.46435546875, -0.927734375, -0.39111328125, 0.1455078125, 0.68212890625, 1.21875, 1.75537109375, 2.2919921875, 2.82861328125, 3.365234375, 3.90185546875, 4.4384765625, 4.97509765625, 5.51171875, 6.04833984375, 6.5849609375, 7.12158203125, 7.658203125, 8.19482421875, 8.7314453125, 9.26806640625, 9.8046875, 10.34130859375, 10.8779296875, 11.41455078125, 11.951171875, 12.48779296875, 13.0244140625, 13.56103515625, 14.09765625, 14.63427734375, 15.1708984375, 15.70751953125, 16.244140625, 16.78076171875, 17.3173828125, 17.85400390625, 18.390625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 7.0, 8.0, 21.0, 17.0, 22.0, 33.0, 60.0, 55.0, 72.0, 72.0, 99.0, 2116.0, 77.0, 65.0, 66.0, 64.0, 41.0, 33.0, 24.0, 31.0, 15.0, 13.0, 4.0, 8.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-279.75, -272.44140625, -265.1328125, -257.82421875, -250.515625, -243.20703125, -235.8984375, -228.58984375, -221.28125, -213.97265625, -206.6640625, -199.35546875, -192.046875, -184.73828125, -177.4296875, -170.12109375, -162.8125, -155.50390625, -148.1953125, -140.88671875, -133.578125, -126.26953125, -118.9609375, -111.65234375, -104.34375, -97.03515625, -89.7265625, -82.41796875, -75.109375, -67.80078125, -60.4921875, -53.18359375, -45.875, -38.56640625, -31.2578125, -23.94921875, -16.640625, -9.33203125, -2.0234375, 5.28515625, 12.59375, 19.90234375, 27.2109375, 34.51953125, 41.828125, 49.13671875, 56.4453125, 63.75390625, 71.0625, 78.37109375, 85.6796875, 92.98828125, 100.296875, 107.60546875, 114.9140625, 122.22265625, 129.53125, 136.83984375, 144.1484375, 151.45703125, 158.765625, 166.07421875, 173.3828125, 180.69140625, 188.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 4.0, 6.0, 8.0, 15.0, 20.0, 31.0, 44.0, 67.0, 113.0, 175.0, 346.0, 596.0, 1348.0, 5420.0, 99722.0, 2995712.0, 36332.0, 3500.0, 1026.0, 496.0, 296.0, 140.0, 100.0, 56.0, 41.0, 26.0, 11.0, 11.0, 12.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.5, -41.91064453125, -40.3212890625, -38.73193359375, -37.142578125, -35.55322265625, -33.9638671875, -32.37451171875, -30.78515625, -29.19580078125, -27.6064453125, -26.01708984375, -24.427734375, -22.83837890625, -21.2490234375, -19.65966796875, -18.0703125, -16.48095703125, -14.8916015625, -13.30224609375, -11.712890625, -10.12353515625, -8.5341796875, -6.94482421875, -5.35546875, -3.76611328125, -2.1767578125, -0.58740234375, 1.001953125, 2.59130859375, 4.1806640625, 5.77001953125, 7.359375, 8.94873046875, 10.5380859375, 12.12744140625, 13.716796875, 15.30615234375, 16.8955078125, 18.48486328125, 20.07421875, 21.66357421875, 23.2529296875, 24.84228515625, 26.431640625, 28.02099609375, 29.6103515625, 31.19970703125, 32.7890625, 34.37841796875, 35.9677734375, 37.55712890625, 39.146484375, 40.73583984375, 42.3251953125, 43.91455078125, 45.50390625, 47.09326171875, 48.6826171875, 50.27197265625, 51.861328125, 53.45068359375, 55.0400390625, 56.62939453125, 58.21875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 17.0, 43.0, 75.0, 149.0, 249.0, 203.0, 123.0, 55.0, 34.0, 12.0, 9.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-339.62835693359375, -329.2735290527344, -318.9186706542969, -308.5638427734375, -298.208984375, -287.8541564941406, -277.49932861328125, -267.14447021484375, -256.7896423339844, -246.43479919433594, -236.0799560546875, -225.72512817382812, -215.3702850341797, -205.01544189453125, -194.66061401367188, -184.30577087402344, -173.950927734375, -163.59608459472656, -153.24124145507812, -142.88641357421875, -132.5315704345703, -122.17672729492188, -111.82189178466797, -101.46705627441406, -91.11221313476562, -80.75736999511719, -70.40253448486328, -60.04769515991211, -49.69285583496094, -39.338016510009766, -28.983177185058594, -18.628341674804688, -8.273529052734375, 2.081310272216797, 12.436149597167969, 22.79098892211914, 33.14582824707031, 43.500667572021484, 53.855506896972656, 64.21034240722656, 74.565185546875, 84.92002868652344, 95.27486419677734, 105.62969970703125, 115.98454284667969, 126.33938598632812, 136.6942138671875, 147.04905700683594, 157.40390014648438, 167.7587432861328, 178.11358642578125, 188.46841430664062, 198.82325744628906, 209.1781005859375, 219.53292846679688, 229.8877716064453, 240.24261474609375, 250.5974578857422, 260.9523010253906, 271.30712890625, 281.6619873046875, 292.0168151855469, 302.37164306640625, 312.72650146484375, 323.0813293457031]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 7.0, 4.0, 3.0, 10.0, 7.0, 4.0, 13.0, 19.0, 14.0, 19.0, 24.0, 25.0, 36.0, 27.0, 25.0, 39.0, 33.0, 56.0, 46.0, 34.0, 38.0, 44.0, 41.0, 46.0, 44.0, 32.0, 43.0, 40.0, 32.0, 33.0, 27.0, 23.0, 25.0, 16.0, 17.0, 16.0, 8.0, 9.0, 6.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-201.41018676757812, -195.13650512695312, -188.86282348632812, -182.58914184570312, -176.31546020507812, -170.04176330566406, -163.76808166503906, -157.49440002441406, -151.22071838378906, -144.94703674316406, -138.67335510253906, -132.39967346191406, -126.12598419189453, -119.85230255126953, -113.57861328125, -107.304931640625, -101.03125, -94.757568359375, -88.48388671875, -82.21019744873047, -75.93651580810547, -69.66283416748047, -63.3891487121582, -57.11546325683594, -50.84178161621094, -44.56809997558594, -38.29441452026367, -32.020729064941406, -25.747047424316406, -19.473363876342773, -13.19968032836914, -6.925994873046875, -0.652313232421875, 5.621370315551758, 11.89505386352539, 18.168737411499023, 24.442420959472656, 30.71610450744629, 36.98978805541992, 43.26347351074219, 49.53715515136719, 55.81083679199219, 62.08452224731445, 68.35820770263672, 74.63188934326172, 80.90557098388672, 87.17926025390625, 93.45294189453125, 99.72662353515625, 106.00030517578125, 112.27398681640625, 118.54767608642578, 124.82135772705078, 131.0950469970703, 137.3687286376953, 143.6424102783203, 149.9160919189453, 156.1897735595703, 162.4634552001953, 168.7371368408203, 175.01083374023438, 181.28451538085938, 187.55819702148438, 193.83187866210938, 200.10556030273438]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 0.0, 7.0, 5.0, 4.0, 8.0, 11.0, 15.0, 20.0, 22.0, 22.0, 33.0, 52.0, 75.0, 70.0, 120.0, 145.0, 188.0, 241.0, 283.0, 380.0, 448.0, 559.0, 637.0, 1128.0, 1040575.0, 701.0, 565.0, 454.0, 398.0, 288.0, 251.0, 220.0, 158.0, 99.0, 79.0, 63.0, 44.0, 48.0, 30.0, 20.0, 25.0, 11.0, 11.0, 8.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.380435943603516, -47.73820495605469, -46.09597396850586, -44.45374298095703, -42.8115119934082, -41.169281005859375, -39.52705001831055, -37.88481903076172, -36.24258804321289, -34.60035705566406, -32.958126068115234, -31.315895080566406, -29.673664093017578, -28.03143310546875, -26.389202117919922, -24.746971130371094, -23.1047420501709, -21.46251106262207, -19.820280075073242, -18.178049087524414, -16.535818099975586, -14.893588066101074, -13.251357078552246, -11.609126091003418, -9.96689510345459, -8.324664115905762, -6.682433128356934, -5.040202617645264, -3.3979716300964355, -1.7557411193847656, -0.1135101318359375, 1.5287208557128906, 3.1709518432617188, 4.813182830810547, 6.455413818359375, 8.097644805908203, 9.739875793457031, 11.382105827331543, 13.024336814880371, 14.6665678024292, 16.308799743652344, 17.951030731201172, 19.59326171875, 21.235492706298828, 22.877723693847656, 24.519954681396484, 26.162185668945312, 27.80441665649414, 29.446645736694336, 31.088876724243164, 32.73110580444336, 34.37333679199219, 36.015567779541016, 37.657798767089844, 39.30002975463867, 40.9422607421875, 42.58449172973633, 44.226722717285156, 45.868953704833984, 47.51118469238281, 49.15341567993164, 50.79564666748047, 52.4378776550293, 54.080108642578125, 55.72233963012695]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 3.0, 2.0, 3.0, 7.0, 14.0, 15.0, 24.0, 74.0, 288.0, 51462280.0, 298.0, 50.0, 23.0, 24.0, 12.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2568.0, -2403.10009765625, -2238.2001953125, -2073.30029296875, -1908.4005126953125, -1743.5006103515625, -1578.600830078125, -1413.700927734375, -1248.801025390625, -1083.901123046875, -919.0012817382812, -754.1014404296875, -589.2015380859375, -424.3016357421875, -259.40179443359375, -94.501953125, 70.39794921875, 235.29782104492188, 400.19769287109375, 565.0975341796875, 729.9974365234375, 894.8973388671875, 1059.797119140625, 1224.697021484375, 1389.596923828125, 1554.496826171875, 1719.396728515625, 1884.2965087890625, 2049.1962890625, 2214.09619140625, 2378.99609375, 2543.89599609375, 2708.79541015625, 2873.6953125, 3038.59521484375, 3203.4951171875, 3368.39501953125, 3533.294921875, 3698.194580078125, 3863.094482421875, 4027.994384765625, 4192.89404296875, 4357.7939453125, 4522.69384765625, 4687.59375, 4852.49365234375, 5017.3935546875, 5182.29345703125, 5347.193359375, 5512.09326171875, 5676.9931640625, 5841.89306640625, 6006.79296875, 6171.69287109375, 6336.5927734375, 6501.4921875, 6666.392578125, 6831.29248046875, 6996.1923828125, 7161.09228515625, 7325.9921875, 7490.89208984375, 7655.7919921875, 7820.69140625, 7985.59130859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [9.0, 3.0, 0.0, 3.0, 8.0, 20.0, 42.0, 61.0, 92.0, 98.0, 156.0, 232.0, 373.0, 540.0, 790.0, 1067.0, 1498.0, 2161.0, 3107.0, 4157.0, 5866.0, 8563.0, 12360.0, 17325.0, 26125.0, 39110.0, 58637.0, 91794.0, 149725.0, 255222.0, 500801.0, 3939410.0, 497942.0, 253704.0, 146811.0, 91612.0, 58772.0, 39122.0, 25829.0, 17824.0, 12184.0, 8411.0, 5857.0, 4050.0, 2880.0, 2151.0, 1439.0, 1054.0, 755.0, 553.0, 387.0, 215.0, 159.0, 132.0, 68.0, 78.0, 49.0, 24.0, 8.0, 9.0, 9.0, 6.0, 1.0, 6.0], "bins": [-1.3447265625, -1.302032470703125, -1.25933837890625, -1.216644287109375, -1.1739501953125, -1.131256103515625, -1.08856201171875, -1.045867919921875, -1.003173828125, -0.960479736328125, -0.91778564453125, -0.875091552734375, -0.8323974609375, -0.789703369140625, -0.74700927734375, -0.704315185546875, -0.66162109375, -0.618927001953125, -0.57623291015625, -0.533538818359375, -0.4908447265625, -0.448150634765625, -0.40545654296875, -0.362762451171875, -0.320068359375, -0.277374267578125, -0.23468017578125, -0.191986083984375, -0.1492919921875, -0.106597900390625, -0.06390380859375, -0.021209716796875, 0.021484375, 0.064178466796875, 0.10687255859375, 0.149566650390625, 0.1922607421875, 0.234954833984375, 0.27764892578125, 0.320343017578125, 0.363037109375, 0.405731201171875, 0.44842529296875, 0.491119384765625, 0.5338134765625, 0.576507568359375, 0.61920166015625, 0.661895751953125, 0.70458984375, 0.747283935546875, 0.78997802734375, 0.832672119140625, 0.8753662109375, 0.918060302734375, 0.96075439453125, 1.003448486328125, 1.046142578125, 1.088836669921875, 1.13153076171875, 1.174224853515625, 1.2169189453125, 1.259613037109375, 1.30230712890625, 1.345001220703125, 1.3876953125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 1.0, 6.0, 5.0, 5.0, 7.0, 9.0, 8.0, 16.0, 14.0, 20.0, 22.0, 19.0, 26.0, 34.0, 18.0, 36.0, 45.0, 33.0, 36.0, 48.0, 49.0, 1054.0, 50.0, 41.0, 39.0, 36.0, 45.0, 33.0, 33.0, 37.0, 25.0, 19.0, 24.0, 21.0, 25.0, 11.0, 17.0, 11.0, 7.0, 7.0, 9.0, 7.0, 2.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.0, -22.29296875, -21.5859375, -20.87890625, -20.171875, -19.46484375, -18.7578125, -18.05078125, -17.34375, -16.63671875, -15.9296875, -15.22265625, -14.515625, -13.80859375, -13.1015625, -12.39453125, -11.6875, -10.98046875, -10.2734375, -9.56640625, -8.859375, -8.15234375, -7.4453125, -6.73828125, -6.03125, -5.32421875, -4.6171875, -3.91015625, -3.203125, -2.49609375, -1.7890625, -1.08203125, -0.375, 0.33203125, 1.0390625, 1.74609375, 2.453125, 3.16015625, 3.8671875, 4.57421875, 5.28125, 5.98828125, 6.6953125, 7.40234375, 8.109375, 8.81640625, 9.5234375, 10.23046875, 10.9375, 11.64453125, 12.3515625, 13.05859375, 13.765625, 14.47265625, 15.1796875, 15.88671875, 16.59375, 17.30078125, 18.0078125, 18.71484375, 19.421875, 20.12890625, 20.8359375, 21.54296875, 22.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 8.0, 6.0, 6.0, 17.0, 25.0, 24.0, 49.0, 74.0, 96.0, 109.0, 165.0, 259.0, 384.0, 518.0, 724.0, 1070.0, 1528.0, 2226.0, 3326.0, 4649.0, 6787.0, 10025.0, 14587.0, 20897.0, 31261.0, 46163.0, 70353.0, 108496.0, 177839.0, 313748.0, 611387.0, 3827831.0, 417721.0, 225964.0, 135131.0, 84914.0, 55650.0, 36910.0, 25409.0, 16985.0, 11619.0, 8133.0, 5565.0, 3896.0, 2694.0, 1931.0, 1304.0, 920.0, 622.0, 419.0, 308.0, 228.0, 144.0, 113.0, 80.0, 66.0, 36.0, 14.0, 16.0, 11.0, 9.0, 3.0], "bins": [-1.4609375, -1.416961669921875, -1.37298583984375, -1.329010009765625, -1.2850341796875, -1.241058349609375, -1.19708251953125, -1.153106689453125, -1.109130859375, -1.065155029296875, -1.02117919921875, -0.977203369140625, -0.9332275390625, -0.889251708984375, -0.84527587890625, -0.801300048828125, -0.75732421875, -0.713348388671875, -0.66937255859375, -0.625396728515625, -0.5814208984375, -0.537445068359375, -0.49346923828125, -0.449493408203125, -0.405517578125, -0.361541748046875, -0.31756591796875, -0.273590087890625, -0.2296142578125, -0.185638427734375, -0.14166259765625, -0.097686767578125, -0.0537109375, -0.009735107421875, 0.03424072265625, 0.078216552734375, 0.1221923828125, 0.166168212890625, 0.21014404296875, 0.254119873046875, 0.298095703125, 0.342071533203125, 0.38604736328125, 0.430023193359375, 0.4739990234375, 0.517974853515625, 0.56195068359375, 0.605926513671875, 0.64990234375, 0.693878173828125, 0.73785400390625, 0.781829833984375, 0.8258056640625, 0.869781494140625, 0.91375732421875, 0.957733154296875, 1.001708984375, 1.045684814453125, 1.08966064453125, 1.133636474609375, 1.1776123046875, 1.221588134765625, 1.26556396484375, 1.309539794921875, 1.353515625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 1.0, 2.0, 8.0, 8.0, 10.0, 11.0, 15.0, 8.0, 16.0, 17.0, 19.0, 18.0, 21.0, 30.0, 25.0, 25.0, 36.0, 31.0, 41.0, 40.0, 42.0, 41.0, 85.0, 987.0, 45.0, 45.0, 39.0, 30.0, 25.0, 29.0, 44.0, 19.0, 35.0, 22.0, 21.0, 17.0, 18.0, 17.0, 16.0, 10.0, 12.0, 4.0, 8.0, 5.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.078125, -16.565185546875, -16.05224609375, -15.539306640625, -15.0263671875, -14.513427734375, -14.00048828125, -13.487548828125, -12.974609375, -12.461669921875, -11.94873046875, -11.435791015625, -10.9228515625, -10.409912109375, -9.89697265625, -9.384033203125, -8.87109375, -8.358154296875, -7.84521484375, -7.332275390625, -6.8193359375, -6.306396484375, -5.79345703125, -5.280517578125, -4.767578125, -4.254638671875, -3.74169921875, -3.228759765625, -2.7158203125, -2.202880859375, -1.68994140625, -1.177001953125, -0.6640625, -0.151123046875, 0.36181640625, 0.874755859375, 1.3876953125, 1.900634765625, 2.41357421875, 2.926513671875, 3.439453125, 3.952392578125, 4.46533203125, 4.978271484375, 5.4912109375, 6.004150390625, 6.51708984375, 7.030029296875, 7.54296875, 8.055908203125, 8.56884765625, 9.081787109375, 9.5947265625, 10.107666015625, 10.62060546875, 11.133544921875, 11.646484375, 12.159423828125, 12.67236328125, 13.185302734375, 13.6982421875, 14.211181640625, 14.72412109375, 15.237060546875, 15.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [8.0, 7.0, 2.0, 8.0, 10.0, 13.0, 10.0, 7.0, 10.0, 20.0, 17.0, 19.0, 22.0, 20.0, 30.0, 34.0, 68.0, 79.0, 144.0, 241.0, 304.0, 525.0, 871.0, 1360.0, 2214.0, 3877.0, 6865.0, 11873.0, 22667.0, 45434.0, 111911.0, 5774046.0, 178898.0, 64242.0, 29447.0, 15442.0, 8565.0, 4766.0, 2884.0, 1502.0, 1028.0, 649.0, 466.0, 279.0, 163.0, 98.0, 67.0, 51.0, 32.0, 33.0, 8.0, 21.0, 8.0, 19.0, 13.0, 7.0, 12.0, 6.0, 11.0, 5.0, 6.0, 3.0, 3.0, 6.0], "bins": [-4.6328125, -4.4866943359375, -4.340576171875, -4.1944580078125, -4.04833984375, -3.9022216796875, -3.756103515625, -3.6099853515625, -3.4638671875, -3.3177490234375, -3.171630859375, -3.0255126953125, -2.87939453125, -2.7332763671875, -2.587158203125, -2.4410400390625, -2.294921875, -2.1488037109375, -2.002685546875, -1.8565673828125, -1.71044921875, -1.5643310546875, -1.418212890625, -1.2720947265625, -1.1259765625, -0.9798583984375, -0.833740234375, -0.6876220703125, -0.54150390625, -0.3953857421875, -0.249267578125, -0.1031494140625, 0.04296875, 0.1890869140625, 0.335205078125, 0.4813232421875, 0.62744140625, 0.7735595703125, 0.919677734375, 1.0657958984375, 1.2119140625, 1.3580322265625, 1.504150390625, 1.6502685546875, 1.79638671875, 1.9425048828125, 2.088623046875, 2.2347412109375, 2.380859375, 2.5269775390625, 2.673095703125, 2.8192138671875, 2.96533203125, 3.1114501953125, 3.257568359375, 3.4036865234375, 3.5498046875, 3.6959228515625, 3.842041015625, 3.9881591796875, 4.13427734375, 4.2803955078125, 4.426513671875, 4.5726318359375, 4.71875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 9.0, 11.0, 19.0, 13.0, 22.0, 20.0, 21.0, 18.0, 28.0, 26.0, 27.0, 30.0, 38.0, 32.0, 29.0, 37.0, 51.0, 948.0, 143.0, 33.0, 35.0, 37.0, 30.0, 27.0, 26.0, 30.0, 30.0, 25.0, 21.0, 29.0, 22.0, 18.0, 15.0, 14.0, 8.0, 6.0, 9.0, 3.0, 9.0, 6.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-12.0390625, -11.6590576171875, -11.279052734375, -10.8990478515625, -10.51904296875, -10.1390380859375, -9.759033203125, -9.3790283203125, -8.9990234375, -8.6190185546875, -8.239013671875, -7.8590087890625, -7.47900390625, -7.0989990234375, -6.718994140625, -6.3389892578125, -5.958984375, -5.5789794921875, -5.198974609375, -4.8189697265625, -4.43896484375, -4.0589599609375, -3.678955078125, -3.2989501953125, -2.9189453125, -2.5389404296875, -2.158935546875, -1.7789306640625, -1.39892578125, -1.0189208984375, -0.638916015625, -0.2589111328125, 0.12109375, 0.5010986328125, 0.881103515625, 1.2611083984375, 1.64111328125, 2.0211181640625, 2.401123046875, 2.7811279296875, 3.1611328125, 3.5411376953125, 3.921142578125, 4.3011474609375, 4.68115234375, 5.0611572265625, 5.441162109375, 5.8211669921875, 6.201171875, 6.5811767578125, 6.961181640625, 7.3411865234375, 7.72119140625, 8.1011962890625, 8.481201171875, 8.8612060546875, 9.2412109375, 9.6212158203125, 10.001220703125, 10.3812255859375, 10.76123046875, 11.1412353515625, 11.521240234375, 11.9012451171875, 12.28125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 5.0, 17.0, 31.0, 32.0, 45.0, 92.0, 185.0, 264.0, 131.0, 63.0, 36.0, 34.0, 14.0, 8.0, 5.0, 11.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.67357635498047, -36.34067153930664, -35.00776672363281, -33.674861907958984, -32.341957092285156, -31.009052276611328, -29.676145553588867, -28.34324073791504, -27.01033592224121, -25.677431106567383, -24.344526290893555, -23.011621475219727, -21.678714752197266, -20.345809936523438, -19.01290512084961, -17.68000030517578, -16.347095489501953, -15.014190673828125, -13.681285858154297, -12.348380088806152, -11.015475273132324, -9.682570457458496, -8.349664688110352, -7.016759872436523, -5.683855056762695, -4.350950241088867, -3.018044948577881, -1.6851398944854736, -0.3522348403930664, 0.9806699752807617, 2.313575267791748, 3.6464805603027344, 4.9793853759765625, 6.312290191650391, 7.645195484161377, 8.978100776672363, 10.311005592346191, 11.64391040802002, 12.976816177368164, 14.309720993041992, 15.64262580871582, 16.97553062438965, 18.308435440063477, 19.641340255737305, 20.974246978759766, 22.307151794433594, 23.640056610107422, 24.97296142578125, 26.305866241455078, 27.638771057128906, 28.971675872802734, 30.304580688476562, 31.63748550415039, 32.97039031982422, 34.30329513549805, 35.636199951171875, 36.96910858154297, 38.3020133972168, 39.634918212890625, 40.96782302856445, 42.30072784423828, 43.63363265991211, 44.96653747558594, 46.29944610595703, 47.632347106933594]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 9.0, 10.0, 14.0, 19.0, 18.0, 23.0, 16.0, 25.0, 24.0, 24.0, 38.0, 30.0, 42.0, 40.0, 35.0, 44.0, 40.0, 50.0, 45.0, 41.0, 39.0, 36.0, 37.0, 36.0, 27.0, 34.0, 23.0, 23.0, 23.0, 14.0, 14.0, 23.0, 12.0, 9.0, 6.0, 4.0, 10.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.157644271850586, -27.326684951782227, -26.495725631713867, -25.664766311645508, -24.833805084228516, -24.002845764160156, -23.171886444091797, -22.340927124023438, -21.509967803955078, -20.67900848388672, -19.84804916381836, -19.01708984375, -18.18613052368164, -17.35517120361328, -16.52420997619629, -15.69325065612793, -14.86229133605957, -14.031332015991211, -13.200372695922852, -12.369412422180176, -11.538453102111816, -10.707493782043457, -9.876533508300781, -9.045574188232422, -8.214614868164062, -7.383655548095703, -6.5526957511901855, -5.721735954284668, -4.890776634216309, -4.059817314147949, -3.2288575172424316, -2.397897720336914, -1.5669364929199219, -0.7359769344329834, 0.09498262405395508, 0.9259421825408936, 1.756901741027832, 2.5878610610961914, 3.418820858001709, 4.249780654907227, 5.080739974975586, 5.911699295043945, 6.742659091949463, 7.5736188888549805, 8.40457820892334, 9.2355375289917, 10.066497802734375, 10.897457122802734, 11.728416442871094, 12.559375762939453, 13.390335083007812, 14.221295356750488, 15.052254676818848, 15.883213996887207, 16.714174270629883, 17.545133590698242, 18.3760929107666, 19.20705223083496, 20.03801155090332, 20.86897087097168, 21.699932098388672, 22.53089141845703, 23.36185073852539, 24.19281005859375, 25.02376937866211]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 8.0, 9.0, 10.0, 16.0, 12.0, 16.0, 25.0, 38.0, 43.0, 57.0, 82.0, 88.0, 155.0, 177.0, 225.0, 364.0, 477.0, 714.0, 1090.0, 1698.0, 3084.0, 5890.0, 27638.0, 4113583.0, 28226.0, 4772.0, 2296.0, 1240.0, 725.0, 464.0, 313.0, 204.0, 154.0, 112.0, 78.0, 55.0, 42.0, 46.0, 17.0, 15.0, 8.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62548828125, -0.608795166015625, -0.59210205078125, -0.575408935546875, -0.5587158203125, -0.542022705078125, -0.52532958984375, -0.508636474609375, -0.491943359375, -0.475250244140625, -0.45855712890625, -0.441864013671875, -0.4251708984375, -0.408477783203125, -0.39178466796875, -0.375091552734375, -0.3583984375, -0.341705322265625, -0.32501220703125, -0.308319091796875, -0.2916259765625, -0.274932861328125, -0.25823974609375, -0.241546630859375, -0.224853515625, -0.208160400390625, -0.19146728515625, -0.174774169921875, -0.1580810546875, -0.141387939453125, -0.12469482421875, -0.108001708984375, -0.09130859375, -0.074615478515625, -0.05792236328125, -0.041229248046875, -0.0245361328125, -0.007843017578125, 0.00885009765625, 0.025543212890625, 0.042236328125, 0.058929443359375, 0.07562255859375, 0.092315673828125, 0.1090087890625, 0.125701904296875, 0.14239501953125, 0.159088134765625, 0.17578125, 0.192474365234375, 0.20916748046875, 0.225860595703125, 0.2425537109375, 0.259246826171875, 0.27593994140625, 0.292633056640625, 0.309326171875, 0.326019287109375, 0.34271240234375, 0.359405517578125, 0.3760986328125, 0.392791748046875, 0.40948486328125, 0.426177978515625, 0.44287109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 9.0, 5.0, 3.0, 5.0, 4.0, 6.0, 2.0, 7.0, 9.0, 9.0, 15.0, 18.0, 755.0, 54.0, 17.0, 14.0, 6.0, 9.0, 5.0, 8.0, 5.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.1480541229248047, -0.14400863647460938, -0.13996315002441406, -0.13591766357421875, -0.13187217712402344, -0.12782669067382812, -0.12378120422363281, -0.1197357177734375, -0.11569023132324219, -0.11164474487304688, -0.10759925842285156, -0.10355377197265625, -0.09950828552246094, -0.09546279907226562, -0.09141731262207031, -0.087371826171875, -0.08332633972167969, -0.07928085327148438, -0.07523536682128906, -0.07118988037109375, -0.06714439392089844, -0.06309890747070312, -0.05905342102050781, -0.0550079345703125, -0.05096244812011719, -0.046916961669921875, -0.04287147521972656, -0.03882598876953125, -0.03478050231933594, -0.030735015869140625, -0.026689529418945312, -0.02264404296875, -0.018598556518554688, -0.014553070068359375, -0.010507583618164062, -0.00646209716796875, -0.0024166107177734375, 0.001628875732421875, 0.0056743621826171875, 0.0097198486328125, 0.013765335083007812, 0.017810821533203125, 0.021856307983398438, 0.02590179443359375, 0.029947280883789062, 0.033992767333984375, 0.03803825378417969, 0.042083740234375, 0.04612922668457031, 0.050174713134765625, 0.05422019958496094, 0.05826568603515625, 0.06231117248535156, 0.06635665893554688, 0.07040214538574219, 0.0744476318359375, 0.07849311828613281, 0.08253860473632812, 0.08658409118652344, 0.09062957763671875, 0.09467506408691406, 0.09872055053710938, 0.10276603698730469, 0.1068115234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 9.0, 18.0, 22.0, 26.0, 38.0, 83.0, 104.0, 121.0, 220.0, 253.0, 418.0, 581.0, 940.0, 1333.0, 2107.0, 3501.0, 6209.0, 11593.0, 25151.0, 72822.0, 3388278.0, 574302.0, 56331.0, 22173.0, 10823.0, 6047.0, 3653.0, 2284.0, 1449.0, 1073.0, 687.0, 434.0, 333.0, 220.0, 157.0, 136.0, 104.0, 64.0, 47.0, 35.0, 22.0, 18.0, 11.0, 7.0, 10.0, 9.0, 4.0, 5.0, 4.0, 0.0, 3.0], "bins": [-0.425048828125, -0.4125022888183594, -0.39995574951171875, -0.3874092102050781, -0.3748626708984375, -0.3623161315917969, -0.34976959228515625, -0.3372230529785156, -0.324676513671875, -0.3121299743652344, -0.29958343505859375, -0.2870368957519531, -0.2744903564453125, -0.2619438171386719, -0.24939727783203125, -0.23685073852539062, -0.22430419921875, -0.21175765991210938, -0.19921112060546875, -0.18666458129882812, -0.1741180419921875, -0.16157150268554688, -0.14902496337890625, -0.13647842407226562, -0.123931884765625, -0.11138534545898438, -0.09883880615234375, -0.08629226684570312, -0.0737457275390625, -0.061199188232421875, -0.04865264892578125, -0.036106109619140625, -0.0235595703125, -0.011013031005859375, 0.00153350830078125, 0.014080047607421875, 0.0266265869140625, 0.039173126220703125, 0.05171966552734375, 0.06426620483398438, 0.076812744140625, 0.08935928344726562, 0.10190582275390625, 0.11445236206054688, 0.1269989013671875, 0.13954544067382812, 0.15209197998046875, 0.16463851928710938, 0.17718505859375, 0.18973159790039062, 0.20227813720703125, 0.21482467651367188, 0.2273712158203125, 0.23991775512695312, 0.25246429443359375, 0.2650108337402344, 0.277557373046875, 0.2901039123535156, 0.30265045166015625, 0.3151969909667969, 0.3277435302734375, 0.3402900695800781, 0.35283660888671875, 0.3653831481933594, 0.3779296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 9.0, 5.0, 7.0, 13.0, 21.0, 23.0, 20.0, 29.0, 39.0, 112.0, 430.0, 2283.0, 626.0, 160.0, 71.0, 37.0, 35.0, 32.0, 13.0, 13.0, 12.0, 10.0, 11.0, 10.0, 7.0, 3.0, 1.0, 11.0, 2.0, 2.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1884765625, -0.1816539764404297, -0.17483139038085938, -0.16800880432128906, -0.16118621826171875, -0.15436363220214844, -0.14754104614257812, -0.1407184600830078, -0.1338958740234375, -0.1270732879638672, -0.12025070190429688, -0.11342811584472656, -0.10660552978515625, -0.09978294372558594, -0.09296035766601562, -0.08613777160644531, -0.079315185546875, -0.07249259948730469, -0.06567001342773438, -0.05884742736816406, -0.05202484130859375, -0.04520225524902344, -0.038379669189453125, -0.03155708312988281, -0.0247344970703125, -0.017911911010742188, -0.011089324951171875, -0.0042667388916015625, 0.00255584716796875, 0.009378433227539062, 0.016201019287109375, 0.023023605346679688, 0.02984619140625, 0.03666877746582031, 0.043491363525390625, 0.05031394958496094, 0.05713653564453125, 0.06395912170410156, 0.07078170776367188, 0.07760429382324219, 0.0844268798828125, 0.09124946594238281, 0.09807205200195312, 0.10489463806152344, 0.11171722412109375, 0.11853981018066406, 0.12536239624023438, 0.1321849822998047, 0.139007568359375, 0.1458301544189453, 0.15265274047851562, 0.15947532653808594, 0.16629791259765625, 0.17312049865722656, 0.17994308471679688, 0.1867656707763672, 0.1935882568359375, 0.2004108428955078, 0.20723342895507812, 0.21405601501464844, 0.22087860107421875, 0.22770118713378906, 0.23452377319335938, 0.2413463592529297, 0.2481689453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 9.0, 14.0, 30.0, 49.0, 85.0, 222.0, 227.0, 124.0, 64.0, 46.0, 26.0, 17.0, 16.0, 12.0, 9.0, 7.0, 9.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0187275409698486, -0.9822201132774353, -0.9457127451896667, -0.9092053174972534, -0.8726978898048401, -0.8361904621124268, -0.7996830940246582, -0.7631756663322449, -0.7266682386398315, -0.6901608109474182, -0.6536534428596497, -0.6171460151672363, -0.580638587474823, -0.5441311597824097, -0.5076237916946411, -0.4711163640022278, -0.43460899591445923, -0.3981015980243683, -0.36159417033195496, -0.325086772441864, -0.2885793447494507, -0.25207194685935974, -0.2155645489692688, -0.17905712127685547, -0.14254972338676453, -0.10604231059551239, -0.06953490525484085, -0.03302749991416931, 0.0034799128770828247, 0.03998732566833496, 0.0764947235584259, 0.11300215125083923, 0.14950954914093018, 0.1860169619321823, 0.22252437472343445, 0.2590317726135254, 0.2955392003059387, 0.33204659819602966, 0.3685539960861206, 0.40506142377853394, 0.4415688216686249, 0.4780762195587158, 0.5145836472511292, 0.5510910749435425, 0.587598443031311, 0.6241058707237244, 0.6606132984161377, 0.6971206665039062, 0.7336280941963196, 0.7701355218887329, 0.8066428899765015, 0.8431503176689148, 0.8796577453613281, 0.9161651134490967, 0.95267254114151, 0.9891799688339233, 1.025687336921692, 1.0621947050094604, 1.0987021923065186, 1.135209560394287, 1.1717169284820557, 1.2082244157791138, 1.2447317838668823, 1.2812392711639404, 1.317746639251709]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 10.0, 20.0, 13.0, 14.0, 31.0, 37.0, 56.0, 54.0, 59.0, 37.0, 65.0, 69.0, 73.0, 69.0, 64.0, 57.0, 49.0, 50.0, 31.0, 31.0, 21.0, 23.0, 15.0, 10.0, 10.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0996553897857666, -1.0632859468460083, -1.02691650390625, -0.9905471205711365, -0.954177737236023, -0.9178082942962646, -0.8814388513565063, -0.845069408416748, -0.8087000250816345, -0.7723305821418762, -0.7359611988067627, -0.6995917558670044, -0.6632223129272461, -0.6268529295921326, -0.5904834866523743, -0.5541141033172607, -0.5177446603775024, -0.48137524724006653, -0.4450058341026306, -0.4086363911628723, -0.3722669780254364, -0.3358975648880005, -0.2995281219482422, -0.2631587088108063, -0.22678929567337036, -0.19041988253593445, -0.15405045449733734, -0.11768103390932083, -0.08131161332130432, -0.04494220018386841, -0.008572772145271301, 0.027796655893325806, 0.06416606903076172, 0.10053548961877823, 0.13690491020679474, 0.17327433824539185, 0.20964375138282776, 0.24601316452026367, 0.282382607460022, 0.3187520205974579, 0.3551214337348938, 0.3914908468723297, 0.4278602600097656, 0.4642297029495239, 0.5005991458892822, 0.5369685292243958, 0.573337972164154, 0.6097073554992676, 0.6460767984390259, 0.6824462413787842, 0.7188156247138977, 0.755185067653656, 0.7915544509887695, 0.8279238939285278, 0.8642933368682861, 0.9006627798080444, 0.937032163143158, 0.9734016060829163, 1.0097709894180298, 1.046140432357788, 1.0825098752975464, 1.1188793182373047, 1.1552486419677734, 1.1916180849075317, 1.22798752784729]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 10.0, 18.0, 19.0, 51.0, 49.0, 65.0, 107.0, 133.0, 223.0, 319.0, 429.0, 642.0, 965.0, 1328.0, 2040.0, 3214.0, 5136.0, 8326.0, 15401.0, 44936.0, 885077.0, 42349.0, 15157.0, 8375.0, 4991.0, 3049.0, 1954.0, 1309.0, 924.0, 635.0, 415.0, 273.0, 190.0, 121.0, 81.0, 60.0, 44.0, 38.0, 22.0, 12.0, 14.0, 13.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.60302734375, -0.5818557739257812, -0.5606842041015625, -0.5395126342773438, -0.518341064453125, -0.49716949462890625, -0.4759979248046875, -0.45482635498046875, -0.43365478515625, -0.41248321533203125, -0.3913116455078125, -0.37014007568359375, -0.348968505859375, -0.32779693603515625, -0.3066253662109375, -0.28545379638671875, -0.2642822265625, -0.24311065673828125, -0.2219390869140625, -0.20076751708984375, -0.179595947265625, -0.15842437744140625, -0.1372528076171875, -0.11608123779296875, -0.09490966796875, -0.07373809814453125, -0.0525665283203125, -0.03139495849609375, -0.010223388671875, 0.01094818115234375, 0.0321197509765625, 0.05329132080078125, 0.074462890625, 0.09563446044921875, 0.1168060302734375, 0.13797760009765625, 0.159149169921875, 0.18032073974609375, 0.2014923095703125, 0.22266387939453125, 0.24383544921875, 0.26500701904296875, 0.2861785888671875, 0.30735015869140625, 0.328521728515625, 0.34969329833984375, 0.3708648681640625, 0.39203643798828125, 0.4132080078125, 0.43437957763671875, 0.4555511474609375, 0.47672271728515625, 0.497894287109375, 0.5190658569335938, 0.5402374267578125, 0.5614089965820312, 0.58258056640625, 0.6037521362304688, 0.6249237060546875, 0.6460952758789062, 0.667266845703125, 0.6884384155273438, 0.7096099853515625, 0.7307815551757812, 0.751953125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 2.0, 9.0, 4.0, 4.0, 4.0, 1.0, 6.0, 6.0, 12.0, 10.0, 39.0, 318.0, 428.0, 55.0, 15.0, 14.0, 12.0, 5.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 5.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14994525909423828, -0.14608192443847656, -0.14221858978271484, -0.13835525512695312, -0.1344919204711914, -0.1306285858154297, -0.12676525115966797, -0.12290191650390625, -0.11903858184814453, -0.11517524719238281, -0.1113119125366211, -0.10744857788085938, -0.10358524322509766, -0.09972190856933594, -0.09585857391357422, -0.0919952392578125, -0.08813190460205078, -0.08426856994628906, -0.08040523529052734, -0.07654190063476562, -0.0726785659790039, -0.06881523132324219, -0.06495189666748047, -0.06108856201171875, -0.05722522735595703, -0.05336189270019531, -0.049498558044433594, -0.045635223388671875, -0.041771888732910156, -0.03790855407714844, -0.03404521942138672, -0.030181884765625, -0.02631855010986328, -0.022455215454101562, -0.018591880798339844, -0.014728546142578125, -0.010865211486816406, -0.0070018768310546875, -0.0031385421752929688, 0.00072479248046875, 0.004588127136230469, 0.008451461791992188, 0.012314796447753906, 0.016178131103515625, 0.020041465759277344, 0.023904800415039062, 0.02776813507080078, 0.0316314697265625, 0.03549480438232422, 0.03935813903808594, 0.043221473693847656, 0.047084808349609375, 0.050948143005371094, 0.05481147766113281, 0.05867481231689453, 0.06253814697265625, 0.06640148162841797, 0.07026481628417969, 0.0741281509399414, 0.07799148559570312, 0.08185482025146484, 0.08571815490722656, 0.08958148956298828, 0.09344482421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 11.0, 19.0, 21.0, 28.0, 34.0, 62.0, 88.0, 133.0, 214.0, 352.0, 714.0, 1338.0, 3046.0, 7345.0, 19267.0, 54446.0, 195812.0, 551143.0, 143722.0, 43531.0, 15774.0, 6144.0, 2600.0, 1202.0, 620.0, 297.0, 201.0, 113.0, 80.0, 54.0, 30.0, 25.0, 21.0, 19.0, 7.0, 7.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.671875, -0.65289306640625, -0.6339111328125, -0.61492919921875, -0.595947265625, -0.57696533203125, -0.5579833984375, -0.53900146484375, -0.52001953125, -0.50103759765625, -0.4820556640625, -0.46307373046875, -0.444091796875, -0.42510986328125, -0.4061279296875, -0.38714599609375, -0.3681640625, -0.34918212890625, -0.3302001953125, -0.31121826171875, -0.292236328125, -0.27325439453125, -0.2542724609375, -0.23529052734375, -0.21630859375, -0.19732666015625, -0.1783447265625, -0.15936279296875, -0.140380859375, -0.12139892578125, -0.1024169921875, -0.08343505859375, -0.064453125, -0.04547119140625, -0.0264892578125, -0.00750732421875, 0.011474609375, 0.03045654296875, 0.0494384765625, 0.06842041015625, 0.08740234375, 0.10638427734375, 0.1253662109375, 0.14434814453125, 0.163330078125, 0.18231201171875, 0.2012939453125, 0.22027587890625, 0.2392578125, 0.25823974609375, 0.2772216796875, 0.29620361328125, 0.315185546875, 0.33416748046875, 0.3531494140625, 0.37213134765625, 0.39111328125, 0.41009521484375, 0.4290771484375, 0.44805908203125, 0.467041015625, 0.48602294921875, 0.5050048828125, 0.52398681640625, 0.54296875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 12.0, 10.0, 10.0, 13.0, 17.0, 21.0, 20.0, 29.0, 29.0, 29.0, 41.0, 32.0, 38.0, 43.0, 51.0, 40.0, 46.0, 43.0, 41.0, 50.0, 33.0, 54.0, 28.0, 29.0, 33.0, 24.0, 36.0, 23.0, 27.0, 17.0, 19.0, 9.0, 8.0, 11.0, 7.0, 6.0, 5.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.439453125, -0.4242706298828125, -0.409088134765625, -0.3939056396484375, -0.37872314453125, -0.3635406494140625, -0.348358154296875, -0.3331756591796875, -0.3179931640625, -0.3028106689453125, -0.287628173828125, -0.2724456787109375, -0.25726318359375, -0.2420806884765625, -0.226898193359375, -0.2117156982421875, -0.196533203125, -0.1813507080078125, -0.166168212890625, -0.1509857177734375, -0.13580322265625, -0.1206207275390625, -0.105438232421875, -0.0902557373046875, -0.0750732421875, -0.0598907470703125, -0.044708251953125, -0.0295257568359375, -0.01434326171875, 0.0008392333984375, 0.016021728515625, 0.0312042236328125, 0.04638671875, 0.0615692138671875, 0.076751708984375, 0.0919342041015625, 0.10711669921875, 0.1222991943359375, 0.137481689453125, 0.1526641845703125, 0.1678466796875, 0.1830291748046875, 0.198211669921875, 0.2133941650390625, 0.22857666015625, 0.2437591552734375, 0.258941650390625, 0.2741241455078125, 0.289306640625, 0.3044891357421875, 0.319671630859375, 0.3348541259765625, 0.35003662109375, 0.3652191162109375, 0.380401611328125, 0.3955841064453125, 0.4107666015625, 0.4259490966796875, 0.441131591796875, 0.4563140869140625, 0.47149658203125, 0.4866790771484375, 0.501861572265625, 0.5170440673828125, 0.5322265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 13.0, 14.0, 14.0, 25.0, 25.0, 38.0, 56.0, 90.0, 134.0, 246.0, 359.0, 652.0, 1212.0, 2802.0, 6950.0, 22211.0, 109762.0, 742497.0, 123888.0, 24141.0, 7475.0, 2900.0, 1362.0, 681.0, 345.0, 213.0, 149.0, 94.0, 47.0, 51.0, 23.0, 23.0, 9.0, 11.0, 5.0, 16.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0243682861328125, -0.023701190948486328, -0.023034095764160156, -0.022367000579833984, -0.021699905395507812, -0.02103281021118164, -0.02036571502685547, -0.019698619842529297, -0.019031524658203125, -0.018364429473876953, -0.01769733428955078, -0.01703023910522461, -0.016363143920898438, -0.015696048736572266, -0.015028953552246094, -0.014361858367919922, -0.01369476318359375, -0.013027667999267578, -0.012360572814941406, -0.011693477630615234, -0.011026382446289062, -0.01035928726196289, -0.009692192077636719, -0.009025096893310547, -0.008358001708984375, -0.007690906524658203, -0.007023811340332031, -0.006356716156005859, -0.0056896209716796875, -0.005022525787353516, -0.004355430603027344, -0.003688335418701172, -0.003021240234375, -0.002354145050048828, -0.0016870498657226562, -0.0010199546813964844, -0.0003528594970703125, 0.0003142356872558594, 0.0009813308715820312, 0.0016484260559082031, 0.002315521240234375, 0.002982616424560547, 0.0036497116088867188, 0.004316806793212891, 0.0049839019775390625, 0.005650997161865234, 0.006318092346191406, 0.006985187530517578, 0.00765228271484375, 0.008319377899169922, 0.008986473083496094, 0.009653568267822266, 0.010320663452148438, 0.01098775863647461, 0.011654853820800781, 0.012321949005126953, 0.012989044189453125, 0.013656139373779297, 0.014323234558105469, 0.01499032974243164, 0.015657424926757812, 0.016324520111083984, 0.016991615295410156, 0.017658710479736328, 0.0183258056640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 8.0, 1.0, 9.0, 9.0, 7.0, 16.0, 18.0, 30.0, 16.0, 50.0, 50.0, 56.0, 77.0, 65.0, 80.0, 72.0, 69.0, 53.0, 63.0, 58.0, 44.0, 40.0, 34.0, 18.0, 16.0, 7.0, 13.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2782554626464844e-06, -3.1618401408195496e-06, -3.0454248189926147e-06, -2.92900949716568e-06, -2.812594175338745e-06, -2.6961788535118103e-06, -2.5797635316848755e-06, -2.4633482098579407e-06, -2.346932888031006e-06, -2.230517566204071e-06, -2.1141022443771362e-06, -1.9976869225502014e-06, -1.8812716007232666e-06, -1.7648562788963318e-06, -1.648440957069397e-06, -1.5320256352424622e-06, -1.4156103134155273e-06, -1.2991949915885925e-06, -1.1827796697616577e-06, -1.066364347934723e-06, -9.499490261077881e-07, -8.335337042808533e-07, -7.171183824539185e-07, -6.007030606269836e-07, -4.842877388000488e-07, -3.67872416973114e-07, -2.514570951461792e-07, -1.3504177331924438e-07, -1.862645149230957e-08, 9.778887033462524e-08, 2.1420419216156006e-07, 3.3061951398849487e-07, 4.470348358154297e-07, 5.634501576423645e-07, 6.798654794692993e-07, 7.962808012962341e-07, 9.126961231231689e-07, 1.0291114449501038e-06, 1.1455267667770386e-06, 1.2619420886039734e-06, 1.3783574104309082e-06, 1.494772732257843e-06, 1.6111880540847778e-06, 1.7276033759117126e-06, 1.8440186977386475e-06, 1.9604340195655823e-06, 2.076849341392517e-06, 2.193264663219452e-06, 2.3096799850463867e-06, 2.4260953068733215e-06, 2.5425106287002563e-06, 2.658925950527191e-06, 2.775341272354126e-06, 2.891756594181061e-06, 3.0081719160079956e-06, 3.1245872378349304e-06, 3.2410025596618652e-06, 3.3574178814888e-06, 3.473833203315735e-06, 3.5902485251426697e-06, 3.7066638469696045e-06, 3.823079168796539e-06, 3.939494490623474e-06, 4.055909812450409e-06, 4.172325134277344e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 11.0, 10.0, 10.0, 15.0, 33.0, 52.0, 85.0, 147.0, 254.0, 460.0, 1093.0, 2515.0, 6621.0, 20596.0, 77921.0, 552256.0, 309006.0, 53654.0, 15027.0, 4966.0, 1962.0, 884.0, 426.0, 197.0, 127.0, 66.0, 48.0, 40.0, 16.0, 20.0, 8.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0224609375, -0.021851778030395508, -0.021242618560791016, -0.020633459091186523, -0.02002429962158203, -0.01941514015197754, -0.018805980682373047, -0.018196821212768555, -0.017587661743164062, -0.01697850227355957, -0.016369342803955078, -0.015760183334350586, -0.015151023864746094, -0.014541864395141602, -0.01393270492553711, -0.013323545455932617, -0.012714385986328125, -0.012105226516723633, -0.01149606704711914, -0.010886907577514648, -0.010277748107910156, -0.009668588638305664, -0.009059429168701172, -0.00845026969909668, -0.007841110229492188, -0.007231950759887695, -0.006622791290283203, -0.006013631820678711, -0.005404472351074219, -0.0047953128814697266, -0.004186153411865234, -0.003576993942260742, -0.00296783447265625, -0.002358675003051758, -0.0017495155334472656, -0.0011403560638427734, -0.0005311965942382812, 7.796287536621094e-05, 0.0006871223449707031, 0.0012962818145751953, 0.0019054412841796875, 0.0025146007537841797, 0.003123760223388672, 0.003732919692993164, 0.004342079162597656, 0.0049512386322021484, 0.005560398101806641, 0.006169557571411133, 0.006778717041015625, 0.007387876510620117, 0.00799703598022461, 0.008606195449829102, 0.009215354919433594, 0.009824514389038086, 0.010433673858642578, 0.01104283332824707, 0.011651992797851562, 0.012261152267456055, 0.012870311737060547, 0.013479471206665039, 0.014088630676269531, 0.014697790145874023, 0.015306949615478516, 0.015916109085083008, 0.0165252685546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 9.0, 11.0, 12.0, 18.0, 24.0, 29.0, 27.0, 26.0, 40.0, 48.0, 42.0, 51.0, 75.0, 65.0, 58.0, 64.0, 57.0, 58.0, 59.0, 44.0, 40.0, 16.0, 23.0, 24.0, 21.0, 10.0, 7.0, 5.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01316070556640625, -0.012675881385803223, -0.012191057205200195, -0.011706233024597168, -0.01122140884399414, -0.010736584663391113, -0.010251760482788086, -0.009766936302185059, -0.009282112121582031, -0.008797287940979004, -0.008312463760375977, -0.00782763957977295, -0.007342815399169922, -0.0068579912185668945, -0.006373167037963867, -0.00588834285736084, -0.0054035186767578125, -0.004918694496154785, -0.004433870315551758, -0.0039490461349487305, -0.003464221954345703, -0.0029793977737426758, -0.0024945735931396484, -0.002009749412536621, -0.0015249252319335938, -0.0010401010513305664, -0.0005552768707275391, -7.045269012451172e-05, 0.0004143714904785156, 0.000899195671081543, 0.0013840198516845703, 0.0018688440322875977, 0.002353668212890625, 0.0028384923934936523, 0.0033233165740966797, 0.003808140754699707, 0.004292964935302734, 0.004777789115905762, 0.005262613296508789, 0.005747437477111816, 0.006232261657714844, 0.006717085838317871, 0.0072019100189208984, 0.007686734199523926, 0.008171558380126953, 0.00865638256072998, 0.009141206741333008, 0.009626030921936035, 0.010110855102539062, 0.01059567928314209, 0.011080503463745117, 0.011565327644348145, 0.012050151824951172, 0.0125349760055542, 0.013019800186157227, 0.013504624366760254, 0.013989448547363281, 0.014474272727966309, 0.014959096908569336, 0.015443921089172363, 0.01592874526977539, 0.016413569450378418, 0.016898393630981445, 0.017383217811584473, 0.0178680419921875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 12.0, 11.0, 19.0, 29.0, 61.0, 142.0, 370.0, 183.0, 77.0, 40.0, 19.0, 11.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.148697853088379, -5.907928466796875, -5.667159080505371, -5.426389694213867, -5.185619831085205, -4.944850444793701, -4.704081058502197, -4.463311672210693, -4.222541809082031, -3.9817724227905273, -3.7410027980804443, -3.5002334117889404, -3.2594637870788574, -3.0186944007873535, -2.7779250144958496, -2.5371556282043457, -2.296386241912842, -2.055616855621338, -1.8148472309112549, -1.574077844619751, -1.3333083391189575, -1.092538833618164, -0.8517694473266602, -0.6109999418258667, -0.37023043632507324, -0.12946096062660217, 0.1113085150718689, 0.3520779609680176, 0.592847466468811, 0.8336169719696045, 1.0743863582611084, 1.3151558637619019, 1.5559253692626953, 1.7966948747634888, 2.0374643802642822, 2.278233766555786, 2.519003391265869, 2.759772777557373, 3.000542163848877, 3.241311550140381, 3.482081174850464, 3.7228505611419678, 3.963620185852051, 4.204389572143555, 4.445158958435059, 4.6859283447265625, 4.926697731018066, 5.1674675941467285, 5.408236980438232, 5.649006366729736, 5.88977575302124, 6.130545616149902, 6.371315002441406, 6.61208438873291, 6.852853775024414, 7.093623161315918, 7.334392547607422, 7.575161933898926, 7.81593132019043, 8.056700706481934, 8.297470092773438, 8.538240432739258, 8.779008865356445, 9.019779205322266, 9.26054859161377]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 11.0, 8.0, 9.0, 18.0, 27.0, 41.0, 91.0, 114.0, 169.0, 143.0, 117.0, 82.0, 51.0, 28.0, 14.0, 13.0, 7.0, 4.0, 1.0, 5.0, 8.0, 3.0, 5.0, 1.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.467884063720703, -9.162485122680664, -8.857086181640625, -8.551687240600586, -8.246288299560547, -7.940889835357666, -7.635491371154785, -7.330092430114746, -7.024693489074707, -6.719294548034668, -6.413895606994629, -6.108497142791748, -5.803098201751709, -5.49769926071167, -5.192300796508789, -4.88690185546875, -4.581502914428711, -4.276103973388672, -3.970705270767212, -3.665306568145752, -3.359907627105713, -3.054508686065674, -2.749109983444214, -2.443711280822754, -2.138312339782715, -1.8329135179519653, -1.5275146961212158, -1.2221158742904663, -0.9167170524597168, -0.6113182306289673, -0.3059194087982178, -0.0005207061767578125, 0.30487823486328125, 0.6102770566940308, 0.9156758785247803, 1.2210747003555298, 1.5264735221862793, 1.8318723440170288, 2.1372711658477783, 2.4426698684692383, 2.7480688095092773, 3.0534677505493164, 3.3588664531707764, 3.6642651557922363, 3.9696640968322754, 4.2750630378723145, 4.580461502075195, 4.885860443115234, 5.191259384155273, 5.4966583251953125, 5.802057266235352, 6.107455730438232, 6.4128546714782715, 6.7182536125183105, 7.023652076721191, 7.3290510177612305, 7.6344499588012695, 7.939848899841309, 8.245247840881348, 8.550646781921387, 8.85604476928711, 9.161443710327148, 9.466842651367188, 9.772241592407227, 10.077640533447266]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 7.0, 11.0, 14.0, 21.0, 24.0, 25.0, 24.0, 44.0, 56.0, 67.0, 93.0, 136.0, 189.0, 257.0, 318.0, 431.0, 609.0, 816.0, 1249.0, 1923.0, 2855.0, 4768.0, 8545.0, 19651.0, 172897.0, 3927011.0, 29892.0, 9775.0, 4937.0, 2762.0, 1662.0, 1013.0, 647.0, 443.0, 335.0, 224.0, 165.0, 109.0, 62.0, 52.0, 39.0, 24.0, 20.0, 12.0, 14.0, 14.0, 9.0, 7.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-1.35546875, -1.316864013671875, -1.27825927734375, -1.239654541015625, -1.2010498046875, -1.162445068359375, -1.12384033203125, -1.085235595703125, -1.046630859375, -1.008026123046875, -0.96942138671875, -0.930816650390625, -0.8922119140625, -0.853607177734375, -0.81500244140625, -0.776397705078125, -0.73779296875, -0.699188232421875, -0.66058349609375, -0.621978759765625, -0.5833740234375, -0.544769287109375, -0.50616455078125, -0.467559814453125, -0.428955078125, -0.390350341796875, -0.35174560546875, -0.313140869140625, -0.2745361328125, -0.235931396484375, -0.19732666015625, -0.158721923828125, -0.1201171875, -0.081512451171875, -0.04290771484375, -0.004302978515625, 0.0343017578125, 0.072906494140625, 0.11151123046875, 0.150115966796875, 0.188720703125, 0.227325439453125, 0.26593017578125, 0.304534912109375, 0.3431396484375, 0.381744384765625, 0.42034912109375, 0.458953857421875, 0.49755859375, 0.536163330078125, 0.57476806640625, 0.613372802734375, 0.6519775390625, 0.690582275390625, 0.72918701171875, 0.767791748046875, 0.806396484375, 0.845001220703125, 0.88360595703125, 0.922210693359375, 0.9608154296875, 0.999420166015625, 1.03802490234375, 1.076629638671875, 1.115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 9.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 15.0, 9.0, 24.0, 42.0, 150.0, 256.0, 217.0, 98.0, 45.0, 22.0, 7.0, 10.0, 11.0, 4.0, 9.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09521484375, -0.09254169464111328, -0.08986854553222656, -0.08719539642333984, -0.08452224731445312, -0.0818490982055664, -0.07917594909667969, -0.07650279998779297, -0.07382965087890625, -0.07115650177001953, -0.06848335266113281, -0.0658102035522461, -0.06313705444335938, -0.060463905334472656, -0.05779075622558594, -0.05511760711669922, -0.0524444580078125, -0.04977130889892578, -0.04709815979003906, -0.044425010681152344, -0.041751861572265625, -0.039078712463378906, -0.03640556335449219, -0.03373241424560547, -0.03105926513671875, -0.02838611602783203, -0.025712966918945312, -0.023039817810058594, -0.020366668701171875, -0.017693519592285156, -0.015020370483398438, -0.012347221374511719, -0.009674072265625, -0.007000923156738281, -0.0043277740478515625, -0.0016546249389648438, 0.001018524169921875, 0.0036916732788085938, 0.0063648223876953125, 0.009037971496582031, 0.01171112060546875, 0.014384269714355469, 0.017057418823242188, 0.019730567932128906, 0.022403717041015625, 0.025076866149902344, 0.027750015258789062, 0.03042316436767578, 0.0330963134765625, 0.03576946258544922, 0.03844261169433594, 0.041115760803222656, 0.043788909912109375, 0.046462059020996094, 0.04913520812988281, 0.05180835723876953, 0.05448150634765625, 0.05715465545654297, 0.05982780456542969, 0.0625009536743164, 0.06517410278320312, 0.06784725189208984, 0.07052040100097656, 0.07319355010986328, 0.07586669921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 19.0, 17.0, 21.0, 45.0, 58.0, 92.0, 151.0, 225.0, 360.0, 520.0, 949.0, 1620.0, 2880.0, 5191.0, 9880.0, 20529.0, 45989.0, 132723.0, 3675767.0, 190978.0, 56602.0, 24501.0, 11530.0, 6009.0, 3161.0, 1783.0, 1075.0, 595.0, 363.0, 217.0, 129.0, 97.0, 65.0, 35.0, 32.0, 18.0, 11.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.89990234375, -0.8731307983398438, -0.8463592529296875, -0.8195877075195312, -0.792816162109375, -0.7660446166992188, -0.7392730712890625, -0.7125015258789062, -0.68572998046875, -0.6589584350585938, -0.6321868896484375, -0.6054153442382812, -0.578643798828125, -0.5518722534179688, -0.5251007080078125, -0.49832916259765625, -0.4715576171875, -0.44478607177734375, -0.4180145263671875, -0.39124298095703125, -0.364471435546875, -0.33769989013671875, -0.3109283447265625, -0.28415679931640625, -0.25738525390625, -0.23061370849609375, -0.2038421630859375, -0.17707061767578125, -0.150299072265625, -0.12352752685546875, -0.0967559814453125, -0.06998443603515625, -0.043212890625, -0.01644134521484375, 0.0103302001953125, 0.03710174560546875, 0.063873291015625, 0.09064483642578125, 0.1174163818359375, 0.14418792724609375, 0.17095947265625, 0.19773101806640625, 0.2245025634765625, 0.25127410888671875, 0.278045654296875, 0.30481719970703125, 0.3315887451171875, 0.35836029052734375, 0.3851318359375, 0.41190338134765625, 0.4386749267578125, 0.46544647216796875, 0.492218017578125, 0.5189895629882812, 0.5457611083984375, 0.5725326538085938, 0.59930419921875, 0.6260757446289062, 0.6528472900390625, 0.6796188354492188, 0.706390380859375, 0.7331619262695312, 0.7599334716796875, 0.7867050170898438, 0.8134765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 2.0, 12.0, 7.0, 9.0, 10.0, 12.0, 14.0, 22.0, 26.0, 22.0, 33.0, 29.0, 40.0, 48.0, 61.0, 148.0, 2879.0, 253.0, 91.0, 69.0, 47.0, 41.0, 37.0, 24.0, 30.0, 22.0, 18.0, 12.0, 9.0, 6.0, 5.0, 14.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1925048828125, -0.18725967407226562, -0.18201446533203125, -0.17676925659179688, -0.1715240478515625, -0.16627883911132812, -0.16103363037109375, -0.15578842163085938, -0.150543212890625, -0.14529800415039062, -0.14005279541015625, -0.13480758666992188, -0.1295623779296875, -0.12431716918945312, -0.11907196044921875, -0.11382675170898438, -0.10858154296875, -0.10333633422851562, -0.09809112548828125, -0.09284591674804688, -0.0876007080078125, -0.08235549926757812, -0.07711029052734375, -0.07186508178710938, -0.066619873046875, -0.061374664306640625, -0.05612945556640625, -0.050884246826171875, -0.0456390380859375, -0.040393829345703125, -0.03514862060546875, -0.029903411865234375, -0.024658203125, -0.019412994384765625, -0.01416778564453125, -0.008922576904296875, -0.0036773681640625, 0.001567840576171875, 0.00681304931640625, 0.012058258056640625, 0.017303466796875, 0.022548675537109375, 0.02779388427734375, 0.033039093017578125, 0.0382843017578125, 0.043529510498046875, 0.04877471923828125, 0.054019927978515625, 0.05926513671875, 0.06451034545898438, 0.06975555419921875, 0.07500076293945312, 0.0802459716796875, 0.08549118041992188, 0.09073638916015625, 0.09598159790039062, 0.101226806640625, 0.10647201538085938, 0.11171722412109375, 0.11696243286132812, 0.1222076416015625, 0.12745285034179688, 0.13269805908203125, 0.13794326782226562, 0.1431884765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 29.0, 28.0, 71.0, 123.0, 344.0, 226.0, 87.0, 43.0, 18.0, 7.0, 4.0, 8.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8802274465560913, -0.8355528712272644, -0.7908783555030823, -0.7462037801742554, -0.7015292644500732, -0.6568546891212463, -0.6121801137924194, -0.5675055980682373, -0.5228310227394104, -0.4781564772129059, -0.43348193168640137, -0.38880735635757446, -0.34413281083106995, -0.29945826530456543, -0.2547836899757385, -0.210109144449234, -0.1654345989227295, -0.12076004594564438, -0.07608549296855927, -0.031410932540893555, 0.013263612985610962, 0.05793815851211548, 0.10261273384094238, 0.1472872793674469, 0.19196182489395142, 0.23663637042045593, 0.28131091594696045, 0.32598549127578735, 0.37066003680229187, 0.4153345823287964, 0.4600091576576233, 0.5046837329864502, 0.5493581295013428, 0.5940327048301697, 0.6387072205543518, 0.6833817958831787, 0.7280563116073608, 0.7727308869361877, 0.8174054622650146, 0.8620799779891968, 0.9067545533180237, 0.9514291286468506, 0.9961036443710327, 1.0407781600952148, 1.0854527950286865, 1.1301273107528687, 1.1748018264770508, 1.2194764614105225, 1.2641509771347046, 1.3088254928588867, 1.3535001277923584, 1.3981746435165405, 1.4428491592407227, 1.4875237941741943, 1.5321983098983765, 1.5768728256225586, 1.6215474605560303, 1.6662219762802124, 1.710896611213684, 1.7555711269378662, 1.8002456426620483, 1.8449201583862305, 1.8895947933197021, 1.9342693090438843, 1.9789438247680664]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 3.0, 6.0, 12.0, 10.0, 15.0, 20.0, 24.0, 43.0, 30.0, 31.0, 37.0, 44.0, 43.0, 56.0, 71.0, 66.0, 70.0, 60.0, 63.0, 52.0, 36.0, 49.0, 32.0, 24.0, 24.0, 22.0, 14.0, 14.0, 8.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.635047972202301, -0.612790048122406, -0.590532124042511, -0.568274199962616, -0.546016275882721, -0.5237583518028259, -0.5015004277229309, -0.4792425036430359, -0.45698457956314087, -0.43472665548324585, -0.41246873140335083, -0.3902108073234558, -0.3679528832435608, -0.34569495916366577, -0.32343703508377075, -0.30117911100387573, -0.2789211869239807, -0.2566632628440857, -0.23440533876419067, -0.21214741468429565, -0.18988949060440063, -0.16763156652450562, -0.1453736424446106, -0.12311571836471558, -0.10085779428482056, -0.07859987020492554, -0.05634194612503052, -0.0340840220451355, -0.011826097965240479, 0.010431826114654541, 0.03268975019454956, 0.05494767427444458, 0.07720553874969482, 0.09946346282958984, 0.12172138690948486, 0.14397931098937988, 0.1662372350692749, 0.18849515914916992, 0.21075308322906494, 0.23301100730895996, 0.255268931388855, 0.27752685546875, 0.299784779548645, 0.32204270362854004, 0.34430062770843506, 0.3665585517883301, 0.3888164758682251, 0.4110743999481201, 0.43333232402801514, 0.45559024810791016, 0.4778481721878052, 0.5001060962677002, 0.5223640203475952, 0.5446219444274902, 0.5668798685073853, 0.5891377925872803, 0.6113957166671753, 0.6336536407470703, 0.6559115648269653, 0.6781694889068604, 0.7004274129867554, 0.7226853370666504, 0.7449432611465454, 0.7672011852264404, 0.7894591093063354]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 9.0, 4.0, 6.0, 9.0, 13.0, 17.0, 19.0, 33.0, 28.0, 44.0, 60.0, 107.0, 140.0, 202.0, 325.0, 458.0, 606.0, 923.0, 1282.0, 2216.0, 3818.0, 6957.0, 14292.0, 42975.0, 463853.0, 437865.0, 41184.0, 13888.0, 6699.0, 3533.0, 2339.0, 1517.0, 977.0, 620.0, 434.0, 300.0, 223.0, 172.0, 129.0, 87.0, 66.0, 48.0, 32.0, 23.0, 8.0, 14.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.744140625, -0.7201309204101562, -0.6961212158203125, -0.6721115112304688, -0.648101806640625, -0.6240921020507812, -0.6000823974609375, -0.5760726928710938, -0.55206298828125, -0.5280532836914062, -0.5040435791015625, -0.48003387451171875, -0.456024169921875, -0.43201446533203125, -0.4080047607421875, -0.38399505615234375, -0.3599853515625, -0.33597564697265625, -0.3119659423828125, -0.28795623779296875, -0.263946533203125, -0.23993682861328125, -0.2159271240234375, -0.19191741943359375, -0.16790771484375, -0.14389801025390625, -0.1198883056640625, -0.09587860107421875, -0.071868896484375, -0.04785919189453125, -0.0238494873046875, 0.00016021728515625, 0.024169921875, 0.04817962646484375, 0.0721893310546875, 0.09619903564453125, 0.120208740234375, 0.14421844482421875, 0.1682281494140625, 0.19223785400390625, 0.21624755859375, 0.24025726318359375, 0.2642669677734375, 0.28827667236328125, 0.312286376953125, 0.33629608154296875, 0.3603057861328125, 0.38431549072265625, 0.4083251953125, 0.43233489990234375, 0.4563446044921875, 0.48035430908203125, 0.504364013671875, 0.5283737182617188, 0.5523834228515625, 0.5763931274414062, 0.60040283203125, 0.6244125366210938, 0.6484222412109375, 0.6724319458007812, 0.696441650390625, 0.7204513549804688, 0.7444610595703125, 0.7684707641601562, 0.79248046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 17.0, 17.0, 26.0, 57.0, 118.0, 180.0, 231.0, 118.0, 82.0, 26.0, 26.0, 13.0, 8.0, 10.0, 10.0, 7.0, 8.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1064453125, -0.10356521606445312, -0.10068511962890625, -0.09780502319335938, -0.0949249267578125, -0.09204483032226562, -0.08916473388671875, -0.08628463745117188, -0.083404541015625, -0.08052444458007812, -0.07764434814453125, -0.07476425170898438, -0.0718841552734375, -0.06900405883789062, -0.06612396240234375, -0.06324386596679688, -0.06036376953125, -0.057483673095703125, -0.05460357666015625, -0.051723480224609375, -0.0488433837890625, -0.045963287353515625, -0.04308319091796875, -0.040203094482421875, -0.037322998046875, -0.034442901611328125, -0.03156280517578125, -0.028682708740234375, -0.0258026123046875, -0.022922515869140625, -0.02004241943359375, -0.017162322998046875, -0.0142822265625, -0.011402130126953125, -0.00852203369140625, -0.005641937255859375, -0.0027618408203125, 0.000118255615234375, 0.00299835205078125, 0.005878448486328125, 0.008758544921875, 0.011638641357421875, 0.01451873779296875, 0.017398834228515625, 0.0202789306640625, 0.023159027099609375, 0.02603912353515625, 0.028919219970703125, 0.03179931640625, 0.034679412841796875, 0.03755950927734375, 0.040439605712890625, 0.0433197021484375, 0.046199798583984375, 0.04907989501953125, 0.051959991455078125, 0.054840087890625, 0.057720184326171875, 0.06060028076171875, 0.06348037719726562, 0.0663604736328125, 0.06924057006835938, 0.07212066650390625, 0.07500076293945312, 0.077880859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 8.0, 6.0, 13.0, 20.0, 17.0, 22.0, 18.0, 35.0, 37.0, 60.0, 90.0, 119.0, 182.0, 316.0, 564.0, 929.0, 1597.0, 2666.0, 4564.0, 7967.0, 13784.0, 24911.0, 46566.0, 93699.0, 236392.0, 355478.0, 127774.0, 59512.0, 31032.0, 16887.0, 9832.0, 5612.0, 3232.0, 1780.0, 1085.0, 611.0, 390.0, 243.0, 145.0, 88.0, 79.0, 50.0, 36.0, 29.0, 18.0, 14.0, 10.0, 8.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0], "bins": [-0.37255859375, -0.3609886169433594, -0.34941864013671875, -0.3378486633300781, -0.3262786865234375, -0.3147087097167969, -0.30313873291015625, -0.2915687561035156, -0.279998779296875, -0.2684288024902344, -0.25685882568359375, -0.24528884887695312, -0.2337188720703125, -0.22214889526367188, -0.21057891845703125, -0.19900894165039062, -0.18743896484375, -0.17586898803710938, -0.16429901123046875, -0.15272903442382812, -0.1411590576171875, -0.12958908081054688, -0.11801910400390625, -0.10644912719726562, -0.094879150390625, -0.08330917358398438, -0.07173919677734375, -0.060169219970703125, -0.0485992431640625, -0.037029266357421875, -0.02545928955078125, -0.013889312744140625, -0.0023193359375, 0.009250640869140625, 0.02082061767578125, 0.032390594482421875, 0.0439605712890625, 0.055530548095703125, 0.06710052490234375, 0.07867050170898438, 0.090240478515625, 0.10181045532226562, 0.11338043212890625, 0.12495040893554688, 0.1365203857421875, 0.14809036254882812, 0.15966033935546875, 0.17123031616210938, 0.18280029296875, 0.19437026977539062, 0.20594024658203125, 0.21751022338867188, 0.2290802001953125, 0.24065017700195312, 0.25222015380859375, 0.2637901306152344, 0.275360107421875, 0.2869300842285156, 0.29850006103515625, 0.3100700378417969, 0.3216400146484375, 0.3332099914550781, 0.34477996826171875, 0.3563499450683594, 0.367919921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 3.0, 12.0, 8.0, 6.0, 12.0, 11.0, 11.0, 13.0, 16.0, 17.0, 13.0, 20.0, 26.0, 29.0, 43.0, 30.0, 28.0, 34.0, 30.0, 33.0, 35.0, 30.0, 29.0, 34.0, 39.0, 48.0, 33.0, 27.0, 34.0, 26.0, 26.0, 25.0, 24.0, 21.0, 21.0, 15.0, 27.0, 16.0, 18.0, 14.0, 7.0, 16.0, 15.0, 2.0, 6.0, 1.0, 2.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.230224609375, -0.22295570373535156, -0.21568679809570312, -0.2084178924560547, -0.20114898681640625, -0.1938800811767578, -0.18661117553710938, -0.17934226989746094, -0.1720733642578125, -0.16480445861816406, -0.15753555297851562, -0.1502666473388672, -0.14299774169921875, -0.1357288360595703, -0.12845993041992188, -0.12119102478027344, -0.113922119140625, -0.10665321350097656, -0.09938430786132812, -0.09211540222167969, -0.08484649658203125, -0.07757759094238281, -0.07030868530273438, -0.06303977966308594, -0.0557708740234375, -0.04850196838378906, -0.041233062744140625, -0.03396415710449219, -0.02669525146484375, -0.019426345825195312, -0.012157440185546875, -0.0048885345458984375, 0.00238037109375, 0.009649276733398438, 0.016918182373046875, 0.024187088012695312, 0.03145599365234375, 0.03872489929199219, 0.045993804931640625, 0.05326271057128906, 0.0605316162109375, 0.06780052185058594, 0.07506942749023438, 0.08233833312988281, 0.08960723876953125, 0.09687614440917969, 0.10414505004882812, 0.11141395568847656, 0.118682861328125, 0.12595176696777344, 0.13322067260742188, 0.1404895782470703, 0.14775848388671875, 0.1550273895263672, 0.16229629516601562, 0.16956520080566406, 0.1768341064453125, 0.18410301208496094, 0.19137191772460938, 0.1986408233642578, 0.20590972900390625, 0.2131786346435547, 0.22044754028320312, 0.22771644592285156, 0.2349853515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 14.0, 12.0, 27.0, 44.0, 48.0, 79.0, 88.0, 133.0, 210.0, 377.0, 666.0, 1106.0, 2118.0, 4744.0, 16093.0, 961444.0, 48373.0, 6553.0, 2846.0, 1398.0, 775.0, 446.0, 322.0, 205.0, 140.0, 91.0, 40.0, 35.0, 24.0, 17.0, 24.0, 7.0, 11.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.17158889770507812, -0.16580963134765625, -0.16003036499023438, -0.1542510986328125, -0.14847183227539062, -0.14269256591796875, -0.13691329956054688, -0.131134033203125, -0.12535476684570312, -0.11957550048828125, -0.11379623413085938, -0.1080169677734375, -0.10223770141601562, -0.09645843505859375, -0.09067916870117188, -0.08489990234375, -0.07912063598632812, -0.07334136962890625, -0.06756210327148438, -0.0617828369140625, -0.056003570556640625, -0.05022430419921875, -0.044445037841796875, -0.038665771484375, -0.032886505126953125, -0.02710723876953125, -0.021327972412109375, -0.0155487060546875, -0.009769439697265625, -0.00399017333984375, 0.001789093017578125, 0.007568359375, 0.013347625732421875, 0.01912689208984375, 0.024906158447265625, 0.0306854248046875, 0.036464691162109375, 0.04224395751953125, 0.048023223876953125, 0.053802490234375, 0.059581756591796875, 0.06536102294921875, 0.07114028930664062, 0.0769195556640625, 0.08269882202148438, 0.08847808837890625, 0.09425735473632812, 0.10003662109375, 0.10581588745117188, 0.11159515380859375, 0.11737442016601562, 0.1231536865234375, 0.12893295288085938, 0.13471221923828125, 0.14049148559570312, 0.146270751953125, 0.15205001831054688, 0.15782928466796875, 0.16360855102539062, 0.1693878173828125, 0.17516708374023438, 0.18094635009765625, 0.18672561645507812, 0.1925048828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 12.0, 19.0, 102.0, 204.0, 282.0, 211.0, 102.0, 37.0, 15.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6285648345947266e-05, -2.5743618607521057e-05, -2.520158886909485e-05, -2.465955913066864e-05, -2.411752939224243e-05, -2.3575499653816223e-05, -2.3033469915390015e-05, -2.2491440176963806e-05, -2.1949410438537598e-05, -2.140738070011139e-05, -2.086535096168518e-05, -2.0323321223258972e-05, -1.9781291484832764e-05, -1.9239261746406555e-05, -1.8697232007980347e-05, -1.8155202269554138e-05, -1.761317253112793e-05, -1.707114279270172e-05, -1.6529113054275513e-05, -1.5987083315849304e-05, -1.5445053577423096e-05, -1.4903023838996887e-05, -1.4360994100570679e-05, -1.381896436214447e-05, -1.3276934623718262e-05, -1.2734904885292053e-05, -1.2192875146865845e-05, -1.1650845408439636e-05, -1.1108815670013428e-05, -1.056678593158722e-05, -1.002475619316101e-05, -9.482726454734802e-06, -8.940696716308594e-06, -8.398666977882385e-06, -7.856637239456177e-06, -7.314607501029968e-06, -6.77257776260376e-06, -6.230548024177551e-06, -5.688518285751343e-06, -5.146488547325134e-06, -4.604458808898926e-06, -4.062429070472717e-06, -3.520399332046509e-06, -2.9783695936203003e-06, -2.436339855194092e-06, -1.8943101167678833e-06, -1.3522803783416748e-06, -8.102506399154663e-07, -2.682209014892578e-07, 2.738088369369507e-07, 8.158385753631592e-07, 1.3578683137893677e-06, 1.8998980522155762e-06, 2.4419277906417847e-06, 2.983957529067993e-06, 3.5259872674942017e-06, 4.06801700592041e-06, 4.610046744346619e-06, 5.152076482772827e-06, 5.694106221199036e-06, 6.236135959625244e-06, 6.778165698051453e-06, 7.320195436477661e-06, 7.86222517490387e-06, 8.404254913330078e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 11.0, 12.0, 15.0, 25.0, 53.0, 62.0, 111.0, 166.0, 279.0, 418.0, 717.0, 1164.0, 1904.0, 3145.0, 6778.0, 40334.0, 941227.0, 38465.0, 6294.0, 2922.0, 1719.0, 1069.0, 625.0, 380.0, 234.0, 161.0, 93.0, 49.0, 36.0, 30.0, 20.0, 15.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12274169921875, -0.11896514892578125, -0.1151885986328125, -0.11141204833984375, -0.107635498046875, -0.10385894775390625, -0.1000823974609375, -0.09630584716796875, -0.092529296875, -0.08875274658203125, -0.0849761962890625, -0.08119964599609375, -0.077423095703125, -0.07364654541015625, -0.0698699951171875, -0.06609344482421875, -0.06231689453125, -0.05854034423828125, -0.0547637939453125, -0.05098724365234375, -0.047210693359375, -0.04343414306640625, -0.0396575927734375, -0.03588104248046875, -0.0321044921875, -0.02832794189453125, -0.0245513916015625, -0.02077484130859375, -0.016998291015625, -0.01322174072265625, -0.0094451904296875, -0.00566864013671875, -0.00189208984375, 0.00188446044921875, 0.0056610107421875, 0.00943756103515625, 0.013214111328125, 0.01699066162109375, 0.0207672119140625, 0.02454376220703125, 0.0283203125, 0.03209686279296875, 0.0358734130859375, 0.03964996337890625, 0.043426513671875, 0.04720306396484375, 0.0509796142578125, 0.05475616455078125, 0.05853271484375, 0.06230926513671875, 0.0660858154296875, 0.06986236572265625, 0.073638916015625, 0.07741546630859375, 0.0811920166015625, 0.08496856689453125, 0.0887451171875, 0.09252166748046875, 0.0962982177734375, 0.10007476806640625, 0.103851318359375, 0.10762786865234375, 0.1114044189453125, 0.11518096923828125, 0.11895751953125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 8.0, 14.0, 34.0, 55.0, 213.0, 400.0, 170.0, 45.0, 18.0, 14.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.082763671875, -0.0802145004272461, -0.07766532897949219, -0.07511615753173828, -0.07256698608398438, -0.07001781463623047, -0.06746864318847656, -0.06491947174072266, -0.06237030029296875, -0.059821128845214844, -0.05727195739746094, -0.05472278594970703, -0.052173614501953125, -0.04962444305419922, -0.04707527160644531, -0.044526100158691406, -0.0419769287109375, -0.039427757263183594, -0.03687858581542969, -0.03432941436767578, -0.031780242919921875, -0.02923107147216797, -0.026681900024414062, -0.024132728576660156, -0.02158355712890625, -0.019034385681152344, -0.016485214233398438, -0.013936042785644531, -0.011386871337890625, -0.008837699890136719, -0.0062885284423828125, -0.0037393569946289062, -0.001190185546875, 0.0013589859008789062, 0.0039081573486328125, 0.006457328796386719, 0.009006500244140625, 0.011555671691894531, 0.014104843139648438, 0.016654014587402344, 0.01920318603515625, 0.021752357482910156, 0.024301528930664062, 0.02685070037841797, 0.029399871826171875, 0.03194904327392578, 0.03449821472167969, 0.037047386169433594, 0.0395965576171875, 0.042145729064941406, 0.04469490051269531, 0.04724407196044922, 0.049793243408203125, 0.05234241485595703, 0.05489158630371094, 0.057440757751464844, 0.05998992919921875, 0.06253910064697266, 0.06508827209472656, 0.06763744354248047, 0.07018661499023438, 0.07273578643798828, 0.07528495788574219, 0.0778341293334961, 0.08038330078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 12.0, 4.0, 11.0, 15.0, 31.0, 41.0, 78.0, 150.0, 287.0, 156.0, 66.0, 56.0, 42.0, 19.0, 13.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375112533569336, -4.258655548095703, -4.14219856262207, -4.025741100311279, -3.9092841148376465, -3.7928271293640137, -3.676370143890381, -3.559912919998169, -3.443455934524536, -3.3269989490509033, -3.2105417251586914, -3.0940847396850586, -2.9776275157928467, -2.861170530319214, -2.744713306427002, -2.628256320953369, -2.5117993354797363, -2.3953423500061035, -2.2788851261138916, -2.162428140640259, -2.045970916748047, -1.929513931274414, -1.8130568265914917, -1.6965997219085693, -1.5801424980163574, -1.463685393333435, -1.3472282886505127, -1.2307713031768799, -1.1143141984939575, -0.9978570938110352, -0.8813999891281128, -0.7649429440498352, -0.6484858989715576, -0.5320287942886353, -0.41557174921035767, -0.2991146445274353, -0.18265756964683533, -0.06620049476623535, 0.05025660991668701, 0.1667136549949646, 0.28317075967788696, 0.39962783455848694, 0.5160849094390869, 0.6325420141220093, 0.7489991188049316, 0.8654561638832092, 0.9819132685661316, 1.0983703136444092, 1.2148274183273315, 1.331284523010254, 1.4477416276931763, 1.5641987323760986, 1.6806557178497314, 1.7971128225326538, 1.9135699272155762, 2.030026912689209, 2.146484136581421, 2.2629411220550537, 2.3793983459472656, 2.4958553314208984, 2.6123125553131104, 2.728769540786743, 2.845226764678955, 2.961683750152588, 3.0781407356262207]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 5.0, 6.0, 9.0, 6.0, 7.0, 18.0, 21.0, 37.0, 51.0, 59.0, 94.0, 113.0, 128.0, 107.0, 95.0, 82.0, 50.0, 34.0, 23.0, 16.0, 11.0, 7.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.094596862792969, -3.9675374031066895, -3.84047794342041, -3.7134182453155518, -3.5863587856292725, -3.459299325942993, -3.3322396278381348, -3.2051801681518555, -3.078120708465576, -2.951061248779297, -2.8240017890930176, -2.696942090988159, -2.56988263130188, -2.4428231716156006, -2.315763473510742, -2.188704013824463, -2.0616445541381836, -1.9345850944519043, -1.8075255155563354, -1.6804659366607666, -1.5534064769744873, -1.426347017288208, -1.2992874383926392, -1.1722278594970703, -1.045168399810791, -0.9181088805198669, -0.7910493612289429, -0.6639898419380188, -0.5369303226470947, -0.40987080335617065, -0.2828112840652466, -0.1557517647743225, -0.02869272232055664, 0.09836679697036743, 0.2254263162612915, 0.3524858355522156, 0.47954535484313965, 0.6066048741340637, 0.7336643934249878, 0.8607239127159119, 0.9877834320068359, 1.1148428916931152, 1.241902470588684, 1.368962049484253, 1.4960215091705322, 1.6230809688568115, 1.7501405477523804, 1.8772001266479492, 2.0042595863342285, 2.131319046020508, 2.258378505706787, 2.3854382038116455, 2.512497663497925, 2.639557123184204, 2.7666168212890625, 2.893676280975342, 3.020735740661621, 3.1477952003479004, 3.2748546600341797, 3.401914358139038, 3.5289738178253174, 3.6560332775115967, 3.783092975616455, 3.9101524353027344, 4.037211894989014]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 7.0, 3.0, 9.0, 8.0, 10.0, 12.0, 14.0, 17.0, 26.0, 28.0, 41.0, 45.0, 57.0, 86.0, 91.0, 126.0, 165.0, 287.0, 369.0, 610.0, 982.0, 1738.0, 3123.0, 7165.0, 23211.0, 3904878.0, 217974.0, 20778.0, 6069.0, 2700.0, 1401.0, 862.0, 469.0, 315.0, 176.0, 109.0, 82.0, 73.0, 46.0, 33.0, 24.0, 20.0, 17.0, 8.0, 10.0, 3.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.423828125, -2.35821533203125, -2.2926025390625, -2.22698974609375, -2.161376953125, -2.09576416015625, -2.0301513671875, -1.96453857421875, -1.89892578125, -1.83331298828125, -1.7677001953125, -1.70208740234375, -1.636474609375, -1.57086181640625, -1.5052490234375, -1.43963623046875, -1.3740234375, -1.30841064453125, -1.2427978515625, -1.17718505859375, -1.111572265625, -1.04595947265625, -0.9803466796875, -0.91473388671875, -0.84912109375, -0.78350830078125, -0.7178955078125, -0.65228271484375, -0.586669921875, -0.52105712890625, -0.4554443359375, -0.38983154296875, -0.32421875, -0.25860595703125, -0.1929931640625, -0.12738037109375, -0.061767578125, 0.00384521484375, 0.0694580078125, 0.13507080078125, 0.20068359375, 0.26629638671875, 0.3319091796875, 0.39752197265625, 0.463134765625, 0.52874755859375, 0.5943603515625, 0.65997314453125, 0.7255859375, 0.79119873046875, 0.8568115234375, 0.92242431640625, 0.988037109375, 1.05364990234375, 1.1192626953125, 1.18487548828125, 1.25048828125, 1.31610107421875, 1.3817138671875, 1.44732666015625, 1.512939453125, 1.57855224609375, 1.6441650390625, 1.70977783203125, 1.775390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 5.0, 9.0, 6.0, 15.0, 14.0, 35.0, 55.0, 120.0, 149.0, 219.0, 149.0, 99.0, 41.0, 23.0, 13.0, 7.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11822509765625, -0.11504650115966797, -0.11186790466308594, -0.1086893081665039, -0.10551071166992188, -0.10233211517333984, -0.09915351867675781, -0.09597492218017578, -0.09279632568359375, -0.08961772918701172, -0.08643913269042969, -0.08326053619384766, -0.08008193969726562, -0.0769033432006836, -0.07372474670410156, -0.07054615020751953, -0.0673675537109375, -0.06418895721435547, -0.06101036071777344, -0.057831764221191406, -0.054653167724609375, -0.051474571228027344, -0.04829597473144531, -0.04511737823486328, -0.04193878173828125, -0.03876018524169922, -0.03558158874511719, -0.032402992248535156, -0.029224395751953125, -0.026045799255371094, -0.022867202758789062, -0.01968860626220703, -0.016510009765625, -0.013331413269042969, -0.010152816772460938, -0.006974220275878906, -0.003795623779296875, -0.0006170272827148438, 0.0025615692138671875, 0.005740165710449219, 0.00891876220703125, 0.012097358703613281, 0.015275955200195312, 0.018454551696777344, 0.021633148193359375, 0.024811744689941406, 0.027990341186523438, 0.03116893768310547, 0.0343475341796875, 0.03752613067626953, 0.04070472717285156, 0.043883323669433594, 0.047061920166015625, 0.050240516662597656, 0.05341911315917969, 0.05659770965576172, 0.05977630615234375, 0.06295490264892578, 0.06613349914550781, 0.06931209564208984, 0.07249069213867188, 0.0756692886352539, 0.07884788513183594, 0.08202648162841797, 0.085205078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 8.0, 8.0, 15.0, 30.0, 46.0, 72.0, 184.0, 404.0, 1055.0, 2937.0, 8376.0, 28611.0, 166204.0, 3904945.0, 58551.0, 15130.0, 4782.0, 1655.0, 642.0, 280.0, 130.0, 63.0, 43.0, 22.0, 13.0, 10.0, 12.0, 11.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.486053466796875, -1.42718505859375, -1.368316650390625, -1.3094482421875, -1.250579833984375, -1.19171142578125, -1.132843017578125, -1.073974609375, -1.015106201171875, -0.95623779296875, -0.897369384765625, -0.8385009765625, -0.779632568359375, -0.72076416015625, -0.661895751953125, -0.60302734375, -0.544158935546875, -0.48529052734375, -0.426422119140625, -0.3675537109375, -0.308685302734375, -0.24981689453125, -0.190948486328125, -0.132080078125, -0.073211669921875, -0.01434326171875, 0.044525146484375, 0.1033935546875, 0.162261962890625, 0.22113037109375, 0.279998779296875, 0.3388671875, 0.397735595703125, 0.45660400390625, 0.515472412109375, 0.5743408203125, 0.633209228515625, 0.69207763671875, 0.750946044921875, 0.809814453125, 0.868682861328125, 0.92755126953125, 0.986419677734375, 1.0452880859375, 1.104156494140625, 1.16302490234375, 1.221893310546875, 1.28076171875, 1.339630126953125, 1.39849853515625, 1.457366943359375, 1.5162353515625, 1.575103759765625, 1.63397216796875, 1.692840576171875, 1.751708984375, 1.810577392578125, 1.86944580078125, 1.928314208984375, 1.9871826171875, 2.046051025390625, 2.10491943359375, 2.163787841796875, 2.22265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 12.0, 10.0, 10.0, 9.0, 13.0, 13.0, 19.0, 19.0, 28.0, 30.0, 36.0, 33.0, 57.0, 78.0, 3199.0, 200.0, 61.0, 52.0, 35.0, 26.0, 27.0, 15.0, 15.0, 12.0, 13.0, 8.0, 7.0, 3.0, 6.0, 6.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2061767578125, -0.20071983337402344, -0.19526290893554688, -0.1898059844970703, -0.18434906005859375, -0.1788921356201172, -0.17343521118164062, -0.16797828674316406, -0.1625213623046875, -0.15706443786621094, -0.15160751342773438, -0.1461505889892578, -0.14069366455078125, -0.1352367401123047, -0.12977981567382812, -0.12432289123535156, -0.118865966796875, -0.11340904235839844, -0.10795211791992188, -0.10249519348144531, -0.09703826904296875, -0.09158134460449219, -0.08612442016601562, -0.08066749572753906, -0.0752105712890625, -0.06975364685058594, -0.06429672241210938, -0.05883979797363281, -0.05338287353515625, -0.04792594909667969, -0.042469024658203125, -0.03701210021972656, -0.03155517578125, -0.026098251342773438, -0.020641326904296875, -0.015184402465820312, -0.00972747802734375, -0.0042705535888671875, 0.001186370849609375, 0.0066432952880859375, 0.0121002197265625, 0.017557144165039062, 0.023014068603515625, 0.028470993041992188, 0.03392791748046875, 0.03938484191894531, 0.044841766357421875, 0.05029869079589844, 0.055755615234375, 0.06121253967285156, 0.06666946411132812, 0.07212638854980469, 0.07758331298828125, 0.08304023742675781, 0.08849716186523438, 0.09395408630371094, 0.0994110107421875, 0.10486793518066406, 0.11032485961914062, 0.11578178405761719, 0.12123870849609375, 0.1266956329345703, 0.13215255737304688, 0.13760948181152344, 0.14306640625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 12.0, 15.0, 33.0, 53.0, 99.0, 319.0, 290.0, 102.0, 38.0, 18.0, 14.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7874802350997925, -0.7311680316925049, -0.6748558282852173, -0.6185436248779297, -0.5622314214706421, -0.5059192180633545, -0.44960707426071167, -0.3932948708534241, -0.3369826674461365, -0.2806704640388489, -0.22435827553272247, -0.16804608702659607, -0.11173388361930847, -0.055421680212020874, 0.0008904933929443359, 0.057202696800231934, 0.11351490020751953, 0.16982710361480713, 0.22613929212093353, 0.28245148062705994, 0.33876368403434753, 0.39507588744163513, 0.45138806104660034, 0.5077002644538879, 0.5640124678611755, 0.6203246712684631, 0.6766368746757507, 0.7329490184783936, 0.7892612218856812, 0.8455734252929688, 0.9018856287002563, 0.958197832107544, 1.014510154724121, 1.0708223581314087, 1.1271345615386963, 1.1834467649459839, 1.2397589683532715, 1.296071171760559, 1.3523833751678467, 1.4086954593658447, 1.4650077819824219, 1.5213199853897095, 1.577632188796997, 1.6339443922042847, 1.6902565956115723, 1.7465687990188599, 1.8028810024261475, 1.8591930866241455, 1.915505290031433, 1.9718174934387207, 2.0281295776367188, 2.084441900253296, 2.140753984451294, 2.197066307067871, 2.253378391265869, 2.3096907138824463, 2.3660027980804443, 2.4223148822784424, 2.4786272048950195, 2.5349392890930176, 2.5912516117095947, 2.6475636959075928, 2.70387601852417, 2.760188102722168, 2.816500425338745]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 8.0, 19.0, 13.0, 21.0, 23.0, 31.0, 48.0, 44.0, 49.0, 43.0, 73.0, 68.0, 66.0, 64.0, 75.0, 67.0, 46.0, 47.0, 27.0, 31.0, 28.0, 20.0, 15.0, 16.0, 12.0, 3.0, 10.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6607336401939392, -0.6385074853897095, -0.6162813305854797, -0.59405517578125, -0.5718289613723755, -0.5496028065681458, -0.527376651763916, -0.5051504969596863, -0.48292431235313416, -0.4606981575489044, -0.4384719729423523, -0.41624581813812256, -0.3940196633338928, -0.3717934787273407, -0.34956732392311096, -0.32734113931655884, -0.3051149845123291, -0.28288882970809937, -0.26066264510154724, -0.2384364902973175, -0.21621032059192657, -0.19398415088653564, -0.1717579960823059, -0.14953182637691498, -0.12730565667152405, -0.10507948696613312, -0.08285332471132278, -0.06062716245651245, -0.03840099275112152, -0.01617482304573059, 0.0060513317584991455, 0.028277501463890076, 0.05050373077392578, 0.07272990047931671, 0.09495606273412704, 0.11718222498893738, 0.1394083946943283, 0.16163456439971924, 0.18386071920394897, 0.2060868889093399, 0.22831305861473083, 0.25053921341896057, 0.2727653980255127, 0.29499155282974243, 0.31721770763397217, 0.3394438922405243, 0.36167004704475403, 0.38389623165130615, 0.4061223864555359, 0.4283485412597656, 0.45057472586631775, 0.4728008806705475, 0.4950270652770996, 0.5172532200813293, 0.5394793748855591, 0.5617055296897888, 0.5839316844940186, 0.6061578392982483, 0.628383994102478, 0.6506102085113525, 0.6728363633155823, 0.695062518119812, 0.7172886729240417, 0.7395148277282715, 0.761741042137146]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 0.0, 6.0, 4.0, 2.0, 9.0, 8.0, 9.0, 17.0, 16.0, 38.0, 36.0, 66.0, 82.0, 100.0, 147.0, 242.0, 385.0, 630.0, 1014.0, 2017.0, 4185.0, 12246.0, 61019.0, 698221.0, 226432.0, 27483.0, 7340.0, 2952.0, 1523.0, 817.0, 488.0, 316.0, 214.0, 138.0, 109.0, 61.0, 50.0, 37.0, 27.0, 18.0, 20.0, 13.0, 4.0, 4.0, 3.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9482421875, -0.9174346923828125, -0.886627197265625, -0.8558197021484375, -0.82501220703125, -0.7942047119140625, -0.763397216796875, -0.7325897216796875, -0.7017822265625, -0.6709747314453125, -0.640167236328125, -0.6093597412109375, -0.57855224609375, -0.5477447509765625, -0.516937255859375, -0.4861297607421875, -0.455322265625, -0.4245147705078125, -0.393707275390625, -0.3628997802734375, -0.33209228515625, -0.3012847900390625, -0.270477294921875, -0.2396697998046875, -0.2088623046875, -0.1780548095703125, -0.147247314453125, -0.1164398193359375, -0.08563232421875, -0.0548248291015625, -0.024017333984375, 0.0067901611328125, 0.03759765625, 0.0684051513671875, 0.099212646484375, 0.1300201416015625, 0.16082763671875, 0.1916351318359375, 0.222442626953125, 0.2532501220703125, 0.2840576171875, 0.3148651123046875, 0.345672607421875, 0.3764801025390625, 0.40728759765625, 0.4380950927734375, 0.468902587890625, 0.4997100830078125, 0.530517578125, 0.5613250732421875, 0.592132568359375, 0.6229400634765625, 0.65374755859375, 0.6845550537109375, 0.715362548828125, 0.7461700439453125, 0.7769775390625, 0.8077850341796875, 0.838592529296875, 0.8694000244140625, 0.90020751953125, 0.9310150146484375, 0.961822509765625, 0.9926300048828125, 1.0234375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 9.0, 17.0, 29.0, 56.0, 81.0, 121.0, 139.0, 162.0, 137.0, 105.0, 52.0, 33.0, 17.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1044921875, -0.1017465591430664, -0.09900093078613281, -0.09625530242919922, -0.09350967407226562, -0.09076404571533203, -0.08801841735839844, -0.08527278900146484, -0.08252716064453125, -0.07978153228759766, -0.07703590393066406, -0.07429027557373047, -0.07154464721679688, -0.06879901885986328, -0.06605339050292969, -0.0633077621459961, -0.0605621337890625, -0.057816505432128906, -0.05507087707519531, -0.05232524871826172, -0.049579620361328125, -0.04683399200439453, -0.04408836364746094, -0.041342735290527344, -0.03859710693359375, -0.035851478576660156, -0.03310585021972656, -0.03036022186279297, -0.027614593505859375, -0.02486896514892578, -0.022123336791992188, -0.019377708435058594, -0.016632080078125, -0.013886451721191406, -0.011140823364257812, -0.008395195007324219, -0.005649566650390625, -0.0029039382934570312, -0.0001583099365234375, 0.0025873184204101562, 0.00533294677734375, 0.008078575134277344, 0.010824203491210938, 0.013569831848144531, 0.016315460205078125, 0.01906108856201172, 0.021806716918945312, 0.024552345275878906, 0.0272979736328125, 0.030043601989746094, 0.03278923034667969, 0.03553485870361328, 0.038280487060546875, 0.04102611541748047, 0.04377174377441406, 0.046517372131347656, 0.04926300048828125, 0.052008628845214844, 0.05475425720214844, 0.05749988555908203, 0.060245513916015625, 0.06299114227294922, 0.06573677062988281, 0.0684823989868164, 0.07122802734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 11.0, 11.0, 18.0, 29.0, 47.0, 54.0, 87.0, 112.0, 199.0, 290.0, 406.0, 709.0, 1091.0, 1743.0, 2864.0, 4800.0, 8434.0, 14440.0, 25840.0, 48428.0, 98566.0, 260695.0, 331217.0, 120553.0, 57077.0, 30296.0, 16731.0, 9570.0, 5557.0, 3321.0, 2005.0, 1207.0, 731.0, 484.0, 302.0, 197.0, 133.0, 89.0, 63.0, 47.0, 24.0, 19.0, 12.0, 15.0, 10.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3720703125, -0.3608360290527344, -0.34960174560546875, -0.3383674621582031, -0.3271331787109375, -0.3158988952636719, -0.30466461181640625, -0.2934303283691406, -0.282196044921875, -0.2709617614746094, -0.25972747802734375, -0.24849319458007812, -0.2372589111328125, -0.22602462768554688, -0.21479034423828125, -0.20355606079101562, -0.19232177734375, -0.18108749389648438, -0.16985321044921875, -0.15861892700195312, -0.1473846435546875, -0.13615036010742188, -0.12491607666015625, -0.11368179321289062, -0.102447509765625, -0.09121322631835938, -0.07997894287109375, -0.06874465942382812, -0.0575103759765625, -0.046276092529296875, -0.03504180908203125, -0.023807525634765625, -0.0125732421875, -0.001338958740234375, 0.00989532470703125, 0.021129608154296875, 0.0323638916015625, 0.043598175048828125, 0.05483245849609375, 0.06606674194335938, 0.077301025390625, 0.08853530883789062, 0.09976959228515625, 0.11100387573242188, 0.1222381591796875, 0.13347244262695312, 0.14470672607421875, 0.15594100952148438, 0.16717529296875, 0.17840957641601562, 0.18964385986328125, 0.20087814331054688, 0.2121124267578125, 0.22334671020507812, 0.23458099365234375, 0.24581527709960938, 0.257049560546875, 0.2682838439941406, 0.27951812744140625, 0.2907524108886719, 0.3019866943359375, 0.3132209777832031, 0.32445526123046875, 0.3356895446777344, 0.346923828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 2.0, 9.0, 3.0, 9.0, 13.0, 9.0, 19.0, 25.0, 22.0, 24.0, 21.0, 22.0, 36.0, 30.0, 33.0, 43.0, 27.0, 31.0, 40.0, 44.0, 47.0, 38.0, 46.0, 49.0, 40.0, 34.0, 34.0, 20.0, 30.0, 24.0, 20.0, 25.0, 24.0, 17.0, 18.0, 13.0, 13.0, 11.0, 6.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2222900390625, -0.2153778076171875, -0.208465576171875, -0.2015533447265625, -0.19464111328125, -0.1877288818359375, -0.180816650390625, -0.1739044189453125, -0.1669921875, -0.1600799560546875, -0.153167724609375, -0.1462554931640625, -0.13934326171875, -0.1324310302734375, -0.125518798828125, -0.1186065673828125, -0.1116943359375, -0.1047821044921875, -0.097869873046875, -0.0909576416015625, -0.08404541015625, -0.0771331787109375, -0.070220947265625, -0.0633087158203125, -0.056396484375, -0.0494842529296875, -0.042572021484375, -0.0356597900390625, -0.02874755859375, -0.0218353271484375, -0.014923095703125, -0.0080108642578125, -0.0010986328125, 0.0058135986328125, 0.012725830078125, 0.0196380615234375, 0.02655029296875, 0.0334625244140625, 0.040374755859375, 0.0472869873046875, 0.05419921875, 0.0611114501953125, 0.068023681640625, 0.0749359130859375, 0.08184814453125, 0.0887603759765625, 0.095672607421875, 0.1025848388671875, 0.1094970703125, 0.1164093017578125, 0.123321533203125, 0.1302337646484375, 0.13714599609375, 0.1440582275390625, 0.150970458984375, 0.1578826904296875, 0.164794921875, 0.1717071533203125, 0.178619384765625, 0.1855316162109375, 0.19244384765625, 0.1993560791015625, 0.206268310546875, 0.2131805419921875, 0.2200927734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 11.0, 7.0, 9.0, 15.0, 14.0, 21.0, 23.0, 35.0, 63.0, 79.0, 97.0, 194.0, 314.0, 594.0, 1408.0, 4040.0, 14832.0, 96538.0, 827530.0, 82638.0, 13451.0, 3832.0, 1347.0, 599.0, 284.0, 181.0, 102.0, 70.0, 47.0, 42.0, 28.0, 18.0, 14.0, 13.0, 12.0, 10.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.2060546875, -0.1995067596435547, -0.19295883178710938, -0.18641090393066406, -0.17986297607421875, -0.17331504821777344, -0.16676712036132812, -0.1602191925048828, -0.1536712646484375, -0.1471233367919922, -0.14057540893554688, -0.13402748107910156, -0.12747955322265625, -0.12093162536621094, -0.11438369750976562, -0.10783576965332031, -0.101287841796875, -0.09473991394042969, -0.08819198608398438, -0.08164405822753906, -0.07509613037109375, -0.06854820251464844, -0.062000274658203125, -0.05545234680175781, -0.0489044189453125, -0.04235649108886719, -0.035808563232421875, -0.029260635375976562, -0.02271270751953125, -0.016164779663085938, -0.009616851806640625, -0.0030689239501953125, 0.00347900390625, 0.010026931762695312, 0.016574859619140625, 0.023122787475585938, 0.02967071533203125, 0.03621864318847656, 0.042766571044921875, 0.04931449890136719, 0.0558624267578125, 0.06241035461425781, 0.06895828247070312, 0.07550621032714844, 0.08205413818359375, 0.08860206604003906, 0.09514999389648438, 0.10169792175292969, 0.108245849609375, 0.11479377746582031, 0.12134170532226562, 0.12788963317871094, 0.13443756103515625, 0.14098548889160156, 0.14753341674804688, 0.1540813446044922, 0.1606292724609375, 0.1671772003173828, 0.17372512817382812, 0.18027305603027344, 0.18682098388671875, 0.19336891174316406, 0.19991683959960938, 0.2064647674560547, 0.2130126953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 9.0, 5.0, 9.0, 12.0, 17.0, 33.0, 65.0, 116.0, 203.0, 190.0, 132.0, 85.0, 38.0, 26.0, 16.0, 11.0, 8.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.199411392211914e-05, -2.1401792764663696e-05, -2.0809471607208252e-05, -2.0217150449752808e-05, -1.9624829292297363e-05, -1.903250813484192e-05, -1.8440186977386475e-05, -1.784786581993103e-05, -1.7255544662475586e-05, -1.666322350502014e-05, -1.6070902347564697e-05, -1.5478581190109253e-05, -1.4886260032653809e-05, -1.4293938875198364e-05, -1.370161771774292e-05, -1.3109296560287476e-05, -1.2516975402832031e-05, -1.1924654245376587e-05, -1.1332333087921143e-05, -1.0740011930465698e-05, -1.0147690773010254e-05, -9.55536961555481e-06, -8.963048458099365e-06, -8.370727300643921e-06, -7.778406143188477e-06, -7.186084985733032e-06, -6.593763828277588e-06, -6.0014426708221436e-06, -5.409121513366699e-06, -4.816800355911255e-06, -4.2244791984558105e-06, -3.632158041000366e-06, -3.039836883544922e-06, -2.4475157260894775e-06, -1.8551945686340332e-06, -1.2628734111785889e-06, -6.705522537231445e-07, -7.82310962677002e-08, 5.140900611877441e-07, 1.1064112186431885e-06, 1.6987323760986328e-06, 2.291053533554077e-06, 2.8833746910095215e-06, 3.475695848464966e-06, 4.06801700592041e-06, 4.6603381633758545e-06, 5.252659320831299e-06, 5.844980478286743e-06, 6.4373016357421875e-06, 7.029622793197632e-06, 7.621943950653076e-06, 8.21426510810852e-06, 8.806586265563965e-06, 9.39890742301941e-06, 9.991228580474854e-06, 1.0583549737930298e-05, 1.1175870895385742e-05, 1.1768192052841187e-05, 1.2360513210296631e-05, 1.2952834367752075e-05, 1.354515552520752e-05, 1.4137476682662964e-05, 1.4729797840118408e-05, 1.5322118997573853e-05, 1.5914440155029297e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 10.0, 9.0, 11.0, 17.0, 25.0, 36.0, 44.0, 68.0, 101.0, 182.0, 301.0, 626.0, 1515.0, 4149.0, 12867.0, 51499.0, 606155.0, 317699.0, 37328.0, 10051.0, 3293.0, 1280.0, 545.0, 284.0, 149.0, 82.0, 64.0, 35.0, 38.0, 28.0, 16.0, 7.0, 14.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1759033203125, -0.17055702209472656, -0.16521072387695312, -0.1598644256591797, -0.15451812744140625, -0.1491718292236328, -0.14382553100585938, -0.13847923278808594, -0.1331329345703125, -0.12778663635253906, -0.12244033813476562, -0.11709403991699219, -0.11174774169921875, -0.10640144348144531, -0.10105514526367188, -0.09570884704589844, -0.090362548828125, -0.08501625061035156, -0.07966995239257812, -0.07432365417480469, -0.06897735595703125, -0.06363105773925781, -0.058284759521484375, -0.05293846130371094, -0.0475921630859375, -0.04224586486816406, -0.036899566650390625, -0.03155326843261719, -0.02620697021484375, -0.020860671997070312, -0.015514373779296875, -0.010168075561523438, -0.00482177734375, 0.0005245208740234375, 0.005870819091796875, 0.011217117309570312, 0.01656341552734375, 0.021909713745117188, 0.027256011962890625, 0.03260231018066406, 0.0379486083984375, 0.04329490661621094, 0.048641204833984375, 0.05398750305175781, 0.05933380126953125, 0.06468009948730469, 0.07002639770507812, 0.07537269592285156, 0.080718994140625, 0.08606529235839844, 0.09141159057617188, 0.09675788879394531, 0.10210418701171875, 0.10745048522949219, 0.11279678344726562, 0.11814308166503906, 0.1234893798828125, 0.12883567810058594, 0.13418197631835938, 0.1395282745361328, 0.14487457275390625, 0.1502208709716797, 0.15556716918945312, 0.16091346740722656, 0.166259765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 12.0, 19.0, 25.0, 22.0, 24.0, 57.0, 90.0, 128.0, 176.0, 145.0, 105.0, 66.0, 47.0, 27.0, 22.0, 12.0, 8.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10333251953125, -0.10016822814941406, -0.09700393676757812, -0.09383964538574219, -0.09067535400390625, -0.08751106262207031, -0.08434677124023438, -0.08118247985839844, -0.0780181884765625, -0.07485389709472656, -0.07168960571289062, -0.06852531433105469, -0.06536102294921875, -0.06219673156738281, -0.059032440185546875, -0.05586814880371094, -0.052703857421875, -0.04953956604003906, -0.046375274658203125, -0.04321098327636719, -0.04004669189453125, -0.03688240051269531, -0.033718109130859375, -0.030553817749023438, -0.0273895263671875, -0.024225234985351562, -0.021060943603515625, -0.017896652221679688, -0.01473236083984375, -0.011568069458007812, -0.008403778076171875, -0.0052394866943359375, -0.0020751953125, 0.0010890960693359375, 0.004253387451171875, 0.0074176788330078125, 0.01058197021484375, 0.013746261596679688, 0.016910552978515625, 0.020074844360351562, 0.0232391357421875, 0.026403427124023438, 0.029567718505859375, 0.03273200988769531, 0.03589630126953125, 0.03906059265136719, 0.042224884033203125, 0.04538917541503906, 0.048553466796875, 0.05171775817871094, 0.054882049560546875, 0.05804634094238281, 0.06121063232421875, 0.06437492370605469, 0.06753921508789062, 0.07070350646972656, 0.0738677978515625, 0.07703208923339844, 0.08019638061523438, 0.08336067199707031, 0.08652496337890625, 0.08968925476074219, 0.09285354614257812, 0.09601783752441406, 0.09918212890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 11.0, 25.0, 29.0, 71.0, 105.0, 320.0, 205.0, 110.0, 59.0, 23.0, 17.0, 12.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.078115701675415, -2.9228432178497314, -2.7675704956054688, -2.612298011779785, -2.4570255279541016, -2.301752805709839, -2.1464803218841553, -1.9912077188491821, -1.835935115814209, -1.6806625127792358, -1.5253899097442627, -1.370117425918579, -1.214844822883606, -1.0595722198486328, -0.9042996764183044, -0.7490271329879761, -0.5937545299530029, -0.4384819567203522, -0.2832093834877014, -0.12793681025505066, 0.027335762977600098, 0.18260836601257324, 0.3378809094429016, 0.49315345287323, 0.6484260559082031, 0.8036986589431763, 0.9589712023735046, 1.114243745803833, 1.2695163488388062, 1.4247889518737793, 1.580061435699463, 1.735334038734436, 1.89060640335083, 2.0458788871765137, 2.2011516094207764, 2.35642409324646, 2.5116968154907227, 2.6669692993164062, 2.82224178314209, 2.9775142669677734, 3.132786989212036, 3.2880594730377197, 3.4433321952819824, 3.598604679107666, 3.7538771629333496, 3.9091498851776123, 4.064422607421875, 4.219695091247559, 4.374967575073242, 4.530240058898926, 4.685512542724609, 4.840785503387451, 4.996057987213135, 5.151330471038818, 5.306602954864502, 5.4618754386901855, 5.617148399353027, 5.772420883178711, 5.9276933670043945, 6.082966327667236, 6.23823881149292, 6.3935112953186035, 6.548783779144287, 6.704056262969971, 6.859328746795654]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 15.0, 17.0, 16.0, 32.0, 33.0, 44.0, 57.0, 56.0, 61.0, 53.0, 64.0, 71.0, 76.0, 82.0, 59.0, 50.0, 43.0, 33.0, 24.0, 24.0, 24.0, 18.0, 12.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.226388454437256, -2.145380973815918, -2.06437349319458, -1.9833661317825317, -1.9023586511611938, -1.8213512897491455, -1.7403438091278076, -1.6593363285064697, -1.5783288478851318, -1.497321367263794, -1.4163140058517456, -1.3353065252304077, -1.2542990446090698, -1.1732916831970215, -1.0922842025756836, -1.0112767219543457, -0.9302693605422974, -0.8492619395256042, -0.7682544589042664, -0.6872470378875732, -0.6062395572662354, -0.5252321362495422, -0.4442247152328491, -0.36321723461151123, -0.2822098135948181, -0.2012023627758026, -0.1201949268579483, -0.039187490940093994, 0.04181995987892151, 0.12282741069793701, 0.20383483171463013, 0.284842312335968, 0.36584973335266113, 0.44685718417167664, 0.5278646349906921, 0.6088720560073853, 0.6898795366287231, 0.7708869576454163, 0.8518943786621094, 0.9329018592834473, 1.0139093399047852, 1.094916820526123, 1.1759241819381714, 1.2569316625595093, 1.3379391431808472, 1.4189465045928955, 1.4999539852142334, 1.5809614658355713, 1.6619688272476196, 1.7429763078689575, 1.8239836692810059, 1.9049911499023438, 1.9859986305236816, 2.0670061111450195, 2.1480135917663574, 2.2290210723876953, 2.310028314590454, 2.391035795211792, 2.47204327583313, 2.5530505180358887, 2.6340579986572266, 2.7150654792785645, 2.7960729598999023, 2.8770804405212402, 2.958087921142578]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 14.0, 25.0, 38.0, 69.0, 107.0, 243.0, 520.0, 1447.0, 6470.0, 106810.0, 4064131.0, 11380.0, 1930.0, 572.0, 240.0, 125.0, 61.0, 36.0, 16.0, 14.0, 11.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.125, -4.013946533203125, -3.90289306640625, -3.791839599609375, -3.6807861328125, -3.569732666015625, -3.45867919921875, -3.347625732421875, -3.236572265625, -3.125518798828125, -3.01446533203125, -2.903411865234375, -2.7923583984375, -2.681304931640625, -2.57025146484375, -2.459197998046875, -2.34814453125, -2.237091064453125, -2.12603759765625, -2.014984130859375, -1.9039306640625, -1.792877197265625, -1.68182373046875, -1.570770263671875, -1.459716796875, -1.348663330078125, -1.23760986328125, -1.126556396484375, -1.0155029296875, -0.904449462890625, -0.79339599609375, -0.682342529296875, -0.5712890625, -0.460235595703125, -0.34918212890625, -0.238128662109375, -0.1270751953125, -0.016021728515625, 0.09503173828125, 0.206085205078125, 0.317138671875, 0.428192138671875, 0.53924560546875, 0.650299072265625, 0.7613525390625, 0.872406005859375, 0.98345947265625, 1.094512939453125, 1.20556640625, 1.316619873046875, 1.42767333984375, 1.538726806640625, 1.6497802734375, 1.760833740234375, 1.87188720703125, 1.982940673828125, 2.093994140625, 2.205047607421875, 2.31610107421875, 2.427154541015625, 2.5382080078125, 2.649261474609375, 2.76031494140625, 2.871368408203125, 2.982421875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 22.0, 31.0, 42.0, 87.0, 106.0, 145.0, 150.0, 130.0, 101.0, 67.0, 32.0, 22.0, 9.0, 14.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12005615234375, -0.11682701110839844, -0.11359786987304688, -0.11036872863769531, -0.10713958740234375, -0.10391044616699219, -0.10068130493164062, -0.09745216369628906, -0.0942230224609375, -0.09099388122558594, -0.08776473999023438, -0.08453559875488281, -0.08130645751953125, -0.07807731628417969, -0.07484817504882812, -0.07161903381347656, -0.068389892578125, -0.06516075134277344, -0.061931610107421875, -0.05870246887207031, -0.05547332763671875, -0.05224418640136719, -0.049015045166015625, -0.04578590393066406, -0.0425567626953125, -0.03932762145996094, -0.036098480224609375, -0.03286933898925781, -0.02964019775390625, -0.026411056518554688, -0.023181915283203125, -0.019952774047851562, -0.0167236328125, -0.013494491577148438, -0.010265350341796875, -0.0070362091064453125, -0.00380706787109375, -0.0005779266357421875, 0.002651214599609375, 0.0058803558349609375, 0.0091094970703125, 0.012338638305664062, 0.015567779541015625, 0.018796920776367188, 0.02202606201171875, 0.025255203247070312, 0.028484344482421875, 0.03171348571777344, 0.034942626953125, 0.03817176818847656, 0.041400909423828125, 0.04463005065917969, 0.04785919189453125, 0.05108833312988281, 0.054317474365234375, 0.05754661560058594, 0.0607757568359375, 0.06400489807128906, 0.06723403930664062, 0.07046318054199219, 0.07369232177734375, 0.07692146301269531, 0.08015060424804688, 0.08337974548339844, 0.08660888671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 14.0, 20.0, 21.0, 44.0, 48.0, 67.0, 108.0, 146.0, 220.0, 321.0, 525.0, 776.0, 1322.0, 2020.0, 3521.0, 5942.0, 10886.0, 21800.0, 52226.0, 283616.0, 3685689.0, 70165.0, 25696.0, 12512.0, 6486.0, 3777.0, 2266.0, 1463.0, 832.0, 598.0, 386.0, 245.0, 173.0, 108.0, 78.0, 50.0, 33.0, 17.0, 11.0, 12.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8154296875, -0.7908172607421875, -0.766204833984375, -0.7415924072265625, -0.71697998046875, -0.6923675537109375, -0.667755126953125, -0.6431427001953125, -0.6185302734375, -0.5939178466796875, -0.569305419921875, -0.5446929931640625, -0.52008056640625, -0.4954681396484375, -0.470855712890625, -0.4462432861328125, -0.421630859375, -0.3970184326171875, -0.372406005859375, -0.3477935791015625, -0.32318115234375, -0.2985687255859375, -0.273956298828125, -0.2493438720703125, -0.2247314453125, -0.2001190185546875, -0.175506591796875, -0.1508941650390625, -0.12628173828125, -0.1016693115234375, -0.077056884765625, -0.0524444580078125, -0.02783203125, -0.0032196044921875, 0.021392822265625, 0.0460052490234375, 0.07061767578125, 0.0952301025390625, 0.119842529296875, 0.1444549560546875, 0.1690673828125, 0.1936798095703125, 0.218292236328125, 0.2429046630859375, 0.26751708984375, 0.2921295166015625, 0.316741943359375, 0.3413543701171875, 0.365966796875, 0.3905792236328125, 0.415191650390625, 0.4398040771484375, 0.46441650390625, 0.4890289306640625, 0.513641357421875, 0.5382537841796875, 0.5628662109375, 0.5874786376953125, 0.612091064453125, 0.6367034912109375, 0.66131591796875, 0.6859283447265625, 0.710540771484375, 0.7351531982421875, 0.759765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 1.0, 8.0, 4.0, 6.0, 8.0, 9.0, 9.0, 11.0, 19.0, 21.0, 28.0, 25.0, 27.0, 50.0, 71.0, 179.0, 3225.0, 112.0, 71.0, 51.0, 24.0, 21.0, 17.0, 17.0, 10.0, 10.0, 6.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.220703125, -0.21479415893554688, -0.20888519287109375, -0.20297622680664062, -0.1970672607421875, -0.19115829467773438, -0.18524932861328125, -0.17934036254882812, -0.173431396484375, -0.16752243041992188, -0.16161346435546875, -0.15570449829101562, -0.1497955322265625, -0.14388656616210938, -0.13797760009765625, -0.13206863403320312, -0.12615966796875, -0.12025070190429688, -0.11434173583984375, -0.10843276977539062, -0.1025238037109375, -0.09661483764648438, -0.09070587158203125, -0.08479690551757812, -0.078887939453125, -0.07297897338867188, -0.06707000732421875, -0.061161041259765625, -0.0552520751953125, -0.049343109130859375, -0.04343414306640625, -0.037525177001953125, -0.0316162109375, -0.025707244873046875, -0.01979827880859375, -0.013889312744140625, -0.0079803466796875, -0.002071380615234375, 0.00383758544921875, 0.009746551513671875, 0.015655517578125, 0.021564483642578125, 0.02747344970703125, 0.033382415771484375, 0.0392913818359375, 0.045200347900390625, 0.05110931396484375, 0.057018280029296875, 0.06292724609375, 0.06883621215820312, 0.07474517822265625, 0.08065414428710938, 0.0865631103515625, 0.09247207641601562, 0.09838104248046875, 0.10429000854492188, 0.110198974609375, 0.11610794067382812, 0.12201690673828125, 0.12792587280273438, 0.1338348388671875, 0.13974380493164062, 0.14565277099609375, 0.15156173706054688, 0.157470703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 8.0, 7.0, 5.0, 6.0, 9.0, 9.0, 13.0, 18.0, 31.0, 22.0, 29.0, 30.0, 64.0, 98.0, 139.0, 137.0, 109.0, 63.0, 48.0, 42.0, 27.0, 14.0, 20.0, 10.0, 11.0, 5.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.8397519588470459, -0.8187509179115295, -0.7977498173713684, -0.776748776435852, -0.7557476758956909, -0.7347466349601746, -0.7137455940246582, -0.6927444934844971, -0.6717434525489807, -0.6507424116134644, -0.6297413110733032, -0.6087402701377869, -0.5877391695976257, -0.5667381286621094, -0.5457370281219482, -0.5247359871864319, -0.5037349462509155, -0.4827338755130768, -0.46173280477523804, -0.4407317638397217, -0.41973069310188293, -0.3987296223640442, -0.37772855162620544, -0.3567274808883667, -0.33572638034820557, -0.3147253096103668, -0.2937242388725281, -0.2727231979370117, -0.251722127199173, -0.23072105646133423, -0.20971998572349548, -0.18871892988681793, -0.16771787405014038, -0.14671680331230164, -0.12571574747562408, -0.10471467673778534, -0.08371361345052719, -0.06271255016326904, -0.0417114794254303, -0.020710423588752747, 0.00029064714908599854, 0.021291712298989296, 0.04229277744889259, 0.06329384446144104, 0.08429490774869919, 0.10529597103595734, 0.12629704177379608, 0.14729809761047363, 0.16829916834831238, 0.18930023908615112, 0.21030129492282867, 0.23130236566066742, 0.25230342149734497, 0.2733044922351837, 0.29430556297302246, 0.3153066039085388, 0.33630770444869995, 0.3573087751865387, 0.37830984592437744, 0.3993108868598938, 0.42031195759773254, 0.4413130283355713, 0.46231409907341003, 0.4833151698112488, 0.5043162107467651]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 15.0, 27.0, 16.0, 16.0, 33.0, 26.0, 36.0, 27.0, 45.0, 42.0, 36.0, 50.0, 51.0, 48.0, 51.0, 42.0, 45.0, 28.0, 51.0, 47.0, 35.0, 36.0, 23.0, 27.0, 31.0, 20.0, 8.0, 11.0, 11.0, 9.0, 8.0, 3.0, 9.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6068528294563293, -0.5886223316192627, -0.5703918933868408, -0.5521613955497742, -0.5339308977127075, -0.5157004594802856, -0.497469961643219, -0.47923949360847473, -0.46100902557373047, -0.4427785575389862, -0.42454808950424194, -0.4063175916671753, -0.38808712363243103, -0.36985665559768677, -0.3516261577606201, -0.33339568972587585, -0.3151652216911316, -0.29693475365638733, -0.27870428562164307, -0.2604737877845764, -0.24224331974983215, -0.2240128517150879, -0.20578236877918243, -0.18755188584327698, -0.16932141780853271, -0.15109094977378845, -0.132860466837883, -0.11462999135255814, -0.09639951586723328, -0.07816904038190842, -0.05993856489658356, -0.0417080819606781, -0.023477613925933838, -0.005247138440608978, 0.012983337044715881, 0.03121381253004074, 0.0494442880153656, 0.06767476350069046, 0.08590523898601532, 0.10413572192192078, 0.12236618995666504, 0.1405966579914093, 0.15882714092731476, 0.17705762386322021, 0.19528809189796448, 0.21351855993270874, 0.2317490428686142, 0.24997952580451965, 0.2682099938392639, 0.2864404618740082, 0.30467092990875244, 0.3229014277458191, 0.34113189578056335, 0.3593623638153076, 0.37759286165237427, 0.39582332968711853, 0.4140537977218628, 0.43228426575660706, 0.4505147337913513, 0.46874523162841797, 0.48697569966316223, 0.5052061676979065, 0.5234366655349731, 0.541667103767395, 0.5598976016044617]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 7.0, 11.0, 12.0, 25.0, 23.0, 37.0, 61.0, 75.0, 117.0, 182.0, 226.0, 423.0, 645.0, 1140.0, 2200.0, 4907.0, 15388.0, 65066.0, 530132.0, 355564.0, 50553.0, 12560.0, 4368.0, 2024.0, 1067.0, 582.0, 380.0, 236.0, 144.0, 120.0, 82.0, 44.0, 38.0, 30.0, 22.0, 19.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.79541015625, -0.7704925537109375, -0.745574951171875, -0.7206573486328125, -0.69573974609375, -0.6708221435546875, -0.645904541015625, -0.6209869384765625, -0.5960693359375, -0.5711517333984375, -0.546234130859375, -0.5213165283203125, -0.49639892578125, -0.4714813232421875, -0.446563720703125, -0.4216461181640625, -0.396728515625, -0.3718109130859375, -0.346893310546875, -0.3219757080078125, -0.29705810546875, -0.2721405029296875, -0.247222900390625, -0.2223052978515625, -0.1973876953125, -0.1724700927734375, -0.147552490234375, -0.1226348876953125, -0.09771728515625, -0.0727996826171875, -0.047882080078125, -0.0229644775390625, 0.001953125, 0.0268707275390625, 0.051788330078125, 0.0767059326171875, 0.10162353515625, 0.1265411376953125, 0.151458740234375, 0.1763763427734375, 0.2012939453125, 0.2262115478515625, 0.251129150390625, 0.2760467529296875, 0.30096435546875, 0.3258819580078125, 0.350799560546875, 0.3757171630859375, 0.400634765625, 0.4255523681640625, 0.450469970703125, 0.4753875732421875, 0.50030517578125, 0.5252227783203125, 0.550140380859375, 0.5750579833984375, 0.5999755859375, 0.6248931884765625, 0.649810791015625, 0.6747283935546875, 0.69964599609375, 0.7245635986328125, 0.749481201171875, 0.7743988037109375, 0.79931640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 12.0, 21.0, 47.0, 65.0, 99.0, 116.0, 126.0, 121.0, 117.0, 83.0, 74.0, 40.0, 27.0, 11.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11373233795166016, -0.11064338684082031, -0.10755443572998047, -0.10446548461914062, -0.10137653350830078, -0.09828758239746094, -0.0951986312866211, -0.09210968017578125, -0.0890207290649414, -0.08593177795410156, -0.08284282684326172, -0.07975387573242188, -0.07666492462158203, -0.07357597351074219, -0.07048702239990234, -0.0673980712890625, -0.06430912017822266, -0.06122016906738281, -0.05813121795654297, -0.055042266845703125, -0.05195331573486328, -0.04886436462402344, -0.045775413513183594, -0.04268646240234375, -0.039597511291503906, -0.03650856018066406, -0.03341960906982422, -0.030330657958984375, -0.02724170684814453, -0.024152755737304688, -0.021063804626464844, -0.017974853515625, -0.014885902404785156, -0.011796951293945312, -0.008708000183105469, -0.005619049072265625, -0.0025300979614257812, 0.0005588531494140625, 0.0036478042602539062, 0.00673675537109375, 0.009825706481933594, 0.012914657592773438, 0.01600360870361328, 0.019092559814453125, 0.02218151092529297, 0.025270462036132812, 0.028359413146972656, 0.0314483642578125, 0.034537315368652344, 0.03762626647949219, 0.04071521759033203, 0.043804168701171875, 0.04689311981201172, 0.04998207092285156, 0.053071022033691406, 0.05615997314453125, 0.059248924255371094, 0.06233787536621094, 0.06542682647705078, 0.06851577758789062, 0.07160472869873047, 0.07469367980957031, 0.07778263092041016, 0.08087158203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 0.0, 4.0, 8.0, 6.0, 11.0, 13.0, 13.0, 31.0, 23.0, 43.0, 72.0, 112.0, 168.0, 189.0, 289.0, 469.0, 782.0, 1283.0, 2182.0, 3889.0, 7476.0, 15629.0, 34308.0, 85870.0, 295859.0, 409117.0, 109520.0, 42150.0, 18638.0, 9016.0, 4801.0, 2572.0, 1426.0, 918.0, 565.0, 363.0, 226.0, 158.0, 116.0, 76.0, 36.0, 31.0, 27.0, 20.0, 17.0, 11.0, 5.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.42333984375, -0.4101600646972656, -0.39698028564453125, -0.3838005065917969, -0.3706207275390625, -0.3574409484863281, -0.34426116943359375, -0.3310813903808594, -0.317901611328125, -0.3047218322753906, -0.29154205322265625, -0.2783622741699219, -0.2651824951171875, -0.2520027160644531, -0.23882293701171875, -0.22564315795898438, -0.21246337890625, -0.19928359985351562, -0.18610382080078125, -0.17292404174804688, -0.1597442626953125, -0.14656448364257812, -0.13338470458984375, -0.12020492553710938, -0.107025146484375, -0.09384536743164062, -0.08066558837890625, -0.06748580932617188, -0.0543060302734375, -0.041126251220703125, -0.02794647216796875, -0.014766693115234375, -0.0015869140625, 0.011592864990234375, 0.02477264404296875, 0.037952423095703125, 0.0511322021484375, 0.06431198120117188, 0.07749176025390625, 0.09067153930664062, 0.103851318359375, 0.11703109741210938, 0.13021087646484375, 0.14339065551757812, 0.1565704345703125, 0.16975021362304688, 0.18292999267578125, 0.19610977172851562, 0.20928955078125, 0.22246932983398438, 0.23564910888671875, 0.24882888793945312, 0.2620086669921875, 0.2751884460449219, 0.28836822509765625, 0.3015480041503906, 0.314727783203125, 0.3279075622558594, 0.34108734130859375, 0.3542671203613281, 0.3674468994140625, 0.3806266784667969, 0.39380645751953125, 0.4069862365722656, 0.420166015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 10.0, 9.0, 13.0, 27.0, 27.0, 32.0, 42.0, 42.0, 52.0, 54.0, 53.0, 63.0, 59.0, 59.0, 82.0, 53.0, 54.0, 38.0, 42.0, 40.0, 22.0, 26.0, 16.0, 16.0, 20.0, 11.0, 7.0, 11.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32080078125, -0.31076812744140625, -0.3007354736328125, -0.29070281982421875, -0.280670166015625, -0.27063751220703125, -0.2606048583984375, -0.25057220458984375, -0.24053955078125, -0.23050689697265625, -0.2204742431640625, -0.21044158935546875, -0.200408935546875, -0.19037628173828125, -0.1803436279296875, -0.17031097412109375, -0.1602783203125, -0.15024566650390625, -0.1402130126953125, -0.13018035888671875, -0.120147705078125, -0.11011505126953125, -0.1000823974609375, -0.09004974365234375, -0.08001708984375, -0.06998443603515625, -0.0599517822265625, -0.04991912841796875, -0.039886474609375, -0.02985382080078125, -0.0198211669921875, -0.00978851318359375, 0.000244140625, 0.01027679443359375, 0.0203094482421875, 0.03034210205078125, 0.040374755859375, 0.05040740966796875, 0.0604400634765625, 0.07047271728515625, 0.08050537109375, 0.09053802490234375, 0.1005706787109375, 0.11060333251953125, 0.120635986328125, 0.13066864013671875, 0.1407012939453125, 0.15073394775390625, 0.1607666015625, 0.17079925537109375, 0.1808319091796875, 0.19086456298828125, 0.200897216796875, 0.21092987060546875, 0.2209625244140625, 0.23099517822265625, 0.24102783203125, 0.25106048583984375, 0.2610931396484375, 0.27112579345703125, 0.281158447265625, 0.29119110107421875, 0.3012237548828125, 0.31125640869140625, 0.3212890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 14.0, 15.0, 32.0, 43.0, 79.0, 154.0, 365.0, 1011.0, 4818.0, 67163.0, 946898.0, 23963.0, 2749.0, 653.0, 298.0, 132.0, 59.0, 45.0, 16.0, 15.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396240234375, -0.3827362060546875, -0.369232177734375, -0.3557281494140625, -0.34222412109375, -0.3287200927734375, -0.315216064453125, -0.3017120361328125, -0.2882080078125, -0.2747039794921875, -0.261199951171875, -0.2476959228515625, -0.23419189453125, -0.2206878662109375, -0.207183837890625, -0.1936798095703125, -0.18017578125, -0.1666717529296875, -0.153167724609375, -0.1396636962890625, -0.12615966796875, -0.1126556396484375, -0.099151611328125, -0.0856475830078125, -0.0721435546875, -0.0586395263671875, -0.045135498046875, -0.0316314697265625, -0.01812744140625, -0.0046234130859375, 0.008880615234375, 0.0223846435546875, 0.035888671875, 0.0493927001953125, 0.062896728515625, 0.0764007568359375, 0.08990478515625, 0.1034088134765625, 0.116912841796875, 0.1304168701171875, 0.1439208984375, 0.1574249267578125, 0.170928955078125, 0.1844329833984375, 0.19793701171875, 0.2114410400390625, 0.224945068359375, 0.2384490966796875, 0.251953125, 0.2654571533203125, 0.278961181640625, 0.2924652099609375, 0.30596923828125, 0.3194732666015625, 0.332977294921875, 0.3464813232421875, 0.3599853515625, 0.3734893798828125, 0.386993408203125, 0.4004974365234375, 0.41400146484375, 0.4275054931640625, 0.441009521484375, 0.4545135498046875, 0.468017578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 12.0, 19.0, 31.0, 90.0, 276.0, 292.0, 138.0, 55.0, 28.0, 11.0, 17.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.0411949157714844e-05, -3.947596997022629e-05, -3.853999078273773e-05, -3.7604011595249176e-05, -3.666803240776062e-05, -3.5732053220272064e-05, -3.479607403278351e-05, -3.386009484529495e-05, -3.2924115657806396e-05, -3.198813647031784e-05, -3.1052157282829285e-05, -3.011617809534073e-05, -2.9180198907852173e-05, -2.8244219720363617e-05, -2.730824053287506e-05, -2.6372261345386505e-05, -2.543628215789795e-05, -2.4500302970409393e-05, -2.3564323782920837e-05, -2.262834459543228e-05, -2.1692365407943726e-05, -2.075638622045517e-05, -1.9820407032966614e-05, -1.8884427845478058e-05, -1.7948448657989502e-05, -1.7012469470500946e-05, -1.607649028301239e-05, -1.5140511095523834e-05, -1.4204531908035278e-05, -1.3268552720546722e-05, -1.2332573533058167e-05, -1.139659434556961e-05, -1.0460615158081055e-05, -9.524635970592499e-06, -8.588656783103943e-06, -7.652677595615387e-06, -6.716698408126831e-06, -5.780719220638275e-06, -4.844740033149719e-06, -3.908760845661163e-06, -2.9727816581726074e-06, -2.0368024706840515e-06, -1.1008232831954956e-06, -1.648440957069397e-07, 7.711350917816162e-07, 1.7071142792701721e-06, 2.643093466758728e-06, 3.579072654247284e-06, 4.51505184173584e-06, 5.451031029224396e-06, 6.387010216712952e-06, 7.3229894042015076e-06, 8.258968591690063e-06, 9.19494777917862e-06, 1.0130926966667175e-05, 1.1066906154155731e-05, 1.2002885341644287e-05, 1.2938864529132843e-05, 1.3874843716621399e-05, 1.4810822904109955e-05, 1.574680209159851e-05, 1.6682781279087067e-05, 1.7618760466575623e-05, 1.855473965406418e-05, 1.9490718841552734e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 6.0, 17.0, 20.0, 35.0, 29.0, 57.0, 73.0, 116.0, 177.0, 304.0, 486.0, 958.0, 1878.0, 4098.0, 12468.0, 63050.0, 799356.0, 135186.0, 19580.0, 5613.0, 2388.0, 1130.0, 604.0, 323.0, 203.0, 112.0, 84.0, 63.0, 43.0, 26.0, 14.0, 10.0, 12.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20556640625, -0.19886207580566406, -0.19215774536132812, -0.1854534149169922, -0.17874908447265625, -0.1720447540283203, -0.16534042358398438, -0.15863609313964844, -0.1519317626953125, -0.14522743225097656, -0.13852310180664062, -0.1318187713623047, -0.12511444091796875, -0.11841011047363281, -0.11170578002929688, -0.10500144958496094, -0.098297119140625, -0.09159278869628906, -0.08488845825195312, -0.07818412780761719, -0.07147979736328125, -0.06477546691894531, -0.058071136474609375, -0.05136680603027344, -0.0446624755859375, -0.03795814514160156, -0.031253814697265625, -0.024549484252929688, -0.01784515380859375, -0.011140823364257812, -0.004436492919921875, 0.0022678375244140625, 0.00897216796875, 0.015676498413085938, 0.022380828857421875, 0.029085159301757812, 0.03578948974609375, 0.04249382019042969, 0.049198150634765625, 0.05590248107910156, 0.0626068115234375, 0.06931114196777344, 0.07601547241210938, 0.08271980285644531, 0.08942413330078125, 0.09612846374511719, 0.10283279418945312, 0.10953712463378906, 0.116241455078125, 0.12294578552246094, 0.12965011596679688, 0.1363544464111328, 0.14305877685546875, 0.1497631072998047, 0.15646743774414062, 0.16317176818847656, 0.1698760986328125, 0.17658042907714844, 0.18328475952148438, 0.1899890899658203, 0.19669342041015625, 0.2033977508544922, 0.21010208129882812, 0.21680641174316406, 0.2235107421875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 10.0, 18.0, 24.0, 35.0, 58.0, 93.0, 161.0, 227.0, 140.0, 84.0, 45.0, 37.0, 21.0, 12.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.15918731689453125, -0.1548004150390625, -0.15041351318359375, -0.146026611328125, -0.14163970947265625, -0.1372528076171875, -0.13286590576171875, -0.12847900390625, -0.12409210205078125, -0.1197052001953125, -0.11531829833984375, -0.110931396484375, -0.10654449462890625, -0.1021575927734375, -0.09777069091796875, -0.0933837890625, -0.08899688720703125, -0.0846099853515625, -0.08022308349609375, -0.075836181640625, -0.07144927978515625, -0.0670623779296875, -0.06267547607421875, -0.05828857421875, -0.05390167236328125, -0.0495147705078125, -0.04512786865234375, -0.040740966796875, -0.03635406494140625, -0.0319671630859375, -0.02758026123046875, -0.023193359375, -0.01880645751953125, -0.0144195556640625, -0.01003265380859375, -0.005645751953125, -0.00125885009765625, 0.0031280517578125, 0.00751495361328125, 0.01190185546875, 0.01628875732421875, 0.0206756591796875, 0.02506256103515625, 0.029449462890625, 0.03383636474609375, 0.0382232666015625, 0.04261016845703125, 0.0469970703125, 0.05138397216796875, 0.0557708740234375, 0.06015777587890625, 0.064544677734375, 0.06893157958984375, 0.0733184814453125, 0.07770538330078125, 0.08209228515625, 0.08647918701171875, 0.0908660888671875, 0.09525299072265625, 0.099639892578125, 0.10402679443359375, 0.1084136962890625, 0.11280059814453125, 0.1171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 13.0, 14.0, 37.0, 53.0, 104.0, 190.0, 263.0, 139.0, 63.0, 45.0, 29.0, 6.0, 11.0, 10.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.006848096847534, -1.8968191146850586, -1.786790132522583, -1.6767610311508179, -1.5667320489883423, -1.4567030668258667, -1.3466739654541016, -1.236644983291626, -1.1266160011291504, -1.0165870189666748, -0.9065579771995544, -0.7965289354324341, -0.6864999532699585, -0.5764709711074829, -0.46644192934036255, -0.3564128875732422, -0.2463839054107666, -0.13635489344596863, -0.026325881481170654, 0.08370313048362732, 0.1937321424484253, 0.3037611246109009, 0.41379016637802124, 0.5238192081451416, 0.6338481903076172, 0.7438771724700928, 0.8539062142372131, 0.9639352560043335, 1.073964238166809, 1.1839932203292847, 1.2940223217010498, 1.4040513038635254, 1.5140800476074219, 1.6241090297698975, 1.734138011932373, 1.8441671133041382, 1.9541960954666138, 2.064225196838379, 2.1742541790008545, 2.28428316116333, 2.3943121433258057, 2.5043411254882812, 2.614370107650757, 2.7243990898132324, 2.834428310394287, 2.9444570541381836, 3.0544862747192383, 3.164515256881714, 3.2745442390441895, 3.384573221206665, 3.4946022033691406, 3.604631185531616, 3.714660167694092, 3.8246893882751465, 3.934718370437622, 4.044747352600098, 4.154776573181152, 4.264805793762207, 4.3748345375061035, 4.484863758087158, 4.594892501831055, 4.704921722412109, 4.814950466156006, 4.9249796867370605, 5.035008430480957]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 4.0, 11.0, 16.0, 11.0, 12.0, 12.0, 16.0, 23.0, 24.0, 16.0, 19.0, 37.0, 26.0, 33.0, 28.0, 41.0, 33.0, 45.0, 41.0, 54.0, 53.0, 36.0, 45.0, 28.0, 37.0, 36.0, 29.0, 23.0, 33.0, 20.0, 17.0, 19.0, 19.0, 16.0, 14.0, 13.0, 9.0, 13.0, 6.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.24226975440979, -1.1990463733673096, -1.1558228731155396, -1.1125993728637695, -1.069375991821289, -1.0261526107788086, -0.9829291105270386, -0.9397056698799133, -0.8964822292327881, -0.8532587885856628, -0.8100353479385376, -0.7668119072914124, -0.7235884666442871, -0.6803650259971619, -0.6371415853500366, -0.5939181447029114, -0.5506947040557861, -0.5074712634086609, -0.46424782276153564, -0.4210243821144104, -0.37780094146728516, -0.3345775008201599, -0.29135406017303467, -0.24813061952590942, -0.20490717887878418, -0.16168373823165894, -0.11846029758453369, -0.07523685693740845, -0.0320134162902832, 0.011210024356842041, 0.054433465003967285, 0.09765690565109253, 0.14088034629821777, 0.18410378694534302, 0.22732722759246826, 0.2705506682395935, 0.31377410888671875, 0.356997549533844, 0.40022099018096924, 0.4434444308280945, 0.4866678714752197, 0.529891312122345, 0.5731147527694702, 0.6163381934165955, 0.6595616340637207, 0.702785074710846, 0.7460085153579712, 0.7892319560050964, 0.8324553966522217, 0.8756788372993469, 0.9189022779464722, 0.9621257185935974, 1.0053491592407227, 1.0485725402832031, 1.0917960405349731, 1.1350195407867432, 1.1782429218292236, 1.221466302871704, 1.2646898031234741, 1.3079133033752441, 1.3511366844177246, 1.394360065460205, 1.437583565711975, 1.4808070659637451, 1.5240304470062256]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 1.0, 11.0, 10.0, 9.0, 16.0, 14.0, 32.0, 36.0, 54.0, 88.0, 128.0, 249.0, 452.0, 1005.0, 2335.0, 6942.0, 27984.0, 3997253.0, 133219.0, 16303.0, 4756.0, 1699.0, 759.0, 349.0, 202.0, 126.0, 68.0, 39.0, 42.0, 25.0, 21.0, 17.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.326171875, -1.2901611328125, -1.254150390625, -1.2181396484375, -1.18212890625, -1.1461181640625, -1.110107421875, -1.0740966796875, -1.0380859375, -1.0020751953125, -0.966064453125, -0.9300537109375, -0.89404296875, -0.8580322265625, -0.822021484375, -0.7860107421875, -0.75, -0.7139892578125, -0.677978515625, -0.6419677734375, -0.60595703125, -0.5699462890625, -0.533935546875, -0.4979248046875, -0.4619140625, -0.4259033203125, -0.389892578125, -0.3538818359375, -0.31787109375, -0.2818603515625, -0.245849609375, -0.2098388671875, -0.173828125, -0.1378173828125, -0.101806640625, -0.0657958984375, -0.02978515625, 0.0062255859375, 0.042236328125, 0.0782470703125, 0.1142578125, 0.1502685546875, 0.186279296875, 0.2222900390625, 0.25830078125, 0.2943115234375, 0.330322265625, 0.3663330078125, 0.40234375, 0.4383544921875, 0.474365234375, 0.5103759765625, 0.54638671875, 0.5823974609375, 0.618408203125, 0.6544189453125, 0.6904296875, 0.7264404296875, 0.762451171875, 0.7984619140625, 0.83447265625, 0.8704833984375, 0.906494140625, 0.9425048828125, 0.978515625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 14.0, 10.0, 25.0, 39.0, 47.0, 71.0, 77.0, 114.0, 128.0, 107.0, 91.0, 78.0, 64.0, 41.0, 38.0, 20.0, 15.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1156005859375, -0.11254310607910156, -0.10948562622070312, -0.10642814636230469, -0.10337066650390625, -0.10031318664550781, -0.09725570678710938, -0.09419822692871094, -0.0911407470703125, -0.08808326721191406, -0.08502578735351562, -0.08196830749511719, -0.07891082763671875, -0.07585334777832031, -0.07279586791992188, -0.06973838806152344, -0.066680908203125, -0.06362342834472656, -0.060565948486328125, -0.05750846862792969, -0.05445098876953125, -0.05139350891113281, -0.048336029052734375, -0.04527854919433594, -0.0422210693359375, -0.03916358947753906, -0.036106109619140625, -0.03304862976074219, -0.02999114990234375, -0.026933670043945312, -0.023876190185546875, -0.020818710327148438, -0.01776123046875, -0.014703750610351562, -0.011646270751953125, -0.008588790893554688, -0.00553131103515625, -0.0024738311767578125, 0.000583648681640625, 0.0036411285400390625, 0.0066986083984375, 0.009756088256835938, 0.012813568115234375, 0.015871047973632812, 0.01892852783203125, 0.021986007690429688, 0.025043487548828125, 0.028100967407226562, 0.031158447265625, 0.03421592712402344, 0.037273406982421875, 0.04033088684082031, 0.04338836669921875, 0.04644584655761719, 0.049503326416015625, 0.05256080627441406, 0.0556182861328125, 0.05867576599121094, 0.061733245849609375, 0.06479072570800781, 0.06784820556640625, 0.07090568542480469, 0.07396316528320312, 0.07702064514160156, 0.080078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 6.0, 11.0, 13.0, 24.0, 20.0, 29.0, 49.0, 65.0, 148.0, 229.0, 385.0, 832.0, 1659.0, 3799.0, 9132.0, 26004.0, 124202.0, 3920259.0, 75691.0, 19113.0, 6981.0, 2880.0, 1321.0, 621.0, 345.0, 181.0, 111.0, 53.0, 37.0, 27.0, 16.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9306640625, -0.90435791015625, -0.8780517578125, -0.85174560546875, -0.825439453125, -0.79913330078125, -0.7728271484375, -0.74652099609375, -0.72021484375, -0.69390869140625, -0.6676025390625, -0.64129638671875, -0.614990234375, -0.58868408203125, -0.5623779296875, -0.53607177734375, -0.509765625, -0.48345947265625, -0.4571533203125, -0.43084716796875, -0.404541015625, -0.37823486328125, -0.3519287109375, -0.32562255859375, -0.29931640625, -0.27301025390625, -0.2467041015625, -0.22039794921875, -0.194091796875, -0.16778564453125, -0.1414794921875, -0.11517333984375, -0.0888671875, -0.06256103515625, -0.0362548828125, -0.00994873046875, 0.016357421875, 0.04266357421875, 0.0689697265625, 0.09527587890625, 0.12158203125, 0.14788818359375, 0.1741943359375, 0.20050048828125, 0.226806640625, 0.25311279296875, 0.2794189453125, 0.30572509765625, 0.33203125, 0.35833740234375, 0.3846435546875, 0.41094970703125, 0.437255859375, 0.46356201171875, 0.4898681640625, 0.51617431640625, 0.54248046875, 0.56878662109375, 0.5950927734375, 0.62139892578125, 0.647705078125, 0.67401123046875, 0.7003173828125, 0.72662353515625, 0.7529296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 8.0, 11.0, 10.0, 13.0, 15.0, 19.0, 22.0, 31.0, 61.0, 94.0, 354.0, 3106.0, 115.0, 57.0, 38.0, 32.0, 24.0, 13.0, 14.0, 6.0, 10.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.259765625, -0.25345802307128906, -0.24715042114257812, -0.2408428192138672, -0.23453521728515625, -0.2282276153564453, -0.22192001342773438, -0.21561241149902344, -0.2093048095703125, -0.20299720764160156, -0.19668960571289062, -0.1903820037841797, -0.18407440185546875, -0.1777667999267578, -0.17145919799804688, -0.16515159606933594, -0.158843994140625, -0.15253639221191406, -0.14622879028320312, -0.1399211883544922, -0.13361358642578125, -0.1273059844970703, -0.12099838256835938, -0.11469078063964844, -0.1083831787109375, -0.10207557678222656, -0.09576797485351562, -0.08946037292480469, -0.08315277099609375, -0.07684516906738281, -0.07053756713867188, -0.06422996520996094, -0.05792236328125, -0.05161476135253906, -0.045307159423828125, -0.03899955749511719, -0.03269195556640625, -0.026384353637695312, -0.020076751708984375, -0.013769149780273438, -0.0074615478515625, -0.0011539459228515625, 0.005153656005859375, 0.011461257934570312, 0.01776885986328125, 0.024076461791992188, 0.030384063720703125, 0.03669166564941406, 0.042999267578125, 0.04930686950683594, 0.055614471435546875, 0.06192207336425781, 0.06822967529296875, 0.07453727722167969, 0.08084487915039062, 0.08715248107910156, 0.0934600830078125, 0.09976768493652344, 0.10607528686523438, 0.11238288879394531, 0.11869049072265625, 0.12499809265136719, 0.13130569458007812, 0.13761329650878906, 0.1439208984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 19.0, 27.0, 30.0, 72.0, 127.0, 299.0, 219.0, 96.0, 50.0, 32.0, 9.0, 5.0, 6.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5345711708068848, -0.4959692656993866, -0.4573673605918884, -0.41876548528671265, -0.3801635801792145, -0.3415616750717163, -0.3029597997665405, -0.26435789465904236, -0.2257559895515442, -0.18715408444404602, -0.14855219423770905, -0.10995029658079147, -0.0713483989238739, -0.03274649381637573, 0.005855396389961243, 0.04445728659629822, 0.08305919170379639, 0.12166108936071396, 0.16026298701763153, 0.1988648772239685, 0.23746678233146667, 0.27606868743896484, 0.3146705627441406, 0.3532724678516388, 0.39187437295913696, 0.43047627806663513, 0.4690781831741333, 0.5076800584793091, 0.5462819337844849, 0.5848838686943054, 0.6234857439994812, 0.6620876789093018, 0.7006895542144775, 0.7392914295196533, 0.7778933644294739, 0.8164952397346497, 0.8550971746444702, 0.893699049949646, 0.9323009252548218, 0.9709028005599976, 1.009504795074463, 1.0481066703796387, 1.0867085456848145, 1.1253105401992798, 1.1639124155044556, 1.2025142908096313, 1.2411161661148071, 1.279718041419983, 1.3183199167251587, 1.3569217920303345, 1.3955236673355103, 1.4341256618499756, 1.4727275371551514, 1.5113294124603271, 1.549931287765503, 1.5885331630706787, 1.6271350383758545, 1.6657369136810303, 1.704338788986206, 1.7429407835006714, 1.7815426588058472, 1.820144534111023, 1.8587464094161987, 1.8973482847213745, 1.9359502792358398]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 9.0, 8.0, 6.0, 13.0, 13.0, 25.0, 18.0, 29.0, 28.0, 32.0, 36.0, 56.0, 61.0, 65.0, 71.0, 64.0, 62.0, 66.0, 46.0, 54.0, 48.0, 38.0, 25.0, 27.0, 27.0, 14.0, 14.0, 10.0, 11.0, 11.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3723422884941101, -0.35435330867767334, -0.33636435866355896, -0.3183753788471222, -0.3003864288330078, -0.28239744901657104, -0.2644084692001343, -0.2464195042848587, -0.22843053936958313, -0.21044157445430756, -0.19245260953903198, -0.17446362972259521, -0.15647466480731964, -0.13848569989204407, -0.1204967275261879, -0.10250775516033173, -0.08451879024505615, -0.06652982532978058, -0.04854085296392441, -0.030551884323358536, -0.012562915682792664, 0.00542604923248291, 0.02341502159833908, 0.04140399396419525, 0.059392958879470825, 0.0773819237947464, 0.09537089616060257, 0.11335986852645874, 0.13134883344173431, 0.1493377983570099, 0.16732677817344666, 0.18531574308872223, 0.2033047080039978, 0.22129367291927338, 0.23928263783454895, 0.2572716176509857, 0.2752605676651001, 0.29324954748153687, 0.31123852729797363, 0.3292275071144104, 0.3472164571285248, 0.36520543694496155, 0.3831943869590759, 0.4011833667755127, 0.41917234659194946, 0.43716129660606384, 0.4551502764225006, 0.473139226436615, 0.49112820625305176, 0.5091171860694885, 0.5271061658859253, 0.5450950860977173, 0.563084065914154, 0.5810730457305908, 0.5990620255470276, 0.6170510053634644, 0.6350399255752563, 0.6530289053916931, 0.6710178852081299, 0.6890068054199219, 0.7069957852363586, 0.7249847650527954, 0.7429737448692322, 0.760962724685669, 0.7789517045021057]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 14.0, 8.0, 12.0, 23.0, 22.0, 41.0, 39.0, 54.0, 76.0, 88.0, 135.0, 158.0, 252.0, 401.0, 610.0, 1099.0, 2200.0, 4840.0, 11767.0, 32366.0, 107035.0, 540655.0, 252582.0, 59298.0, 19764.0, 7605.0, 3337.0, 1562.0, 830.0, 468.0, 326.0, 243.0, 150.0, 142.0, 97.0, 57.0, 48.0, 44.0, 28.0, 14.0, 16.0, 13.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.450927734375, -0.43627166748046875, -0.4216156005859375, -0.40695953369140625, -0.392303466796875, -0.37764739990234375, -0.3629913330078125, -0.34833526611328125, -0.33367919921875, -0.31902313232421875, -0.3043670654296875, -0.28971099853515625, -0.275054931640625, -0.26039886474609375, -0.2457427978515625, -0.23108673095703125, -0.2164306640625, -0.20177459716796875, -0.1871185302734375, -0.17246246337890625, -0.157806396484375, -0.14315032958984375, -0.1284942626953125, -0.11383819580078125, -0.09918212890625, -0.08452606201171875, -0.0698699951171875, -0.05521392822265625, -0.040557861328125, -0.02590179443359375, -0.0112457275390625, 0.00341033935546875, 0.01806640625, 0.03272247314453125, 0.0473785400390625, 0.06203460693359375, 0.076690673828125, 0.09134674072265625, 0.1060028076171875, 0.12065887451171875, 0.13531494140625, 0.14997100830078125, 0.1646270751953125, 0.17928314208984375, 0.193939208984375, 0.20859527587890625, 0.2232513427734375, 0.23790740966796875, 0.2525634765625, 0.26721954345703125, 0.2818756103515625, 0.29653167724609375, 0.311187744140625, 0.32584381103515625, 0.3404998779296875, 0.35515594482421875, 0.36981201171875, 0.38446807861328125, 0.3991241455078125, 0.41378021240234375, 0.428436279296875, 0.44309234619140625, 0.4577484130859375, 0.47240447998046875, 0.487060546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 12.0, 17.0, 29.0, 40.0, 59.0, 61.0, 83.0, 109.0, 115.0, 107.0, 91.0, 74.0, 62.0, 44.0, 25.0, 25.0, 18.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11358642578125, -0.11065101623535156, -0.10771560668945312, -0.10478019714355469, -0.10184478759765625, -0.09890937805175781, -0.09597396850585938, -0.09303855895996094, -0.0901031494140625, -0.08716773986816406, -0.08423233032226562, -0.08129692077636719, -0.07836151123046875, -0.07542610168457031, -0.07249069213867188, -0.06955528259277344, -0.066619873046875, -0.06368446350097656, -0.060749053955078125, -0.05781364440917969, -0.05487823486328125, -0.05194282531738281, -0.049007415771484375, -0.04607200622558594, -0.0431365966796875, -0.04020118713378906, -0.037265777587890625, -0.03433036804199219, -0.03139495849609375, -0.028459548950195312, -0.025524139404296875, -0.022588729858398438, -0.0196533203125, -0.016717910766601562, -0.013782501220703125, -0.010847091674804688, -0.00791168212890625, -0.0049762725830078125, -0.002040863037109375, 0.0008945465087890625, 0.0038299560546875, 0.0067653656005859375, 0.009700775146484375, 0.012636184692382812, 0.01557159423828125, 0.018507003784179688, 0.021442413330078125, 0.024377822875976562, 0.027313232421875, 0.030248641967773438, 0.033184051513671875, 0.03611946105957031, 0.03905487060546875, 0.04199028015136719, 0.044925689697265625, 0.04786109924316406, 0.0507965087890625, 0.05373191833496094, 0.056667327880859375, 0.05960273742675781, 0.06253814697265625, 0.06547355651855469, 0.06840896606445312, 0.07134437561035156, 0.07427978515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 12.0, 14.0, 19.0, 29.0, 33.0, 52.0, 89.0, 121.0, 222.0, 297.0, 505.0, 775.0, 1353.0, 2320.0, 3871.0, 7052.0, 12269.0, 23718.0, 47125.0, 103971.0, 305287.0, 325847.0, 109400.0, 49377.0, 24693.0, 13032.0, 7087.0, 3940.0, 2343.0, 1355.0, 866.0, 525.0, 318.0, 220.0, 128.0, 94.0, 57.0, 51.0, 34.0, 14.0, 13.0, 4.0, 5.0, 7.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.302978515625, -0.29407501220703125, -0.2851715087890625, -0.27626800537109375, -0.267364501953125, -0.25846099853515625, -0.2495574951171875, -0.24065399169921875, -0.23175048828125, -0.22284698486328125, -0.2139434814453125, -0.20503997802734375, -0.196136474609375, -0.18723297119140625, -0.1783294677734375, -0.16942596435546875, -0.1605224609375, -0.15161895751953125, -0.1427154541015625, -0.13381195068359375, -0.124908447265625, -0.11600494384765625, -0.1071014404296875, -0.09819793701171875, -0.08929443359375, -0.08039093017578125, -0.0714874267578125, -0.06258392333984375, -0.053680419921875, -0.04477691650390625, -0.0358734130859375, -0.02696990966796875, -0.01806640625, -0.00916290283203125, -0.0002593994140625, 0.00864410400390625, 0.017547607421875, 0.02645111083984375, 0.0353546142578125, 0.04425811767578125, 0.05316162109375, 0.06206512451171875, 0.0709686279296875, 0.07987213134765625, 0.088775634765625, 0.09767913818359375, 0.1065826416015625, 0.11548614501953125, 0.1243896484375, 0.13329315185546875, 0.1421966552734375, 0.15110015869140625, 0.160003662109375, 0.16890716552734375, 0.1778106689453125, 0.18671417236328125, 0.19561767578125, 0.20452117919921875, 0.2134246826171875, 0.22232818603515625, 0.231231689453125, 0.24013519287109375, 0.2490386962890625, 0.25794219970703125, 0.266845703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 10.0, 13.0, 18.0, 12.0, 16.0, 26.0, 19.0, 25.0, 47.0, 37.0, 40.0, 46.0, 38.0, 43.0, 41.0, 63.0, 45.0, 45.0, 41.0, 42.0, 43.0, 37.0, 32.0, 27.0, 34.0, 26.0, 22.0, 21.0, 9.0, 11.0, 10.0, 10.0, 4.0, 5.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2301025390625, -0.2225475311279297, -0.21499252319335938, -0.20743751525878906, -0.19988250732421875, -0.19232749938964844, -0.18477249145507812, -0.1772174835205078, -0.1696624755859375, -0.1621074676513672, -0.15455245971679688, -0.14699745178222656, -0.13944244384765625, -0.13188743591308594, -0.12433242797851562, -0.11677742004394531, -0.109222412109375, -0.10166740417480469, -0.09411239624023438, -0.08655738830566406, -0.07900238037109375, -0.07144737243652344, -0.06389236450195312, -0.05633735656738281, -0.0487823486328125, -0.04122734069824219, -0.033672332763671875, -0.026117324829101562, -0.01856231689453125, -0.011007308959960938, -0.003452301025390625, 0.0041027069091796875, 0.01165771484375, 0.019212722778320312, 0.026767730712890625, 0.03432273864746094, 0.04187774658203125, 0.04943275451660156, 0.056987762451171875, 0.06454277038574219, 0.0720977783203125, 0.07965278625488281, 0.08720779418945312, 0.09476280212402344, 0.10231781005859375, 0.10987281799316406, 0.11742782592773438, 0.12498283386230469, 0.132537841796875, 0.1400928497314453, 0.14764785766601562, 0.15520286560058594, 0.16275787353515625, 0.17031288146972656, 0.17786788940429688, 0.1854228973388672, 0.1929779052734375, 0.2005329132080078, 0.20808792114257812, 0.21564292907714844, 0.22319793701171875, 0.23075294494628906, 0.23830795288085938, 0.2458629608154297, 0.25341796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 4.0, 8.0, 10.0, 15.0, 20.0, 22.0, 30.0, 41.0, 51.0, 70.0, 99.0, 148.0, 221.0, 313.0, 484.0, 907.0, 1514.0, 2962.0, 5697.0, 13565.0, 43978.0, 448415.0, 458896.0, 44533.0, 13700.0, 5943.0, 2906.0, 1513.0, 892.0, 524.0, 299.0, 219.0, 142.0, 104.0, 77.0, 49.0, 34.0, 38.0, 17.0, 18.0, 12.0, 8.0, 11.0, 4.0, 9.0, 3.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08392333984375, -0.08112621307373047, -0.07832908630371094, -0.0755319595336914, -0.07273483276367188, -0.06993770599365234, -0.06714057922363281, -0.06434345245361328, -0.06154632568359375, -0.05874919891357422, -0.05595207214355469, -0.053154945373535156, -0.050357818603515625, -0.047560691833496094, -0.04476356506347656, -0.04196643829345703, -0.0391693115234375, -0.03637218475341797, -0.03357505798339844, -0.030777931213378906, -0.027980804443359375, -0.025183677673339844, -0.022386550903320312, -0.01958942413330078, -0.01679229736328125, -0.013995170593261719, -0.011198043823242188, -0.008400917053222656, -0.005603790283203125, -0.0028066635131835938, -9.5367431640625e-06, 0.0027875900268554688, 0.005584716796875, 0.008381843566894531, 0.011178970336914062, 0.013976097106933594, 0.016773223876953125, 0.019570350646972656, 0.022367477416992188, 0.02516460418701172, 0.02796173095703125, 0.03075885772705078, 0.03355598449707031, 0.036353111267089844, 0.039150238037109375, 0.041947364807128906, 0.04474449157714844, 0.04754161834716797, 0.0503387451171875, 0.05313587188720703, 0.05593299865722656, 0.058730125427246094, 0.061527252197265625, 0.06432437896728516, 0.06712150573730469, 0.06991863250732422, 0.07271575927734375, 0.07551288604736328, 0.07831001281738281, 0.08110713958740234, 0.08390426635742188, 0.0867013931274414, 0.08949851989746094, 0.09229564666748047, 0.0950927734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 12.0, 15.0, 25.0, 31.0, 79.0, 97.0, 175.0, 178.0, 141.0, 82.0, 49.0, 31.0, 22.0, 10.0, 13.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4185905456542969e-05, -1.376122236251831e-05, -1.3336539268493652e-05, -1.2911856174468994e-05, -1.2487173080444336e-05, -1.2062489986419678e-05, -1.163780689239502e-05, -1.1213123798370361e-05, -1.0788440704345703e-05, -1.0363757610321045e-05, -9.939074516296387e-06, -9.514391422271729e-06, -9.08970832824707e-06, -8.665025234222412e-06, -8.240342140197754e-06, -7.815659046173096e-06, -7.3909759521484375e-06, -6.966292858123779e-06, -6.541609764099121e-06, -6.116926670074463e-06, -5.692243576049805e-06, -5.2675604820251465e-06, -4.842877388000488e-06, -4.41819429397583e-06, -3.993511199951172e-06, -3.5688281059265137e-06, -3.1441450119018555e-06, -2.7194619178771973e-06, -2.294778823852539e-06, -1.8700957298278809e-06, -1.4454126358032227e-06, -1.0207295417785645e-06, -5.960464477539062e-07, -1.7136335372924805e-07, 2.5331974029541016e-07, 6.780028343200684e-07, 1.1026859283447266e-06, 1.5273690223693848e-06, 1.952052116394043e-06, 2.376735210418701e-06, 2.8014183044433594e-06, 3.2261013984680176e-06, 3.6507844924926758e-06, 4.075467586517334e-06, 4.500150680541992e-06, 4.92483377456665e-06, 5.349516868591309e-06, 5.774199962615967e-06, 6.198883056640625e-06, 6.623566150665283e-06, 7.048249244689941e-06, 7.4729323387146e-06, 7.897615432739258e-06, 8.322298526763916e-06, 8.746981620788574e-06, 9.171664714813232e-06, 9.59634780883789e-06, 1.0021030902862549e-05, 1.0445713996887207e-05, 1.0870397090911865e-05, 1.1295080184936523e-05, 1.1719763278961182e-05, 1.214444637298584e-05, 1.2569129467010498e-05, 1.2993812561035156e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 6.0, 8.0, 6.0, 5.0, 18.0, 30.0, 37.0, 48.0, 66.0, 91.0, 173.0, 309.0, 527.0, 1062.0, 2539.0, 6554.0, 21344.0, 119682.0, 775510.0, 92287.0, 18072.0, 5601.0, 2269.0, 1008.0, 532.0, 285.0, 163.0, 100.0, 59.0, 53.0, 30.0, 25.0, 16.0, 11.0, 9.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1199951171875, -0.11670207977294922, -0.11340904235839844, -0.11011600494384766, -0.10682296752929688, -0.1035299301147461, -0.10023689270019531, -0.09694385528564453, -0.09365081787109375, -0.09035778045654297, -0.08706474304199219, -0.0837717056274414, -0.08047866821289062, -0.07718563079833984, -0.07389259338378906, -0.07059955596923828, -0.0673065185546875, -0.06401348114013672, -0.06072044372558594, -0.057427406311035156, -0.054134368896484375, -0.050841331481933594, -0.04754829406738281, -0.04425525665283203, -0.04096221923828125, -0.03766918182373047, -0.03437614440917969, -0.031083106994628906, -0.027790069580078125, -0.024497032165527344, -0.021203994750976562, -0.01791095733642578, -0.014617919921875, -0.011324882507324219, -0.008031845092773438, -0.004738807678222656, -0.001445770263671875, 0.0018472671508789062, 0.0051403045654296875, 0.008433341979980469, 0.01172637939453125, 0.015019416809082031, 0.018312454223632812, 0.021605491638183594, 0.024898529052734375, 0.028191566467285156, 0.03148460388183594, 0.03477764129638672, 0.0380706787109375, 0.04136371612548828, 0.04465675354003906, 0.047949790954589844, 0.051242828369140625, 0.054535865783691406, 0.05782890319824219, 0.06112194061279297, 0.06441497802734375, 0.06770801544189453, 0.07100105285644531, 0.0742940902709961, 0.07758712768554688, 0.08088016510009766, 0.08417320251464844, 0.08746623992919922, 0.09075927734375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 8.0, 11.0, 11.0, 26.0, 28.0, 47.0, 59.0, 116.0, 198.0, 172.0, 104.0, 74.0, 64.0, 24.0, 17.0, 8.0, 10.0, 11.0, 0.0, 3.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.066162109375, -0.06351947784423828, -0.06087684631347656, -0.058234214782714844, -0.055591583251953125, -0.052948951721191406, -0.05030632019042969, -0.04766368865966797, -0.04502105712890625, -0.04237842559814453, -0.03973579406738281, -0.037093162536621094, -0.034450531005859375, -0.031807899475097656, -0.029165267944335938, -0.02652263641357422, -0.0238800048828125, -0.02123737335205078, -0.018594741821289062, -0.015952110290527344, -0.013309478759765625, -0.010666847229003906, -0.008024215698242188, -0.005381584167480469, -0.00273895263671875, -9.632110595703125e-05, 0.0025463104248046875, 0.005188941955566406, 0.007831573486328125, 0.010474205017089844, 0.013116836547851562, 0.01575946807861328, 0.018402099609375, 0.02104473114013672, 0.023687362670898438, 0.026329994201660156, 0.028972625732421875, 0.031615257263183594, 0.03425788879394531, 0.03690052032470703, 0.03954315185546875, 0.04218578338623047, 0.04482841491699219, 0.047471046447753906, 0.050113677978515625, 0.052756309509277344, 0.05539894104003906, 0.05804157257080078, 0.0606842041015625, 0.06332683563232422, 0.06596946716308594, 0.06861209869384766, 0.07125473022460938, 0.0738973617553711, 0.07653999328613281, 0.07918262481689453, 0.08182525634765625, 0.08446788787841797, 0.08711051940917969, 0.0897531509399414, 0.09239578247070312, 0.09503841400146484, 0.09768104553222656, 0.10032367706298828, 0.10296630859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 11.0, 19.0, 25.0, 30.0, 39.0, 94.0, 141.0, 221.0, 140.0, 98.0, 57.0, 30.0, 35.0, 16.0, 18.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53851318359375, -1.459850788116455, -1.3811883926391602, -1.3025258779525757, -1.2238634824752808, -1.1452010869979858, -1.0665385723114014, -0.9878761768341064, -0.9092137813568115, -0.8305513858795166, -0.7518889307975769, -0.6732264757156372, -0.5945640802383423, -0.5159016847610474, -0.43723922967910767, -0.35857677459716797, -0.27991437911987305, -0.20125195384025574, -0.12258952856063843, -0.04392710328102112, 0.03473532199859619, 0.1133977472782135, 0.1920601725578308, 0.2707226276397705, 0.34938502311706543, 0.42804744839668274, 0.5067098736763, 0.5853723287582397, 0.6640347242355347, 0.7426971197128296, 0.8213595747947693, 0.900022029876709, 0.978684663772583, 1.057347059249878, 1.1360094547271729, 1.2146719694137573, 1.2933343648910522, 1.3719967603683472, 1.4506592750549316, 1.5293216705322266, 1.6079840660095215, 1.6866464614868164, 1.7653088569641113, 1.8439713716506958, 1.9226337671279907, 2.001296281814575, 2.07995867729187, 2.158621072769165, 2.23728346824646, 2.315945863723755, 2.39460825920105, 2.4732706546783447, 2.5519332885742188, 2.6305956840515137, 2.7092580795288086, 2.7879204750061035, 2.8665828704833984, 2.9452452659606934, 3.0239076614379883, 3.102570056915283, 3.181232452392578, 3.259895086288452, 3.338557481765747, 3.417219877243042, 3.495882272720337]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 3.0, 12.0, 11.0, 12.0, 23.0, 21.0, 29.0, 32.0, 35.0, 35.0, 45.0, 43.0, 54.0, 45.0, 59.0, 68.0, 66.0, 45.0, 57.0, 47.0, 43.0, 30.0, 42.0, 36.0, 22.0, 25.0, 10.0, 13.0, 8.0, 9.0, 6.0, 6.0, 1.0, 6.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9847045540809631, -0.9313434362411499, -0.8779823184013367, -0.8246212005615234, -0.7712600231170654, -0.7178989052772522, -0.664537787437439, -0.611176609992981, -0.5578155517578125, -0.5044544339179993, -0.45109328627586365, -0.3977321684360504, -0.3443710207939148, -0.29100990295410156, -0.23764878511428833, -0.1842876374721527, -0.1309264898300171, -0.07756535708904266, -0.024204231798648834, 0.029156893491744995, 0.08251802623271942, 0.13587915897369385, 0.18924027681350708, 0.2426014244556427, 0.29596254229545593, 0.34932366013526917, 0.4026848077774048, 0.456045925617218, 0.5094070434570312, 0.5627682209014893, 0.6161292791366577, 0.6694904565811157, 0.7228516340255737, 0.776212751865387, 0.8295738697052002, 0.8829350471496582, 0.9362961649894714, 0.9896572828292847, 1.0430183410644531, 1.0963795185089111, 1.1497406959533691, 1.2031018733978271, 1.2564629316329956, 1.3098241090774536, 1.363185167312622, 1.41654634475708, 1.469907522201538, 1.5232685804367065, 1.576629638671875, 1.629990816116333, 1.6833518743515015, 1.7367130517959595, 1.790074110031128, 1.843435287475586, 1.896796464920044, 1.9501575231552124, 2.00351881980896, 2.056879997253418, 2.110241174697876, 2.163602113723755, 2.216963291168213, 2.270324468612671, 2.323685646057129, 2.377046823501587, 2.430407762527466]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 14.0, 17.0, 26.0, 33.0, 46.0, 61.0, 80.0, 138.0, 227.0, 419.0, 803.0, 1581.0, 3911.0, 11450.0, 68720.0, 4065866.0, 27904.0, 7248.0, 2776.0, 1287.0, 618.0, 356.0, 217.0, 130.0, 100.0, 76.0, 35.0, 26.0, 25.0, 13.0, 19.0, 12.0, 8.0, 7.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.830078125, -0.8072128295898438, -0.7843475341796875, -0.7614822387695312, -0.738616943359375, -0.7157516479492188, -0.6928863525390625, -0.6700210571289062, -0.64715576171875, -0.6242904663085938, -0.6014251708984375, -0.5785598754882812, -0.555694580078125, -0.5328292846679688, -0.5099639892578125, -0.48709869384765625, -0.4642333984375, -0.44136810302734375, -0.4185028076171875, -0.39563751220703125, -0.372772216796875, -0.34990692138671875, -0.3270416259765625, -0.30417633056640625, -0.28131103515625, -0.25844573974609375, -0.2355804443359375, -0.21271514892578125, -0.189849853515625, -0.16698455810546875, -0.1441192626953125, -0.12125396728515625, -0.098388671875, -0.07552337646484375, -0.0526580810546875, -0.02979278564453125, -0.006927490234375, 0.01593780517578125, 0.0388031005859375, 0.06166839599609375, 0.08453369140625, 0.10739898681640625, 0.1302642822265625, 0.15312957763671875, 0.175994873046875, 0.19886016845703125, 0.2217254638671875, 0.24459075927734375, 0.2674560546875, 0.29032135009765625, 0.3131866455078125, 0.33605194091796875, 0.358917236328125, 0.38178253173828125, 0.4046478271484375, 0.42751312255859375, 0.45037841796875, 0.47324371337890625, 0.4961090087890625, 0.5189743041992188, 0.541839599609375, 0.5647048950195312, 0.5875701904296875, 0.6104354858398438, 0.63330078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 17.0, 28.0, 55.0, 44.0, 86.0, 85.0, 96.0, 101.0, 88.0, 88.0, 57.0, 70.0, 43.0, 42.0, 25.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1075439453125, -0.10468769073486328, -0.10183143615722656, -0.09897518157958984, -0.09611892700195312, -0.0932626724243164, -0.09040641784667969, -0.08755016326904297, -0.08469390869140625, -0.08183765411376953, -0.07898139953613281, -0.0761251449584961, -0.07326889038085938, -0.07041263580322266, -0.06755638122558594, -0.06470012664794922, -0.0618438720703125, -0.05898761749267578, -0.05613136291503906, -0.053275108337402344, -0.050418853759765625, -0.047562599182128906, -0.04470634460449219, -0.04185009002685547, -0.03899383544921875, -0.03613758087158203, -0.03328132629394531, -0.030425071716308594, -0.027568817138671875, -0.024712562561035156, -0.021856307983398438, -0.01900005340576172, -0.016143798828125, -0.013287544250488281, -0.010431289672851562, -0.007575035095214844, -0.004718780517578125, -0.0018625259399414062, 0.0009937286376953125, 0.0038499832153320312, 0.00670623779296875, 0.009562492370605469, 0.012418746948242188, 0.015275001525878906, 0.018131256103515625, 0.020987510681152344, 0.023843765258789062, 0.02670001983642578, 0.0295562744140625, 0.03241252899169922, 0.03526878356933594, 0.038125038146972656, 0.040981292724609375, 0.043837547302246094, 0.04669380187988281, 0.04955005645751953, 0.05240631103515625, 0.05526256561279297, 0.05811882019042969, 0.060975074768066406, 0.06383132934570312, 0.06668758392333984, 0.06954383850097656, 0.07240009307861328, 0.07525634765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 19.0, 32.0, 33.0, 69.0, 80.0, 93.0, 157.0, 232.0, 317.0, 504.0, 760.0, 1157.0, 1777.0, 2741.0, 4468.0, 7831.0, 15743.0, 40808.0, 353384.0, 3675701.0, 49584.0, 17543.0, 8569.0, 4614.0, 2930.0, 1745.0, 1059.0, 780.0, 503.0, 332.0, 210.0, 147.0, 108.0, 77.0, 46.0, 33.0, 22.0, 15.0, 14.0, 5.0, 10.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.436767578125, -0.4235649108886719, -0.41036224365234375, -0.3971595764160156, -0.3839569091796875, -0.3707542419433594, -0.35755157470703125, -0.3443489074707031, -0.331146240234375, -0.3179435729980469, -0.30474090576171875, -0.2915382385253906, -0.2783355712890625, -0.2651329040527344, -0.25193023681640625, -0.23872756958007812, -0.22552490234375, -0.21232223510742188, -0.19911956787109375, -0.18591690063476562, -0.1727142333984375, -0.15951156616210938, -0.14630889892578125, -0.13310623168945312, -0.119903564453125, -0.10670089721679688, -0.09349822998046875, -0.08029556274414062, -0.0670928955078125, -0.053890228271484375, -0.04068756103515625, -0.027484893798828125, -0.0142822265625, -0.001079559326171875, 0.01212310791015625, 0.025325775146484375, 0.0385284423828125, 0.051731109619140625, 0.06493377685546875, 0.07813644409179688, 0.091339111328125, 0.10454177856445312, 0.11774444580078125, 0.13094711303710938, 0.1441497802734375, 0.15735244750976562, 0.17055511474609375, 0.18375778198242188, 0.19696044921875, 0.21016311645507812, 0.22336578369140625, 0.23656845092773438, 0.2497711181640625, 0.2629737854003906, 0.27617645263671875, 0.2893791198730469, 0.302581787109375, 0.3157844543457031, 0.32898712158203125, 0.3421897888183594, 0.3553924560546875, 0.3685951232910156, 0.38179779052734375, 0.3950004577636719, 0.408203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 5.0, 7.0, 9.0, 12.0, 10.0, 15.0, 25.0, 29.0, 62.0, 95.0, 3183.0, 379.0, 76.0, 45.0, 28.0, 15.0, 14.0, 9.0, 8.0, 5.0, 5.0, 6.0, 1.0, 6.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1673583984375, -0.1625518798828125, -0.157745361328125, -0.1529388427734375, -0.14813232421875, -0.1433258056640625, -0.138519287109375, -0.1337127685546875, -0.12890625, -0.1240997314453125, -0.119293212890625, -0.1144866943359375, -0.10968017578125, -0.1048736572265625, -0.100067138671875, -0.0952606201171875, -0.0904541015625, -0.0856475830078125, -0.080841064453125, -0.0760345458984375, -0.07122802734375, -0.0664215087890625, -0.061614990234375, -0.0568084716796875, -0.052001953125, -0.0471954345703125, -0.042388916015625, -0.0375823974609375, -0.03277587890625, -0.0279693603515625, -0.023162841796875, -0.0183563232421875, -0.0135498046875, -0.0087432861328125, -0.003936767578125, 0.0008697509765625, 0.00567626953125, 0.0104827880859375, 0.015289306640625, 0.0200958251953125, 0.02490234375, 0.0297088623046875, 0.034515380859375, 0.0393218994140625, 0.04412841796875, 0.0489349365234375, 0.053741455078125, 0.0585479736328125, 0.0633544921875, 0.0681610107421875, 0.072967529296875, 0.0777740478515625, 0.08258056640625, 0.0873870849609375, 0.092193603515625, 0.0970001220703125, 0.101806640625, 0.1066131591796875, 0.111419677734375, 0.1162261962890625, 0.12103271484375, 0.1258392333984375, 0.130645751953125, 0.1354522705078125, 0.1402587890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 14.0, 34.0, 63.0, 182.0, 411.0, 189.0, 55.0, 27.0, 10.0, 8.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5472186803817749, -0.5000909566879272, -0.45296329259872437, -0.4058355689048767, -0.35870787501335144, -0.31158018112182617, -0.2644524574279785, -0.21732476353645325, -0.17019706964492798, -0.12306936830282211, -0.07594166696071625, -0.028813958168029785, 0.018313735723495483, 0.06544142961502075, 0.11256915330886841, 0.15969684720039368, 0.20682454109191895, 0.2539522349834442, 0.3010799288749695, 0.34820765256881714, 0.3953353464603424, 0.4424630403518677, 0.48959076404571533, 0.536718487739563, 0.5838461518287659, 0.6309738755226135, 0.6781015396118164, 0.7252292633056641, 0.7723569869995117, 0.8194846510887146, 0.8666123747825623, 0.9137400388717651, 0.9608678817749023, 1.00799560546875, 1.0551233291625977, 1.1022510528564453, 1.1493786573410034, 1.196506381034851, 1.2436341047286987, 1.2907618284225464, 1.3378894329071045, 1.3850171566009521, 1.4321448802947998, 1.4792726039886475, 1.5264002084732056, 1.5735279321670532, 1.6206556558609009, 1.6677833795547485, 1.7149111032485962, 1.7620388269424438, 1.8091665506362915, 1.8562941551208496, 1.9034218788146973, 1.950549602508545, 1.9976773262023926, 2.0448050498962402, 2.091932773590088, 2.1390604972839355, 2.186188220977783, 2.233315944671631, 2.2804436683654785, 2.327571392059326, 2.374699115753174, 2.4218266010284424, 2.46895432472229]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 9.0, 7.0, 10.0, 13.0, 15.0, 24.0, 27.0, 36.0, 38.0, 46.0, 37.0, 53.0, 72.0, 48.0, 61.0, 51.0, 55.0, 63.0, 45.0, 42.0, 46.0, 37.0, 40.0, 30.0, 20.0, 14.0, 12.0, 12.0, 8.0, 10.0, 4.0, 0.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.5562217235565186, -0.5417782068252563, -0.5273346900939941, -0.5128911733627319, -0.49844762682914734, -0.48400411009788513, -0.4695605933666229, -0.4551170766353607, -0.4406735599040985, -0.4262300431728363, -0.4117865264415741, -0.3973429799079895, -0.3828994631767273, -0.3684559464454651, -0.3540124297142029, -0.3395689129829407, -0.32512539625167847, -0.31068187952041626, -0.29623836278915405, -0.28179484605789185, -0.26735129952430725, -0.25290778279304504, -0.23846426606178284, -0.22402074933052063, -0.20957720279693604, -0.19513368606567383, -0.18069015443325043, -0.16624663770198822, -0.151803120970726, -0.1373595893383026, -0.1229160726070404, -0.1084725558757782, -0.09402903914451599, -0.07958551496267319, -0.06514199823141098, -0.050698474049568176, -0.03625495359301567, -0.021811433136463165, -0.007367908954620361, 0.007075607776641846, 0.02151913195848465, 0.035962652415037155, 0.05040617287158966, 0.06484969705343246, 0.07929322123527527, 0.09373673796653748, 0.10818026214838028, 0.12262377887964249, 0.1370673030614853, 0.1515108197927475, 0.1659543514251709, 0.1803978681564331, 0.1948413848876953, 0.20928490161895752, 0.22372843325138092, 0.23817194998264313, 0.25261548161506653, 0.26705899834632874, 0.28150251507759094, 0.29594606161117554, 0.31038957834243774, 0.32483309507369995, 0.33927661180496216, 0.35372012853622437, 0.3681636452674866]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 5.0, 7.0, 12.0, 19.0, 17.0, 23.0, 32.0, 51.0, 64.0, 96.0, 152.0, 232.0, 358.0, 588.0, 957.0, 1717.0, 3351.0, 7731.0, 21294.0, 65973.0, 273507.0, 515188.0, 104046.0, 32150.0, 11113.0, 4656.0, 2161.0, 1123.0, 634.0, 397.0, 274.0, 189.0, 129.0, 91.0, 66.0, 45.0, 33.0, 21.0, 12.0, 12.0, 12.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5380859375, -0.5227928161621094, -0.5074996948242188, -0.4922065734863281, -0.4769134521484375, -0.4616203308105469, -0.44632720947265625, -0.4310340881347656, -0.415740966796875, -0.4004478454589844, -0.38515472412109375, -0.3698616027832031, -0.3545684814453125, -0.3392753601074219, -0.32398223876953125, -0.3086891174316406, -0.29339599609375, -0.2781028747558594, -0.26280975341796875, -0.24751663208007812, -0.2322235107421875, -0.21693038940429688, -0.20163726806640625, -0.18634414672851562, -0.171051025390625, -0.15575790405273438, -0.14046478271484375, -0.12517166137695312, -0.1098785400390625, -0.09458541870117188, -0.07929229736328125, -0.06399917602539062, -0.0487060546875, -0.033412933349609375, -0.01811981201171875, -0.002826690673828125, 0.0124664306640625, 0.027759552001953125, 0.04305267333984375, 0.058345794677734375, 0.073638916015625, 0.08893203735351562, 0.10422515869140625, 0.11951828002929688, 0.1348114013671875, 0.15010452270507812, 0.16539764404296875, 0.18069076538085938, 0.19598388671875, 0.21127700805664062, 0.22657012939453125, 0.24186325073242188, 0.2571563720703125, 0.2724494934082031, 0.28774261474609375, 0.3030357360839844, 0.318328857421875, 0.3336219787597656, 0.34891510009765625, 0.3642082214355469, 0.3795013427734375, 0.3947944641113281, 0.41008758544921875, 0.4253807067871094, 0.440673828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 11.0, 19.0, 26.0, 39.0, 47.0, 66.0, 80.0, 91.0, 96.0, 95.0, 89.0, 70.0, 68.0, 55.0, 43.0, 27.0, 25.0, 13.0, 11.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11309814453125, -0.11020565032958984, -0.10731315612792969, -0.10442066192626953, -0.10152816772460938, -0.09863567352294922, -0.09574317932128906, -0.0928506851196289, -0.08995819091796875, -0.0870656967163086, -0.08417320251464844, -0.08128070831298828, -0.07838821411132812, -0.07549571990966797, -0.07260322570800781, -0.06971073150634766, -0.0668182373046875, -0.06392574310302734, -0.06103324890136719, -0.05814075469970703, -0.055248260498046875, -0.05235576629638672, -0.04946327209472656, -0.046570777893066406, -0.04367828369140625, -0.040785789489746094, -0.03789329528808594, -0.03500080108642578, -0.032108306884765625, -0.02921581268310547, -0.026323318481445312, -0.023430824279785156, -0.020538330078125, -0.017645835876464844, -0.014753341674804688, -0.011860847473144531, -0.008968353271484375, -0.006075859069824219, -0.0031833648681640625, -0.00029087066650390625, 0.00260162353515625, 0.005494117736816406, 0.008386611938476562, 0.011279106140136719, 0.014171600341796875, 0.01706409454345703, 0.019956588745117188, 0.022849082946777344, 0.0257415771484375, 0.028634071350097656, 0.03152656555175781, 0.03441905975341797, 0.037311553955078125, 0.04020404815673828, 0.04309654235839844, 0.045989036560058594, 0.04888153076171875, 0.051774024963378906, 0.05466651916503906, 0.05755901336669922, 0.060451507568359375, 0.06334400177001953, 0.06623649597167969, 0.06912899017333984, 0.072021484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 23.0, 37.0, 69.0, 60.0, 139.0, 239.0, 400.0, 716.0, 1369.0, 2954.0, 6681.0, 15939.0, 40657.0, 123307.0, 495505.0, 247302.0, 68824.0, 25254.0, 10227.0, 4410.0, 2113.0, 1033.0, 531.0, 279.0, 181.0, 96.0, 61.0, 46.0, 28.0, 18.0, 11.0, 11.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.460693359375, -0.44815826416015625, -0.4356231689453125, -0.42308807373046875, -0.410552978515625, -0.39801788330078125, -0.3854827880859375, -0.37294769287109375, -0.36041259765625, -0.34787750244140625, -0.3353424072265625, -0.32280731201171875, -0.310272216796875, -0.29773712158203125, -0.2852020263671875, -0.27266693115234375, -0.2601318359375, -0.24759674072265625, -0.2350616455078125, -0.22252655029296875, -0.209991455078125, -0.19745635986328125, -0.1849212646484375, -0.17238616943359375, -0.15985107421875, -0.14731597900390625, -0.1347808837890625, -0.12224578857421875, -0.109710693359375, -0.09717559814453125, -0.0846405029296875, -0.07210540771484375, -0.0595703125, -0.04703521728515625, -0.0345001220703125, -0.02196502685546875, -0.009429931640625, 0.00310516357421875, 0.0156402587890625, 0.02817535400390625, 0.04071044921875, 0.05324554443359375, 0.0657806396484375, 0.07831573486328125, 0.090850830078125, 0.10338592529296875, 0.1159210205078125, 0.12845611572265625, 0.1409912109375, 0.15352630615234375, 0.1660614013671875, 0.17859649658203125, 0.191131591796875, 0.20366668701171875, 0.2162017822265625, 0.22873687744140625, 0.24127197265625, 0.25380706787109375, 0.2663421630859375, 0.27887725830078125, 0.291412353515625, 0.30394744873046875, 0.3164825439453125, 0.32901763916015625, 0.341552734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 12.0, 16.0, 16.0, 15.0, 14.0, 24.0, 32.0, 34.0, 34.0, 37.0, 49.0, 53.0, 56.0, 50.0, 52.0, 44.0, 39.0, 47.0, 41.0, 53.0, 39.0, 47.0, 39.0, 27.0, 23.0, 16.0, 21.0, 14.0, 13.0, 11.0, 8.0, 8.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.31494140625, -0.3064117431640625, -0.297882080078125, -0.2893524169921875, -0.28082275390625, -0.2722930908203125, -0.263763427734375, -0.2552337646484375, -0.2467041015625, -0.2381744384765625, -0.229644775390625, -0.2211151123046875, -0.21258544921875, -0.2040557861328125, -0.195526123046875, -0.1869964599609375, -0.178466796875, -0.1699371337890625, -0.161407470703125, -0.1528778076171875, -0.14434814453125, -0.1358184814453125, -0.127288818359375, -0.1187591552734375, -0.1102294921875, -0.1016998291015625, -0.093170166015625, -0.0846405029296875, -0.07611083984375, -0.0675811767578125, -0.059051513671875, -0.0505218505859375, -0.0419921875, -0.0334625244140625, -0.024932861328125, -0.0164031982421875, -0.00787353515625, 0.0006561279296875, 0.009185791015625, 0.0177154541015625, 0.0262451171875, 0.0347747802734375, 0.043304443359375, 0.0518341064453125, 0.06036376953125, 0.0688934326171875, 0.077423095703125, 0.0859527587890625, 0.094482421875, 0.1030120849609375, 0.111541748046875, 0.1200714111328125, 0.12860107421875, 0.1371307373046875, 0.145660400390625, 0.1541900634765625, 0.1627197265625, 0.1712493896484375, 0.179779052734375, 0.1883087158203125, 0.19683837890625, 0.2053680419921875, 0.213897705078125, 0.2224273681640625, 0.23095703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 14.0, 17.0, 41.0, 55.0, 150.0, 365.0, 1147.0, 5997.0, 60624.0, 919137.0, 53854.0, 5384.0, 1116.0, 354.0, 138.0, 61.0, 41.0, 22.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143798828125, -0.13767433166503906, -0.13154983520507812, -0.1254253387451172, -0.11930084228515625, -0.11317634582519531, -0.10705184936523438, -0.10092735290527344, -0.0948028564453125, -0.08867835998535156, -0.08255386352539062, -0.07642936706542969, -0.07030487060546875, -0.06418037414550781, -0.058055877685546875, -0.05193138122558594, -0.045806884765625, -0.03968238830566406, -0.033557891845703125, -0.027433395385742188, -0.02130889892578125, -0.015184402465820312, -0.009059906005859375, -0.0029354095458984375, 0.0031890869140625, 0.009313583374023438, 0.015438079833984375, 0.021562576293945312, 0.02768707275390625, 0.03381156921386719, 0.039936065673828125, 0.04606056213378906, 0.05218505859375, 0.05830955505371094, 0.06443405151367188, 0.07055854797363281, 0.07668304443359375, 0.08280754089355469, 0.08893203735351562, 0.09505653381347656, 0.1011810302734375, 0.10730552673339844, 0.11343002319335938, 0.11955451965332031, 0.12567901611328125, 0.1318035125732422, 0.13792800903320312, 0.14405250549316406, 0.150177001953125, 0.15630149841308594, 0.16242599487304688, 0.1685504913330078, 0.17467498779296875, 0.1807994842529297, 0.18692398071289062, 0.19304847717285156, 0.1991729736328125, 0.20529747009277344, 0.21142196655273438, 0.2175464630126953, 0.22367095947265625, 0.2297954559326172, 0.23591995239257812, 0.24204444885253906, 0.2481689453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 7.0, 16.0, 24.0, 61.0, 67.0, 141.0, 171.0, 174.0, 99.0, 76.0, 37.0, 28.0, 23.0, 17.0, 7.0, 12.0, 7.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3887882232666016e-05, -1.343805342912674e-05, -1.2988224625587463e-05, -1.2538395822048187e-05, -1.2088567018508911e-05, -1.1638738214969635e-05, -1.1188909411430359e-05, -1.0739080607891083e-05, -1.0289251804351807e-05, -9.83942300081253e-06, -9.389594197273254e-06, -8.939765393733978e-06, -8.489936590194702e-06, -8.040107786655426e-06, -7.59027898311615e-06, -7.140450179576874e-06, -6.690621376037598e-06, -6.2407925724983215e-06, -5.790963768959045e-06, -5.341134965419769e-06, -4.891306161880493e-06, -4.441477358341217e-06, -3.991648554801941e-06, -3.541819751262665e-06, -3.0919909477233887e-06, -2.6421621441841125e-06, -2.1923333406448364e-06, -1.7425045371055603e-06, -1.2926757335662842e-06, -8.428469300270081e-07, -3.9301812648773193e-07, 5.681067705154419e-08, 5.066394805908203e-07, 9.564682841300964e-07, 1.4062970876693726e-06, 1.8561258912086487e-06, 2.305954694747925e-06, 2.755783498287201e-06, 3.205612301826477e-06, 3.655441105365753e-06, 4.105269908905029e-06, 4.555098712444305e-06, 5.0049275159835815e-06, 5.454756319522858e-06, 5.904585123062134e-06, 6.35441392660141e-06, 6.804242730140686e-06, 7.254071533679962e-06, 7.703900337219238e-06, 8.153729140758514e-06, 8.60355794429779e-06, 9.053386747837067e-06, 9.503215551376343e-06, 9.953044354915619e-06, 1.0402873158454895e-05, 1.0852701961994171e-05, 1.1302530765533447e-05, 1.1752359569072723e-05, 1.2202188372612e-05, 1.2652017176151276e-05, 1.3101845979690552e-05, 1.3551674783229828e-05, 1.4001503586769104e-05, 1.445133239030838e-05, 1.4901161193847656e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 16.0, 17.0, 27.0, 23.0, 70.0, 86.0, 158.0, 238.0, 528.0, 1122.0, 2759.0, 6935.0, 21095.0, 94403.0, 718843.0, 157777.0, 29365.0, 8970.0, 3291.0, 1400.0, 632.0, 358.0, 171.0, 92.0, 60.0, 36.0, 15.0, 19.0, 11.0, 7.0, 7.0, 7.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.0901327133178711, -0.08736991882324219, -0.08460712432861328, -0.08184432983398438, -0.07908153533935547, -0.07631874084472656, -0.07355594635009766, -0.07079315185546875, -0.06803035736083984, -0.06526756286621094, -0.06250476837158203, -0.059741973876953125, -0.05697917938232422, -0.05421638488769531, -0.051453590393066406, -0.0486907958984375, -0.045928001403808594, -0.04316520690917969, -0.04040241241455078, -0.037639617919921875, -0.03487682342529297, -0.03211402893066406, -0.029351234436035156, -0.02658843994140625, -0.023825645446777344, -0.021062850952148438, -0.01830005645751953, -0.015537261962890625, -0.012774467468261719, -0.010011672973632812, -0.007248878479003906, -0.004486083984375, -0.0017232894897460938, 0.0010395050048828125, 0.0038022994995117188, 0.006565093994140625, 0.009327888488769531, 0.012090682983398438, 0.014853477478027344, 0.01761627197265625, 0.020379066467285156, 0.023141860961914062, 0.02590465545654297, 0.028667449951171875, 0.03143024444580078, 0.03419303894042969, 0.036955833435058594, 0.0397186279296875, 0.042481422424316406, 0.04524421691894531, 0.04800701141357422, 0.050769805908203125, 0.05353260040283203, 0.05629539489746094, 0.059058189392089844, 0.06182098388671875, 0.06458377838134766, 0.06734657287597656, 0.07010936737060547, 0.07287216186523438, 0.07563495635986328, 0.07839775085449219, 0.0811605453491211, 0.08392333984375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 10.0, 8.0, 18.0, 13.0, 17.0, 14.0, 23.0, 41.0, 50.0, 71.0, 89.0, 103.0, 105.0, 105.0, 91.0, 62.0, 40.0, 44.0, 16.0, 20.0, 12.0, 14.0, 9.0, 5.0, 2.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.078125, -0.07631778717041016, -0.07451057434082031, -0.07270336151123047, -0.07089614868164062, -0.06908893585205078, -0.06728172302246094, -0.0654745101928711, -0.06366729736328125, -0.061860084533691406, -0.06005287170410156, -0.05824565887451172, -0.056438446044921875, -0.05463123321533203, -0.05282402038574219, -0.051016807556152344, -0.0492095947265625, -0.047402381896972656, -0.04559516906738281, -0.04378795623779297, -0.041980743408203125, -0.04017353057861328, -0.03836631774902344, -0.036559104919433594, -0.03475189208984375, -0.032944679260253906, -0.031137466430664062, -0.02933025360107422, -0.027523040771484375, -0.02571582794189453, -0.023908615112304688, -0.022101402282714844, -0.020294189453125, -0.018486976623535156, -0.016679763793945312, -0.014872550964355469, -0.013065338134765625, -0.011258125305175781, -0.009450912475585938, -0.007643699645996094, -0.00583648681640625, -0.004029273986816406, -0.0022220611572265625, -0.00041484832763671875, 0.001392364501953125, 0.0031995773315429688, 0.0050067901611328125, 0.006814002990722656, 0.0086212158203125, 0.010428428649902344, 0.012235641479492188, 0.014042854309082031, 0.015850067138671875, 0.01765727996826172, 0.019464492797851562, 0.021271705627441406, 0.02307891845703125, 0.024886131286621094, 0.026693344116210938, 0.02850055694580078, 0.030307769775390625, 0.03211498260498047, 0.03392219543457031, 0.035729408264160156, 0.03753662109375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 5.0, 6.0, 8.0, 12.0, 12.0, 21.0, 23.0, 33.0, 38.0, 55.0, 94.0, 134.0, 162.0, 142.0, 60.0, 46.0, 33.0, 21.0, 20.0, 12.0, 13.0, 5.0, 8.0, 9.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.9020448923110962, -1.8482508659362793, -1.7944567203521729, -1.740662693977356, -1.686868667602539, -1.6330745220184326, -1.5792804956436157, -1.5254864692687988, -1.4716923236846924, -1.4178982973098755, -1.364104151725769, -1.3103101253509521, -1.2565159797668457, -1.2027219533920288, -1.148927927017212, -1.0951337814331055, -1.0413397550582886, -0.9875456690788269, -0.9337515830993652, -0.8799575567245483, -0.8261634707450867, -0.772369384765625, -0.7185753583908081, -0.6647812724113464, -0.6109871864318848, -0.5571931004524231, -0.5033990144729614, -0.44960498809814453, -0.39581090211868286, -0.3420168161392212, -0.2882227599620819, -0.23442870378494263, -0.1806347370147705, -0.12684066593647003, -0.07304659485816956, -0.01925252377986908, 0.034541547298431396, 0.08833563327789307, 0.14212968945503235, 0.19592374563217163, 0.2497178316116333, 0.30351191759109497, 0.35730597376823425, 0.41110002994537354, 0.4648941159248352, 0.5186882019042969, 0.5724822282791138, 0.6262763142585754, 0.6800704002380371, 0.7338644862174988, 0.7876585721969604, 0.8414525985717773, 0.895246684551239, 0.9490407705307007, 1.0028347969055176, 1.056628942489624, 1.110422968864441, 1.1642169952392578, 1.2180111408233643, 1.2718051671981812, 1.325599193572998, 1.3793933391571045, 1.4331873655319214, 1.4869813919067383, 1.5407755374908447]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 9.0, 7.0, 13.0, 7.0, 20.0, 21.0, 22.0, 24.0, 33.0, 39.0, 40.0, 42.0, 55.0, 57.0, 65.0, 64.0, 59.0, 77.0, 50.0, 43.0, 56.0, 41.0, 32.0, 28.0, 26.0, 17.0, 20.0, 10.0, 7.0, 12.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9438296556472778, -1.8891737461090088, -1.8345178365707397, -1.7798619270324707, -1.725205898284912, -1.6705501079559326, -1.615894079208374, -1.561238169670105, -1.506582260131836, -1.451926350593567, -1.3972704410552979, -1.3426145315170288, -1.2879586219787598, -1.2333025932312012, -1.1786466836929321, -1.123990774154663, -1.069334864616394, -1.014678955078125, -0.960023045539856, -0.9053670763969421, -0.8507111668586731, -0.796055257320404, -0.7413992881774902, -0.6867433786392212, -0.6320874691009521, -0.5774315595626831, -0.5227756500244141, -0.46811968088150024, -0.4134637713432312, -0.35880786180496216, -0.3041519224643707, -0.2494959831237793, -0.1948399543762207, -0.14018402993679047, -0.08552810549736023, -0.030872181057929993, 0.023783743381500244, 0.07843965291976929, 0.13309559226036072, 0.18775153160095215, 0.2424074411392212, 0.29706335067749023, 0.35171929001808167, 0.4063752293586731, 0.46103113889694214, 0.5156870484352112, 0.570343017578125, 0.624998927116394, 0.6796548366546631, 0.7343107461929321, 0.7889666557312012, 0.843622624874115, 0.898278534412384, 0.9529344439506531, 1.007590413093567, 1.062246322631836, 1.116902232170105, 1.171558141708374, 1.226214051246643, 1.280869960784912, 1.3355259895324707, 1.3901817798614502, 1.4448378086090088, 1.4994937181472778, 1.5541496276855469]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 3.0, 6.0, 12.0, 8.0, 14.0, 11.0, 20.0, 23.0, 32.0, 52.0, 63.0, 95.0, 151.0, 224.0, 362.0, 627.0, 1211.0, 2528.0, 5774.0, 16431.0, 63905.0, 3995244.0, 76959.0, 18755.0, 6191.0, 2444.0, 1172.0, 722.0, 423.0, 238.0, 172.0, 104.0, 74.0, 63.0, 47.0, 31.0, 24.0, 21.0, 13.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.6748046875, -0.656341552734375, -0.63787841796875, -0.619415283203125, -0.6009521484375, -0.582489013671875, -0.56402587890625, -0.545562744140625, -0.527099609375, -0.508636474609375, -0.49017333984375, -0.471710205078125, -0.4532470703125, -0.434783935546875, -0.41632080078125, -0.397857666015625, -0.37939453125, -0.360931396484375, -0.34246826171875, -0.324005126953125, -0.3055419921875, -0.287078857421875, -0.26861572265625, -0.250152587890625, -0.231689453125, -0.213226318359375, -0.19476318359375, -0.176300048828125, -0.1578369140625, -0.139373779296875, -0.12091064453125, -0.102447509765625, -0.083984375, -0.065521240234375, -0.04705810546875, -0.028594970703125, -0.0101318359375, 0.008331298828125, 0.02679443359375, 0.045257568359375, 0.063720703125, 0.082183837890625, 0.10064697265625, 0.119110107421875, 0.1375732421875, 0.156036376953125, 0.17449951171875, 0.192962646484375, 0.21142578125, 0.229888916015625, 0.24835205078125, 0.266815185546875, 0.2852783203125, 0.303741455078125, 0.32220458984375, 0.340667724609375, 0.359130859375, 0.377593994140625, 0.39605712890625, 0.414520263671875, 0.4329833984375, 0.451446533203125, 0.46990966796875, 0.488372802734375, 0.5068359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 10.0, 16.0, 26.0, 21.0, 36.0, 48.0, 65.0, 86.0, 85.0, 100.0, 88.0, 79.0, 82.0, 72.0, 49.0, 53.0, 21.0, 23.0, 13.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.10479736328125, -0.10196590423583984, -0.09913444519042969, -0.09630298614501953, -0.09347152709960938, -0.09064006805419922, -0.08780860900878906, -0.0849771499633789, -0.08214569091796875, -0.0793142318725586, -0.07648277282714844, -0.07365131378173828, -0.07081985473632812, -0.06798839569091797, -0.06515693664550781, -0.062325477600097656, -0.0594940185546875, -0.056662559509277344, -0.05383110046386719, -0.05099964141845703, -0.048168182373046875, -0.04533672332763672, -0.04250526428222656, -0.039673805236816406, -0.03684234619140625, -0.034010887145996094, -0.031179428100585938, -0.02834796905517578, -0.025516510009765625, -0.02268505096435547, -0.019853591918945312, -0.017022132873535156, -0.014190673828125, -0.011359214782714844, -0.008527755737304688, -0.005696296691894531, -0.002864837646484375, -3.337860107421875e-05, 0.0027980804443359375, 0.005629539489746094, 0.00846099853515625, 0.011292457580566406, 0.014123916625976562, 0.01695537567138672, 0.019786834716796875, 0.02261829376220703, 0.025449752807617188, 0.028281211853027344, 0.0311126708984375, 0.033944129943847656, 0.03677558898925781, 0.03960704803466797, 0.042438507080078125, 0.04526996612548828, 0.04810142517089844, 0.050932884216308594, 0.05376434326171875, 0.056595802307128906, 0.05942726135253906, 0.06225872039794922, 0.06509017944335938, 0.06792163848876953, 0.07075309753417969, 0.07358455657958984, 0.076416015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 4.0, 15.0, 16.0, 17.0, 51.0, 75.0, 89.0, 155.0, 231.0, 379.0, 639.0, 1045.0, 1701.0, 3211.0, 5813.0, 11465.0, 26929.0, 87188.0, 3796128.0, 187727.0, 39440.0, 15630.0, 7339.0, 3793.0, 2106.0, 1256.0, 685.0, 403.0, 282.0, 153.0, 105.0, 73.0, 42.0, 32.0, 19.0, 13.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.386962890625, -0.373931884765625, -0.36090087890625, -0.347869873046875, -0.3348388671875, -0.321807861328125, -0.30877685546875, -0.295745849609375, -0.28271484375, -0.269683837890625, -0.25665283203125, -0.243621826171875, -0.2305908203125, -0.217559814453125, -0.20452880859375, -0.191497802734375, -0.178466796875, -0.165435791015625, -0.15240478515625, -0.139373779296875, -0.1263427734375, -0.113311767578125, -0.10028076171875, -0.087249755859375, -0.07421875, -0.061187744140625, -0.04815673828125, -0.035125732421875, -0.0220947265625, -0.009063720703125, 0.00396728515625, 0.016998291015625, 0.030029296875, 0.043060302734375, 0.05609130859375, 0.069122314453125, 0.0821533203125, 0.095184326171875, 0.10821533203125, 0.121246337890625, 0.13427734375, 0.147308349609375, 0.16033935546875, 0.173370361328125, 0.1864013671875, 0.199432373046875, 0.21246337890625, 0.225494384765625, 0.238525390625, 0.251556396484375, 0.26458740234375, 0.277618408203125, 0.2906494140625, 0.303680419921875, 0.31671142578125, 0.329742431640625, 0.3427734375, 0.355804443359375, 0.36883544921875, 0.381866455078125, 0.3948974609375, 0.407928466796875, 0.42095947265625, 0.433990478515625, 0.447021484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 4.0, 1.0, 5.0, 14.0, 4.0, 13.0, 12.0, 17.0, 17.0, 24.0, 42.0, 40.0, 73.0, 188.0, 2868.0, 410.0, 100.0, 54.0, 38.0, 30.0, 23.0, 15.0, 6.0, 12.0, 7.0, 9.0, 9.0, 6.0, 8.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16455078125, -0.1593647003173828, -0.15417861938476562, -0.14899253845214844, -0.14380645751953125, -0.13862037658691406, -0.13343429565429688, -0.1282482147216797, -0.1230621337890625, -0.11787605285644531, -0.11268997192382812, -0.10750389099121094, -0.10231781005859375, -0.09713172912597656, -0.09194564819335938, -0.08675956726074219, -0.081573486328125, -0.07638740539550781, -0.07120132446289062, -0.06601524353027344, -0.06082916259765625, -0.05564308166503906, -0.050457000732421875, -0.04527091979980469, -0.0400848388671875, -0.03489875793457031, -0.029712677001953125, -0.024526596069335938, -0.01934051513671875, -0.014154434204101562, -0.008968353271484375, -0.0037822723388671875, 0.00140380859375, 0.0065898895263671875, 0.011775970458984375, 0.016962051391601562, 0.02214813232421875, 0.027334213256835938, 0.032520294189453125, 0.03770637512207031, 0.0428924560546875, 0.04807853698730469, 0.053264617919921875, 0.05845069885253906, 0.06363677978515625, 0.06882286071777344, 0.07400894165039062, 0.07919502258300781, 0.084381103515625, 0.08956718444824219, 0.09475326538085938, 0.09993934631347656, 0.10512542724609375, 0.11031150817871094, 0.11549758911132812, 0.12068367004394531, 0.1258697509765625, 0.1310558319091797, 0.13624191284179688, 0.14142799377441406, 0.14661407470703125, 0.15180015563964844, 0.15698623657226562, 0.1621723175048828, 0.1673583984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 11.0, 10.0, 12.0, 16.0, 29.0, 47.0, 96.0, 243.0, 277.0, 126.0, 59.0, 32.0, 27.0, 10.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3315144777297974, -1.2873767614364624, -1.2432390451431274, -1.199101209640503, -1.154963493347168, -1.110825777053833, -1.066688060760498, -1.022550344467163, -0.9784125685691833, -0.9342748522758484, -0.8901370763778687, -0.8459993600845337, -0.8018616437911987, -0.757723867893219, -0.713586151599884, -0.6694483757019043, -0.6253106594085693, -0.5811729431152344, -0.5370351672172546, -0.4928974509239197, -0.44875970482826233, -0.404621958732605, -0.36048424243927, -0.31634649634361267, -0.2722087502479553, -0.22807100415229797, -0.18393327295780182, -0.13979554176330566, -0.09565779566764832, -0.05152004957199097, -0.007382333278656006, 0.03675541281700134, 0.08089303970336914, 0.1250307857990265, 0.16916851699352264, 0.2133062481880188, 0.25744399428367615, 0.3015817403793335, 0.34571945667266846, 0.3898572027683258, 0.43399494886398315, 0.4781326949596405, 0.5222704410552979, 0.5664081573486328, 0.6105458736419678, 0.6546836495399475, 0.6988213658332825, 0.7429591417312622, 0.7870968580245972, 0.8312345743179321, 0.8753723502159119, 0.9195100665092468, 0.9636478424072266, 1.0077855587005615, 1.0519232749938965, 1.0960609912872314, 1.1401987075805664, 1.1843364238739014, 1.2284741401672363, 1.2726118564605713, 1.3167496919631958, 1.3608874082565308, 1.4050251245498657, 1.4491628408432007, 1.4933006763458252]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 11.0, 6.0, 10.0, 12.0, 23.0, 25.0, 14.0, 22.0, 34.0, 35.0, 28.0, 38.0, 45.0, 39.0, 25.0, 50.0, 35.0, 35.0, 47.0, 44.0, 46.0, 51.0, 39.0, 38.0, 38.0, 25.0, 36.0, 31.0, 16.0, 18.0, 16.0, 10.0, 11.0, 11.0, 8.0, 11.0, 4.0, 3.0, 2.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47888320684432983, -0.4641132950782776, -0.44934338331222534, -0.4345734715461731, -0.41980355978012085, -0.4050336480140686, -0.39026373624801636, -0.3754937946796417, -0.3607238829135895, -0.34595397114753723, -0.331184059381485, -0.31641414761543274, -0.3016442358493805, -0.28687429428100586, -0.2721043825149536, -0.25733447074890137, -0.24256457388401031, -0.22779466211795807, -0.21302475035190582, -0.19825482368469238, -0.18348491191864014, -0.1687150001525879, -0.15394508838653564, -0.1391751766204834, -0.12440525740385056, -0.10963534563779831, -0.09486542642116547, -0.08009551465511322, -0.06532560288906097, -0.05055568367242813, -0.035785771906375885, -0.021015852689743042, -0.006245940923690796, 0.008523973636329174, 0.023293888196349144, 0.03806380182504654, 0.052833717316389084, 0.06760363280773163, 0.08237354457378387, 0.09714346379041672, 0.11191337555646896, 0.1266832947731018, 0.14145320653915405, 0.1562231183052063, 0.17099303007125854, 0.1857629418373108, 0.20053285360336304, 0.21530278027057648, 0.23007269203662872, 0.24484260380268097, 0.2596125304698944, 0.27438244223594666, 0.2891523540019989, 0.30392226576805115, 0.3186921775341034, 0.33346208930015564, 0.3482320010662079, 0.36300191283226013, 0.3777718245983124, 0.3925417363643646, 0.40731164813041687, 0.4220815896987915, 0.43685150146484375, 0.451621413230896, 0.46639132499694824]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 9.0, 8.0, 17.0, 23.0, 27.0, 35.0, 41.0, 51.0, 76.0, 120.0, 191.0, 240.0, 362.0, 483.0, 790.0, 1238.0, 2269.0, 4908.0, 11773.0, 33847.0, 122503.0, 594584.0, 197570.0, 48147.0, 15898.0, 6307.0, 2842.0, 1469.0, 823.0, 595.0, 344.0, 251.0, 210.0, 149.0, 91.0, 77.0, 51.0, 47.0, 15.0, 22.0, 13.0, 14.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.57958984375, -0.5628623962402344, -0.5461349487304688, -0.5294075012207031, -0.5126800537109375, -0.4959526062011719, -0.47922515869140625, -0.4624977111816406, -0.445770263671875, -0.4290428161621094, -0.41231536865234375, -0.3955879211425781, -0.3788604736328125, -0.3621330261230469, -0.34540557861328125, -0.3286781311035156, -0.31195068359375, -0.2952232360839844, -0.27849578857421875, -0.2617683410644531, -0.2450408935546875, -0.22831344604492188, -0.21158599853515625, -0.19485855102539062, -0.178131103515625, -0.16140365600585938, -0.14467620849609375, -0.12794876098632812, -0.1112213134765625, -0.09449386596679688, -0.07776641845703125, -0.061038970947265625, -0.0443115234375, -0.027584075927734375, -0.01085662841796875, 0.005870819091796875, 0.0225982666015625, 0.039325714111328125, 0.05605316162109375, 0.07278060913085938, 0.089508056640625, 0.10623550415039062, 0.12296295166015625, 0.13969039916992188, 0.1564178466796875, 0.17314529418945312, 0.18987274169921875, 0.20660018920898438, 0.22332763671875, 0.24005508422851562, 0.25678253173828125, 0.2735099792480469, 0.2902374267578125, 0.3069648742675781, 0.32369232177734375, 0.3404197692871094, 0.357147216796875, 0.3738746643066406, 0.39060211181640625, 0.4073295593261719, 0.4240570068359375, 0.4407844543457031, 0.45751190185546875, 0.4742393493652344, 0.490966796875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 14.0, 26.0, 35.0, 38.0, 51.0, 74.0, 84.0, 100.0, 108.0, 95.0, 82.0, 86.0, 51.0, 45.0, 36.0, 23.0, 14.0, 10.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.11126708984375, -0.10829734802246094, -0.10532760620117188, -0.10235786437988281, -0.09938812255859375, -0.09641838073730469, -0.09344863891601562, -0.09047889709472656, -0.0875091552734375, -0.08453941345214844, -0.08156967163085938, -0.07859992980957031, -0.07563018798828125, -0.07266044616699219, -0.06969070434570312, -0.06672096252441406, -0.063751220703125, -0.06078147888183594, -0.057811737060546875, -0.05484199523925781, -0.05187225341796875, -0.04890251159667969, -0.045932769775390625, -0.04296302795410156, -0.0399932861328125, -0.03702354431152344, -0.034053802490234375, -0.031084060668945312, -0.02811431884765625, -0.025144577026367188, -0.022174835205078125, -0.019205093383789062, -0.0162353515625, -0.013265609741210938, -0.010295867919921875, -0.0073261260986328125, -0.00435638427734375, -0.0013866424560546875, 0.001583099365234375, 0.0045528411865234375, 0.0075225830078125, 0.010492324829101562, 0.013462066650390625, 0.016431808471679688, 0.01940155029296875, 0.022371292114257812, 0.025341033935546875, 0.028310775756835938, 0.031280517578125, 0.03425025939941406, 0.037220001220703125, 0.04018974304199219, 0.04315948486328125, 0.04612922668457031, 0.049098968505859375, 0.05206871032714844, 0.0550384521484375, 0.05800819396972656, 0.060977935791015625, 0.06394767761230469, 0.06691741943359375, 0.06988716125488281, 0.07285690307617188, 0.07582664489746094, 0.07879638671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 10.0, 8.0, 6.0, 11.0, 28.0, 17.0, 48.0, 50.0, 82.0, 128.0, 201.0, 253.0, 425.0, 649.0, 1063.0, 1626.0, 2679.0, 4369.0, 7239.0, 12394.0, 21606.0, 37416.0, 69839.0, 139504.0, 339494.0, 203219.0, 91514.0, 48760.0, 27047.0, 15523.0, 9176.0, 5395.0, 3243.0, 1968.0, 1228.0, 821.0, 476.0, 329.0, 220.0, 123.0, 116.0, 78.0, 51.0, 26.0, 28.0, 17.0, 17.0, 24.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.2308349609375, -0.2241840362548828, -0.21753311157226562, -0.21088218688964844, -0.20423126220703125, -0.19758033752441406, -0.19092941284179688, -0.1842784881591797, -0.1776275634765625, -0.1709766387939453, -0.16432571411132812, -0.15767478942871094, -0.15102386474609375, -0.14437294006347656, -0.13772201538085938, -0.1310710906982422, -0.124420166015625, -0.11776924133300781, -0.11111831665039062, -0.10446739196777344, -0.09781646728515625, -0.09116554260253906, -0.08451461791992188, -0.07786369323730469, -0.0712127685546875, -0.06456184387207031, -0.057910919189453125, -0.05125999450683594, -0.04460906982421875, -0.03795814514160156, -0.031307220458984375, -0.024656295776367188, -0.01800537109375, -0.011354446411132812, -0.004703521728515625, 0.0019474029541015625, 0.00859832763671875, 0.015249252319335938, 0.021900177001953125, 0.028551101684570312, 0.0352020263671875, 0.04185295104980469, 0.048503875732421875, 0.05515480041503906, 0.06180572509765625, 0.06845664978027344, 0.07510757446289062, 0.08175849914550781, 0.088409423828125, 0.09506034851074219, 0.10171127319335938, 0.10836219787597656, 0.11501312255859375, 0.12166404724121094, 0.12831497192382812, 0.1349658966064453, 0.1416168212890625, 0.1482677459716797, 0.15491867065429688, 0.16156959533691406, 0.16822052001953125, 0.17487144470214844, 0.18152236938476562, 0.1881732940673828, 0.19482421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 3.0, 6.0, 4.0, 8.0, 10.0, 15.0, 11.0, 14.0, 21.0, 23.0, 27.0, 23.0, 38.0, 32.0, 29.0, 39.0, 32.0, 38.0, 30.0, 44.0, 42.0, 39.0, 42.0, 35.0, 31.0, 32.0, 37.0, 42.0, 36.0, 28.0, 25.0, 31.0, 21.0, 20.0, 21.0, 9.0, 12.0, 10.0, 9.0, 12.0, 4.0, 3.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.19287109375, -0.1863384246826172, -0.17980575561523438, -0.17327308654785156, -0.16674041748046875, -0.16020774841308594, -0.15367507934570312, -0.1471424102783203, -0.1406097412109375, -0.1340770721435547, -0.12754440307617188, -0.12101173400878906, -0.11447906494140625, -0.10794639587402344, -0.10141372680664062, -0.09488105773925781, -0.088348388671875, -0.08181571960449219, -0.07528305053710938, -0.06875038146972656, -0.06221771240234375, -0.05568504333496094, -0.049152374267578125, -0.04261970520019531, -0.0360870361328125, -0.029554367065429688, -0.023021697998046875, -0.016489028930664062, -0.00995635986328125, -0.0034236907958984375, 0.003108978271484375, 0.009641647338867188, 0.01617431640625, 0.022706985473632812, 0.029239654541015625, 0.03577232360839844, 0.04230499267578125, 0.04883766174316406, 0.055370330810546875, 0.06190299987792969, 0.0684356689453125, 0.07496833801269531, 0.08150100708007812, 0.08803367614746094, 0.09456634521484375, 0.10109901428222656, 0.10763168334960938, 0.11416435241699219, 0.120697021484375, 0.1272296905517578, 0.13376235961914062, 0.14029502868652344, 0.14682769775390625, 0.15336036682128906, 0.15989303588867188, 0.1664257049560547, 0.1729583740234375, 0.1794910430908203, 0.18602371215820312, 0.19255638122558594, 0.19908905029296875, 0.20562171936035156, 0.21215438842773438, 0.2186870574951172, 0.2252197265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 6.0, 21.0, 22.0, 38.0, 54.0, 104.0, 165.0, 347.0, 709.0, 1591.0, 4315.0, 13584.0, 58385.0, 591348.0, 320637.0, 40658.0, 10426.0, 3491.0, 1347.0, 590.0, 324.0, 145.0, 92.0, 50.0, 40.0, 21.0, 12.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06744384765625, -0.06518745422363281, -0.06293106079101562, -0.06067466735839844, -0.05841827392578125, -0.05616188049316406, -0.053905487060546875, -0.05164909362792969, -0.0493927001953125, -0.04713630676269531, -0.044879913330078125, -0.04262351989746094, -0.04036712646484375, -0.03811073303222656, -0.035854339599609375, -0.03359794616699219, -0.031341552734375, -0.029085159301757812, -0.026828765869140625, -0.024572372436523438, -0.02231597900390625, -0.020059585571289062, -0.017803192138671875, -0.015546798706054688, -0.0132904052734375, -0.011034011840820312, -0.008777618408203125, -0.0065212249755859375, -0.00426483154296875, -0.0020084381103515625, 0.000247955322265625, 0.0025043487548828125, 0.0047607421875, 0.0070171356201171875, 0.009273529052734375, 0.011529922485351562, 0.01378631591796875, 0.016042709350585938, 0.018299102783203125, 0.020555496215820312, 0.0228118896484375, 0.025068283081054688, 0.027324676513671875, 0.029581069946289062, 0.03183746337890625, 0.03409385681152344, 0.036350250244140625, 0.03860664367675781, 0.040863037109375, 0.04311943054199219, 0.045375823974609375, 0.04763221740722656, 0.04988861083984375, 0.05214500427246094, 0.054401397705078125, 0.05665779113769531, 0.0589141845703125, 0.06117057800292969, 0.06342697143554688, 0.06568336486816406, 0.06793975830078125, 0.07019615173339844, 0.07245254516601562, 0.07470893859863281, 0.07696533203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 10.0, 7.0, 9.0, 21.0, 14.0, 41.0, 34.0, 59.0, 58.0, 110.0, 67.0, 126.0, 74.0, 87.0, 63.0, 69.0, 41.0, 39.0, 14.0, 21.0, 11.0, 6.0, 3.0, 0.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.185604095458984e-06, -4.975125193595886e-06, -4.764646291732788e-06, -4.55416738986969e-06, -4.343688488006592e-06, -4.133209586143494e-06, -3.9227306842803955e-06, -3.7122517824172974e-06, -3.5017728805541992e-06, -3.291293978691101e-06, -3.080815076828003e-06, -2.8703361749649048e-06, -2.6598572731018066e-06, -2.4493783712387085e-06, -2.2388994693756104e-06, -2.028420567512512e-06, -1.817941665649414e-06, -1.607462763786316e-06, -1.3969838619232178e-06, -1.1865049600601196e-06, -9.760260581970215e-07, -7.655471563339233e-07, -5.550682544708252e-07, -3.4458935260772705e-07, -1.341104507446289e-07, 7.636845111846924e-08, 2.868473529815674e-07, 4.973262548446655e-07, 7.078051567077637e-07, 9.182840585708618e-07, 1.12876296043396e-06, 1.339241862297058e-06, 1.5497207641601562e-06, 1.7601996660232544e-06, 1.9706785678863525e-06, 2.1811574697494507e-06, 2.391636371612549e-06, 2.602115273475647e-06, 2.812594175338745e-06, 3.0230730772018433e-06, 3.2335519790649414e-06, 3.4440308809280396e-06, 3.6545097827911377e-06, 3.864988684654236e-06, 4.075467586517334e-06, 4.285946488380432e-06, 4.49642539024353e-06, 4.706904292106628e-06, 4.9173831939697266e-06, 5.127862095832825e-06, 5.338340997695923e-06, 5.548819899559021e-06, 5.759298801422119e-06, 5.969777703285217e-06, 6.1802566051483154e-06, 6.3907355070114136e-06, 6.601214408874512e-06, 6.81169331073761e-06, 7.022172212600708e-06, 7.232651114463806e-06, 7.443130016326904e-06, 7.653608918190002e-06, 7.8640878200531e-06, 8.074566721916199e-06, 8.285045623779297e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 6.0, 11.0, 14.0, 20.0, 28.0, 32.0, 52.0, 80.0, 154.0, 249.0, 385.0, 768.0, 1396.0, 2828.0, 6506.0, 19332.0, 80907.0, 609188.0, 261177.0, 43839.0, 12142.0, 4668.0, 2188.0, 1069.0, 599.0, 295.0, 185.0, 139.0, 99.0, 53.0, 33.0, 28.0, 15.0, 20.0, 10.0, 11.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0469970703125, -0.04530668258666992, -0.043616294860839844, -0.041925907135009766, -0.04023551940917969, -0.03854513168334961, -0.03685474395751953, -0.03516435623168945, -0.033473968505859375, -0.0317835807800293, -0.03009319305419922, -0.02840280532836914, -0.026712417602539062, -0.025022029876708984, -0.023331642150878906, -0.021641254425048828, -0.01995086669921875, -0.018260478973388672, -0.016570091247558594, -0.014879703521728516, -0.013189315795898438, -0.01149892807006836, -0.009808540344238281, -0.008118152618408203, -0.006427764892578125, -0.004737377166748047, -0.0030469894409179688, -0.0013566017150878906, 0.0003337860107421875, 0.0020241737365722656, 0.0037145614624023438, 0.005404949188232422, 0.0070953369140625, 0.008785724639892578, 0.010476112365722656, 0.012166500091552734, 0.013856887817382812, 0.01554727554321289, 0.01723766326904297, 0.018928050994873047, 0.020618438720703125, 0.022308826446533203, 0.02399921417236328, 0.02568960189819336, 0.027379989624023438, 0.029070377349853516, 0.030760765075683594, 0.03245115280151367, 0.03414154052734375, 0.03583192825317383, 0.037522315979003906, 0.039212703704833984, 0.04090309143066406, 0.04259347915649414, 0.04428386688232422, 0.0459742546081543, 0.047664642333984375, 0.04935503005981445, 0.05104541778564453, 0.05273580551147461, 0.05442619323730469, 0.056116580963134766, 0.057806968688964844, 0.05949735641479492, 0.061187744140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 6.0, 2.0, 7.0, 5.0, 7.0, 11.0, 11.0, 24.0, 34.0, 46.0, 94.0, 85.0, 115.0, 131.0, 100.0, 77.0, 72.0, 61.0, 37.0, 28.0, 18.0, 13.0, 2.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.06036376953125, -0.05891275405883789, -0.05746173858642578, -0.05601072311401367, -0.05455970764160156, -0.05310869216918945, -0.051657676696777344, -0.050206661224365234, -0.048755645751953125, -0.047304630279541016, -0.045853614807128906, -0.0444025993347168, -0.04295158386230469, -0.04150056838989258, -0.04004955291748047, -0.03859853744506836, -0.03714752197265625, -0.03569650650024414, -0.03424549102783203, -0.03279447555541992, -0.03134346008300781, -0.029892444610595703, -0.028441429138183594, -0.026990413665771484, -0.025539398193359375, -0.024088382720947266, -0.022637367248535156, -0.021186351776123047, -0.019735336303710938, -0.018284320831298828, -0.01683330535888672, -0.01538228988647461, -0.0139312744140625, -0.01248025894165039, -0.011029243469238281, -0.009578227996826172, -0.008127212524414062, -0.006676197052001953, -0.005225181579589844, -0.0037741661071777344, -0.002323150634765625, -0.0008721351623535156, 0.0005788803100585938, 0.002029895782470703, 0.0034809112548828125, 0.004931926727294922, 0.006382942199707031, 0.00783395767211914, 0.00928497314453125, 0.01073598861694336, 0.012187004089355469, 0.013638019561767578, 0.015089035034179688, 0.016540050506591797, 0.017991065979003906, 0.019442081451416016, 0.020893096923828125, 0.022344112396240234, 0.023795127868652344, 0.025246143341064453, 0.026697158813476562, 0.028148174285888672, 0.02959918975830078, 0.03105020523071289, 0.032501220703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 8.0, 5.0, 7.0, 6.0, 8.0, 10.0, 13.0, 11.0, 28.0, 34.0, 43.0, 67.0, 95.0, 161.0, 157.0, 94.0, 54.0, 51.0, 25.0, 31.0, 17.0, 13.0, 16.0, 12.0, 7.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.9880999326705933, -1.9384679794311523, -1.8888359069824219, -1.839203953742981, -1.78957200050354, -1.7399399280548096, -1.6903079748153687, -1.6406760215759277, -1.5910439491271973, -1.5414119958877563, -1.4917799234390259, -1.442147970199585, -1.3925158977508545, -1.3428839445114136, -1.2932519912719727, -1.2436199188232422, -1.1939879655838013, -1.1443560123443604, -1.0947239398956299, -1.045091986656189, -0.9954599738121033, -0.9458279609680176, -0.8961960077285767, -0.846563994884491, -0.7969319820404053, -0.7472999691963196, -0.6976679563522339, -0.648036003112793, -0.5984039902687073, -0.5487719774246216, -0.4991399943828583, -0.44950801134109497, -0.3998759984970093, -0.3502439856529236, -0.3006120026111603, -0.250980019569397, -0.20134800672531128, -0.15171600878238678, -0.10208401083946228, -0.052452027797698975, -0.0028200149536132812, 0.04681198298931122, 0.09644398093223572, 0.14607597887516022, 0.19570797681808472, 0.24533997476100922, 0.2949719727039337, 0.344603955745697, 0.3942359685897827, 0.4438679814338684, 0.4934999644756317, 0.543131947517395, 0.5927639603614807, 0.6423959732055664, 0.6920279264450073, 0.741659939289093, 0.7912919521331787, 0.8409239649772644, 0.8905559778213501, 0.940187931060791, 0.9898199439048767, 1.0394519567489624, 1.0890839099884033, 1.1387159824371338, 1.1883479356765747]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 2.0, 5.0, 14.0, 17.0, 19.0, 17.0, 16.0, 27.0, 26.0, 33.0, 26.0, 31.0, 44.0, 43.0, 38.0, 49.0, 49.0, 40.0, 45.0, 44.0, 52.0, 41.0, 30.0, 35.0, 40.0, 27.0, 33.0, 29.0, 24.0, 21.0, 13.0, 8.0, 6.0, 9.0, 8.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1409417390823364, -1.1033849716186523, -1.0658283233642578, -1.0282715559005737, -0.9907148480415344, -0.9531581401824951, -0.915601372718811, -0.8780446648597717, -0.8404879570007324, -0.8029312491416931, -0.7653745412826538, -0.7278177738189697, -0.6902610659599304, -0.6527043581008911, -0.615147590637207, -0.5775908827781677, -0.5400341749191284, -0.5024774670600891, -0.4649207293987274, -0.4273639917373657, -0.3898072838783264, -0.3522505760192871, -0.3146938383579254, -0.2771371006965637, -0.23958039283752441, -0.2020236700773239, -0.1644669473171234, -0.1269102245569229, -0.08935350179672241, -0.05179677903652191, -0.014240056276321411, 0.023316681385040283, 0.06087338924407959, 0.09843011200428009, 0.1359868347644806, 0.1735435575246811, 0.2111002802848816, 0.2486570030450821, 0.2862137258052826, 0.3237704634666443, 0.3613271713256836, 0.3988838791847229, 0.4364406168460846, 0.4739973545074463, 0.5115540623664856, 0.5491107702255249, 0.586667537689209, 0.6242242455482483, 0.6617809534072876, 0.6993376612663269, 0.7368943691253662, 0.7744511365890503, 0.8120078444480896, 0.8495645523071289, 0.887121319770813, 0.9246780276298523, 0.9622347354888916, 0.9997914433479309, 1.0373481512069702, 1.0749049186706543, 1.1124615669250488, 1.150018334388733, 1.187575101852417, 1.2251317501068115, 1.2626885175704956]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 13.0, 12.0, 21.0, 28.0, 37.0, 46.0, 78.0, 100.0, 167.0, 298.0, 540.0, 1052.0, 2205.0, 5686.0, 18383.0, 4016786.0, 126953.0, 13746.0, 4372.0, 1731.0, 783.0, 447.0, 248.0, 162.0, 92.0, 79.0, 55.0, 38.0, 17.0, 16.0, 14.0, 11.0, 9.0, 7.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.89013671875, -0.8660125732421875, -0.841888427734375, -0.8177642822265625, -0.79364013671875, -0.7695159912109375, -0.745391845703125, -0.7212677001953125, -0.6971435546875, -0.6730194091796875, -0.648895263671875, -0.6247711181640625, -0.60064697265625, -0.5765228271484375, -0.552398681640625, -0.5282745361328125, -0.504150390625, -0.4800262451171875, -0.455902099609375, -0.4317779541015625, -0.40765380859375, -0.3835296630859375, -0.359405517578125, -0.3352813720703125, -0.3111572265625, -0.2870330810546875, -0.262908935546875, -0.2387847900390625, -0.21466064453125, -0.1905364990234375, -0.166412353515625, -0.1422882080078125, -0.1181640625, -0.0940399169921875, -0.069915771484375, -0.0457916259765625, -0.02166748046875, 0.0024566650390625, 0.026580810546875, 0.0507049560546875, 0.0748291015625, 0.0989532470703125, 0.123077392578125, 0.1472015380859375, 0.17132568359375, 0.1954498291015625, 0.219573974609375, 0.2436981201171875, 0.267822265625, 0.2919464111328125, 0.316070556640625, 0.3401947021484375, 0.36431884765625, 0.3884429931640625, 0.412567138671875, 0.4366912841796875, 0.4608154296875, 0.4849395751953125, 0.509063720703125, 0.5331878662109375, 0.55731201171875, 0.5814361572265625, 0.605560302734375, 0.6296844482421875, 0.65380859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 11.0, 4.0, 10.0, 28.0, 36.0, 38.0, 49.0, 72.0, 70.0, 88.0, 96.0, 116.0, 90.0, 84.0, 63.0, 41.0, 34.0, 23.0, 16.0, 11.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.11328125, -0.1102752685546875, -0.107269287109375, -0.1042633056640625, -0.10125732421875, -0.0982513427734375, -0.095245361328125, -0.0922393798828125, -0.0892333984375, -0.0862274169921875, -0.083221435546875, -0.0802154541015625, -0.07720947265625, -0.0742034912109375, -0.071197509765625, -0.0681915283203125, -0.065185546875, -0.0621795654296875, -0.059173583984375, -0.0561676025390625, -0.05316162109375, -0.0501556396484375, -0.047149658203125, -0.0441436767578125, -0.0411376953125, -0.0381317138671875, -0.035125732421875, -0.0321197509765625, -0.02911376953125, -0.0261077880859375, -0.023101806640625, -0.0200958251953125, -0.01708984375, -0.0140838623046875, -0.011077880859375, -0.0080718994140625, -0.00506591796875, -0.0020599365234375, 0.000946044921875, 0.0039520263671875, 0.0069580078125, 0.0099639892578125, 0.012969970703125, 0.0159759521484375, 0.01898193359375, 0.0219879150390625, 0.024993896484375, 0.0279998779296875, 0.031005859375, 0.0340118408203125, 0.037017822265625, 0.0400238037109375, 0.04302978515625, 0.0460357666015625, 0.049041748046875, 0.0520477294921875, 0.0550537109375, 0.0580596923828125, 0.061065673828125, 0.0640716552734375, 0.06707763671875, 0.0700836181640625, 0.073089599609375, 0.0760955810546875, 0.0791015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 9.0, 15.0, 21.0, 31.0, 33.0, 54.0, 70.0, 106.0, 139.0, 195.0, 307.0, 490.0, 729.0, 1268.0, 2372.0, 5071.0, 11959.0, 33167.0, 592982.0, 3486395.0, 35345.0, 12337.0, 5165.0, 2404.0, 1273.0, 778.0, 489.0, 316.0, 204.0, 149.0, 108.0, 78.0, 57.0, 48.0, 21.0, 24.0, 19.0, 13.0, 11.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4541015625, -0.4394645690917969, -0.42482757568359375, -0.4101905822753906, -0.3955535888671875, -0.3809165954589844, -0.36627960205078125, -0.3516426086425781, -0.337005615234375, -0.3223686218261719, -0.30773162841796875, -0.2930946350097656, -0.2784576416015625, -0.2638206481933594, -0.24918365478515625, -0.23454666137695312, -0.21990966796875, -0.20527267456054688, -0.19063568115234375, -0.17599868774414062, -0.1613616943359375, -0.14672470092773438, -0.13208770751953125, -0.11745071411132812, -0.102813720703125, -0.08817672729492188, -0.07353973388671875, -0.058902740478515625, -0.0442657470703125, -0.029628753662109375, -0.01499176025390625, -0.000354766845703125, 0.0142822265625, 0.028919219970703125, 0.04355621337890625, 0.058193206787109375, 0.0728302001953125, 0.08746719360351562, 0.10210418701171875, 0.11674118041992188, 0.131378173828125, 0.14601516723632812, 0.16065216064453125, 0.17528915405273438, 0.1899261474609375, 0.20456314086914062, 0.21920013427734375, 0.23383712768554688, 0.24847412109375, 0.2631111145019531, 0.27774810791015625, 0.2923851013183594, 0.3070220947265625, 0.3216590881347656, 0.33629608154296875, 0.3509330749511719, 0.365570068359375, 0.3802070617675781, 0.39484405517578125, 0.4094810485839844, 0.4241180419921875, 0.4387550354003906, 0.45339202880859375, 0.4680290222167969, 0.482666015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 13.0, 4.0, 18.0, 12.0, 19.0, 22.0, 25.0, 45.0, 445.0, 3249.0, 92.0, 38.0, 23.0, 18.0, 11.0, 11.0, 10.0, 9.0, 6.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220703125, -0.21404266357421875, -0.2073822021484375, -0.20072174072265625, -0.194061279296875, -0.18740081787109375, -0.1807403564453125, -0.17407989501953125, -0.16741943359375, -0.16075897216796875, -0.1540985107421875, -0.14743804931640625, -0.140777587890625, -0.13411712646484375, -0.1274566650390625, -0.12079620361328125, -0.1141357421875, -0.10747528076171875, -0.1008148193359375, -0.09415435791015625, -0.087493896484375, -0.08083343505859375, -0.0741729736328125, -0.06751251220703125, -0.06085205078125, -0.05419158935546875, -0.0475311279296875, -0.04087066650390625, -0.034210205078125, -0.02754974365234375, -0.0208892822265625, -0.01422882080078125, -0.007568359375, -0.00090789794921875, 0.0057525634765625, 0.01241302490234375, 0.019073486328125, 0.02573394775390625, 0.0323944091796875, 0.03905487060546875, 0.04571533203125, 0.05237579345703125, 0.0590362548828125, 0.06569671630859375, 0.072357177734375, 0.07901763916015625, 0.0856781005859375, 0.09233856201171875, 0.0989990234375, 0.10565948486328125, 0.1123199462890625, 0.11898040771484375, 0.125640869140625, 0.13230133056640625, 0.1389617919921875, 0.14562225341796875, 0.15228271484375, 0.15894317626953125, 0.1656036376953125, 0.17226409912109375, 0.178924560546875, 0.18558502197265625, 0.1922454833984375, 0.19890594482421875, 0.20556640625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 0.0, 6.0, 8.0, 6.0, 12.0, 10.0, 21.0, 22.0, 29.0, 38.0, 48.0, 68.0, 103.0, 166.0, 117.0, 93.0, 57.0, 39.0, 37.0, 19.0, 20.0, 14.0, 10.0, 10.0, 5.0, 9.0, 4.0, 7.0, 1.0, 4.0, 6.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48110878467559814, -0.46492162346839905, -0.44873446226119995, -0.43254727125167847, -0.41636011004447937, -0.4001729488372803, -0.3839857578277588, -0.3677985966205597, -0.3516114354133606, -0.3354242742061615, -0.3192371129989624, -0.3030499219894409, -0.2868627607822418, -0.2706755995750427, -0.25448840856552124, -0.23830124735832214, -0.22211408615112305, -0.20592692494392395, -0.18973974883556366, -0.17355257272720337, -0.15736541152000427, -0.14117825031280518, -0.12499107420444489, -0.10880390554666519, -0.0926167368888855, -0.0764295682311058, -0.06024239957332611, -0.04405523091554642, -0.027868062257766724, -0.01168089359998703, 0.004506275057792664, 0.020693443715572357, 0.03688061237335205, 0.053067781031131744, 0.06925494968891144, 0.08544211834669113, 0.10162928700447083, 0.11781645566225052, 0.1340036243200302, 0.1501908004283905, 0.1663779616355896, 0.1825651228427887, 0.198752298951149, 0.21493947505950928, 0.23112663626670837, 0.24731379747390747, 0.26350098848342896, 0.27968814969062805, 0.29587531089782715, 0.31206247210502625, 0.32824963331222534, 0.3444368243217468, 0.3606239855289459, 0.376811146736145, 0.3929983377456665, 0.4091854989528656, 0.4253726601600647, 0.4415598213672638, 0.4577469825744629, 0.4739341735839844, 0.49012133479118347, 0.5063084959983826, 0.522495687007904, 0.5386828184127808, 0.5548700094223022]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 11.0, 9.0, 6.0, 8.0, 8.0, 9.0, 18.0, 28.0, 13.0, 24.0, 30.0, 40.0, 37.0, 21.0, 39.0, 43.0, 48.0, 50.0, 37.0, 61.0, 39.0, 43.0, 38.0, 52.0, 40.0, 29.0, 33.0, 31.0, 23.0, 24.0, 26.0, 8.0, 15.0, 19.0, 13.0, 6.0, 10.0, 4.0, 6.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38308626413345337, -0.37010782957077026, -0.35712939500808716, -0.34415096044540405, -0.33117252588272095, -0.31819409132003784, -0.30521565675735474, -0.29223722219467163, -0.2792587876319885, -0.2662803530693054, -0.2533019185066223, -0.2403234839439392, -0.2273450493812561, -0.214366614818573, -0.2013881951570511, -0.18840976059436798, -0.17543134093284607, -0.16245290637016296, -0.14947447180747986, -0.13649603724479675, -0.12351761013269424, -0.11053917557001114, -0.09756074845790863, -0.08458231389522552, -0.07160387933254242, -0.058625444769859314, -0.04564701393246651, -0.0326685830950737, -0.019690148532390594, -0.006711713969707489, 0.0062667131423950195, 0.019245147705078125, 0.03222358226776123, 0.045202016830444336, 0.05818044766783714, 0.07115887850522995, 0.08413731306791306, 0.09711574763059616, 0.11009417474269867, 0.12307260930538177, 0.13605104386806488, 0.14902947843074799, 0.1620079129934311, 0.174986332654953, 0.1879647672176361, 0.2009432017803192, 0.21392163634300232, 0.22690007090568542, 0.23987850546836853, 0.25285694003105164, 0.26583537459373474, 0.27881380915641785, 0.29179224371910095, 0.30477067828178406, 0.3177490830421448, 0.3307275176048279, 0.343705952167511, 0.3566843867301941, 0.3696628212928772, 0.3826412558555603, 0.3956196904182434, 0.4085981249809265, 0.4215765595436096, 0.4345549941062927, 0.44753342866897583]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 18.0, 15.0, 25.0, 26.0, 49.0, 51.0, 72.0, 100.0, 152.0, 212.0, 258.0, 372.0, 542.0, 843.0, 1320.0, 2525.0, 4947.0, 11253.0, 28405.0, 82188.0, 402195.0, 382182.0, 80294.0, 28005.0, 11190.0, 4908.0, 2315.0, 1366.0, 800.0, 530.0, 368.0, 288.0, 196.0, 140.0, 115.0, 66.0, 52.0, 41.0, 29.0, 23.0, 17.0, 16.0, 11.0, 7.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.44384765625, -0.4303932189941406, -0.41693878173828125, -0.4034843444824219, -0.3900299072265625, -0.3765754699707031, -0.36312103271484375, -0.3496665954589844, -0.336212158203125, -0.3227577209472656, -0.30930328369140625, -0.2958488464355469, -0.2823944091796875, -0.2689399719238281, -0.25548553466796875, -0.24203109741210938, -0.22857666015625, -0.21512222290039062, -0.20166778564453125, -0.18821334838867188, -0.1747589111328125, -0.16130447387695312, -0.14785003662109375, -0.13439559936523438, -0.120941162109375, -0.10748672485351562, -0.09403228759765625, -0.08057785034179688, -0.0671234130859375, -0.053668975830078125, -0.04021453857421875, -0.026760101318359375, -0.0133056640625, 0.000148773193359375, 0.01360321044921875, 0.027057647705078125, 0.0405120849609375, 0.053966522216796875, 0.06742095947265625, 0.08087539672851562, 0.094329833984375, 0.10778427124023438, 0.12123870849609375, 0.13469314575195312, 0.1481475830078125, 0.16160202026367188, 0.17505645751953125, 0.18851089477539062, 0.20196533203125, 0.21541976928710938, 0.22887420654296875, 0.24232864379882812, 0.2557830810546875, 0.2692375183105469, 0.28269195556640625, 0.2961463928222656, 0.309600830078125, 0.3230552673339844, 0.33650970458984375, 0.3499641418457031, 0.3634185791015625, 0.3768730163574219, 0.39032745361328125, 0.4037818908691406, 0.417236328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 10.0, 9.0, 16.0, 29.0, 36.0, 51.0, 67.0, 57.0, 103.0, 103.0, 109.0, 90.0, 87.0, 71.0, 58.0, 34.0, 19.0, 23.0, 13.0, 3.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11663818359375, -0.11349010467529297, -0.11034202575683594, -0.1071939468383789, -0.10404586791992188, -0.10089778900146484, -0.09774971008300781, -0.09460163116455078, -0.09145355224609375, -0.08830547332763672, -0.08515739440917969, -0.08200931549072266, -0.07886123657226562, -0.0757131576538086, -0.07256507873535156, -0.06941699981689453, -0.0662689208984375, -0.06312084197998047, -0.05997276306152344, -0.056824684143066406, -0.053676605224609375, -0.050528526306152344, -0.04738044738769531, -0.04423236846923828, -0.04108428955078125, -0.03793621063232422, -0.03478813171386719, -0.031640052795410156, -0.028491973876953125, -0.025343894958496094, -0.022195816040039062, -0.01904773712158203, -0.015899658203125, -0.012751579284667969, -0.009603500366210938, -0.006455421447753906, -0.003307342529296875, -0.00015926361083984375, 0.0029888153076171875, 0.006136894226074219, 0.00928497314453125, 0.012433052062988281, 0.015581130981445312, 0.018729209899902344, 0.021877288818359375, 0.025025367736816406, 0.028173446655273438, 0.03132152557373047, 0.0344696044921875, 0.03761768341064453, 0.04076576232910156, 0.043913841247558594, 0.047061920166015625, 0.050209999084472656, 0.05335807800292969, 0.05650615692138672, 0.05965423583984375, 0.06280231475830078, 0.06595039367675781, 0.06909847259521484, 0.07224655151367188, 0.0753946304321289, 0.07854270935058594, 0.08169078826904297, 0.0848388671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 8.0, 8.0, 18.0, 16.0, 31.0, 51.0, 73.0, 107.0, 144.0, 218.0, 320.0, 477.0, 839.0, 1227.0, 1987.0, 3297.0, 5563.0, 9432.0, 16254.0, 29132.0, 56064.0, 125555.0, 385737.0, 232877.0, 83866.0, 41499.0, 22296.0, 12577.0, 7412.0, 4378.0, 2549.0, 1603.0, 1032.0, 655.0, 402.0, 252.0, 193.0, 121.0, 95.0, 57.0, 35.0, 37.0, 10.0, 16.0, 9.0, 4.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1956787109375, -0.18951988220214844, -0.18336105346679688, -0.1772022247314453, -0.17104339599609375, -0.1648845672607422, -0.15872573852539062, -0.15256690979003906, -0.1464080810546875, -0.14024925231933594, -0.13409042358398438, -0.1279315948486328, -0.12177276611328125, -0.11561393737792969, -0.10945510864257812, -0.10329627990722656, -0.097137451171875, -0.09097862243652344, -0.08481979370117188, -0.07866096496582031, -0.07250213623046875, -0.06634330749511719, -0.060184478759765625, -0.05402565002441406, -0.0478668212890625, -0.04170799255371094, -0.035549163818359375, -0.029390335083007812, -0.02323150634765625, -0.017072677612304688, -0.010913848876953125, -0.0047550201416015625, 0.00140380859375, 0.0075626373291015625, 0.013721466064453125, 0.019880294799804688, 0.02603912353515625, 0.03219795227050781, 0.038356781005859375, 0.04451560974121094, 0.0506744384765625, 0.05683326721191406, 0.06299209594726562, 0.06915092468261719, 0.07530975341796875, 0.08146858215332031, 0.08762741088867188, 0.09378623962402344, 0.099945068359375, 0.10610389709472656, 0.11226272583007812, 0.11842155456542969, 0.12458038330078125, 0.1307392120361328, 0.13689804077148438, 0.14305686950683594, 0.1492156982421875, 0.15537452697753906, 0.16153335571289062, 0.1676921844482422, 0.17385101318359375, 0.1800098419189453, 0.18616867065429688, 0.19232749938964844, 0.198486328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 11.0, 11.0, 10.0, 18.0, 19.0, 22.0, 18.0, 27.0, 25.0, 33.0, 32.0, 43.0, 45.0, 48.0, 47.0, 54.0, 42.0, 50.0, 47.0, 50.0, 42.0, 29.0, 37.0, 26.0, 32.0, 25.0, 26.0, 19.0, 11.0, 19.0, 17.0, 10.0, 12.0, 12.0, 7.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.2050762176513672, -0.19860458374023438, -0.19213294982910156, -0.18566131591796875, -0.17918968200683594, -0.17271804809570312, -0.1662464141845703, -0.1597747802734375, -0.1533031463623047, -0.14683151245117188, -0.14035987854003906, -0.13388824462890625, -0.12741661071777344, -0.12094497680664062, -0.11447334289550781, -0.108001708984375, -0.10153007507324219, -0.09505844116210938, -0.08858680725097656, -0.08211517333984375, -0.07564353942871094, -0.06917190551757812, -0.06270027160644531, -0.0562286376953125, -0.04975700378417969, -0.043285369873046875, -0.03681373596191406, -0.03034210205078125, -0.023870468139648438, -0.017398834228515625, -0.010927200317382812, -0.00445556640625, 0.0020160675048828125, 0.008487701416015625, 0.014959335327148438, 0.02143096923828125, 0.027902603149414062, 0.034374237060546875, 0.04084587097167969, 0.0473175048828125, 0.05378913879394531, 0.060260772705078125, 0.06673240661621094, 0.07320404052734375, 0.07967567443847656, 0.08614730834960938, 0.09261894226074219, 0.099090576171875, 0.10556221008300781, 0.11203384399414062, 0.11850547790527344, 0.12497711181640625, 0.13144874572753906, 0.13792037963867188, 0.1443920135498047, 0.1508636474609375, 0.1573352813720703, 0.16380691528320312, 0.17027854919433594, 0.17675018310546875, 0.18322181701660156, 0.18969345092773438, 0.1961650848388672, 0.20263671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 8.0, 9.0, 14.0, 17.0, 18.0, 47.0, 53.0, 98.0, 175.0, 369.0, 773.0, 1688.0, 4085.0, 11037.0, 37848.0, 257268.0, 646772.0, 62468.0, 16096.0, 5524.0, 2161.0, 1003.0, 469.0, 222.0, 133.0, 67.0, 43.0, 24.0, 12.0, 11.0, 10.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.08331298828125, -0.0812387466430664, -0.07916450500488281, -0.07709026336669922, -0.07501602172851562, -0.07294178009033203, -0.07086753845214844, -0.06879329681396484, -0.06671905517578125, -0.06464481353759766, -0.06257057189941406, -0.06049633026123047, -0.058422088623046875, -0.05634784698486328, -0.05427360534667969, -0.052199363708496094, -0.0501251220703125, -0.048050880432128906, -0.04597663879394531, -0.04390239715576172, -0.041828155517578125, -0.03975391387939453, -0.03767967224121094, -0.035605430603027344, -0.03353118896484375, -0.031456947326660156, -0.029382705688476562, -0.02730846405029297, -0.025234222412109375, -0.02315998077392578, -0.021085739135742188, -0.019011497497558594, -0.016937255859375, -0.014863014221191406, -0.012788772583007812, -0.010714530944824219, -0.008640289306640625, -0.006566047668457031, -0.0044918060302734375, -0.0024175643920898438, -0.00034332275390625, 0.0017309188842773438, 0.0038051605224609375, 0.005879402160644531, 0.007953643798828125, 0.010027885437011719, 0.012102127075195312, 0.014176368713378906, 0.0162506103515625, 0.018324851989746094, 0.020399093627929688, 0.02247333526611328, 0.024547576904296875, 0.02662181854248047, 0.028696060180664062, 0.030770301818847656, 0.03284454345703125, 0.034918785095214844, 0.03699302673339844, 0.03906726837158203, 0.041141510009765625, 0.04321575164794922, 0.04528999328613281, 0.047364234924316406, 0.0494384765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 7.0, 7.0, 20.0, 15.0, 19.0, 39.0, 52.0, 50.0, 63.0, 70.0, 117.0, 88.0, 76.0, 77.0, 64.0, 63.0, 52.0, 33.0, 26.0, 12.0, 14.0, 11.0, 4.0, 6.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.702278137207031e-06, -8.501112461090088e-06, -8.299946784973145e-06, -8.098781108856201e-06, -7.897615432739258e-06, -7.696449756622314e-06, -7.495284080505371e-06, -7.294118404388428e-06, -7.092952728271484e-06, -6.891787052154541e-06, -6.690621376037598e-06, -6.489455699920654e-06, -6.288290023803711e-06, -6.087124347686768e-06, -5.885958671569824e-06, -5.684792995452881e-06, -5.4836273193359375e-06, -5.282461643218994e-06, -5.081295967102051e-06, -4.880130290985107e-06, -4.678964614868164e-06, -4.477798938751221e-06, -4.276633262634277e-06, -4.075467586517334e-06, -3.874301910400391e-06, -3.6731362342834473e-06, -3.471970558166504e-06, -3.2708048820495605e-06, -3.069639205932617e-06, -2.868473529815674e-06, -2.6673078536987305e-06, -2.466142177581787e-06, -2.2649765014648438e-06, -2.0638108253479004e-06, -1.862645149230957e-06, -1.6614794731140137e-06, -1.4603137969970703e-06, -1.259148120880127e-06, -1.0579824447631836e-06, -8.568167686462402e-07, -6.556510925292969e-07, -4.544854164123535e-07, -2.5331974029541016e-07, -5.21540641784668e-08, 1.4901161193847656e-07, 3.501772880554199e-07, 5.513429641723633e-07, 7.525086402893066e-07, 9.5367431640625e-07, 1.1548399925231934e-06, 1.3560056686401367e-06, 1.55717134475708e-06, 1.7583370208740234e-06, 1.959502696990967e-06, 2.16066837310791e-06, 2.3618340492248535e-06, 2.562999725341797e-06, 2.7641654014587402e-06, 2.9653310775756836e-06, 3.166496753692627e-06, 3.3676624298095703e-06, 3.5688281059265137e-06, 3.769993782043457e-06, 3.9711594581604e-06, 4.172325134277344e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 5.0, 11.0, 5.0, 13.0, 27.0, 34.0, 52.0, 83.0, 105.0, 236.0, 346.0, 622.0, 1166.0, 2049.0, 4172.0, 8755.0, 20381.0, 58581.0, 313890.0, 511457.0, 79848.0, 25617.0, 10594.0, 4956.0, 2427.0, 1386.0, 684.0, 396.0, 265.0, 144.0, 67.0, 58.0, 39.0, 36.0, 20.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.039093017578125, -0.037795066833496094, -0.03649711608886719, -0.03519916534423828, -0.033901214599609375, -0.03260326385498047, -0.03130531311035156, -0.030007362365722656, -0.02870941162109375, -0.027411460876464844, -0.026113510131835938, -0.02481555938720703, -0.023517608642578125, -0.02221965789794922, -0.020921707153320312, -0.019623756408691406, -0.0183258056640625, -0.017027854919433594, -0.015729904174804688, -0.014431953430175781, -0.013134002685546875, -0.011836051940917969, -0.010538101196289062, -0.009240150451660156, -0.00794219970703125, -0.006644248962402344, -0.0053462982177734375, -0.004048347473144531, -0.002750396728515625, -0.0014524459838867188, -0.0001544952392578125, 0.0011434555053710938, 0.00244140625, 0.0037393569946289062, 0.0050373077392578125, 0.006335258483886719, 0.007633209228515625, 0.008931159973144531, 0.010229110717773438, 0.011527061462402344, 0.01282501220703125, 0.014122962951660156, 0.015420913696289062, 0.01671886444091797, 0.018016815185546875, 0.01931476593017578, 0.020612716674804688, 0.021910667419433594, 0.0232086181640625, 0.024506568908691406, 0.025804519653320312, 0.02710247039794922, 0.028400421142578125, 0.02969837188720703, 0.030996322631835938, 0.032294273376464844, 0.03359222412109375, 0.034890174865722656, 0.03618812561035156, 0.03748607635498047, 0.038784027099609375, 0.04008197784423828, 0.04137992858886719, 0.042677879333496094, 0.043975830078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 10.0, 8.0, 8.0, 20.0, 14.0, 22.0, 23.0, 29.0, 41.0, 68.0, 74.0, 84.0, 87.0, 111.0, 93.0, 75.0, 43.0, 38.0, 26.0, 24.0, 24.0, 16.0, 12.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294189453125, -0.028286457061767578, -0.027153968811035156, -0.026021480560302734, -0.024888992309570312, -0.02375650405883789, -0.02262401580810547, -0.021491527557373047, -0.020359039306640625, -0.019226551055908203, -0.01809406280517578, -0.01696157455444336, -0.015829086303710938, -0.014696598052978516, -0.013564109802246094, -0.012431621551513672, -0.01129913330078125, -0.010166645050048828, -0.009034156799316406, -0.007901668548583984, -0.0067691802978515625, -0.005636692047119141, -0.004504203796386719, -0.003371715545654297, -0.002239227294921875, -0.0011067390441894531, 2.574920654296875e-05, 0.0011582374572753906, 0.0022907257080078125, 0.0034232139587402344, 0.004555702209472656, 0.005688190460205078, 0.0068206787109375, 0.007953166961669922, 0.009085655212402344, 0.010218143463134766, 0.011350631713867188, 0.01248311996459961, 0.013615608215332031, 0.014748096466064453, 0.015880584716796875, 0.017013072967529297, 0.01814556121826172, 0.01927804946899414, 0.020410537719726562, 0.021543025970458984, 0.022675514221191406, 0.023808002471923828, 0.02494049072265625, 0.026072978973388672, 0.027205467224121094, 0.028337955474853516, 0.029470443725585938, 0.03060293197631836, 0.03173542022705078, 0.0328679084777832, 0.034000396728515625, 0.03513288497924805, 0.03626537322998047, 0.03739786148071289, 0.03853034973144531, 0.039662837982177734, 0.040795326232910156, 0.04192781448364258, 0.043060302734375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 3.0, 13.0, 17.0, 21.0, 34.0, 68.0, 87.0, 254.0, 231.0, 118.0, 53.0, 30.0, 23.0, 18.0, 6.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1582906246185303, -2.0753467082977295, -1.9924027919769287, -1.9094587564468384, -1.8265148401260376, -1.7435709238052368, -1.6606268882751465, -1.5776829719543457, -1.494739055633545, -1.4117951393127441, -1.3288512229919434, -1.245907187461853, -1.1629632711410522, -1.0800193548202515, -0.9970753788948059, -0.9141314029693604, -0.8311874866485596, -0.7482435703277588, -0.6652995944023132, -0.5823556184768677, -0.4994117021560669, -0.4164677560329437, -0.33352380990982056, -0.250579833984375, -0.16763591766357422, -0.08469197154045105, -0.0017480254173278809, 0.08119592070579529, 0.16413986682891846, 0.24708381295204163, 0.3300277590751648, 0.41297173500061035, 0.49591541290283203, 0.5788593292236328, 0.6618033051490784, 0.7447472810745239, 0.8276911973953247, 0.9106351137161255, 0.993579089641571, 1.0765230655670166, 1.1594669818878174, 1.2424108982086182, 1.325354814529419, 1.4082988500595093, 1.49124276638031, 1.5741866827011108, 1.6571307182312012, 1.740074634552002, 1.8230185508728027, 1.9059624671936035, 1.9889063835144043, 2.071850299835205, 2.154794216156006, 2.2377383708953857, 2.3206822872161865, 2.4036262035369873, 2.486570119857788, 2.569514036178589, 2.6524579524993896, 2.7354018688201904, 2.8183460235595703, 2.901289939880371, 2.984233856201172, 3.0671777725219727, 3.1501216888427734]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 5.0, 6.0, 2.0, 5.0, 6.0, 8.0, 13.0, 11.0, 13.0, 15.0, 19.0, 23.0, 31.0, 26.0, 30.0, 39.0, 28.0, 26.0, 43.0, 27.0, 34.0, 46.0, 46.0, 35.0, 36.0, 37.0, 42.0, 29.0, 41.0, 24.0, 42.0, 27.0, 26.0, 22.0, 23.0, 18.0, 13.0, 8.0, 10.0, 11.0, 8.0, 7.0, 10.0, 9.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.9556266665458679, -0.9249462485313416, -0.8942658305168152, -0.8635854125022888, -0.8329049944877625, -0.8022245764732361, -0.7715440988540649, -0.7408636808395386, -0.7101832628250122, -0.6795028448104858, -0.6488224267959595, -0.6181420087814331, -0.5874615907669067, -0.5567811727523804, -0.526100754737854, -0.49542030692100525, -0.46473991870880127, -0.4340595006942749, -0.40337908267974854, -0.37269866466522217, -0.3420182466506958, -0.31133782863616943, -0.2806573808193207, -0.2499769628047943, -0.21929654479026794, -0.18861612677574158, -0.1579357087612152, -0.12725527584552765, -0.09657485783100128, -0.06589443981647491, -0.035214006900787354, -0.004533588886260986, 0.026146769523620605, 0.05682719126343727, 0.08750761300325394, 0.1181880384683609, 0.14886845648288727, 0.17954887449741364, 0.2102293074131012, 0.24090972542762756, 0.27159014344215393, 0.3022705614566803, 0.33295097947120667, 0.3636314272880554, 0.3943118453025818, 0.42499226331710815, 0.4556726813316345, 0.4863530993461609, 0.5170335173606873, 0.5477139353752136, 0.57839435338974, 0.6090747714042664, 0.6397551894187927, 0.6704356074333191, 0.7011160850524902, 0.7317965030670166, 0.762476921081543, 0.7931573390960693, 0.8238377571105957, 0.8545181751251221, 0.8851985931396484, 0.9158790111541748, 0.9465594291687012, 0.9772398471832275, 1.007920265197754]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 11.0, 6.0, 4.0, 12.0, 21.0, 18.0, 31.0, 27.0, 42.0, 71.0, 97.0, 128.0, 225.0, 325.0, 619.0, 1103.0, 2045.0, 4119.0, 9761.0, 38029.0, 4064050.0, 52418.0, 11487.0, 4384.0, 2251.0, 1175.0, 672.0, 375.0, 230.0, 124.0, 88.0, 72.0, 43.0, 35.0, 25.0, 35.0, 25.0, 18.0, 15.0, 10.0, 10.0, 11.0, 6.0, 8.0, 3.0, 2.0, 3.0], "bins": [-0.68603515625, -0.6677780151367188, -0.6495208740234375, -0.6312637329101562, -0.613006591796875, -0.5947494506835938, -0.5764923095703125, -0.5582351684570312, -0.53997802734375, -0.5217208862304688, -0.5034637451171875, -0.48520660400390625, -0.466949462890625, -0.44869232177734375, -0.4304351806640625, -0.41217803955078125, -0.3939208984375, -0.37566375732421875, -0.3574066162109375, -0.33914947509765625, -0.320892333984375, -0.30263519287109375, -0.2843780517578125, -0.26612091064453125, -0.24786376953125, -0.22960662841796875, -0.2113494873046875, -0.19309234619140625, -0.174835205078125, -0.15657806396484375, -0.1383209228515625, -0.12006378173828125, -0.101806640625, -0.08354949951171875, -0.0652923583984375, -0.04703521728515625, -0.028778076171875, -0.01052093505859375, 0.0077362060546875, 0.02599334716796875, 0.04425048828125, 0.06250762939453125, 0.0807647705078125, 0.09902191162109375, 0.117279052734375, 0.13553619384765625, 0.1537933349609375, 0.17205047607421875, 0.1903076171875, 0.20856475830078125, 0.2268218994140625, 0.24507904052734375, 0.263336181640625, 0.28159332275390625, 0.2998504638671875, 0.31810760498046875, 0.33636474609375, 0.35462188720703125, 0.3728790283203125, 0.39113616943359375, 0.409393310546875, 0.42765045166015625, 0.4459075927734375, 0.46416473388671875, 0.482421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 3.0, 7.0, 11.0, 18.0, 33.0, 32.0, 67.0, 62.0, 87.0, 89.0, 94.0, 118.0, 97.0, 70.0, 59.0, 53.0, 34.0, 26.0, 14.0, 11.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12127685546875, -0.11797618865966797, -0.11467552185058594, -0.1113748550415039, -0.10807418823242188, -0.10477352142333984, -0.10147285461425781, -0.09817218780517578, -0.09487152099609375, -0.09157085418701172, -0.08827018737792969, -0.08496952056884766, -0.08166885375976562, -0.0783681869506836, -0.07506752014160156, -0.07176685333251953, -0.0684661865234375, -0.06516551971435547, -0.06186485290527344, -0.058564186096191406, -0.055263519287109375, -0.051962852478027344, -0.04866218566894531, -0.04536151885986328, -0.04206085205078125, -0.03876018524169922, -0.03545951843261719, -0.032158851623535156, -0.028858184814453125, -0.025557518005371094, -0.022256851196289062, -0.01895618438720703, -0.015655517578125, -0.012354850769042969, -0.009054183959960938, -0.005753517150878906, -0.002452850341796875, 0.0008478164672851562, 0.0041484832763671875, 0.007449150085449219, 0.01074981689453125, 0.014050483703613281, 0.017351150512695312, 0.020651817321777344, 0.023952484130859375, 0.027253150939941406, 0.030553817749023438, 0.03385448455810547, 0.0371551513671875, 0.04045581817626953, 0.04375648498535156, 0.047057151794433594, 0.050357818603515625, 0.053658485412597656, 0.05695915222167969, 0.06025981903076172, 0.06356048583984375, 0.06686115264892578, 0.07016181945800781, 0.07346248626708984, 0.07676315307617188, 0.0800638198852539, 0.08336448669433594, 0.08666515350341797, 0.0899658203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 9.0, 17.0, 27.0, 27.0, 34.0, 63.0, 106.0, 134.0, 228.0, 380.0, 577.0, 992.0, 1673.0, 2827.0, 5491.0, 11341.0, 27312.0, 115777.0, 3918845.0, 67554.0, 21029.0, 9135.0, 4690.0, 2425.0, 1383.0, 831.0, 455.0, 325.0, 220.0, 117.0, 87.0, 51.0, 29.0, 29.0, 16.0, 12.0, 10.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38916015625, -0.3763427734375, -0.363525390625, -0.3507080078125, -0.337890625, -0.3250732421875, -0.312255859375, -0.2994384765625, -0.28662109375, -0.2738037109375, -0.260986328125, -0.2481689453125, -0.2353515625, -0.2225341796875, -0.209716796875, -0.1968994140625, -0.18408203125, -0.1712646484375, -0.158447265625, -0.1456298828125, -0.1328125, -0.1199951171875, -0.107177734375, -0.0943603515625, -0.08154296875, -0.0687255859375, -0.055908203125, -0.0430908203125, -0.0302734375, -0.0174560546875, -0.004638671875, 0.0081787109375, 0.02099609375, 0.0338134765625, 0.046630859375, 0.0594482421875, 0.072265625, 0.0850830078125, 0.097900390625, 0.1107177734375, 0.12353515625, 0.1363525390625, 0.149169921875, 0.1619873046875, 0.1748046875, 0.1876220703125, 0.200439453125, 0.2132568359375, 0.22607421875, 0.2388916015625, 0.251708984375, 0.2645263671875, 0.27734375, 0.2901611328125, 0.302978515625, 0.3157958984375, 0.32861328125, 0.3414306640625, 0.354248046875, 0.3670654296875, 0.3798828125, 0.3927001953125, 0.405517578125, 0.4183349609375, 0.43115234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 6.0, 9.0, 8.0, 16.0, 14.0, 25.0, 34.0, 60.0, 361.0, 3183.0, 136.0, 46.0, 36.0, 21.0, 21.0, 18.0, 13.0, 10.0, 7.0, 3.0, 3.0, 0.0, 3.0, 7.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2379150390625, -0.23170089721679688, -0.22548675537109375, -0.21927261352539062, -0.2130584716796875, -0.20684432983398438, -0.20063018798828125, -0.19441604614257812, -0.188201904296875, -0.18198776245117188, -0.17577362060546875, -0.16955947875976562, -0.1633453369140625, -0.15713119506835938, -0.15091705322265625, -0.14470291137695312, -0.13848876953125, -0.13227462768554688, -0.12606048583984375, -0.11984634399414062, -0.1136322021484375, -0.10741806030273438, -0.10120391845703125, -0.09498977661132812, -0.088775634765625, -0.08256149291992188, -0.07634735107421875, -0.07013320922851562, -0.0639190673828125, -0.057704925537109375, -0.05149078369140625, -0.045276641845703125, -0.0390625, -0.032848358154296875, -0.02663421630859375, -0.020420074462890625, -0.0142059326171875, -0.007991790771484375, -0.00177764892578125, 0.004436492919921875, 0.010650634765625, 0.016864776611328125, 0.02307891845703125, 0.029293060302734375, 0.0355072021484375, 0.041721343994140625, 0.04793548583984375, 0.054149627685546875, 0.06036376953125, 0.06657791137695312, 0.07279205322265625, 0.07900619506835938, 0.0852203369140625, 0.09143447875976562, 0.09764862060546875, 0.10386276245117188, 0.110076904296875, 0.11629104614257812, 0.12250518798828125, 0.12871932983398438, 0.1349334716796875, 0.14114761352539062, 0.14736175537109375, 0.15357589721679688, 0.1597900390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 16.0, 23.0, 40.0, 108.0, 422.0, 282.0, 72.0, 25.0, 11.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7051247358322144, -0.6251776218414307, -0.5452304482460022, -0.4652833044528961, -0.38533616065979004, -0.30538901686668396, -0.22544187307357788, -0.14549469947814941, -0.06554758548736572, 0.014399558305740356, 0.09434670209884644, 0.17429384589195251, 0.2542409896850586, 0.3341881334781647, 0.41413527727127075, 0.4940824508666992, 0.5740295648574829, 0.6539766788482666, 0.7339238524436951, 0.8138710260391235, 0.8938181400299072, 0.9737652540206909, 1.0537123680114746, 1.1336596012115479, 1.2136067152023315, 1.2935538291931152, 1.3735010623931885, 1.4534481763839722, 1.5333952903747559, 1.6133424043655396, 1.6932895183563232, 1.7732367515563965, 1.8531837463378906, 1.9331308603286743, 2.013077974319458, 2.0930252075195312, 2.1729722023010254, 2.2529194355010986, 2.332866668701172, 2.412813663482666, 2.4927608966827393, 2.5727081298828125, 2.6526551246643066, 2.73260235786438, 2.812549591064453, 2.8924965858459473, 2.9724438190460205, 3.0523910522460938, 3.132338047027588, 3.212285280227661, 3.2922322750091553, 3.3721795082092285, 3.4521265029907227, 3.532073736190796, 3.612020969390869, 3.6919679641723633, 3.7719151973724365, 3.8518624305725098, 3.931809425354004, 4.011756420135498, 4.09170389175415, 4.1716508865356445, 4.251597881317139, 4.331545352935791, 4.411492347717285]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 11.0, 12.0, 20.0, 23.0, 25.0, 42.0, 47.0, 43.0, 51.0, 56.0, 80.0, 65.0, 64.0, 58.0, 59.0, 65.0, 57.0, 61.0, 37.0, 27.0, 18.0, 20.0, 12.0, 18.0, 12.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5814276337623596, -0.5576751232147217, -0.5339226126670837, -0.5101701021194458, -0.48641759157180786, -0.4626650810241699, -0.438912570476532, -0.41516005992889404, -0.3914075493812561, -0.36765503883361816, -0.3439025282859802, -0.3201500177383423, -0.29639750719070435, -0.2726449966430664, -0.24889250099658966, -0.22513999044895172, -0.20138749480247498, -0.17763498425483704, -0.1538824737071991, -0.13012996315956116, -0.10637746006250381, -0.08262494951486588, -0.05887244641780853, -0.03511993587017059, -0.011367425322532654, 0.012385083362460136, 0.03613759204745293, 0.05989009886980057, 0.08364260941743851, 0.10739511996507645, 0.1311476230621338, 0.15490013360977173, 0.17865264415740967, 0.2024051547050476, 0.22615766525268555, 0.2499101758003235, 0.2736626863479614, 0.29741519689559937, 0.3211677074432373, 0.34492021799087524, 0.3686727285385132, 0.3924252390861511, 0.41617774963378906, 0.439930260181427, 0.46368277072906494, 0.4874352812767029, 0.5111877918243408, 0.5349403023719788, 0.5586928129196167, 0.5824453234672546, 0.6061978340148926, 0.6299503445625305, 0.6537028551101685, 0.6774553656578064, 0.7012078762054443, 0.7249603867530823, 0.7487128376960754, 0.7724653482437134, 0.7962178587913513, 0.8199703693389893, 0.8437228798866272, 0.8674753904342651, 0.8912279009819031, 0.914980411529541, 0.938732922077179]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 11.0, 14.0, 7.0, 11.0, 26.0, 37.0, 45.0, 69.0, 83.0, 123.0, 161.0, 262.0, 330.0, 466.0, 808.0, 1315.0, 2577.0, 5478.0, 13709.0, 39025.0, 138789.0, 601019.0, 170481.0, 45070.0, 15699.0, 6205.0, 2714.0, 1428.0, 813.0, 531.0, 345.0, 260.0, 196.0, 131.0, 81.0, 65.0, 59.0, 27.0, 25.0, 15.0, 10.0, 9.0, 8.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.42626953125, -0.412322998046875, -0.39837646484375, -0.384429931640625, -0.3704833984375, -0.356536865234375, -0.34259033203125, -0.328643798828125, -0.314697265625, -0.300750732421875, -0.28680419921875, -0.272857666015625, -0.2589111328125, -0.244964599609375, -0.23101806640625, -0.217071533203125, -0.203125, -0.189178466796875, -0.17523193359375, -0.161285400390625, -0.1473388671875, -0.133392333984375, -0.11944580078125, -0.105499267578125, -0.091552734375, -0.077606201171875, -0.06365966796875, -0.049713134765625, -0.0357666015625, -0.021820068359375, -0.00787353515625, 0.006072998046875, 0.02001953125, 0.033966064453125, 0.04791259765625, 0.061859130859375, 0.0758056640625, 0.089752197265625, 0.10369873046875, 0.117645263671875, 0.131591796875, 0.145538330078125, 0.15948486328125, 0.173431396484375, 0.1873779296875, 0.201324462890625, 0.21527099609375, 0.229217529296875, 0.2431640625, 0.257110595703125, 0.27105712890625, 0.285003662109375, 0.2989501953125, 0.312896728515625, 0.32684326171875, 0.340789794921875, 0.354736328125, 0.368682861328125, 0.38262939453125, 0.396575927734375, 0.4105224609375, 0.424468994140625, 0.43841552734375, 0.452362060546875, 0.46630859375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 7.0, 13.0, 25.0, 28.0, 53.0, 63.0, 68.0, 104.0, 103.0, 101.0, 110.0, 75.0, 67.0, 53.0, 41.0, 26.0, 26.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.11956787109375, -0.11626815795898438, -0.11296844482421875, -0.10966873168945312, -0.1063690185546875, -0.10306930541992188, -0.09976959228515625, -0.09646987915039062, -0.093170166015625, -0.08987045288085938, -0.08657073974609375, -0.08327102661132812, -0.0799713134765625, -0.07667160034179688, -0.07337188720703125, -0.07007217407226562, -0.0667724609375, -0.06347274780273438, -0.06017303466796875, -0.056873321533203125, -0.0535736083984375, -0.050273895263671875, -0.04697418212890625, -0.043674468994140625, -0.040374755859375, -0.037075042724609375, -0.03377532958984375, -0.030475616455078125, -0.0271759033203125, -0.023876190185546875, -0.02057647705078125, -0.017276763916015625, -0.01397705078125, -0.010677337646484375, -0.00737762451171875, -0.004077911376953125, -0.0007781982421875, 0.002521514892578125, 0.00582122802734375, 0.009120941162109375, 0.012420654296875, 0.015720367431640625, 0.01902008056640625, 0.022319793701171875, 0.0256195068359375, 0.028919219970703125, 0.03221893310546875, 0.035518646240234375, 0.038818359375, 0.042118072509765625, 0.04541778564453125, 0.048717498779296875, 0.0520172119140625, 0.055316925048828125, 0.05861663818359375, 0.061916351318359375, 0.065216064453125, 0.06851577758789062, 0.07181549072265625, 0.07511520385742188, 0.0784149169921875, 0.08171463012695312, 0.08501434326171875, 0.08831405639648438, 0.09161376953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 7.0, 9.0, 12.0, 30.0, 41.0, 51.0, 57.0, 117.0, 138.0, 209.0, 278.0, 437.0, 640.0, 1001.0, 1559.0, 2381.0, 3860.0, 6147.0, 10154.0, 16943.0, 29864.0, 55003.0, 111045.0, 306611.0, 277021.0, 103402.0, 51471.0, 28266.0, 16244.0, 9625.0, 5752.0, 3533.0, 2300.0, 1521.0, 893.0, 625.0, 433.0, 257.0, 177.0, 130.0, 100.0, 53.0, 38.0, 36.0, 27.0, 17.0, 14.0, 14.0, 5.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1695556640625, -0.1640777587890625, -0.158599853515625, -0.1531219482421875, -0.14764404296875, -0.1421661376953125, -0.136688232421875, -0.1312103271484375, -0.125732421875, -0.1202545166015625, -0.114776611328125, -0.1092987060546875, -0.10382080078125, -0.0983428955078125, -0.092864990234375, -0.0873870849609375, -0.0819091796875, -0.0764312744140625, -0.070953369140625, -0.0654754638671875, -0.05999755859375, -0.0545196533203125, -0.049041748046875, -0.0435638427734375, -0.0380859375, -0.0326080322265625, -0.027130126953125, -0.0216522216796875, -0.01617431640625, -0.0106964111328125, -0.005218505859375, 0.0002593994140625, 0.0057373046875, 0.0112152099609375, 0.016693115234375, 0.0221710205078125, 0.02764892578125, 0.0331268310546875, 0.038604736328125, 0.0440826416015625, 0.049560546875, 0.0550384521484375, 0.060516357421875, 0.0659942626953125, 0.07147216796875, 0.0769500732421875, 0.082427978515625, 0.0879058837890625, 0.0933837890625, 0.0988616943359375, 0.104339599609375, 0.1098175048828125, 0.11529541015625, 0.1207733154296875, 0.126251220703125, 0.1317291259765625, 0.13720703125, 0.1426849365234375, 0.148162841796875, 0.1536407470703125, 0.15911865234375, 0.1645965576171875, 0.170074462890625, 0.1755523681640625, 0.1810302734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 3.0, 3.0, 7.0, 4.0, 5.0, 10.0, 12.0, 4.0, 16.0, 13.0, 22.0, 21.0, 24.0, 34.0, 31.0, 30.0, 33.0, 32.0, 37.0, 34.0, 51.0, 43.0, 50.0, 39.0, 46.0, 41.0, 36.0, 45.0, 30.0, 45.0, 34.0, 27.0, 19.0, 21.0, 23.0, 13.0, 13.0, 14.0, 12.0, 4.0, 4.0, 7.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.214111328125, -0.20761680603027344, -0.20112228393554688, -0.1946277618408203, -0.18813323974609375, -0.1816387176513672, -0.17514419555664062, -0.16864967346191406, -0.1621551513671875, -0.15566062927246094, -0.14916610717773438, -0.1426715850830078, -0.13617706298828125, -0.1296825408935547, -0.12318801879882812, -0.11669349670410156, -0.110198974609375, -0.10370445251464844, -0.09720993041992188, -0.09071540832519531, -0.08422088623046875, -0.07772636413574219, -0.07123184204101562, -0.06473731994628906, -0.0582427978515625, -0.05174827575683594, -0.045253753662109375, -0.03875923156738281, -0.03226470947265625, -0.025770187377929688, -0.019275665283203125, -0.012781143188476562, -0.00628662109375, 0.0002079010009765625, 0.006702423095703125, 0.013196945190429688, 0.01969146728515625, 0.026185989379882812, 0.032680511474609375, 0.03917503356933594, 0.0456695556640625, 0.05216407775878906, 0.058658599853515625, 0.06515312194824219, 0.07164764404296875, 0.07814216613769531, 0.08463668823242188, 0.09113121032714844, 0.097625732421875, 0.10412025451660156, 0.11061477661132812, 0.11710929870605469, 0.12360382080078125, 0.1300983428955078, 0.13659286499023438, 0.14308738708496094, 0.1495819091796875, 0.15607643127441406, 0.16257095336914062, 0.1690654754638672, 0.17555999755859375, 0.1820545196533203, 0.18854904174804688, 0.19504356384277344, 0.2015380859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 9.0, 15.0, 17.0, 24.0, 39.0, 62.0, 82.0, 190.0, 376.0, 793.0, 2230.0, 7443.0, 38322.0, 788503.0, 185899.0, 17509.0, 4372.0, 1437.0, 559.0, 303.0, 145.0, 79.0, 44.0, 31.0, 26.0, 18.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11456298828125, -0.1117544174194336, -0.10894584655761719, -0.10613727569580078, -0.10332870483398438, -0.10052013397216797, -0.09771156311035156, -0.09490299224853516, -0.09209442138671875, -0.08928585052490234, -0.08647727966308594, -0.08366870880126953, -0.08086013793945312, -0.07805156707763672, -0.07524299621582031, -0.0724344253540039, -0.0696258544921875, -0.0668172836303711, -0.06400871276855469, -0.06120014190673828, -0.058391571044921875, -0.05558300018310547, -0.05277442932128906, -0.049965858459472656, -0.04715728759765625, -0.044348716735839844, -0.04154014587402344, -0.03873157501220703, -0.035923004150390625, -0.03311443328857422, -0.030305862426757812, -0.027497291564941406, -0.024688720703125, -0.021880149841308594, -0.019071578979492188, -0.01626300811767578, -0.013454437255859375, -0.010645866394042969, -0.007837295532226562, -0.005028724670410156, -0.00222015380859375, 0.0005884170532226562, 0.0033969879150390625, 0.006205558776855469, 0.009014129638671875, 0.011822700500488281, 0.014631271362304688, 0.017439842224121094, 0.0202484130859375, 0.023056983947753906, 0.025865554809570312, 0.02867412567138672, 0.031482696533203125, 0.03429126739501953, 0.03709983825683594, 0.039908409118652344, 0.04271697998046875, 0.045525550842285156, 0.04833412170410156, 0.05114269256591797, 0.053951263427734375, 0.05675983428955078, 0.05956840515136719, 0.062376976013183594, 0.065185546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 5.0, 6.0, 8.0, 8.0, 15.0, 17.0, 25.0, 51.0, 61.0, 98.0, 114.0, 99.0, 124.0, 112.0, 68.0, 55.0, 42.0, 25.0, 16.0, 15.0, 4.0, 10.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.187707185745239e-06, -5.938112735748291e-06, -5.688518285751343e-06, -5.4389238357543945e-06, -5.189329385757446e-06, -4.939734935760498e-06, -4.69014048576355e-06, -4.4405460357666016e-06, -4.190951585769653e-06, -3.941357135772705e-06, -3.691762685775757e-06, -3.4421682357788086e-06, -3.1925737857818604e-06, -2.942979335784912e-06, -2.693384885787964e-06, -2.4437904357910156e-06, -2.1941959857940674e-06, -1.944601535797119e-06, -1.695007085800171e-06, -1.4454126358032227e-06, -1.1958181858062744e-06, -9.462237358093262e-07, -6.966292858123779e-07, -4.470348358154297e-07, -1.9744038581848145e-07, 5.21540641784668e-08, 3.0174851417541504e-07, 5.513429641723633e-07, 8.009374141693115e-07, 1.0505318641662598e-06, 1.300126314163208e-06, 1.5497207641601562e-06, 1.7993152141571045e-06, 2.0489096641540527e-06, 2.298504114151001e-06, 2.5480985641479492e-06, 2.7976930141448975e-06, 3.0472874641418457e-06, 3.296881914138794e-06, 3.546476364135742e-06, 3.7960708141326904e-06, 4.045665264129639e-06, 4.295259714126587e-06, 4.544854164123535e-06, 4.794448614120483e-06, 5.044043064117432e-06, 5.29363751411438e-06, 5.543231964111328e-06, 5.792826414108276e-06, 6.042420864105225e-06, 6.292015314102173e-06, 6.541609764099121e-06, 6.791204214096069e-06, 7.040798664093018e-06, 7.290393114089966e-06, 7.539987564086914e-06, 7.789582014083862e-06, 8.03917646408081e-06, 8.288770914077759e-06, 8.538365364074707e-06, 8.787959814071655e-06, 9.037554264068604e-06, 9.287148714065552e-06, 9.5367431640625e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 14.0, 15.0, 25.0, 32.0, 50.0, 63.0, 104.0, 144.0, 204.0, 335.0, 479.0, 761.0, 1251.0, 2182.0, 3769.0, 7192.0, 15106.0, 36727.0, 121220.0, 568097.0, 200456.0, 50927.0, 19471.0, 8906.0, 4470.0, 2522.0, 1486.0, 903.0, 494.0, 370.0, 245.0, 141.0, 125.0, 71.0, 56.0, 39.0, 26.0, 12.0, 8.0, 6.0, 8.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03033447265625, -0.029275894165039062, -0.028217315673828125, -0.027158737182617188, -0.02610015869140625, -0.025041580200195312, -0.023983001708984375, -0.022924423217773438, -0.0218658447265625, -0.020807266235351562, -0.019748687744140625, -0.018690109252929688, -0.01763153076171875, -0.016572952270507812, -0.015514373779296875, -0.014455795288085938, -0.013397216796875, -0.012338638305664062, -0.011280059814453125, -0.010221481323242188, -0.00916290283203125, -0.008104324340820312, -0.007045745849609375, -0.0059871673583984375, -0.0049285888671875, -0.0038700103759765625, -0.002811431884765625, -0.0017528533935546875, -0.00069427490234375, 0.0003643035888671875, 0.001422882080078125, 0.0024814605712890625, 0.0035400390625, 0.0045986175537109375, 0.005657196044921875, 0.0067157745361328125, 0.00777435302734375, 0.008832931518554688, 0.009891510009765625, 0.010950088500976562, 0.0120086669921875, 0.013067245483398438, 0.014125823974609375, 0.015184402465820312, 0.01624298095703125, 0.017301559448242188, 0.018360137939453125, 0.019418716430664062, 0.020477294921875, 0.021535873413085938, 0.022594451904296875, 0.023653030395507812, 0.02471160888671875, 0.025770187377929688, 0.026828765869140625, 0.027887344360351562, 0.0289459228515625, 0.030004501342773438, 0.031063079833984375, 0.03212165832519531, 0.03318023681640625, 0.03423881530761719, 0.035297393798828125, 0.03635597229003906, 0.03741455078125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 5.0, 8.0, 5.0, 6.0, 8.0, 25.0, 18.0, 28.0, 30.0, 45.0, 61.0, 82.0, 106.0, 103.0, 93.0, 86.0, 67.0, 47.0, 36.0, 29.0, 29.0, 15.0, 13.0, 19.0, 11.0, 1.0, 4.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043853759765625, -0.042668819427490234, -0.04148387908935547, -0.0402989387512207, -0.03911399841308594, -0.03792905807495117, -0.036744117736816406, -0.03555917739868164, -0.034374237060546875, -0.03318929672241211, -0.032004356384277344, -0.030819416046142578, -0.029634475708007812, -0.028449535369873047, -0.02726459503173828, -0.026079654693603516, -0.02489471435546875, -0.023709774017333984, -0.02252483367919922, -0.021339893341064453, -0.020154953002929688, -0.018970012664794922, -0.017785072326660156, -0.01660013198852539, -0.015415191650390625, -0.01423025131225586, -0.013045310974121094, -0.011860370635986328, -0.010675430297851562, -0.009490489959716797, -0.008305549621582031, -0.007120609283447266, -0.0059356689453125, -0.004750728607177734, -0.0035657882690429688, -0.002380847930908203, -0.0011959075927734375, -1.0967254638671875e-05, 0.0011739730834960938, 0.0023589134216308594, 0.003543853759765625, 0.004728794097900391, 0.005913734436035156, 0.007098674774169922, 0.008283615112304688, 0.009468555450439453, 0.010653495788574219, 0.011838436126708984, 0.01302337646484375, 0.014208316802978516, 0.015393257141113281, 0.016578197479248047, 0.017763137817382812, 0.018948078155517578, 0.020133018493652344, 0.02131795883178711, 0.022502899169921875, 0.02368783950805664, 0.024872779846191406, 0.026057720184326172, 0.027242660522460938, 0.028427600860595703, 0.02961254119873047, 0.030797481536865234, 0.031982421875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 0.0, 5.0, 12.0, 8.0, 13.0, 12.0, 17.0, 29.0, 52.0, 95.0, 164.0, 204.0, 140.0, 98.0, 34.0, 32.0, 20.0, 16.0, 11.0, 12.0, 12.0, 5.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2310895919799805, -1.1736921072006226, -1.116294503211975, -1.0588970184326172, -1.0014994144439697, -0.9441019296646118, -0.8867044448852539, -0.8293069005012512, -0.7719093561172485, -0.7145118117332458, -0.6571142673492432, -0.5997167825698853, -0.5423192381858826, -0.4849216938018799, -0.4275241792201996, -0.3701266646385193, -0.3127291202545166, -0.2553315758705139, -0.19793406128883362, -0.14053653180599213, -0.08313900232315063, -0.02574145793914795, 0.03165605664253235, 0.08905357122421265, 0.14645111560821533, 0.20384864509105682, 0.2612461745738983, 0.3186436891555786, 0.3760412335395813, 0.433438777923584, 0.4908362925052643, 0.5482338070869446, 0.6056313514709473, 0.66302889585495, 0.7204264402389526, 0.7778239250183105, 0.8352214694023132, 0.8926190137863159, 0.9500164985656738, 1.0074141025543213, 1.0648115873336792, 1.122209072113037, 1.1796066761016846, 1.2370041608810425, 1.2944016456604004, 1.3517992496490479, 1.4091967344284058, 1.4665942192077637, 1.5239918231964111, 1.581389307975769, 1.6387869119644165, 1.6961843967437744, 1.7535820007324219, 1.8109794855117798, 1.8683769702911377, 1.9257745742797852, 1.983172059059143, 2.040569543838501, 2.0979671478271484, 2.155364751815796, 2.2127621173858643, 2.2701597213745117, 2.327557325363159, 2.3849546909332275, 2.442352294921875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 5.0, 2.0, 8.0, 12.0, 16.0, 10.0, 13.0, 19.0, 20.0, 22.0, 17.0, 24.0, 24.0, 30.0, 23.0, 30.0, 31.0, 39.0, 32.0, 43.0, 47.0, 35.0, 28.0, 46.0, 34.0, 50.0, 44.0, 32.0, 32.0, 18.0, 24.0, 24.0, 24.0, 24.0, 22.0, 14.0, 10.0, 11.0, 11.0, 5.0, 6.0, 11.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.9229007363319397, -0.894628643989563, -0.8663565516471863, -0.8380844593048096, -0.8098123669624329, -0.7815402746200562, -0.7532682418823242, -0.7249960899353027, -0.6967240571975708, -0.6684519648551941, -0.6401798725128174, -0.6119077801704407, -0.583635687828064, -0.5553635954856873, -0.5270915031433105, -0.4988194406032562, -0.47054731845855713, -0.4422752261161804, -0.4140031337738037, -0.385731041431427, -0.3574589490890503, -0.3291868567466736, -0.30091479420661926, -0.27264270186424255, -0.24437060952186584, -0.21609851717948914, -0.18782642483711243, -0.1595543473958969, -0.1312822550535202, -0.1030101627111435, -0.07473808526992798, -0.04646599292755127, -0.01819390058517456, 0.01007818803191185, 0.03835027664899826, 0.06662236154079437, 0.09489445388317108, 0.12316654622554779, 0.1514386236667633, 0.17971071600914001, 0.20798280835151672, 0.23625490069389343, 0.26452699303627014, 0.29279905557632446, 0.32107114791870117, 0.3493432402610779, 0.3776153326034546, 0.4058874249458313, 0.434159517288208, 0.4624316096305847, 0.4907037019729614, 0.5189757943153381, 0.5472478866577148, 0.5755199790000916, 0.6037920713424683, 0.6320641040802002, 0.6603362560272217, 0.6886083483695984, 0.7168804407119751, 0.7451525330543518, 0.7734246253967285, 0.8016967177391052, 0.8299688100814819, 0.8582408428192139, 0.8865129351615906]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 3.0, 10.0, 18.0, 12.0, 20.0, 33.0, 67.0, 85.0, 153.0, 345.0, 622.0, 1446.0, 4651.0, 60455.0, 4115290.0, 7483.0, 1919.0, 765.0, 409.0, 193.0, 103.0, 54.0, 46.0, 16.0, 13.0, 13.0, 5.0, 8.0, 9.0, 3.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0107421875, -0.9792938232421875, -0.947845458984375, -0.9163970947265625, -0.88494873046875, -0.8535003662109375, -0.822052001953125, -0.7906036376953125, -0.7591552734375, -0.7277069091796875, -0.696258544921875, -0.6648101806640625, -0.63336181640625, -0.6019134521484375, -0.570465087890625, -0.5390167236328125, -0.507568359375, -0.4761199951171875, -0.444671630859375, -0.4132232666015625, -0.38177490234375, -0.3503265380859375, -0.318878173828125, -0.2874298095703125, -0.2559814453125, -0.2245330810546875, -0.193084716796875, -0.1616363525390625, -0.13018798828125, -0.0987396240234375, -0.067291259765625, -0.0358428955078125, -0.00439453125, 0.0270538330078125, 0.058502197265625, 0.0899505615234375, 0.12139892578125, 0.1528472900390625, 0.184295654296875, 0.2157440185546875, 0.2471923828125, 0.2786407470703125, 0.310089111328125, 0.3415374755859375, 0.37298583984375, 0.4044342041015625, 0.435882568359375, 0.4673309326171875, 0.498779296875, 0.5302276611328125, 0.561676025390625, 0.5931243896484375, 0.62457275390625, 0.6560211181640625, 0.687469482421875, 0.7189178466796875, 0.7503662109375, 0.7818145751953125, 0.813262939453125, 0.8447113037109375, 0.87615966796875, 0.9076080322265625, 0.939056396484375, 0.9705047607421875, 1.001953125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 18.0, 19.0, 31.0, 38.0, 58.0, 93.0, 86.0, 115.0, 111.0, 102.0, 74.0, 64.0, 75.0, 35.0, 25.0, 18.0, 16.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1192626953125, -0.11587810516357422, -0.11249351501464844, -0.10910892486572266, -0.10572433471679688, -0.1023397445678711, -0.09895515441894531, -0.09557056427001953, -0.09218597412109375, -0.08880138397216797, -0.08541679382324219, -0.0820322036743164, -0.07864761352539062, -0.07526302337646484, -0.07187843322753906, -0.06849384307861328, -0.0651092529296875, -0.06172466278076172, -0.05834007263183594, -0.054955482482910156, -0.051570892333984375, -0.048186302185058594, -0.04480171203613281, -0.04141712188720703, -0.03803253173828125, -0.03464794158935547, -0.03126335144042969, -0.027878761291503906, -0.024494171142578125, -0.021109580993652344, -0.017724990844726562, -0.014340400695800781, -0.010955810546875, -0.007571220397949219, -0.0041866302490234375, -0.0008020401000976562, 0.002582550048828125, 0.005967140197753906, 0.009351730346679688, 0.012736320495605469, 0.01612091064453125, 0.01950550079345703, 0.022890090942382812, 0.026274681091308594, 0.029659271240234375, 0.033043861389160156, 0.03642845153808594, 0.03981304168701172, 0.0431976318359375, 0.04658222198486328, 0.04996681213378906, 0.053351402282714844, 0.056735992431640625, 0.060120582580566406, 0.06350517272949219, 0.06688976287841797, 0.07027435302734375, 0.07365894317626953, 0.07704353332519531, 0.0804281234741211, 0.08381271362304688, 0.08719730377197266, 0.09058189392089844, 0.09396648406982422, 0.09735107421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 6.0, 4.0, 7.0, 12.0, 19.0, 14.0, 29.0, 50.0, 50.0, 81.0, 111.0, 170.0, 199.0, 266.0, 396.0, 528.0, 711.0, 1098.0, 1527.0, 2350.0, 4023.0, 6835.0, 13751.0, 32215.0, 277350.0, 3773593.0, 41755.0, 16277.0, 8094.0, 4450.0, 2719.0, 1623.0, 1168.0, 770.0, 567.0, 402.0, 295.0, 201.0, 161.0, 115.0, 79.0, 55.0, 51.0, 37.0, 22.0, 13.0, 9.0, 11.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.246337890625, -0.23866653442382812, -0.23099517822265625, -0.22332382202148438, -0.2156524658203125, -0.20798110961914062, -0.20030975341796875, -0.19263839721679688, -0.184967041015625, -0.17729568481445312, -0.16962432861328125, -0.16195297241210938, -0.1542816162109375, -0.14661026000976562, -0.13893890380859375, -0.13126754760742188, -0.12359619140625, -0.11592483520507812, -0.10825347900390625, -0.10058212280273438, -0.0929107666015625, -0.08523941040039062, -0.07756805419921875, -0.06989669799804688, -0.062225341796875, -0.054553985595703125, -0.04688262939453125, -0.039211273193359375, -0.0315399169921875, -0.023868560791015625, -0.01619720458984375, -0.008525848388671875, -0.0008544921875, 0.006816864013671875, 0.01448822021484375, 0.022159576416015625, 0.0298309326171875, 0.037502288818359375, 0.04517364501953125, 0.052845001220703125, 0.060516357421875, 0.06818771362304688, 0.07585906982421875, 0.08353042602539062, 0.0912017822265625, 0.09887313842773438, 0.10654449462890625, 0.11421585083007812, 0.12188720703125, 0.12955856323242188, 0.13722991943359375, 0.14490127563476562, 0.1525726318359375, 0.16024398803710938, 0.16791534423828125, 0.17558670043945312, 0.183258056640625, 0.19092941284179688, 0.19860076904296875, 0.20627212524414062, 0.2139434814453125, 0.22161483764648438, 0.22928619384765625, 0.23695755004882812, 0.24462890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 7.0, 5.0, 11.0, 11.0, 16.0, 32.0, 64.0, 494.0, 3168.0, 95.0, 34.0, 22.0, 17.0, 12.0, 11.0, 12.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.133056640625, -0.1290416717529297, -0.12502670288085938, -0.12101173400878906, -0.11699676513671875, -0.11298179626464844, -0.10896682739257812, -0.10495185852050781, -0.1009368896484375, -0.09692192077636719, -0.09290695190429688, -0.08889198303222656, -0.08487701416015625, -0.08086204528808594, -0.07684707641601562, -0.07283210754394531, -0.068817138671875, -0.06480216979980469, -0.060787200927734375, -0.05677223205566406, -0.05275726318359375, -0.04874229431152344, -0.044727325439453125, -0.04071235656738281, -0.0366973876953125, -0.03268241882324219, -0.028667449951171875, -0.024652481079101562, -0.02063751220703125, -0.016622543334960938, -0.012607574462890625, -0.008592605590820312, -0.00457763671875, -0.0005626678466796875, 0.003452301025390625, 0.0074672698974609375, 0.01148223876953125, 0.015497207641601562, 0.019512176513671875, 0.023527145385742188, 0.0275421142578125, 0.03155708312988281, 0.035572052001953125, 0.03958702087402344, 0.04360198974609375, 0.04761695861816406, 0.051631927490234375, 0.05564689636230469, 0.059661865234375, 0.06367683410644531, 0.06769180297851562, 0.07170677185058594, 0.07572174072265625, 0.07973670959472656, 0.08375167846679688, 0.08776664733886719, 0.0917816162109375, 0.09579658508300781, 0.09981155395507812, 0.10382652282714844, 0.10784149169921875, 0.11185646057128906, 0.11587142944335938, 0.11988639831542969, 0.1239013671875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 0.0, 5.0, 6.0, 6.0, 13.0, 6.0, 13.0, 10.0, 18.0, 24.0, 38.0, 57.0, 85.0, 117.0, 151.0, 121.0, 97.0, 60.0, 43.0, 21.0, 22.0, 18.0, 16.0, 8.0, 8.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37012985348701477, -0.3580525815486908, -0.3459753394126892, -0.33389806747436523, -0.32182079553604126, -0.3097435534000397, -0.2976662814617157, -0.2855890393257141, -0.27351176738739014, -0.26143449544906616, -0.24935725331306458, -0.2372799813747406, -0.22520272433757782, -0.21312546730041504, -0.20104819536209106, -0.18897093832492828, -0.1768936812877655, -0.16481642425060272, -0.15273916721343994, -0.14066189527511597, -0.12858463823795319, -0.1165073812007904, -0.10443011671304703, -0.09235285222530365, -0.08027559518814087, -0.06819833815097809, -0.05612107366323471, -0.04404381290078163, -0.03196655213832855, -0.019889291375875473, -0.007812030613422394, 0.004265233874320984, 0.016342461109161377, 0.028419721871614456, 0.040496982634067535, 0.052574243396520615, 0.0646515041589737, 0.07672876119613647, 0.08880602568387985, 0.10088329017162323, 0.11296054720878601, 0.1250378042459488, 0.13711506128311157, 0.14919233322143555, 0.16126959025859833, 0.1733468472957611, 0.18542411923408508, 0.19750137627124786, 0.20957863330841064, 0.22165589034557343, 0.2337331473827362, 0.24581041932106018, 0.25788766145706177, 0.26996493339538574, 0.2820422053337097, 0.2941194772720337, 0.3061967194080353, 0.31827399134635925, 0.33035123348236084, 0.3424285054206848, 0.3545057773590088, 0.3665830194950104, 0.37866029143333435, 0.39073753356933594, 0.4028148055076599]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 5.0, 4.0, 14.0, 9.0, 19.0, 16.0, 16.0, 15.0, 21.0, 24.0, 22.0, 28.0, 26.0, 29.0, 29.0, 28.0, 40.0, 50.0, 29.0, 48.0, 40.0, 44.0, 37.0, 35.0, 36.0, 35.0, 33.0, 37.0, 37.0, 26.0, 22.0, 19.0, 21.0, 18.0, 14.0, 18.0, 10.0, 9.0, 6.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23685616254806519, -0.22855837643146515, -0.2202605903148651, -0.21196278929710388, -0.20366500318050385, -0.1953672170639038, -0.18706943094730377, -0.17877164483070374, -0.1704738438129425, -0.16217605769634247, -0.15387827157974243, -0.1455804705619812, -0.13728268444538116, -0.12898489832878113, -0.12068711221218109, -0.11238932609558105, -0.10409153997898102, -0.09579375386238098, -0.08749596029520035, -0.07919817417860031, -0.07090038061141968, -0.06260259449481964, -0.054304808378219604, -0.04600701853632927, -0.037709228694438934, -0.0294114388525486, -0.021113650873303413, -0.012815862894058228, -0.0045180730521678925, 0.0037797167897224426, 0.01207750290632248, 0.020375292748212814, 0.02867308259010315, 0.036970872431993484, 0.04526866227388382, 0.053566448390483856, 0.06186423823237419, 0.07016202807426453, 0.07845981419086456, 0.0867576003074646, 0.09505539387464523, 0.10335317999124527, 0.1116509735584259, 0.11994875967502594, 0.12824654579162598, 0.1365443468093872, 0.14484211802482605, 0.15313991904258728, 0.16143770515918732, 0.16973549127578735, 0.1780332773923874, 0.18633106350898743, 0.19462886452674866, 0.2029266506433487, 0.21122443675994873, 0.21952222287654877, 0.2278200089931488, 0.23611779510974884, 0.24441558122634888, 0.2527133822441101, 0.26101115345954895, 0.2693089544773102, 0.277606725692749, 0.28590452671051025, 0.2942023277282715]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 11.0, 7.0, 9.0, 19.0, 22.0, 36.0, 49.0, 58.0, 90.0, 114.0, 172.0, 229.0, 404.0, 630.0, 1047.0, 1943.0, 4342.0, 10782.0, 35378.0, 156542.0, 644157.0, 140687.0, 32953.0, 10240.0, 4031.0, 1863.0, 947.0, 569.0, 368.0, 238.0, 173.0, 123.0, 85.0, 73.0, 48.0, 29.0, 21.0, 23.0, 12.0, 5.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4342002868652344, -0.42040252685546875, -0.4066047668457031, -0.3928070068359375, -0.3790092468261719, -0.36521148681640625, -0.3514137268066406, -0.337615966796875, -0.3238182067871094, -0.31002044677734375, -0.2962226867675781, -0.2824249267578125, -0.2686271667480469, -0.25482940673828125, -0.24103164672851562, -0.22723388671875, -0.21343612670898438, -0.19963836669921875, -0.18584060668945312, -0.1720428466796875, -0.15824508666992188, -0.14444732666015625, -0.13064956665039062, -0.116851806640625, -0.10305404663085938, -0.08925628662109375, -0.07545852661132812, -0.0616607666015625, -0.047863006591796875, -0.03406524658203125, -0.020267486572265625, -0.0064697265625, 0.007328033447265625, 0.02112579345703125, 0.034923553466796875, 0.0487213134765625, 0.06251907348632812, 0.07631683349609375, 0.09011459350585938, 0.103912353515625, 0.11771011352539062, 0.13150787353515625, 0.14530563354492188, 0.1591033935546875, 0.17290115356445312, 0.18669891357421875, 0.20049667358398438, 0.21429443359375, 0.22809219360351562, 0.24188995361328125, 0.2556877136230469, 0.2694854736328125, 0.2832832336425781, 0.29708099365234375, 0.3108787536621094, 0.324676513671875, 0.3384742736816406, 0.35227203369140625, 0.3660697937011719, 0.3798675537109375, 0.3936653137207031, 0.40746307373046875, 0.4212608337402344, 0.43505859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 7.0, 8.0, 21.0, 22.0, 34.0, 57.0, 72.0, 92.0, 108.0, 124.0, 97.0, 95.0, 74.0, 66.0, 45.0, 27.0, 22.0, 16.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1212158203125, -0.11771297454833984, -0.11421012878417969, -0.11070728302001953, -0.10720443725585938, -0.10370159149169922, -0.10019874572753906, -0.0966958999633789, -0.09319305419921875, -0.0896902084350586, -0.08618736267089844, -0.08268451690673828, -0.07918167114257812, -0.07567882537841797, -0.07217597961425781, -0.06867313385009766, -0.0651702880859375, -0.061667442321777344, -0.05816459655761719, -0.05466175079345703, -0.051158905029296875, -0.04765605926513672, -0.04415321350097656, -0.040650367736816406, -0.03714752197265625, -0.033644676208496094, -0.030141830444335938, -0.02663898468017578, -0.023136138916015625, -0.01963329315185547, -0.016130447387695312, -0.012627601623535156, -0.009124755859375, -0.005621910095214844, -0.0021190643310546875, 0.0013837814331054688, 0.004886627197265625, 0.008389472961425781, 0.011892318725585938, 0.015395164489746094, 0.01889801025390625, 0.022400856018066406, 0.025903701782226562, 0.02940654754638672, 0.032909393310546875, 0.03641223907470703, 0.03991508483886719, 0.043417930603027344, 0.0469207763671875, 0.050423622131347656, 0.05392646789550781, 0.05742931365966797, 0.060932159423828125, 0.06443500518798828, 0.06793785095214844, 0.0714406967163086, 0.07494354248046875, 0.0784463882446289, 0.08194923400878906, 0.08545207977294922, 0.08895492553710938, 0.09245777130126953, 0.09596061706542969, 0.09946346282958984, 0.10296630859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 18.0, 9.0, 16.0, 22.0, 45.0, 66.0, 75.0, 128.0, 228.0, 334.0, 503.0, 763.0, 1219.0, 1976.0, 3300.0, 5496.0, 8668.0, 15070.0, 25352.0, 45077.0, 84151.0, 190519.0, 351078.0, 149058.0, 70922.0, 38753.0, 22242.0, 13118.0, 7865.0, 4717.0, 2893.0, 1802.0, 1158.0, 660.0, 418.0, 281.0, 198.0, 121.0, 91.0, 42.0, 35.0, 23.0, 20.0, 10.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1541748046875, -0.1494121551513672, -0.14464950561523438, -0.13988685607910156, -0.13512420654296875, -0.13036155700683594, -0.12559890747070312, -0.12083625793457031, -0.1160736083984375, -0.11131095886230469, -0.10654830932617188, -0.10178565979003906, -0.09702301025390625, -0.09226036071777344, -0.08749771118164062, -0.08273506164550781, -0.077972412109375, -0.07320976257324219, -0.06844711303710938, -0.06368446350097656, -0.05892181396484375, -0.05415916442871094, -0.049396514892578125, -0.04463386535644531, -0.0398712158203125, -0.03510856628417969, -0.030345916748046875, -0.025583267211914062, -0.02082061767578125, -0.016057968139648438, -0.011295318603515625, -0.0065326690673828125, -0.00177001953125, 0.0029926300048828125, 0.007755279541015625, 0.012517929077148438, 0.01728057861328125, 0.022043228149414062, 0.026805877685546875, 0.03156852722167969, 0.0363311767578125, 0.04109382629394531, 0.045856475830078125, 0.05061912536621094, 0.05538177490234375, 0.06014442443847656, 0.06490707397460938, 0.06966972351074219, 0.074432373046875, 0.07919502258300781, 0.08395767211914062, 0.08872032165527344, 0.09348297119140625, 0.09824562072753906, 0.10300827026367188, 0.10777091979980469, 0.1125335693359375, 0.11729621887207031, 0.12205886840820312, 0.12682151794433594, 0.13158416748046875, 0.13634681701660156, 0.14110946655273438, 0.1458721160888672, 0.150634765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 0.0, 4.0, 3.0, 4.0, 6.0, 3.0, 11.0, 19.0, 15.0, 16.0, 13.0, 21.0, 23.0, 22.0, 26.0, 37.0, 25.0, 48.0, 31.0, 28.0, 27.0, 39.0, 45.0, 37.0, 43.0, 29.0, 39.0, 34.0, 42.0, 29.0, 28.0, 34.0, 23.0, 24.0, 23.0, 23.0, 28.0, 21.0, 8.0, 17.0, 13.0, 10.0, 7.0, 11.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.14209747314453125, -0.1367340087890625, -0.13137054443359375, -0.126007080078125, -0.12064361572265625, -0.1152801513671875, -0.10991668701171875, -0.10455322265625, -0.09918975830078125, -0.0938262939453125, -0.08846282958984375, -0.083099365234375, -0.07773590087890625, -0.0723724365234375, -0.06700897216796875, -0.0616455078125, -0.05628204345703125, -0.0509185791015625, -0.04555511474609375, -0.040191650390625, -0.03482818603515625, -0.0294647216796875, -0.02410125732421875, -0.01873779296875, -0.01337432861328125, -0.0080108642578125, -0.00264739990234375, 0.002716064453125, 0.00807952880859375, 0.0134429931640625, 0.01880645751953125, 0.024169921875, 0.02953338623046875, 0.0348968505859375, 0.04026031494140625, 0.045623779296875, 0.05098724365234375, 0.0563507080078125, 0.06171417236328125, 0.06707763671875, 0.07244110107421875, 0.0778045654296875, 0.08316802978515625, 0.088531494140625, 0.09389495849609375, 0.0992584228515625, 0.10462188720703125, 0.1099853515625, 0.11534881591796875, 0.1207122802734375, 0.12607574462890625, 0.131439208984375, 0.13680267333984375, 0.1421661376953125, 0.14752960205078125, 0.15289306640625, 0.15825653076171875, 0.1636199951171875, 0.16898345947265625, 0.174346923828125, 0.17971038818359375, 0.1850738525390625, 0.19043731689453125, 0.19580078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 10.0, 26.0, 23.0, 48.0, 82.0, 149.0, 306.0, 480.0, 1053.0, 2079.0, 4724.0, 12009.0, 38597.0, 233361.0, 650442.0, 73064.0, 19289.0, 6969.0, 2925.0, 1392.0, 702.0, 324.0, 188.0, 117.0, 72.0, 40.0, 20.0, 12.0, 12.0, 7.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.04558897018432617, -0.044363975524902344, -0.043138980865478516, -0.04191398620605469, -0.04068899154663086, -0.03946399688720703, -0.0382390022277832, -0.037014007568359375, -0.03578901290893555, -0.03456401824951172, -0.03333902359008789, -0.03211402893066406, -0.030889034271240234, -0.029664039611816406, -0.028439044952392578, -0.02721405029296875, -0.025989055633544922, -0.024764060974121094, -0.023539066314697266, -0.022314071655273438, -0.02108907699584961, -0.01986408233642578, -0.018639087677001953, -0.017414093017578125, -0.016189098358154297, -0.014964103698730469, -0.01373910903930664, -0.012514114379882812, -0.011289119720458984, -0.010064125061035156, -0.008839130401611328, -0.0076141357421875, -0.006389141082763672, -0.005164146423339844, -0.003939151763916016, -0.0027141571044921875, -0.0014891624450683594, -0.00026416778564453125, 0.0009608268737792969, 0.002185821533203125, 0.003410816192626953, 0.004635810852050781, 0.005860805511474609, 0.0070858001708984375, 0.008310794830322266, 0.009535789489746094, 0.010760784149169922, 0.01198577880859375, 0.013210773468017578, 0.014435768127441406, 0.015660762786865234, 0.016885757446289062, 0.01811075210571289, 0.01933574676513672, 0.020560741424560547, 0.021785736083984375, 0.023010730743408203, 0.02423572540283203, 0.02546072006225586, 0.026685714721679688, 0.027910709381103516, 0.029135704040527344, 0.030360698699951172, 0.031585693359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 6.0, 5.0, 12.0, 13.0, 37.0, 30.0, 48.0, 76.0, 58.0, 79.0, 113.0, 89.0, 87.0, 118.0, 61.0, 55.0, 26.0, 19.0, 19.0, 11.0, 8.0, 12.0, 3.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.448927938938141e-06, -4.248693585395813e-06, -4.048459231853485e-06, -3.848224878311157e-06, -3.6479905247688293e-06, -3.4477561712265015e-06, -3.2475218176841736e-06, -3.0472874641418457e-06, -2.847053110599518e-06, -2.64681875705719e-06, -2.446584403514862e-06, -2.246350049972534e-06, -2.0461156964302063e-06, -1.8458813428878784e-06, -1.6456469893455505e-06, -1.4454126358032227e-06, -1.2451782822608948e-06, -1.044943928718567e-06, -8.44709575176239e-07, -6.444752216339111e-07, -4.4424086809158325e-07, -2.4400651454925537e-07, -4.377216100692749e-08, 1.564621925354004e-07, 3.5669654607772827e-07, 5.569308996200562e-07, 7.57165253162384e-07, 9.57399606704712e-07, 1.1576339602470398e-06, 1.3578683137893677e-06, 1.5581026673316956e-06, 1.7583370208740234e-06, 1.9585713744163513e-06, 2.158805727958679e-06, 2.359040081501007e-06, 2.559274435043335e-06, 2.759508788585663e-06, 2.9597431421279907e-06, 3.1599774956703186e-06, 3.3602118492126465e-06, 3.5604462027549744e-06, 3.7606805562973022e-06, 3.96091490983963e-06, 4.161149263381958e-06, 4.361383616924286e-06, 4.561617970466614e-06, 4.761852324008942e-06, 4.9620866775512695e-06, 5.162321031093597e-06, 5.362555384635925e-06, 5.562789738178253e-06, 5.763024091720581e-06, 5.963258445262909e-06, 6.163492798805237e-06, 6.363727152347565e-06, 6.563961505889893e-06, 6.7641958594322205e-06, 6.964430212974548e-06, 7.164664566516876e-06, 7.364898920059204e-06, 7.565133273601532e-06, 7.76536762714386e-06, 7.965601980686188e-06, 8.165836334228516e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 12.0, 16.0, 24.0, 33.0, 52.0, 78.0, 106.0, 194.0, 362.0, 572.0, 980.0, 1889.0, 3670.0, 7988.0, 20466.0, 74317.0, 586643.0, 278711.0, 45167.0, 14518.0, 6280.0, 2938.0, 1432.0, 846.0, 508.0, 244.0, 168.0, 116.0, 63.0, 55.0, 39.0, 16.0, 13.0, 9.0, 12.0, 3.0, 8.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294189453125, -0.028464794158935547, -0.027510643005371094, -0.02655649185180664, -0.025602340698242188, -0.024648189544677734, -0.02369403839111328, -0.022739887237548828, -0.021785736083984375, -0.020831584930419922, -0.01987743377685547, -0.018923282623291016, -0.017969131469726562, -0.01701498031616211, -0.016060829162597656, -0.015106678009033203, -0.01415252685546875, -0.013198375701904297, -0.012244224548339844, -0.01129007339477539, -0.010335922241210938, -0.009381771087646484, -0.008427619934082031, -0.007473468780517578, -0.006519317626953125, -0.005565166473388672, -0.004611015319824219, -0.0036568641662597656, -0.0027027130126953125, -0.0017485618591308594, -0.0007944107055664062, 0.00015974044799804688, 0.0011138916015625, 0.002068042755126953, 0.0030221939086914062, 0.003976345062255859, 0.0049304962158203125, 0.005884647369384766, 0.006838798522949219, 0.007792949676513672, 0.008747100830078125, 0.009701251983642578, 0.010655403137207031, 0.011609554290771484, 0.012563705444335938, 0.01351785659790039, 0.014472007751464844, 0.015426158905029297, 0.01638031005859375, 0.017334461212158203, 0.018288612365722656, 0.01924276351928711, 0.020196914672851562, 0.021151065826416016, 0.02210521697998047, 0.023059368133544922, 0.024013519287109375, 0.024967670440673828, 0.02592182159423828, 0.026875972747802734, 0.027830123901367188, 0.02878427505493164, 0.029738426208496094, 0.030692577362060547, 0.031646728515625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 5.0, 2.0, 10.0, 13.0, 14.0, 14.0, 24.0, 37.0, 51.0, 70.0, 77.0, 102.0, 143.0, 113.0, 84.0, 82.0, 43.0, 24.0, 23.0, 9.0, 8.0, 10.0, 9.0, 7.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03271484375, -0.03179574012756348, -0.030876636505126953, -0.02995753288269043, -0.029038429260253906, -0.028119325637817383, -0.02720022201538086, -0.026281118392944336, -0.025362014770507812, -0.02444291114807129, -0.023523807525634766, -0.022604703903198242, -0.02168560028076172, -0.020766496658325195, -0.019847393035888672, -0.01892828941345215, -0.018009185791015625, -0.0170900821685791, -0.016170978546142578, -0.015251874923706055, -0.014332771301269531, -0.013413667678833008, -0.012494564056396484, -0.011575460433959961, -0.010656356811523438, -0.009737253189086914, -0.00881814956665039, -0.007899045944213867, -0.006979942321777344, -0.00606083869934082, -0.005141735076904297, -0.0042226314544677734, -0.00330352783203125, -0.0023844242095947266, -0.0014653205871582031, -0.0005462169647216797, 0.00037288665771484375, 0.0012919902801513672, 0.0022110939025878906, 0.003130197525024414, 0.0040493011474609375, 0.004968404769897461, 0.005887508392333984, 0.006806612014770508, 0.007725715637207031, 0.008644819259643555, 0.009563922882080078, 0.010483026504516602, 0.011402130126953125, 0.012321233749389648, 0.013240337371826172, 0.014159440994262695, 0.015078544616699219, 0.015997648239135742, 0.016916751861572266, 0.01783585548400879, 0.018754959106445312, 0.019674062728881836, 0.02059316635131836, 0.021512269973754883, 0.022431373596191406, 0.02335047721862793, 0.024269580841064453, 0.025188684463500977, 0.0261077880859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 8.0, 9.0, 13.0, 8.0, 14.0, 20.0, 27.0, 41.0, 57.0, 70.0, 145.0, 189.0, 134.0, 84.0, 52.0, 25.0, 24.0, 21.0, 19.0, 9.0, 6.0, 3.0, 7.0, 3.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.807403564453125, -1.7669123411178589, -1.7264211177825928, -1.685929775238037, -1.645438551902771, -1.6049473285675049, -1.5644559860229492, -1.523964762687683, -1.483473539352417, -1.4429823160171509, -1.4024910926818848, -1.361999750137329, -1.321508526802063, -1.2810173034667969, -1.2405259609222412, -1.200034737586975, -1.159543514251709, -1.1190522909164429, -1.0785610675811768, -1.038069725036621, -0.997578501701355, -0.9570872783660889, -0.916595995426178, -0.8761047124862671, -0.835613489151001, -0.7951222658157349, -0.754630982875824, -0.7141396999359131, -0.673648476600647, -0.6331572532653809, -0.59266597032547, -0.5521746873855591, -0.5116835832595825, -0.471192330121994, -0.4307010769844055, -0.390209823846817, -0.3497185707092285, -0.30922731757164, -0.2687360644340515, -0.228244811296463, -0.1877535581588745, -0.147262305021286, -0.10677105188369751, -0.06627979874610901, -0.025788545608520508, 0.014702707529067993, 0.055193960666656494, 0.095685213804245, 0.1361764669418335, 0.176667720079422, 0.2171589732170105, 0.257650226354599, 0.2981414794921875, 0.338632732629776, 0.3791239857673645, 0.419615238904953, 0.4601064920425415, 0.5005977153778076, 0.5410889983177185, 0.5815802812576294, 0.6220715045928955, 0.6625627279281616, 0.7030540108680725, 0.7435452938079834, 0.7840365171432495]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 8.0, 8.0, 11.0, 12.0, 15.0, 18.0, 20.0, 24.0, 29.0, 33.0, 29.0, 34.0, 35.0, 35.0, 50.0, 44.0, 40.0, 61.0, 57.0, 52.0, 55.0, 36.0, 48.0, 33.0, 25.0, 33.0, 20.0, 29.0, 17.0, 17.0, 18.0, 13.0, 4.0, 13.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7344107031822205, -0.705753743648529, -0.6770967245101929, -0.6484397649765015, -0.6197828054428101, -0.5911257863044739, -0.5624688267707825, -0.5338118076324463, -0.5051548480987549, -0.4764978587627411, -0.4478408694267273, -0.4191839098930359, -0.3905269205570221, -0.3618699312210083, -0.3332129716873169, -0.3045559823513031, -0.2758989930152893, -0.2472420036792755, -0.2185850292444229, -0.1899280548095703, -0.16127106547355652, -0.13261407613754272, -0.10395710170269012, -0.07530012726783752, -0.04664313793182373, -0.017986156046390533, 0.010670825839042664, 0.03932780772447586, 0.06798478960990906, 0.09664177894592285, 0.12529875338077545, 0.15395572781562805, 0.18261265754699707, 0.21126964688301086, 0.23992662131786346, 0.26858359575271606, 0.29724058508872986, 0.32589757442474365, 0.35455453395843506, 0.38321152329444885, 0.41186851263046265, 0.44052550196647644, 0.46918249130249023, 0.49783945083618164, 0.526496410369873, 0.5551534295082092, 0.5838103890419006, 0.6124674081802368, 0.6411243677139282, 0.6697813272476196, 0.6984383463859558, 0.7270953059196472, 0.7557523250579834, 0.7844092845916748, 0.8130662441253662, 0.8417232036590576, 0.8703802227973938, 0.8990371823310852, 0.9276942014694214, 0.9563511610031128, 0.9850081205368042, 1.0136651992797852, 1.0423221588134766, 1.070979118347168, 1.0996360778808594]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 10.0, 19.0, 15.0, 38.0, 56.0, 104.0, 229.0, 441.0, 1543.0, 8511.0, 4150499.0, 28415.0, 3039.0, 698.0, 272.0, 158.0, 84.0, 53.0, 38.0, 26.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.4755859375, -1.4342803955078125, -1.392974853515625, -1.3516693115234375, -1.31036376953125, -1.2690582275390625, -1.227752685546875, -1.1864471435546875, -1.1451416015625, -1.1038360595703125, -1.062530517578125, -1.0212249755859375, -0.97991943359375, -0.9386138916015625, -0.897308349609375, -0.8560028076171875, -0.814697265625, -0.7733917236328125, -0.732086181640625, -0.6907806396484375, -0.64947509765625, -0.6081695556640625, -0.566864013671875, -0.5255584716796875, -0.4842529296875, -0.4429473876953125, -0.401641845703125, -0.3603363037109375, -0.31903076171875, -0.2777252197265625, -0.236419677734375, -0.1951141357421875, -0.15380859375, -0.1125030517578125, -0.071197509765625, -0.0298919677734375, 0.01141357421875, 0.0527191162109375, 0.094024658203125, 0.1353302001953125, 0.1766357421875, 0.2179412841796875, 0.259246826171875, 0.3005523681640625, 0.34185791015625, 0.3831634521484375, 0.424468994140625, 0.4657745361328125, 0.507080078125, 0.5483856201171875, 0.589691162109375, 0.6309967041015625, 0.67230224609375, 0.7136077880859375, 0.754913330078125, 0.7962188720703125, 0.8375244140625, 0.8788299560546875, 0.920135498046875, 0.9614410400390625, 1.00274658203125, 1.0440521240234375, 1.085357666015625, 1.1266632080078125, 1.16796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 12.0, 13.0, 24.0, 33.0, 66.0, 72.0, 93.0, 112.0, 118.0, 116.0, 92.0, 69.0, 67.0, 42.0, 29.0, 16.0, 14.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12152099609375, -0.11789798736572266, -0.11427497863769531, -0.11065196990966797, -0.10702896118164062, -0.10340595245361328, -0.09978294372558594, -0.0961599349975586, -0.09253692626953125, -0.0889139175415039, -0.08529090881347656, -0.08166790008544922, -0.07804489135742188, -0.07442188262939453, -0.07079887390136719, -0.06717586517333984, -0.0635528564453125, -0.059929847717285156, -0.05630683898925781, -0.05268383026123047, -0.049060821533203125, -0.04543781280517578, -0.04181480407714844, -0.038191795349121094, -0.03456878662109375, -0.030945777893066406, -0.027322769165039062, -0.02369976043701172, -0.020076751708984375, -0.01645374298095703, -0.012830734252929688, -0.009207725524902344, -0.005584716796875, -0.0019617080688476562, 0.0016613006591796875, 0.005284309387207031, 0.008907318115234375, 0.012530326843261719, 0.016153335571289062, 0.019776344299316406, 0.02339935302734375, 0.027022361755371094, 0.030645370483398438, 0.03426837921142578, 0.037891387939453125, 0.04151439666748047, 0.04513740539550781, 0.048760414123535156, 0.0523834228515625, 0.056006431579589844, 0.05962944030761719, 0.06325244903564453, 0.06687545776367188, 0.07049846649169922, 0.07412147521972656, 0.0777444839477539, 0.08136749267578125, 0.0849905014038086, 0.08861351013183594, 0.09223651885986328, 0.09585952758789062, 0.09948253631591797, 0.10310554504394531, 0.10672855377197266, 0.1103515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 11.0, 5.0, 5.0, 11.0, 9.0, 19.0, 24.0, 29.0, 35.0, 61.0, 83.0, 153.0, 313.0, 691.0, 1455.0, 3308.0, 7874.0, 23063.0, 286431.0, 3827805.0, 27134.0, 8951.0, 3679.0, 1590.0, 749.0, 342.0, 148.0, 93.0, 72.0, 20.0, 29.0, 28.0, 22.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4697265625, -0.455078125, -0.4404296875, -0.42578125, -0.4111328125, -0.396484375, -0.3818359375, -0.3671875, -0.3525390625, -0.337890625, -0.3232421875, -0.30859375, -0.2939453125, -0.279296875, -0.2646484375, -0.25, -0.2353515625, -0.220703125, -0.2060546875, -0.19140625, -0.1767578125, -0.162109375, -0.1474609375, -0.1328125, -0.1181640625, -0.103515625, -0.0888671875, -0.07421875, -0.0595703125, -0.044921875, -0.0302734375, -0.015625, -0.0009765625, 0.013671875, 0.0283203125, 0.04296875, 0.0576171875, 0.072265625, 0.0869140625, 0.1015625, 0.1162109375, 0.130859375, 0.1455078125, 0.16015625, 0.1748046875, 0.189453125, 0.2041015625, 0.21875, 0.2333984375, 0.248046875, 0.2626953125, 0.27734375, 0.2919921875, 0.306640625, 0.3212890625, 0.3359375, 0.3505859375, 0.365234375, 0.3798828125, 0.39453125, 0.4091796875, 0.423828125, 0.4384765625, 0.453125, 0.4677734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 3.0, 5.0, 3.0, 9.0, 6.0, 13.0, 11.0, 21.0, 28.0, 41.0, 150.0, 3514.0, 152.0, 36.0, 19.0, 11.0, 11.0, 9.0, 3.0, 7.0, 5.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2364501953125, -0.23125076293945312, -0.22605133056640625, -0.22085189819335938, -0.2156524658203125, -0.21045303344726562, -0.20525360107421875, -0.20005416870117188, -0.194854736328125, -0.18965530395507812, -0.18445587158203125, -0.17925643920898438, -0.1740570068359375, -0.16885757446289062, -0.16365814208984375, -0.15845870971679688, -0.15325927734375, -0.14805984497070312, -0.14286041259765625, -0.13766098022460938, -0.1324615478515625, -0.12726211547851562, -0.12206268310546875, -0.11686325073242188, -0.111663818359375, -0.10646438598632812, -0.10126495361328125, -0.09606552124023438, -0.0908660888671875, -0.08566665649414062, -0.08046722412109375, -0.07526779174804688, -0.070068359375, -0.06486892700195312, -0.05966949462890625, -0.054470062255859375, -0.0492706298828125, -0.044071197509765625, -0.03887176513671875, -0.033672332763671875, -0.028472900390625, -0.023273468017578125, -0.01807403564453125, -0.012874603271484375, -0.0076751708984375, -0.002475738525390625, 0.00272369384765625, 0.007923126220703125, 0.01312255859375, 0.018321990966796875, 0.02352142333984375, 0.028720855712890625, 0.0339202880859375, 0.039119720458984375, 0.04431915283203125, 0.049518585205078125, 0.054718017578125, 0.059917449951171875, 0.06511688232421875, 0.07031631469726562, 0.0755157470703125, 0.08071517944335938, 0.08591461181640625, 0.09111404418945312, 0.0963134765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 20.0, 33.0, 121.0, 477.0, 306.0, 47.0, 3.0, 3.0, 1.0, 1.0], "bins": [-3.821107864379883, -3.755127429962158, -3.6891469955444336, -3.623166561126709, -3.5571861267089844, -3.4912056922912598, -3.425225257873535, -3.3592448234558105, -3.293264389038086, -3.2272839546203613, -3.1613035202026367, -3.095323085784912, -3.0293426513671875, -2.963362216949463, -2.8973817825317383, -2.8314013481140137, -2.765420913696289, -2.6994404792785645, -2.63346004486084, -2.5674796104431152, -2.5014991760253906, -2.435518741607666, -2.3695383071899414, -2.303557872772217, -2.237577199935913, -2.1715967655181885, -2.105616331100464, -2.0396358966827393, -1.9736554622650146, -1.90767502784729, -1.8416945934295654, -1.7757141590118408, -1.7097337245941162, -1.6437532901763916, -1.577772855758667, -1.5117924213409424, -1.4458119869232178, -1.3798315525054932, -1.3138511180877686, -1.247870683670044, -1.1818902492523193, -1.1159098148345947, -1.0499293804168701, -0.9839489459991455, -0.9179685115814209, -0.8519880771636963, -0.7860075831413269, -0.7200271487236023, -0.6540466547012329, -0.5880662202835083, -0.5220857858657837, -0.4561053216457367, -0.3901248872280121, -0.3241444528102875, -0.2581639885902405, -0.19218355417251587, -0.12620314955711365, -0.06022270768880844, 0.005757734179496765, 0.07173818349838257, 0.13771861791610718, 0.2036990523338318, 0.2696795165538788, 0.3356599509716034, 0.401640385389328]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 10.0, 17.0, 17.0, 25.0, 27.0, 37.0, 57.0, 53.0, 49.0, 80.0, 67.0, 71.0, 61.0, 78.0, 56.0, 59.0, 53.0, 37.0, 39.0, 25.0, 23.0, 23.0, 10.0, 11.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4907100200653076, -0.476390540599823, -0.4620710611343384, -0.44775155186653137, -0.43343207240104675, -0.41911259293556213, -0.4047931134700775, -0.3904736042022705, -0.3761541247367859, -0.36183464527130127, -0.34751516580581665, -0.33319565653800964, -0.318876177072525, -0.3045566976070404, -0.2902372181415558, -0.2759177088737488, -0.26159822940826416, -0.24727874994277954, -0.23295925557613373, -0.2186397761106491, -0.2043202817440033, -0.19000080227851868, -0.17568132281303406, -0.16136182844638824, -0.14704236388206482, -0.1327228844165802, -0.11840339004993439, -0.10408391058444977, -0.08976441621780396, -0.07544493675231934, -0.06112544983625412, -0.046805962920188904, -0.03248646855354309, -0.018166981637477875, -0.003847496584057808, 0.010471988469362259, 0.024791475385427475, 0.03911095857620239, 0.05343044549226761, 0.06774993240833282, 0.08206941932439804, 0.09638890624046326, 0.11070839315652847, 0.1250278800725937, 0.1393473595380783, 0.15366685390472412, 0.16798633337020874, 0.18230581283569336, 0.19662530720233917, 0.2109447866678238, 0.2252642810344696, 0.23958376049995422, 0.25390323996543884, 0.26822274923324585, 0.28254222869873047, 0.2968617081642151, 0.3111811876296997, 0.3255006670951843, 0.33982014656066895, 0.35413965582847595, 0.36845913529396057, 0.3827786147594452, 0.3970980942249298, 0.4114176034927368, 0.42573708295822144]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 10.0, 5.0, 4.0, 7.0, 16.0, 27.0, 40.0, 60.0, 70.0, 115.0, 170.0, 256.0, 442.0, 711.0, 1165.0, 2406.0, 6402.0, 23481.0, 115972.0, 702981.0, 151691.0, 28799.0, 7662.0, 2696.0, 1309.0, 720.0, 440.0, 303.0, 171.0, 123.0, 99.0, 72.0, 34.0, 24.0, 24.0, 10.0, 6.0, 3.0, 4.0, 1.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48978424072265625, -0.4732208251953125, -0.45665740966796875, -0.440093994140625, -0.42353057861328125, -0.4069671630859375, -0.39040374755859375, -0.37384033203125, -0.35727691650390625, -0.3407135009765625, -0.32415008544921875, -0.307586669921875, -0.29102325439453125, -0.2744598388671875, -0.25789642333984375, -0.2413330078125, -0.22476959228515625, -0.2082061767578125, -0.19164276123046875, -0.175079345703125, -0.15851593017578125, -0.1419525146484375, -0.12538909912109375, -0.10882568359375, -0.09226226806640625, -0.0756988525390625, -0.05913543701171875, -0.042572021484375, -0.02600860595703125, -0.0094451904296875, 0.00711822509765625, 0.023681640625, 0.04024505615234375, 0.0568084716796875, 0.07337188720703125, 0.089935302734375, 0.10649871826171875, 0.1230621337890625, 0.13962554931640625, 0.15618896484375, 0.17275238037109375, 0.1893157958984375, 0.20587921142578125, 0.222442626953125, 0.23900604248046875, 0.2555694580078125, 0.27213287353515625, 0.2886962890625, 0.30525970458984375, 0.3218231201171875, 0.33838653564453125, 0.354949951171875, 0.37151336669921875, 0.3880767822265625, 0.40464019775390625, 0.42120361328125, 0.43776702880859375, 0.4543304443359375, 0.47089385986328125, 0.487457275390625, 0.5040206909179688, 0.5205841064453125, 0.5371475219726562, 0.5537109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 8.0, 10.0, 18.0, 36.0, 44.0, 91.0, 89.0, 98.0, 129.0, 120.0, 99.0, 76.0, 66.0, 43.0, 29.0, 18.0, 14.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12261962890625, -0.11887264251708984, -0.11512565612792969, -0.11137866973876953, -0.10763168334960938, -0.10388469696044922, -0.10013771057128906, -0.0963907241821289, -0.09264373779296875, -0.0888967514038086, -0.08514976501464844, -0.08140277862548828, -0.07765579223632812, -0.07390880584716797, -0.07016181945800781, -0.06641483306884766, -0.0626678466796875, -0.058920860290527344, -0.05517387390136719, -0.05142688751220703, -0.047679901123046875, -0.04393291473388672, -0.04018592834472656, -0.036438941955566406, -0.03269195556640625, -0.028944969177246094, -0.025197982788085938, -0.02145099639892578, -0.017704010009765625, -0.013957023620605469, -0.010210037231445312, -0.006463050842285156, -0.002716064453125, 0.0010309219360351562, 0.0047779083251953125, 0.008524894714355469, 0.012271881103515625, 0.01601886749267578, 0.019765853881835938, 0.023512840270996094, 0.02725982666015625, 0.031006813049316406, 0.03475379943847656, 0.03850078582763672, 0.042247772216796875, 0.04599475860595703, 0.04974174499511719, 0.053488731384277344, 0.0572357177734375, 0.060982704162597656, 0.06472969055175781, 0.06847667694091797, 0.07222366333007812, 0.07597064971923828, 0.07971763610839844, 0.0834646224975586, 0.08721160888671875, 0.0909585952758789, 0.09470558166503906, 0.09845256805419922, 0.10219955444335938, 0.10594654083251953, 0.10969352722167969, 0.11344051361083984, 0.1171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 10.0, 23.0, 18.0, 28.0, 40.0, 57.0, 98.0, 126.0, 190.0, 265.0, 409.0, 649.0, 900.0, 1351.0, 2087.0, 3103.0, 5174.0, 7999.0, 13578.0, 22435.0, 39562.0, 73984.0, 166541.0, 360840.0, 172980.0, 75365.0, 40768.0, 23177.0, 13648.0, 8310.0, 5219.0, 3210.0, 2215.0, 1383.0, 934.0, 575.0, 430.0, 278.0, 177.0, 143.0, 93.0, 60.0, 39.0, 22.0, 17.0, 10.0, 13.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 4.0], "bins": [-0.155029296875, -0.1504039764404297, -0.14577865600585938, -0.14115333557128906, -0.13652801513671875, -0.13190269470214844, -0.12727737426757812, -0.12265205383300781, -0.1180267333984375, -0.11340141296386719, -0.10877609252929688, -0.10415077209472656, -0.09952545166015625, -0.09490013122558594, -0.09027481079101562, -0.08564949035644531, -0.081024169921875, -0.07639884948730469, -0.07177352905273438, -0.06714820861816406, -0.06252288818359375, -0.05789756774902344, -0.053272247314453125, -0.04864692687988281, -0.0440216064453125, -0.03939628601074219, -0.034770965576171875, -0.030145645141601562, -0.02552032470703125, -0.020895004272460938, -0.016269683837890625, -0.011644363403320312, -0.00701904296875, -0.0023937225341796875, 0.002231597900390625, 0.0068569183349609375, 0.01148223876953125, 0.016107559204101562, 0.020732879638671875, 0.025358200073242188, 0.0299835205078125, 0.03460884094238281, 0.039234161376953125, 0.04385948181152344, 0.04848480224609375, 0.05311012268066406, 0.057735443115234375, 0.06236076354980469, 0.066986083984375, 0.07161140441894531, 0.07623672485351562, 0.08086204528808594, 0.08548736572265625, 0.09011268615722656, 0.09473800659179688, 0.09936332702636719, 0.1039886474609375, 0.10861396789550781, 0.11323928833007812, 0.11786460876464844, 0.12248992919921875, 0.12711524963378906, 0.13174057006835938, 0.1363658905029297, 0.1409912109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 3.0, 7.0, 16.0, 7.0, 12.0, 18.0, 16.0, 32.0, 24.0, 40.0, 41.0, 35.0, 35.0, 51.0, 51.0, 53.0, 47.0, 58.0, 52.0, 51.0, 27.0, 37.0, 38.0, 48.0, 31.0, 30.0, 27.0, 21.0, 11.0, 15.0, 14.0, 12.0, 5.0, 10.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.1992015838623047, -0.19222640991210938, -0.18525123596191406, -0.17827606201171875, -0.17130088806152344, -0.16432571411132812, -0.1573505401611328, -0.1503753662109375, -0.1434001922607422, -0.13642501831054688, -0.12944984436035156, -0.12247467041015625, -0.11549949645996094, -0.10852432250976562, -0.10154914855957031, -0.094573974609375, -0.08759880065917969, -0.08062362670898438, -0.07364845275878906, -0.06667327880859375, -0.05969810485839844, -0.052722930908203125, -0.04574775695800781, -0.0387725830078125, -0.03179740905761719, -0.024822235107421875, -0.017847061157226562, -0.01087188720703125, -0.0038967132568359375, 0.003078460693359375, 0.010053634643554688, 0.01702880859375, 0.024003982543945312, 0.030979156494140625, 0.03795433044433594, 0.04492950439453125, 0.05190467834472656, 0.058879852294921875, 0.06585502624511719, 0.0728302001953125, 0.07980537414550781, 0.08678054809570312, 0.09375572204589844, 0.10073089599609375, 0.10770606994628906, 0.11468124389648438, 0.12165641784667969, 0.128631591796875, 0.1356067657470703, 0.14258193969726562, 0.14955711364746094, 0.15653228759765625, 0.16350746154785156, 0.17048263549804688, 0.1774578094482422, 0.1844329833984375, 0.1914081573486328, 0.19838333129882812, 0.20535850524902344, 0.21233367919921875, 0.21930885314941406, 0.22628402709960938, 0.2332592010498047, 0.240234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 15.0, 17.0, 30.0, 44.0, 90.0, 155.0, 385.0, 943.0, 3158.0, 13569.0, 150836.0, 838406.0, 32483.0, 5789.0, 1555.0, 527.0, 277.0, 116.0, 52.0, 37.0, 28.0, 14.0, 10.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08592700958251953, -0.08298683166503906, -0.0800466537475586, -0.07710647583007812, -0.07416629791259766, -0.07122611999511719, -0.06828594207763672, -0.06534576416015625, -0.06240558624267578, -0.05946540832519531, -0.056525230407714844, -0.053585052490234375, -0.050644874572753906, -0.04770469665527344, -0.04476451873779297, -0.0418243408203125, -0.03888416290283203, -0.03594398498535156, -0.033003807067871094, -0.030063629150390625, -0.027123451232910156, -0.024183273315429688, -0.02124309539794922, -0.01830291748046875, -0.015362739562988281, -0.012422561645507812, -0.009482383728027344, -0.006542205810546875, -0.0036020278930664062, -0.0006618499755859375, 0.0022783279418945312, 0.005218505859375, 0.008158683776855469, 0.011098861694335938, 0.014039039611816406, 0.016979217529296875, 0.019919395446777344, 0.022859573364257812, 0.02579975128173828, 0.02873992919921875, 0.03168010711669922, 0.03462028503417969, 0.037560462951660156, 0.040500640869140625, 0.043440818786621094, 0.04638099670410156, 0.04932117462158203, 0.0522613525390625, 0.05520153045654297, 0.05814170837402344, 0.061081886291503906, 0.06402206420898438, 0.06696224212646484, 0.06990242004394531, 0.07284259796142578, 0.07578277587890625, 0.07872295379638672, 0.08166313171386719, 0.08460330963134766, 0.08754348754882812, 0.0904836654663086, 0.09342384338378906, 0.09636402130126953, 0.09930419921875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 19.0, 21.0, 27.0, 53.0, 51.0, 60.0, 72.0, 97.0, 86.0, 91.0, 87.0, 77.0, 53.0, 47.0, 36.0, 25.0, 19.0, 14.0, 10.0, 15.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7220458984375e-06, -5.540437996387482e-06, -5.358830094337463e-06, -5.177222192287445e-06, -4.995614290237427e-06, -4.8140063881874084e-06, -4.63239848613739e-06, -4.450790584087372e-06, -4.2691826820373535e-06, -4.087574779987335e-06, -3.905966877937317e-06, -3.7243589758872986e-06, -3.5427510738372803e-06, -3.361143171787262e-06, -3.1795352697372437e-06, -2.9979273676872253e-06, -2.816319465637207e-06, -2.6347115635871887e-06, -2.4531036615371704e-06, -2.271495759487152e-06, -2.089887857437134e-06, -1.9082799553871155e-06, -1.7266720533370972e-06, -1.5450641512870789e-06, -1.3634562492370605e-06, -1.1818483471870422e-06, -1.000240445137024e-06, -8.186325430870056e-07, -6.370246410369873e-07, -4.55416738986969e-07, -2.738088369369507e-07, -9.220093488693237e-08, 8.940696716308594e-08, 2.7101486921310425e-07, 4.5262277126312256e-07, 6.342306733131409e-07, 8.158385753631592e-07, 9.974464774131775e-07, 1.1790543794631958e-06, 1.3606622815132141e-06, 1.5422701835632324e-06, 1.7238780856132507e-06, 1.905485987663269e-06, 2.0870938897132874e-06, 2.2687017917633057e-06, 2.450309693813324e-06, 2.6319175958633423e-06, 2.8135254979133606e-06, 2.995133399963379e-06, 3.1767413020133972e-06, 3.3583492040634155e-06, 3.539957106113434e-06, 3.721565008163452e-06, 3.9031729102134705e-06, 4.084780812263489e-06, 4.266388714313507e-06, 4.447996616363525e-06, 4.629604518413544e-06, 4.811212420463562e-06, 4.99282032251358e-06, 5.174428224563599e-06, 5.356036126613617e-06, 5.537644028663635e-06, 5.7192519307136536e-06, 5.900859832763672e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 23.0, 25.0, 21.0, 37.0, 62.0, 91.0, 136.0, 195.0, 290.0, 456.0, 754.0, 1239.0, 2088.0, 3857.0, 7107.0, 14727.0, 34810.0, 116756.0, 620336.0, 167026.0, 42667.0, 17168.0, 8247.0, 4349.0, 2376.0, 1385.0, 800.0, 538.0, 341.0, 203.0, 128.0, 100.0, 58.0, 40.0, 29.0, 21.0, 12.0, 15.0, 5.0, 6.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03375244140625, -0.03264951705932617, -0.031546592712402344, -0.030443668365478516, -0.029340744018554688, -0.02823781967163086, -0.02713489532470703, -0.026031970977783203, -0.024929046630859375, -0.023826122283935547, -0.02272319793701172, -0.02162027359008789, -0.020517349243164062, -0.019414424896240234, -0.018311500549316406, -0.017208576202392578, -0.01610565185546875, -0.015002727508544922, -0.013899803161621094, -0.012796878814697266, -0.011693954467773438, -0.01059103012084961, -0.009488105773925781, -0.008385181427001953, -0.007282257080078125, -0.006179332733154297, -0.005076408386230469, -0.003973484039306641, -0.0028705596923828125, -0.0017676353454589844, -0.0006647109985351562, 0.0004382133483886719, 0.0015411376953125, 0.002644062042236328, 0.0037469863891601562, 0.004849910736083984, 0.0059528350830078125, 0.007055759429931641, 0.008158683776855469, 0.009261608123779297, 0.010364532470703125, 0.011467456817626953, 0.012570381164550781, 0.01367330551147461, 0.014776229858398438, 0.015879154205322266, 0.016982078552246094, 0.018085002899169922, 0.01918792724609375, 0.020290851593017578, 0.021393775939941406, 0.022496700286865234, 0.023599624633789062, 0.02470254898071289, 0.02580547332763672, 0.026908397674560547, 0.028011322021484375, 0.029114246368408203, 0.03021717071533203, 0.03132009506225586, 0.03242301940917969, 0.033525943756103516, 0.034628868103027344, 0.03573179244995117, 0.036834716796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 13.0, 14.0, 19.0, 23.0, 22.0, 29.0, 44.0, 64.0, 87.0, 150.0, 146.0, 111.0, 69.0, 48.0, 30.0, 29.0, 11.0, 12.0, 15.0, 5.0, 5.0, 11.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047210693359375, -0.04582691192626953, -0.04444313049316406, -0.043059349060058594, -0.041675567626953125, -0.040291786193847656, -0.03890800476074219, -0.03752422332763672, -0.03614044189453125, -0.03475666046142578, -0.03337287902832031, -0.031989097595214844, -0.030605316162109375, -0.029221534729003906, -0.027837753295898438, -0.02645397186279297, -0.0250701904296875, -0.02368640899658203, -0.022302627563476562, -0.020918846130371094, -0.019535064697265625, -0.018151283264160156, -0.016767501831054688, -0.015383720397949219, -0.01399993896484375, -0.012616157531738281, -0.011232376098632812, -0.009848594665527344, -0.008464813232421875, -0.007081031799316406, -0.0056972503662109375, -0.004313468933105469, -0.0029296875, -0.0015459060668945312, -0.0001621246337890625, 0.0012216567993164062, 0.002605438232421875, 0.003989219665527344, 0.0053730010986328125, 0.006756782531738281, 0.00814056396484375, 0.009524345397949219, 0.010908126831054688, 0.012291908264160156, 0.013675689697265625, 0.015059471130371094, 0.016443252563476562, 0.01782703399658203, 0.0192108154296875, 0.02059459686279297, 0.021978378295898438, 0.023362159729003906, 0.024745941162109375, 0.026129722595214844, 0.027513504028320312, 0.02889728546142578, 0.03028106689453125, 0.03166484832763672, 0.03304862976074219, 0.034432411193847656, 0.035816192626953125, 0.037199974060058594, 0.03858375549316406, 0.03996753692626953, 0.041351318359375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 4.0, 4.0, 8.0, 13.0, 24.0, 22.0, 26.0, 46.0, 61.0, 85.0, 122.0, 192.0, 123.0, 74.0, 64.0, 19.0, 18.0, 18.0, 15.0, 13.0, 4.0, 13.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7379820346832275, -1.6889346837997437, -1.6398872137069702, -1.5908398628234863, -1.5417925119400024, -1.4927451610565186, -1.4436976909637451, -1.3946503400802612, -1.3456029891967773, -1.2965556383132935, -1.24750816822052, -1.1984608173370361, -1.1494134664535522, -1.1003661155700684, -1.051318645477295, -1.002271294593811, -0.9532238245010376, -0.9041764140129089, -0.855129063129425, -0.8060816526412964, -0.7570343017578125, -0.7079868912696838, -0.6589394807815552, -0.6098921298980713, -0.5608447194099426, -0.511797308921814, -0.4627499580383301, -0.4137025475502014, -0.36465516686439514, -0.31560778617858887, -0.2665603756904602, -0.21751299500465393, -0.1684654951095581, -0.11941810697317123, -0.07037071883678436, -0.021323323249816895, 0.02772405743598938, 0.07677143812179565, 0.12581884860992432, 0.1748662292957306, 0.22391360998153687, 0.27296099066734314, 0.3220083713531494, 0.3710557818412781, 0.42010316252708435, 0.4691505432128906, 0.5181979537010193, 0.567245364189148, 0.6162927150726318, 0.6653401255607605, 0.7143874764442444, 0.763434886932373, 0.8124822378158569, 0.8615296483039856, 0.9105770587921143, 0.9596244096755981, 1.008671760559082, 1.057719111442566, 1.1067665815353394, 1.1558139324188232, 1.2048612833023071, 1.253908634185791, 1.3029561042785645, 1.3520034551620483, 1.4010509252548218]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 9.0, 11.0, 12.0, 33.0, 24.0, 20.0, 26.0, 32.0, 26.0, 34.0, 30.0, 33.0, 39.0, 34.0, 46.0, 35.0, 38.0, 42.0, 34.0, 39.0, 50.0, 24.0, 44.0, 24.0, 37.0, 21.0, 22.0, 26.0, 21.0, 15.0, 18.0, 11.0, 9.0, 9.0, 6.0, 5.0, 3.0, 11.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.9802571535110474, -0.9491626620292664, -0.9180682301521301, -0.8869737386703491, -0.8558793067932129, -0.8247848153114319, -0.7936903238296509, -0.7625958919525146, -0.7315014004707336, -0.7004069089889526, -0.6693124771118164, -0.6382179856300354, -0.6071235537528992, -0.5760290622711182, -0.5449346303939819, -0.5138401389122009, -0.4827456772327423, -0.4516512155532837, -0.4205567538738251, -0.38946229219436646, -0.35836780071258545, -0.32727333903312683, -0.2961788773536682, -0.2650843858718872, -0.23398993909358978, -0.20289547741413116, -0.17180100083351135, -0.14070653915405273, -0.10961207002401352, -0.0785176008939743, -0.047423139214515686, -0.016328662633895874, 0.014765799045562744, 0.04586026817560196, 0.07695473730564117, 0.10804919898509979, 0.1391436755657196, 0.17023813724517822, 0.20133259892463684, 0.23242707550525665, 0.26352155208587646, 0.2946160137653351, 0.3257104754447937, 0.3568049669265747, 0.3878994286060333, 0.41899389028549194, 0.45008835196495056, 0.4811828136444092, 0.5122772455215454, 0.5433717370033264, 0.5744661688804626, 0.6055606603622437, 0.6366550922393799, 0.6677495837211609, 0.6988440752029419, 0.7299385070800781, 0.7610329985618591, 0.7921274900436401, 0.8232219219207764, 0.8543164134025574, 0.8854108452796936, 0.9165053367614746, 0.9475997686386108, 0.9786942601203918, 1.0097887516021729]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 7.0, 17.0, 13.0, 24.0, 44.0, 64.0, 96.0, 188.0, 349.0, 845.0, 2333.0, 10540.0, 4147865.0, 26152.0, 3479.0, 1122.0, 527.0, 212.0, 137.0, 84.0, 61.0, 26.0, 17.0, 13.0, 11.0, 8.0, 10.0, 3.0, 6.0, 2.0, 4.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6328125, -0.6114883422851562, -0.5901641845703125, -0.5688400268554688, -0.547515869140625, -0.5261917114257812, -0.5048675537109375, -0.48354339599609375, -0.46221923828125, -0.44089508056640625, -0.4195709228515625, -0.39824676513671875, -0.376922607421875, -0.35559844970703125, -0.3342742919921875, -0.31295013427734375, -0.2916259765625, -0.27030181884765625, -0.2489776611328125, -0.22765350341796875, -0.206329345703125, -0.18500518798828125, -0.1636810302734375, -0.14235687255859375, -0.12103271484375, -0.09970855712890625, -0.0783843994140625, -0.05706024169921875, -0.035736083984375, -0.01441192626953125, 0.0069122314453125, 0.02823638916015625, 0.049560546875, 0.07088470458984375, 0.0922088623046875, 0.11353302001953125, 0.134857177734375, 0.15618133544921875, 0.1775054931640625, 0.19882965087890625, 0.22015380859375, 0.24147796630859375, 0.2628021240234375, 0.28412628173828125, 0.305450439453125, 0.32677459716796875, 0.3480987548828125, 0.36942291259765625, 0.3907470703125, 0.41207122802734375, 0.4333953857421875, 0.45471954345703125, 0.476043701171875, 0.49736785888671875, 0.5186920166015625, 0.5400161743164062, 0.56134033203125, 0.5826644897460938, 0.6039886474609375, 0.6253128051757812, 0.646636962890625, 0.6679611206054688, 0.6892852783203125, 0.7106094360351562, 0.73193359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 9.0, 16.0, 25.0, 56.0, 73.0, 89.0, 109.0, 125.0, 117.0, 108.0, 84.0, 62.0, 42.0, 31.0, 20.0, 15.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12548828125, -0.1216745376586914, -0.11786079406738281, -0.11404705047607422, -0.11023330688476562, -0.10641956329345703, -0.10260581970214844, -0.09879207611083984, -0.09497833251953125, -0.09116458892822266, -0.08735084533691406, -0.08353710174560547, -0.07972335815429688, -0.07590961456298828, -0.07209587097167969, -0.0682821273803711, -0.0644683837890625, -0.060654640197753906, -0.05684089660644531, -0.05302715301513672, -0.049213409423828125, -0.04539966583251953, -0.04158592224121094, -0.037772178649902344, -0.03395843505859375, -0.030144691467285156, -0.026330947875976562, -0.02251720428466797, -0.018703460693359375, -0.014889717102050781, -0.011075973510742188, -0.007262229919433594, -0.003448486328125, 0.00036525726318359375, 0.0041790008544921875, 0.007992744445800781, 0.011806488037109375, 0.015620231628417969, 0.019433975219726562, 0.023247718811035156, 0.02706146240234375, 0.030875205993652344, 0.03468894958496094, 0.03850269317626953, 0.042316436767578125, 0.04613018035888672, 0.04994392395019531, 0.053757667541503906, 0.0575714111328125, 0.061385154724121094, 0.06519889831542969, 0.06901264190673828, 0.07282638549804688, 0.07664012908935547, 0.08045387268066406, 0.08426761627197266, 0.08808135986328125, 0.09189510345458984, 0.09570884704589844, 0.09952259063720703, 0.10333633422851562, 0.10715007781982422, 0.11096382141113281, 0.1147775650024414, 0.11859130859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 4.0, 9.0, 10.0, 14.0, 13.0, 26.0, 25.0, 27.0, 41.0, 48.0, 93.0, 116.0, 197.0, 301.0, 557.0, 1227.0, 3154.0, 9819.0, 61973.0, 4075842.0, 29579.0, 6588.0, 2333.0, 1002.0, 461.0, 254.0, 160.0, 109.0, 79.0, 55.0, 38.0, 34.0, 19.0, 15.0, 14.0, 13.0, 7.0, 5.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43212890625, -0.4174041748046875, -0.402679443359375, -0.3879547119140625, -0.37322998046875, -0.3585052490234375, -0.343780517578125, -0.3290557861328125, -0.3143310546875, -0.2996063232421875, -0.284881591796875, -0.2701568603515625, -0.25543212890625, -0.2407073974609375, -0.225982666015625, -0.2112579345703125, -0.196533203125, -0.1818084716796875, -0.167083740234375, -0.1523590087890625, -0.13763427734375, -0.1229095458984375, -0.108184814453125, -0.0934600830078125, -0.0787353515625, -0.0640106201171875, -0.049285888671875, -0.0345611572265625, -0.01983642578125, -0.0051116943359375, 0.009613037109375, 0.0243377685546875, 0.0390625, 0.0537872314453125, 0.068511962890625, 0.0832366943359375, 0.09796142578125, 0.1126861572265625, 0.127410888671875, 0.1421356201171875, 0.1568603515625, 0.1715850830078125, 0.186309814453125, 0.2010345458984375, 0.21575927734375, 0.2304840087890625, 0.245208740234375, 0.2599334716796875, 0.274658203125, 0.2893829345703125, 0.304107666015625, 0.3188323974609375, 0.33355712890625, 0.3482818603515625, 0.363006591796875, 0.3777313232421875, 0.3924560546875, 0.4071807861328125, 0.421905517578125, 0.4366302490234375, 0.45135498046875, 0.4660797119140625, 0.480804443359375, 0.4955291748046875, 0.51025390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 9.0, 9.0, 31.0, 75.0, 3393.0, 423.0, 45.0, 30.0, 16.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3056640625, -0.2986927032470703, -0.2917213439941406, -0.28474998474121094, -0.27777862548828125, -0.27080726623535156, -0.2638359069824219, -0.2568645477294922, -0.2498931884765625, -0.2429218292236328, -0.23595046997070312, -0.22897911071777344, -0.22200775146484375, -0.21503639221191406, -0.20806503295898438, -0.2010936737060547, -0.194122314453125, -0.1871509552001953, -0.18017959594726562, -0.17320823669433594, -0.16623687744140625, -0.15926551818847656, -0.15229415893554688, -0.1453227996826172, -0.1383514404296875, -0.1313800811767578, -0.12440872192382812, -0.11743736267089844, -0.11046600341796875, -0.10349464416503906, -0.09652328491210938, -0.08955192565917969, -0.08258056640625, -0.07560920715332031, -0.06863784790039062, -0.06166648864746094, -0.05469512939453125, -0.04772377014160156, -0.040752410888671875, -0.03378105163574219, -0.0268096923828125, -0.019838333129882812, -0.012866973876953125, -0.0058956146240234375, 0.00107574462890625, 0.008047103881835938, 0.015018463134765625, 0.021989822387695312, 0.028961181640625, 0.03593254089355469, 0.042903900146484375, 0.04987525939941406, 0.05684661865234375, 0.06381797790527344, 0.07078933715820312, 0.07776069641113281, 0.0847320556640625, 0.09170341491699219, 0.09867477416992188, 0.10564613342285156, 0.11261749267578125, 0.11958885192871094, 0.12656021118164062, 0.1335315704345703, 0.1405029296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 8.0, 9.0, 17.0, 36.0, 58.0, 93.0, 250.0, 230.0, 123.0, 59.0, 37.0, 28.0, 15.0, 17.0, 7.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7120325565338135, -0.6874918341636658, -0.6629510521888733, -0.6384103298187256, -0.6138695478439331, -0.5893288254737854, -0.5647880434989929, -0.5402473211288452, -0.5157065391540527, -0.49116578698158264, -0.46662503480911255, -0.44208428263664246, -0.41754353046417236, -0.39300277829170227, -0.3684620261192322, -0.3439213037490845, -0.3193805515766144, -0.2948397994041443, -0.2702990472316742, -0.2457582950592041, -0.221217542886734, -0.19667679071426392, -0.17213605344295502, -0.14759530127048492, -0.12305454909801483, -0.09851379692554474, -0.07397304475307465, -0.04943230003118515, -0.024891547858715057, -0.0003507956862449646, 0.02418994903564453, 0.048730701208114624, 0.07327145338058472, 0.09781220555305481, 0.1223529577255249, 0.146893709897995, 0.1714344620704651, 0.19597521424293518, 0.22051595151424408, 0.24505670368671417, 0.26959747076034546, 0.29413822293281555, 0.31867897510528564, 0.34321972727775574, 0.36776047945022583, 0.3923012316226959, 0.416841983795166, 0.4413827061653137, 0.4659234583377838, 0.4904642105102539, 0.5150049328804016, 0.5395457148551941, 0.5640864372253418, 0.5886272192001343, 0.613167941570282, 0.6377087235450745, 0.6622494459152222, 0.6867901682853699, 0.7113309502601624, 0.7358716726303101, 0.7604124546051025, 0.7849531769752502, 0.8094939589500427, 0.8340346813201904, 0.8585754632949829]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 10.0, 8.0, 16.0, 22.0, 21.0, 34.0, 30.0, 35.0, 41.0, 36.0, 43.0, 39.0, 67.0, 58.0, 59.0, 54.0, 52.0, 44.0, 43.0, 30.0, 40.0, 32.0, 27.0, 28.0, 31.0, 15.0, 17.0, 9.0, 6.0, 11.0, 2.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.37123680114746094, -0.36039119958877563, -0.34954556822776794, -0.33869996666908264, -0.32785436511039734, -0.31700876355171204, -0.30616313219070435, -0.29531753063201904, -0.28447192907333374, -0.27362632751464844, -0.26278069615364075, -0.25193509459495544, -0.24108949303627014, -0.23024387657642365, -0.21939826011657715, -0.20855265855789185, -0.19770704209804535, -0.18686142563819885, -0.17601582407951355, -0.16517020761966705, -0.15432460606098175, -0.14347898960113525, -0.13263338804244995, -0.12178777158260345, -0.11094216257333755, -0.10009655356407166, -0.08925094455480576, -0.07840533554553986, -0.06755971908569336, -0.05671411380171776, -0.04586850106716156, -0.03502289205789566, -0.02417728304862976, -0.013331673108041286, -0.002486063167452812, 0.008359547704458237, 0.019205156713724136, 0.030050765722990036, 0.040896378457546234, 0.051741987466812134, 0.06258759647607803, 0.07343320548534393, 0.08427881449460983, 0.09512442350387573, 0.10597003996372223, 0.11681564152240753, 0.12766125798225403, 0.13850685954093933, 0.14935247600078583, 0.16019809246063232, 0.17104369401931763, 0.18188931047916412, 0.19273491203784943, 0.20358052849769592, 0.21442613005638123, 0.22527174651622772, 0.23611736297607422, 0.24696297943592072, 0.2578085958957672, 0.2686541974544525, 0.2794997990131378, 0.2903454005718231, 0.3011910319328308, 0.3120366334915161, 0.3228822350502014]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 13.0, 17.0, 18.0, 29.0, 37.0, 36.0, 75.0, 104.0, 129.0, 167.0, 252.0, 349.0, 500.0, 798.0, 1433.0, 2962.0, 7079.0, 19633.0, 70956.0, 449461.0, 396579.0, 65787.0, 18647.0, 6676.0, 2783.0, 1484.0, 851.0, 529.0, 328.0, 232.0, 165.0, 107.0, 66.0, 64.0, 55.0, 40.0, 30.0, 15.0, 17.0, 9.0, 13.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.454833984375, -0.4410400390625, -0.42724609375, -0.4134521484375, -0.399658203125, -0.3858642578125, -0.3720703125, -0.3582763671875, -0.344482421875, -0.3306884765625, -0.31689453125, -0.3031005859375, -0.289306640625, -0.2755126953125, -0.26171875, -0.2479248046875, -0.234130859375, -0.2203369140625, -0.20654296875, -0.1927490234375, -0.178955078125, -0.1651611328125, -0.1513671875, -0.1375732421875, -0.123779296875, -0.1099853515625, -0.09619140625, -0.0823974609375, -0.068603515625, -0.0548095703125, -0.041015625, -0.0272216796875, -0.013427734375, 0.0003662109375, 0.01416015625, 0.0279541015625, 0.041748046875, 0.0555419921875, 0.0693359375, 0.0831298828125, 0.096923828125, 0.1107177734375, 0.12451171875, 0.1383056640625, 0.152099609375, 0.1658935546875, 0.1796875, 0.1934814453125, 0.207275390625, 0.2210693359375, 0.23486328125, 0.2486572265625, 0.262451171875, 0.2762451171875, 0.2900390625, 0.3038330078125, 0.317626953125, 0.3314208984375, 0.34521484375, 0.3590087890625, 0.372802734375, 0.3865966796875, 0.400390625, 0.4141845703125, 0.427978515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 0.0, 2.0, 4.0, 10.0, 8.0, 12.0, 33.0, 53.0, 70.0, 92.0, 117.0, 146.0, 105.0, 106.0, 87.0, 42.0, 45.0, 35.0, 18.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12744140625, -0.12354850769042969, -0.11965560913085938, -0.11576271057128906, -0.11186981201171875, -0.10797691345214844, -0.10408401489257812, -0.10019111633300781, -0.0962982177734375, -0.09240531921386719, -0.08851242065429688, -0.08461952209472656, -0.08072662353515625, -0.07683372497558594, -0.07294082641601562, -0.06904792785644531, -0.065155029296875, -0.06126213073730469, -0.057369232177734375, -0.05347633361816406, -0.04958343505859375, -0.04569053649902344, -0.041797637939453125, -0.03790473937988281, -0.0340118408203125, -0.030118942260742188, -0.026226043701171875, -0.022333145141601562, -0.01844024658203125, -0.014547348022460938, -0.010654449462890625, -0.0067615509033203125, -0.00286865234375, 0.0010242462158203125, 0.004917144775390625, 0.008810043334960938, 0.01270294189453125, 0.016595840454101562, 0.020488739013671875, 0.024381637573242188, 0.0282745361328125, 0.03216743469238281, 0.036060333251953125, 0.03995323181152344, 0.04384613037109375, 0.04773902893066406, 0.051631927490234375, 0.05552482604980469, 0.059417724609375, 0.06331062316894531, 0.06720352172851562, 0.07109642028808594, 0.07498931884765625, 0.07888221740722656, 0.08277511596679688, 0.08666801452636719, 0.0905609130859375, 0.09445381164550781, 0.09834671020507812, 0.10223960876464844, 0.10613250732421875, 0.11002540588378906, 0.11391830444335938, 0.11781120300292969, 0.1217041015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 9.0, 11.0, 27.0, 28.0, 36.0, 43.0, 65.0, 97.0, 147.0, 220.0, 328.0, 465.0, 840.0, 1326.0, 2209.0, 3902.0, 7082.0, 14153.0, 30729.0, 72475.0, 215634.0, 460925.0, 137553.0, 52426.0, 23089.0, 11053.0, 5654.0, 3149.0, 1800.0, 1090.0, 644.0, 411.0, 279.0, 180.0, 125.0, 111.0, 75.0, 47.0, 35.0, 23.0, 21.0, 14.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2022705078125, -0.19581222534179688, -0.18935394287109375, -0.18289566040039062, -0.1764373779296875, -0.16997909545898438, -0.16352081298828125, -0.15706253051757812, -0.150604248046875, -0.14414596557617188, -0.13768768310546875, -0.13122940063476562, -0.1247711181640625, -0.11831283569335938, -0.11185455322265625, -0.10539627075195312, -0.09893798828125, -0.09247970581054688, -0.08602142333984375, -0.07956314086914062, -0.0731048583984375, -0.06664657592773438, -0.06018829345703125, -0.053730010986328125, -0.047271728515625, -0.040813446044921875, -0.03435516357421875, -0.027896881103515625, -0.0214385986328125, -0.014980316162109375, -0.00852203369140625, -0.002063751220703125, 0.00439453125, 0.010852813720703125, 0.01731109619140625, 0.023769378662109375, 0.0302276611328125, 0.036685943603515625, 0.04314422607421875, 0.049602508544921875, 0.056060791015625, 0.06251907348632812, 0.06897735595703125, 0.07543563842773438, 0.0818939208984375, 0.08835220336914062, 0.09481048583984375, 0.10126876831054688, 0.10772705078125, 0.11418533325195312, 0.12064361572265625, 0.12710189819335938, 0.1335601806640625, 0.14001846313476562, 0.14647674560546875, 0.15293502807617188, 0.159393310546875, 0.16585159301757812, 0.17230987548828125, 0.17876815795898438, 0.1852264404296875, 0.19168472290039062, 0.19814300537109375, 0.20460128784179688, 0.2110595703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 17.0, 17.0, 19.0, 29.0, 38.0, 37.0, 50.0, 40.0, 41.0, 49.0, 60.0, 64.0, 58.0, 47.0, 54.0, 52.0, 63.0, 43.0, 37.0, 32.0, 25.0, 29.0, 18.0, 17.0, 11.0, 6.0, 7.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27099609375, -0.2633094787597656, -0.25562286376953125, -0.24793624877929688, -0.2402496337890625, -0.23256301879882812, -0.22487640380859375, -0.21718978881835938, -0.209503173828125, -0.20181655883789062, -0.19412994384765625, -0.18644332885742188, -0.1787567138671875, -0.17107009887695312, -0.16338348388671875, -0.15569686889648438, -0.14801025390625, -0.14032363891601562, -0.13263702392578125, -0.12495040893554688, -0.1172637939453125, -0.10957717895507812, -0.10189056396484375, -0.09420394897460938, -0.086517333984375, -0.07883071899414062, -0.07114410400390625, -0.06345748901367188, -0.0557708740234375, -0.048084259033203125, -0.04039764404296875, -0.032711029052734375, -0.0250244140625, -0.017337799072265625, -0.00965118408203125, -0.001964569091796875, 0.0057220458984375, 0.013408660888671875, 0.02109527587890625, 0.028781890869140625, 0.036468505859375, 0.044155120849609375, 0.05184173583984375, 0.059528350830078125, 0.0672149658203125, 0.07490158081054688, 0.08258819580078125, 0.09027481079101562, 0.09796142578125, 0.10564804077148438, 0.11333465576171875, 0.12102127075195312, 0.1287078857421875, 0.13639450073242188, 0.14408111572265625, 0.15176773071289062, 0.159454345703125, 0.16714096069335938, 0.17482757568359375, 0.18251419067382812, 0.1902008056640625, 0.19788742065429688, 0.20557403564453125, 0.21326065063476562, 0.220947265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 12.0, 17.0, 28.0, 46.0, 86.0, 139.0, 252.0, 661.0, 1681.0, 5006.0, 22533.0, 425258.0, 559286.0, 25204.0, 5309.0, 1647.0, 678.0, 343.0, 163.0, 85.0, 44.0, 23.0, 14.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.12646484375, -0.1233053207397461, -0.12014579772949219, -0.11698627471923828, -0.11382675170898438, -0.11066722869873047, -0.10750770568847656, -0.10434818267822266, -0.10118865966796875, -0.09802913665771484, -0.09486961364746094, -0.09171009063720703, -0.08855056762695312, -0.08539104461669922, -0.08223152160644531, -0.0790719985961914, -0.0759124755859375, -0.0727529525756836, -0.06959342956542969, -0.06643390655517578, -0.06327438354492188, -0.06011486053466797, -0.05695533752441406, -0.053795814514160156, -0.05063629150390625, -0.047476768493652344, -0.04431724548339844, -0.04115772247314453, -0.037998199462890625, -0.03483867645263672, -0.03167915344238281, -0.028519630432128906, -0.025360107421875, -0.022200584411621094, -0.019041061401367188, -0.01588153839111328, -0.012722015380859375, -0.009562492370605469, -0.0064029693603515625, -0.0032434463500976562, -8.392333984375e-05, 0.0030755996704101562, 0.0062351226806640625, 0.009394645690917969, 0.012554168701171875, 0.01571369171142578, 0.018873214721679688, 0.022032737731933594, 0.0251922607421875, 0.028351783752441406, 0.03151130676269531, 0.03467082977294922, 0.037830352783203125, 0.04098987579345703, 0.04414939880371094, 0.047308921813964844, 0.05046844482421875, 0.053627967834472656, 0.05678749084472656, 0.05994701385498047, 0.06310653686523438, 0.06626605987548828, 0.06942558288574219, 0.0725851058959961, 0.07574462890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 15.0, 21.0, 25.0, 27.0, 48.0, 57.0, 63.0, 57.0, 107.0, 96.0, 87.0, 72.0, 59.0, 75.0, 39.0, 30.0, 26.0, 18.0, 14.0, 4.0, 8.0, 6.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.212162017822266e-06, -7.020309567451477e-06, -6.8284571170806885e-06, -6.6366046667099e-06, -6.444752216339111e-06, -6.252899765968323e-06, -6.061047315597534e-06, -5.869194865226746e-06, -5.677342414855957e-06, -5.4854899644851685e-06, -5.29363751411438e-06, -5.101785063743591e-06, -4.909932613372803e-06, -4.718080163002014e-06, -4.526227712631226e-06, -4.334375262260437e-06, -4.1425228118896484e-06, -3.95067036151886e-06, -3.7588179111480713e-06, -3.5669654607772827e-06, -3.375113010406494e-06, -3.1832605600357056e-06, -2.991408109664917e-06, -2.7995556592941284e-06, -2.60770320892334e-06, -2.4158507585525513e-06, -2.2239983081817627e-06, -2.032145857810974e-06, -1.8402934074401855e-06, -1.648440957069397e-06, -1.4565885066986084e-06, -1.2647360563278198e-06, -1.0728836059570312e-06, -8.810311555862427e-07, -6.891787052154541e-07, -4.973262548446655e-07, -3.0547380447387695e-07, -1.1362135410308838e-07, 7.82310962677002e-08, 2.7008354663848877e-07, 4.6193599700927734e-07, 6.537884473800659e-07, 8.456408977508545e-07, 1.037493348121643e-06, 1.2293457984924316e-06, 1.4211982488632202e-06, 1.6130506992340088e-06, 1.8049031496047974e-06, 1.996755599975586e-06, 2.1886080503463745e-06, 2.380460500717163e-06, 2.5723129510879517e-06, 2.7641654014587402e-06, 2.956017851829529e-06, 3.1478703022003174e-06, 3.339722752571106e-06, 3.5315752029418945e-06, 3.723427653312683e-06, 3.915280103683472e-06, 4.10713255405426e-06, 4.298985004425049e-06, 4.490837454795837e-06, 4.682689905166626e-06, 4.8745423555374146e-06, 5.066394805908203e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 14.0, 16.0, 22.0, 36.0, 46.0, 81.0, 111.0, 197.0, 303.0, 516.0, 912.0, 1782.0, 3581.0, 8562.0, 26499.0, 143882.0, 719535.0, 106079.0, 22045.0, 7460.0, 3141.0, 1593.0, 876.0, 502.0, 273.0, 171.0, 106.0, 65.0, 36.0, 34.0, 24.0, 8.0, 16.0, 12.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.063720703125, -0.06192207336425781, -0.060123443603515625, -0.05832481384277344, -0.05652618408203125, -0.05472755432128906, -0.052928924560546875, -0.05113029479980469, -0.0493316650390625, -0.04753303527832031, -0.045734405517578125, -0.04393577575683594, -0.04213714599609375, -0.04033851623535156, -0.038539886474609375, -0.03674125671386719, -0.034942626953125, -0.03314399719238281, -0.031345367431640625, -0.029546737670898438, -0.02774810791015625, -0.025949478149414062, -0.024150848388671875, -0.022352218627929688, -0.0205535888671875, -0.018754959106445312, -0.016956329345703125, -0.015157699584960938, -0.01335906982421875, -0.011560440063476562, -0.009761810302734375, -0.007963180541992188, -0.00616455078125, -0.0043659210205078125, -0.002567291259765625, -0.0007686614990234375, 0.00102996826171875, 0.0028285980224609375, 0.004627227783203125, 0.0064258575439453125, 0.0082244873046875, 0.010023117065429688, 0.011821746826171875, 0.013620376586914062, 0.01541900634765625, 0.017217636108398438, 0.019016265869140625, 0.020814895629882812, 0.022613525390625, 0.024412155151367188, 0.026210784912109375, 0.028009414672851562, 0.02980804443359375, 0.03160667419433594, 0.033405303955078125, 0.03520393371582031, 0.0370025634765625, 0.03880119323730469, 0.040599822998046875, 0.04239845275878906, 0.04419708251953125, 0.04599571228027344, 0.047794342041015625, 0.04959297180175781, 0.0513916015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 9.0, 9.0, 6.0, 10.0, 22.0, 32.0, 49.0, 82.0, 95.0, 132.0, 152.0, 113.0, 86.0, 60.0, 38.0, 25.0, 20.0, 17.0, 13.0, 6.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.066650390625, -0.06476640701293945, -0.0628824234008789, -0.06099843978881836, -0.05911445617675781, -0.057230472564697266, -0.05534648895263672, -0.05346250534057617, -0.051578521728515625, -0.04969453811645508, -0.04781055450439453, -0.045926570892333984, -0.04404258728027344, -0.04215860366821289, -0.040274620056152344, -0.0383906364440918, -0.03650665283203125, -0.0346226692199707, -0.032738685607910156, -0.03085470199584961, -0.028970718383789062, -0.027086734771728516, -0.02520275115966797, -0.023318767547607422, -0.021434783935546875, -0.019550800323486328, -0.01766681671142578, -0.015782833099365234, -0.013898849487304688, -0.01201486587524414, -0.010130882263183594, -0.008246898651123047, -0.0063629150390625, -0.004478931427001953, -0.0025949478149414062, -0.0007109642028808594, 0.0011730194091796875, 0.0030570030212402344, 0.004940986633300781, 0.006824970245361328, 0.008708953857421875, 0.010592937469482422, 0.012476921081542969, 0.014360904693603516, 0.016244888305664062, 0.01812887191772461, 0.020012855529785156, 0.021896839141845703, 0.02378082275390625, 0.025664806365966797, 0.027548789978027344, 0.02943277359008789, 0.03131675720214844, 0.033200740814208984, 0.03508472442626953, 0.03696870803833008, 0.038852691650390625, 0.04073667526245117, 0.04262065887451172, 0.044504642486572266, 0.04638862609863281, 0.04827260971069336, 0.050156593322753906, 0.05204057693481445, 0.053924560546875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 10.0, 14.0, 16.0, 26.0, 42.0, 67.0, 139.0, 255.0, 163.0, 94.0, 48.0, 30.0, 37.0, 18.0, 7.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.340862274169922, -2.2771995067596436, -2.213536500930786, -2.149873733520508, -2.0862107276916504, -2.022547960281372, -1.9588850736618042, -1.8952221870422363, -1.8315593004226685, -1.7678964138031006, -1.7042335271835327, -1.6405706405639648, -1.5769078731536865, -1.513244867324829, -1.4495820999145508, -1.385919213294983, -1.322256326675415, -1.2585934400558472, -1.1949305534362793, -1.1312676668167114, -1.0676047801971436, -1.0039420127868652, -0.9402791261672974, -0.8766162395477295, -0.8129533529281616, -0.7492904663085938, -0.6856275796890259, -0.6219647526741028, -0.5583018660545349, -0.49463897943496704, -0.43097612261772156, -0.3673132658004761, -0.3036501407623291, -0.23998726904392242, -0.17632439732551575, -0.11266152560710907, -0.04899865388870239, 0.014664232730865479, 0.07832708954811096, 0.14198994636535645, 0.20565283298492432, 0.2693157196044922, 0.33297857642173767, 0.39664143323898315, 0.460304319858551, 0.5239672064781189, 0.587630033493042, 0.6512929201126099, 0.7149558067321777, 0.7786186933517456, 0.8422815799713135, 0.9059444069862366, 0.9696072936058044, 1.0332701206207275, 1.0969330072402954, 1.1605958938598633, 1.2242587804794312, 1.287921667098999, 1.351584553718567, 1.4152474403381348, 1.478910207748413, 1.5425732135772705, 1.6062359809875488, 1.6698988676071167, 1.7335617542266846]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 2.0, 7.0, 4.0, 11.0, 15.0, 16.0, 22.0, 17.0, 16.0, 24.0, 25.0, 28.0, 36.0, 30.0, 32.0, 35.0, 37.0, 44.0, 54.0, 69.0, 50.0, 50.0, 52.0, 43.0, 41.0, 33.0, 37.0, 35.0, 33.0, 23.0, 18.0, 9.0, 11.0, 8.0, 9.0, 6.0, 7.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1003210544586182, -1.0681474208831787, -1.0359737873077393, -1.0038001537322998, -0.9716265797615051, -0.9394530057907104, -0.907279372215271, -0.8751057386398315, -0.8429321050643921, -0.8107584714889526, -0.778584897518158, -0.7464112639427185, -0.714237630367279, -0.6820640563964844, -0.6498904228210449, -0.6177167892456055, -0.5855432152748108, -0.5533695816993713, -0.5211960077285767, -0.4890223741531372, -0.45684874057769775, -0.4246751368045807, -0.3925015330314636, -0.36032789945602417, -0.3281542956829071, -0.29598069190979004, -0.2638070583343506, -0.23163345456123352, -0.19945983588695526, -0.167286217212677, -0.13511261343955994, -0.10293899476528168, -0.07076537609100342, -0.03859176114201546, -0.006418146193027496, 0.025755465030670166, 0.057929083704948425, 0.09010270237922668, 0.12227630615234375, 0.154449924826622, 0.18662354350090027, 0.21879716217517853, 0.2509707808494568, 0.28314438462257385, 0.3153179883956909, 0.34749162197113037, 0.37966522574424744, 0.4118388295173645, 0.44401246309280396, 0.476186066865921, 0.5083596706390381, 0.5405333042144775, 0.572706937789917, 0.6048805713653564, 0.6370541453361511, 0.6692277789115906, 0.7014013528823853, 0.7335749864578247, 0.7657485604286194, 0.7979221940040588, 0.8300958275794983, 0.862269401550293, 0.8944430351257324, 0.9266166687011719, 0.9587903022766113]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 17.0, 19.0, 23.0, 42.0, 63.0, 114.0, 225.0, 465.0, 1039.0, 3192.0, 4183369.0, 3535.0, 1167.0, 455.0, 229.0, 118.0, 66.0, 45.0, 26.0, 12.0, 9.0, 4.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.28515625, -1.243072509765625, -1.20098876953125, -1.158905029296875, -1.1168212890625, -1.074737548828125, -1.03265380859375, -0.990570068359375, -0.948486328125, -0.906402587890625, -0.86431884765625, -0.822235107421875, -0.7801513671875, -0.738067626953125, -0.69598388671875, -0.653900146484375, -0.61181640625, -0.569732666015625, -0.52764892578125, -0.485565185546875, -0.4434814453125, -0.401397705078125, -0.35931396484375, -0.317230224609375, -0.275146484375, -0.233062744140625, -0.19097900390625, -0.148895263671875, -0.1068115234375, -0.064727783203125, -0.02264404296875, 0.019439697265625, 0.0615234375, 0.103607177734375, 0.14569091796875, 0.187774658203125, 0.2298583984375, 0.271942138671875, 0.31402587890625, 0.356109619140625, 0.398193359375, 0.440277099609375, 0.48236083984375, 0.524444580078125, 0.5665283203125, 0.608612060546875, 0.65069580078125, 0.692779541015625, 0.73486328125, 0.776947021484375, 0.81903076171875, 0.861114501953125, 0.9031982421875, 0.945281982421875, 0.98736572265625, 1.029449462890625, 1.071533203125, 1.113616943359375, 1.15570068359375, 1.197784423828125, 1.2398681640625, 1.281951904296875, 1.32403564453125, 1.366119384765625, 1.408203125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 5.0, 11.0, 15.0, 21.0, 49.0, 59.0, 101.0, 105.0, 125.0, 137.0, 98.0, 96.0, 64.0, 41.0, 36.0, 16.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1292724609375, -0.1252307891845703, -0.12118911743164062, -0.11714744567871094, -0.11310577392578125, -0.10906410217285156, -0.10502243041992188, -0.10098075866699219, -0.0969390869140625, -0.09289741516113281, -0.08885574340820312, -0.08481407165527344, -0.08077239990234375, -0.07673072814941406, -0.07268905639648438, -0.06864738464355469, -0.064605712890625, -0.06056404113769531, -0.056522369384765625, -0.05248069763183594, -0.04843902587890625, -0.04439735412597656, -0.040355682373046875, -0.03631401062011719, -0.0322723388671875, -0.028230667114257812, -0.024188995361328125, -0.020147323608398438, -0.01610565185546875, -0.012063980102539062, -0.008022308349609375, -0.0039806365966796875, 6.103515625e-05, 0.0041027069091796875, 0.008144378662109375, 0.012186050415039062, 0.01622772216796875, 0.020269393920898438, 0.024311065673828125, 0.028352737426757812, 0.0323944091796875, 0.03643608093261719, 0.040477752685546875, 0.04451942443847656, 0.04856109619140625, 0.05260276794433594, 0.056644439697265625, 0.06068611145019531, 0.064727783203125, 0.06876945495605469, 0.07281112670898438, 0.07685279846191406, 0.08089447021484375, 0.08493614196777344, 0.08897781372070312, 0.09301948547363281, 0.0970611572265625, 0.10110282897949219, 0.10514450073242188, 0.10918617248535156, 0.11322784423828125, 0.11726951599121094, 0.12131118774414062, 0.1253528594970703, 0.12939453125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 12.0, 5.0, 20.0, 23.0, 28.0, 37.0, 37.0, 58.0, 80.0, 99.0, 140.0, 200.0, 305.0, 429.0, 667.0, 1185.0, 2304.0, 8964.0, 4167699.0, 6849.0, 2020.0, 1050.0, 637.0, 408.0, 293.0, 184.0, 135.0, 110.0, 84.0, 55.0, 39.0, 30.0, 8.0, 21.0, 12.0, 10.0, 11.0, 7.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58056640625, -0.5620956420898438, -0.5436248779296875, -0.5251541137695312, -0.506683349609375, -0.48821258544921875, -0.4697418212890625, -0.45127105712890625, -0.43280029296875, -0.41432952880859375, -0.3958587646484375, -0.37738800048828125, -0.358917236328125, -0.34044647216796875, -0.3219757080078125, -0.30350494384765625, -0.2850341796875, -0.26656341552734375, -0.2480926513671875, -0.22962188720703125, -0.211151123046875, -0.19268035888671875, -0.1742095947265625, -0.15573883056640625, -0.13726806640625, -0.11879730224609375, -0.1003265380859375, -0.08185577392578125, -0.063385009765625, -0.04491424560546875, -0.0264434814453125, -0.00797271728515625, 0.010498046875, 0.02896881103515625, 0.0474395751953125, 0.06591033935546875, 0.084381103515625, 0.10285186767578125, 0.1213226318359375, 0.13979339599609375, 0.15826416015625, 0.17673492431640625, 0.1952056884765625, 0.21367645263671875, 0.232147216796875, 0.25061798095703125, 0.2690887451171875, 0.28755950927734375, 0.3060302734375, 0.32450103759765625, 0.3429718017578125, 0.36144256591796875, 0.379913330078125, 0.39838409423828125, 0.4168548583984375, 0.43532562255859375, 0.45379638671875, 0.47226715087890625, 0.4907379150390625, 0.5092086791992188, 0.527679443359375, 0.5461502075195312, 0.5646209716796875, 0.5830917358398438, 0.6015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 3958.0, 87.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.1346902847290039, -0.1308307647705078, -0.12697124481201172, -0.12311172485351562, -0.11925220489501953, -0.11539268493652344, -0.11153316497802734, -0.10767364501953125, -0.10381412506103516, -0.09995460510253906, -0.09609508514404297, -0.09223556518554688, -0.08837604522705078, -0.08451652526855469, -0.0806570053100586, -0.0767974853515625, -0.0729379653930664, -0.06907844543457031, -0.06521892547607422, -0.061359405517578125, -0.05749988555908203, -0.05364036560058594, -0.049780845642089844, -0.04592132568359375, -0.042061805725097656, -0.03820228576660156, -0.03434276580810547, -0.030483245849609375, -0.02662372589111328, -0.022764205932617188, -0.018904685974121094, -0.015045166015625, -0.011185646057128906, -0.0073261260986328125, -0.0034666061401367188, 0.000392913818359375, 0.004252433776855469, 0.008111953735351562, 0.011971473693847656, 0.01583099365234375, 0.019690513610839844, 0.023550033569335938, 0.02740955352783203, 0.031269073486328125, 0.03512859344482422, 0.03898811340332031, 0.042847633361816406, 0.0467071533203125, 0.050566673278808594, 0.05442619323730469, 0.05828571319580078, 0.062145233154296875, 0.06600475311279297, 0.06986427307128906, 0.07372379302978516, 0.07758331298828125, 0.08144283294677734, 0.08530235290527344, 0.08916187286376953, 0.09302139282226562, 0.09688091278076172, 0.10074043273925781, 0.1045999526977539, 0.10845947265625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 9.0, 11.0, 12.0, 14.0, 36.0, 34.0, 48.0, 80.0, 109.0, 158.0, 154.0, 87.0, 66.0, 39.0, 35.0, 25.0, 20.0, 13.0, 9.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192462757229805, -0.1864263415336609, -0.1803899109363556, -0.1743534952402115, -0.16831707954406738, -0.16228064894676208, -0.15624423325061798, -0.15020781755447388, -0.14417138695716858, -0.13813497126102448, -0.13209854066371918, -0.12606212496757507, -0.12002570927143097, -0.11398928612470627, -0.10795286297798157, -0.10191644728183746, -0.09588003158569336, -0.08984360843896866, -0.08380719274282455, -0.07777076959609985, -0.07173435389995575, -0.06569793075323105, -0.05966150760650635, -0.053625088185071945, -0.04758866876363754, -0.04155224934220314, -0.03551582992076874, -0.029479406774044037, -0.023442987352609634, -0.017406567931175232, -0.011370144784450531, -0.0053337253630161285, 0.0007026791572570801, 0.006739099510014057, 0.012775519862771034, 0.018811941146850586, 0.02484836056828499, 0.03088477998971939, 0.03692120313644409, 0.042957622557878494, 0.0489940419793129, 0.0550304614007473, 0.0610668808221817, 0.0671033039689064, 0.0731397271156311, 0.07917614281177521, 0.08521256595849991, 0.09124898910522461, 0.09728540480136871, 0.10332182794809341, 0.10935824364423752, 0.11539466679096222, 0.12143108248710632, 0.12746751308441162, 0.13350392878055573, 0.13954034447669983, 0.14557677507400513, 0.15161319077014923, 0.15764962136745453, 0.16368603706359863, 0.16972245275974274, 0.17575886845588684, 0.18179529905319214, 0.18783171474933624, 0.19386813044548035]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 4.0, 8.0, 9.0, 9.0, 16.0, 19.0, 18.0, 13.0, 22.0, 26.0, 30.0, 31.0, 31.0, 43.0, 37.0, 38.0, 44.0, 30.0, 57.0, 51.0, 49.0, 41.0, 46.0, 30.0, 30.0, 38.0, 31.0, 26.0, 33.0, 28.0, 16.0, 19.0, 12.0, 10.0, 11.0, 4.0, 5.0, 3.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1385878324508667, -0.1344495713710785, -0.13031132519245148, -0.12617306411266327, -0.12203481048345566, -0.11789655685424805, -0.11375829577445984, -0.10962004214525223, -0.10548178851604462, -0.101343534886837, -0.0972052812576294, -0.09306702017784119, -0.08892876654863358, -0.08479051291942596, -0.08065225183963776, -0.07651399821043015, -0.07237574458122253, -0.06823749095201492, -0.06409923732280731, -0.059960976243019104, -0.05582272261381149, -0.05168446898460388, -0.04754621163010597, -0.04340795427560806, -0.03926970064640045, -0.03513144701719284, -0.03099318966269493, -0.02685493417084217, -0.02271667867898941, -0.01857842318713665, -0.01444016769528389, -0.01030191220343113, -0.006163656711578369, -0.002025401219725609, 0.0021128542721271515, 0.006251109763979912, 0.010389365255832672, 0.014527620747685432, 0.018665876239538193, 0.022804131731390953, 0.026942387223243713, 0.031080642715096474, 0.035218898206949234, 0.039357155561447144, 0.043495409190654755, 0.047633662819862366, 0.051771920174360275, 0.055910177528858185, 0.060048431158065796, 0.06418668478727341, 0.06832493841648102, 0.07246319949626923, 0.07660145312547684, 0.08073970675468445, 0.08487796783447266, 0.08901622146368027, 0.09315447509288788, 0.09729272872209549, 0.1014309823513031, 0.10556924343109131, 0.10970749706029892, 0.11384575068950653, 0.11798401176929474, 0.12212226539850235, 0.12626051902770996]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 1.0, 5.0, 5.0, 11.0, 16.0, 23.0, 24.0, 37.0, 50.0, 50.0, 81.0, 103.0, 126.0, 172.0, 234.0, 329.0, 462.0, 663.0, 1156.0, 1952.0, 4293.0, 10126.0, 29394.0, 101441.0, 496834.0, 295268.0, 68725.0, 20856.0, 7752.0, 3359.0, 1805.0, 993.0, 672.0, 449.0, 304.0, 193.0, 140.0, 119.0, 76.0, 53.0, 52.0, 47.0, 28.0, 15.0, 10.0, 16.0, 12.0, 8.0, 5.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.3526878356933594, -0.34087371826171875, -0.3290596008300781, -0.3172454833984375, -0.3054313659667969, -0.29361724853515625, -0.2818031311035156, -0.269989013671875, -0.2581748962402344, -0.24636077880859375, -0.23454666137695312, -0.2227325439453125, -0.21091842651367188, -0.19910430908203125, -0.18729019165039062, -0.17547607421875, -0.16366195678710938, -0.15184783935546875, -0.14003372192382812, -0.1282196044921875, -0.11640548706054688, -0.10459136962890625, -0.09277725219726562, -0.080963134765625, -0.06914901733398438, -0.05733489990234375, -0.045520782470703125, -0.0337066650390625, -0.021892547607421875, -0.01007843017578125, 0.001735687255859375, 0.0135498046875, 0.025363922119140625, 0.03717803955078125, 0.048992156982421875, 0.0608062744140625, 0.07262039184570312, 0.08443450927734375, 0.09624862670898438, 0.108062744140625, 0.11987686157226562, 0.13169097900390625, 0.14350509643554688, 0.1553192138671875, 0.16713333129882812, 0.17894744873046875, 0.19076156616210938, 0.20257568359375, 0.21438980102539062, 0.22620391845703125, 0.23801803588867188, 0.2498321533203125, 0.2616462707519531, 0.27346038818359375, 0.2852745056152344, 0.297088623046875, 0.3089027404785156, 0.32071685791015625, 0.3325309753417969, 0.3443450927734375, 0.3561592102050781, 0.36797332763671875, 0.3797874450683594, 0.3916015625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 13.0, 16.0, 23.0, 57.0, 62.0, 91.0, 97.0, 131.0, 121.0, 109.0, 84.0, 79.0, 34.0, 34.0, 21.0, 7.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12487602233886719, -0.12084579467773438, -0.11681556701660156, -0.11278533935546875, -0.10875511169433594, -0.10472488403320312, -0.10069465637207031, -0.0966644287109375, -0.09263420104980469, -0.08860397338867188, -0.08457374572753906, -0.08054351806640625, -0.07651329040527344, -0.07248306274414062, -0.06845283508300781, -0.064422607421875, -0.06039237976074219, -0.056362152099609375, -0.05233192443847656, -0.04830169677734375, -0.04427146911621094, -0.040241241455078125, -0.03621101379394531, -0.0321807861328125, -0.028150558471679688, -0.024120330810546875, -0.020090103149414062, -0.01605987548828125, -0.012029647827148438, -0.007999420166015625, -0.0039691925048828125, 6.103515625e-05, 0.0040912628173828125, 0.008121490478515625, 0.012151718139648438, 0.01618194580078125, 0.020212173461914062, 0.024242401123046875, 0.028272628784179688, 0.0323028564453125, 0.03633308410644531, 0.040363311767578125, 0.04439353942871094, 0.04842376708984375, 0.05245399475097656, 0.056484222412109375, 0.06051445007324219, 0.064544677734375, 0.06857490539550781, 0.07260513305664062, 0.07663536071777344, 0.08066558837890625, 0.08469581604003906, 0.08872604370117188, 0.09275627136230469, 0.0967864990234375, 0.10081672668457031, 0.10484695434570312, 0.10887718200683594, 0.11290740966796875, 0.11693763732910156, 0.12096786499023438, 0.12499809265136719, 0.1290283203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 4.0, 21.0, 28.0, 40.0, 49.0, 89.0, 130.0, 270.0, 456.0, 891.0, 1664.0, 3119.0, 6576.0, 14363.0, 33723.0, 97978.0, 532017.0, 251343.0, 61522.0, 23656.0, 10357.0, 4952.0, 2430.0, 1255.0, 715.0, 343.0, 223.0, 114.0, 63.0, 42.0, 29.0, 20.0, 15.0, 14.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.1887989044189453, -0.18118667602539062, -0.17357444763183594, -0.16596221923828125, -0.15834999084472656, -0.15073776245117188, -0.1431255340576172, -0.1355133056640625, -0.1279010772705078, -0.12028884887695312, -0.11267662048339844, -0.10506439208984375, -0.09745216369628906, -0.08983993530273438, -0.08222770690917969, -0.074615478515625, -0.06700325012207031, -0.059391021728515625, -0.05177879333496094, -0.04416656494140625, -0.03655433654785156, -0.028942108154296875, -0.021329879760742188, -0.0137176513671875, -0.0061054229736328125, 0.001506805419921875, 0.009119033813476562, 0.01673126220703125, 0.024343490600585938, 0.031955718994140625, 0.03956794738769531, 0.04718017578125, 0.05479240417480469, 0.062404632568359375, 0.07001686096191406, 0.07762908935546875, 0.08524131774902344, 0.09285354614257812, 0.10046577453613281, 0.1080780029296875, 0.11569023132324219, 0.12330245971679688, 0.13091468811035156, 0.13852691650390625, 0.14613914489746094, 0.15375137329101562, 0.1613636016845703, 0.168975830078125, 0.1765880584716797, 0.18420028686523438, 0.19181251525878906, 0.19942474365234375, 0.20703697204589844, 0.21464920043945312, 0.2222614288330078, 0.2298736572265625, 0.2374858856201172, 0.24509811401367188, 0.25271034240722656, 0.26032257080078125, 0.26793479919433594, 0.2755470275878906, 0.2831592559814453, 0.290771484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 9.0, 13.0, 15.0, 15.0, 12.0, 22.0, 23.0, 31.0, 30.0, 17.0, 39.0, 39.0, 42.0, 54.0, 51.0, 67.0, 55.0, 57.0, 55.0, 49.0, 50.0, 38.0, 35.0, 27.0, 37.0, 26.0, 20.0, 10.0, 11.0, 12.0, 9.0, 8.0, 4.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1971435546875, -0.18985557556152344, -0.18256759643554688, -0.1752796173095703, -0.16799163818359375, -0.1607036590576172, -0.15341567993164062, -0.14612770080566406, -0.1388397216796875, -0.13155174255371094, -0.12426376342773438, -0.11697578430175781, -0.10968780517578125, -0.10239982604980469, -0.09511184692382812, -0.08782386779785156, -0.080535888671875, -0.07324790954589844, -0.06595993041992188, -0.05867195129394531, -0.05138397216796875, -0.04409599304199219, -0.036808013916015625, -0.029520034790039062, -0.0222320556640625, -0.014944076538085938, -0.007656097412109375, -0.0003681182861328125, 0.00691986083984375, 0.014207839965820312, 0.021495819091796875, 0.028783798217773438, 0.03607177734375, 0.04335975646972656, 0.050647735595703125, 0.05793571472167969, 0.06522369384765625, 0.07251167297363281, 0.07979965209960938, 0.08708763122558594, 0.0943756103515625, 0.10166358947753906, 0.10895156860351562, 0.11623954772949219, 0.12352752685546875, 0.1308155059814453, 0.13810348510742188, 0.14539146423339844, 0.152679443359375, 0.15996742248535156, 0.16725540161132812, 0.1745433807373047, 0.18183135986328125, 0.1891193389892578, 0.19640731811523438, 0.20369529724121094, 0.2109832763671875, 0.21827125549316406, 0.22555923461914062, 0.2328472137451172, 0.24013519287109375, 0.2474231719970703, 0.2547111511230469, 0.26199913024902344, 0.269287109375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 8.0, 6.0, 3.0, 2.0, 7.0, 4.0, 6.0, 8.0, 5.0, 8.0, 18.0, 23.0, 33.0, 42.0, 117.0, 229.0, 597.0, 1280.0, 3625.0, 12368.0, 64366.0, 765975.0, 168906.0, 21955.0, 5618.0, 1923.0, 742.0, 319.0, 149.0, 65.0, 41.0, 17.0, 19.0, 13.0, 8.0, 13.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.02874755859375, -0.027811050415039062, -0.026874542236328125, -0.025938034057617188, -0.02500152587890625, -0.024065017700195312, -0.023128509521484375, -0.022192001342773438, -0.0212554931640625, -0.020318984985351562, -0.019382476806640625, -0.018445968627929688, -0.01750946044921875, -0.016572952270507812, -0.015636444091796875, -0.014699935913085938, -0.013763427734375, -0.012826919555664062, -0.011890411376953125, -0.010953903198242188, -0.01001739501953125, -0.009080886840820312, -0.008144378662109375, -0.0072078704833984375, -0.0062713623046875, -0.0053348541259765625, -0.004398345947265625, -0.0034618377685546875, -0.00252532958984375, -0.0015888214111328125, -0.000652313232421875, 0.0002841949462890625, 0.001220703125, 0.0021572113037109375, 0.003093719482421875, 0.0040302276611328125, 0.00496673583984375, 0.0059032440185546875, 0.006839752197265625, 0.0077762603759765625, 0.0087127685546875, 0.009649276733398438, 0.010585784912109375, 0.011522293090820312, 0.01245880126953125, 0.013395309448242188, 0.014331817626953125, 0.015268325805664062, 0.016204833984375, 0.017141342163085938, 0.018077850341796875, 0.019014358520507812, 0.01995086669921875, 0.020887374877929688, 0.021823883056640625, 0.022760391235351562, 0.0236968994140625, 0.024633407592773438, 0.025569915771484375, 0.026506423950195312, 0.02744293212890625, 0.028379440307617188, 0.029315948486328125, 0.030252456665039062, 0.03118896484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 5.0, 4.0, 13.0, 13.0, 21.0, 4.0, 31.0, 21.0, 42.0, 37.0, 22.0, 48.0, 60.0, 82.0, 67.0, 21.0, 70.0, 59.0, 65.0, 53.0, 23.0, 41.0, 28.0, 31.0, 29.0, 8.0, 21.0, 15.0, 11.0, 8.0, 3.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-3.6954879760742188e-06, -3.5883858799934387e-06, -3.4812837839126587e-06, -3.3741816878318787e-06, -3.2670795917510986e-06, -3.1599774956703186e-06, -3.0528753995895386e-06, -2.9457733035087585e-06, -2.8386712074279785e-06, -2.7315691113471985e-06, -2.6244670152664185e-06, -2.5173649191856384e-06, -2.4102628231048584e-06, -2.3031607270240784e-06, -2.1960586309432983e-06, -2.0889565348625183e-06, -1.9818544387817383e-06, -1.8747523427009583e-06, -1.7676502466201782e-06, -1.6605481505393982e-06, -1.5534460544586182e-06, -1.4463439583778381e-06, -1.339241862297058e-06, -1.232139766216278e-06, -1.125037670135498e-06, -1.017935574054718e-06, -9.10833477973938e-07, -8.03731381893158e-07, -6.966292858123779e-07, -5.895271897315979e-07, -4.824250936508179e-07, -3.7532299757003784e-07, -2.682209014892578e-07, -1.6111880540847778e-07, -5.4016709327697754e-08, 5.3085386753082275e-08, 1.601874828338623e-07, 2.6728957891464233e-07, 3.7439167499542236e-07, 4.814937710762024e-07, 5.885958671569824e-07, 6.956979632377625e-07, 8.028000593185425e-07, 9.099021553993225e-07, 1.0170042514801025e-06, 1.1241063475608826e-06, 1.2312084436416626e-06, 1.3383105397224426e-06, 1.4454126358032227e-06, 1.5525147318840027e-06, 1.6596168279647827e-06, 1.7667189240455627e-06, 1.8738210201263428e-06, 1.980923116207123e-06, 2.088025212287903e-06, 2.195127308368683e-06, 2.302229404449463e-06, 2.409331500530243e-06, 2.516433596611023e-06, 2.623535692691803e-06, 2.730637788772583e-06, 2.837739884853363e-06, 2.944841980934143e-06, 3.051944077014923e-06, 3.159046173095703e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 8.0, 19.0, 28.0, 33.0, 46.0, 90.0, 135.0, 227.0, 401.0, 726.0, 1362.0, 2618.0, 5486.0, 12910.0, 36919.0, 158246.0, 625655.0, 145561.0, 34901.0, 12350.0, 5311.0, 2571.0, 1293.0, 695.0, 363.0, 222.0, 160.0, 87.0, 46.0, 29.0, 21.0, 9.0, 12.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164031982421875, -0.015806198120117188, -0.015209197998046875, -0.014612197875976562, -0.01401519775390625, -0.013418197631835938, -0.012821197509765625, -0.012224197387695312, -0.011627197265625, -0.011030197143554688, -0.010433197021484375, -0.009836196899414062, -0.00923919677734375, -0.008642196655273438, -0.008045196533203125, -0.0074481964111328125, -0.0068511962890625, -0.0062541961669921875, -0.005657196044921875, -0.0050601959228515625, -0.00446319580078125, -0.0038661956787109375, -0.003269195556640625, -0.0026721954345703125, -0.0020751953125, -0.0014781951904296875, -0.000881195068359375, -0.0002841949462890625, 0.00031280517578125, 0.0009098052978515625, 0.001506805419921875, 0.0021038055419921875, 0.0027008056640625, 0.0032978057861328125, 0.003894805908203125, 0.0044918060302734375, 0.00508880615234375, 0.0056858062744140625, 0.006282806396484375, 0.0068798065185546875, 0.007476806640625, 0.008073806762695312, 0.008670806884765625, 0.009267807006835938, 0.00986480712890625, 0.010461807250976562, 0.011058807373046875, 0.011655807495117188, 0.0122528076171875, 0.012849807739257812, 0.013446807861328125, 0.014043807983398438, 0.01464080810546875, 0.015237808227539062, 0.015834808349609375, 0.016431808471679688, 0.01702880859375, 0.017625808715820312, 0.018222808837890625, 0.018819808959960938, 0.01941680908203125, 0.020013809204101562, 0.020610809326171875, 0.021207809448242188, 0.0218048095703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 10.0, 13.0, 8.0, 7.0, 18.0, 13.0, 20.0, 18.0, 27.0, 41.0, 48.0, 56.0, 72.0, 82.0, 67.0, 66.0, 85.0, 50.0, 53.0, 48.0, 35.0, 33.0, 21.0, 32.0, 9.0, 12.0, 4.0, 12.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0176544189453125, -0.01711893081665039, -0.01658344268798828, -0.016047954559326172, -0.015512466430664062, -0.014976978302001953, -0.014441490173339844, -0.013906002044677734, -0.013370513916015625, -0.012835025787353516, -0.012299537658691406, -0.011764049530029297, -0.011228561401367188, -0.010693073272705078, -0.010157585144042969, -0.00962209701538086, -0.00908660888671875, -0.00855112075805664, -0.008015632629394531, -0.007480144500732422, -0.0069446563720703125, -0.006409168243408203, -0.005873680114746094, -0.005338191986083984, -0.004802703857421875, -0.004267215728759766, -0.0037317276000976562, -0.003196239471435547, -0.0026607513427734375, -0.002125263214111328, -0.0015897750854492188, -0.0010542869567871094, -0.000518798828125, 1.6689300537109375e-05, 0.0005521774291992188, 0.0010876655578613281, 0.0016231536865234375, 0.002158641815185547, 0.0026941299438476562, 0.0032296180725097656, 0.003765106201171875, 0.004300594329833984, 0.004836082458496094, 0.005371570587158203, 0.0059070587158203125, 0.006442546844482422, 0.006978034973144531, 0.007513523101806641, 0.00804901123046875, 0.00858449935913086, 0.009119987487792969, 0.009655475616455078, 0.010190963745117188, 0.010726451873779297, 0.011261940002441406, 0.011797428131103516, 0.012332916259765625, 0.012868404388427734, 0.013403892517089844, 0.013939380645751953, 0.014474868774414062, 0.015010356903076172, 0.015545845031738281, 0.01608133316040039, 0.0166168212890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 14.0, 13.0, 13.0, 15.0, 22.0, 31.0, 41.0, 68.0, 100.0, 172.0, 152.0, 106.0, 79.0, 34.0, 28.0, 17.0, 17.0, 17.0, 9.0, 7.0, 4.0, 4.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5219124555587769, -1.4796202182769775, -1.4373281002044678, -1.395035982131958, -1.3527437448501587, -1.3104515075683594, -1.2681593894958496, -1.2258672714233398, -1.1835750341415405, -1.1412827968597412, -1.0989906787872314, -1.0566985607147217, -1.0144063234329224, -0.9721141457557678, -0.9298219680786133, -0.8875297904014587, -0.8452376127243042, -0.8029454350471497, -0.7606532573699951, -0.7183610796928406, -0.676068902015686, -0.6337767243385315, -0.591484546661377, -0.5491923689842224, -0.5069001913070679, -0.46460801362991333, -0.4223158359527588, -0.38002365827560425, -0.3377314805984497, -0.29543930292129517, -0.2531471252441406, -0.21085494756698608, -0.168562650680542, -0.12627047300338745, -0.08397829532623291, -0.04168611764907837, 0.0006060600280761719, 0.04289823770523071, 0.08519041538238525, 0.1274825930595398, 0.16977477073669434, 0.21206694841384888, 0.2543591260910034, 0.29665130376815796, 0.3389434814453125, 0.38123565912246704, 0.4235278367996216, 0.4658200144767761, 0.5081121921539307, 0.5504043698310852, 0.5926965475082397, 0.6349887251853943, 0.6772809028625488, 0.7195730805397034, 0.7618652582168579, 0.8041574358940125, 0.846449613571167, 0.8887417912483215, 0.9310339689254761, 0.9733261466026306, 1.0156183242797852, 1.057910442352295, 1.1002026796340942, 1.1424949169158936, 1.1847870349884033]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 5.0, 14.0, 9.0, 12.0, 13.0, 16.0, 15.0, 25.0, 31.0, 31.0, 32.0, 35.0, 38.0, 43.0, 45.0, 42.0, 46.0, 52.0, 62.0, 45.0, 57.0, 36.0, 46.0, 22.0, 38.0, 24.0, 27.0, 15.0, 21.0, 12.0, 12.0, 14.0, 7.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0112029314041138, -0.9805951118469238, -0.9499872922897339, -0.919379472732544, -0.8887717127799988, -0.8581638932228088, -0.8275560736656189, -0.796948254108429, -0.7663404941558838, -0.7357326745986938, -0.7051248550415039, -0.674517035484314, -0.6439092755317688, -0.6133014559745789, -0.5826936364173889, -0.552085816860199, -0.521477997303009, -0.4908701777458191, -0.46026238799095154, -0.4296545684337616, -0.39904677867889404, -0.3684389591217041, -0.33783113956451416, -0.3072233200073242, -0.27661553025245667, -0.24600772559642792, -0.21539992094039917, -0.18479210138320923, -0.15418429672718048, -0.12357649207115173, -0.09296867251396179, -0.062360867857933044, -0.03175312280654907, -0.0011453144252300262, 0.02946249395608902, 0.060070306062698364, 0.09067811071872711, 0.12128591537475586, 0.1518937349319458, 0.18250153958797455, 0.2131093442440033, 0.24371714890003204, 0.2743249535560608, 0.30493277311325073, 0.3355405926704407, 0.3661483824253082, 0.39675620198249817, 0.4273639917373657, 0.45797181129455566, 0.4885796308517456, 0.5191874504089355, 0.5497952699661255, 0.5804030299186707, 0.6110108494758606, 0.6416186690330505, 0.6722264885902405, 0.7028342485427856, 0.7334420680999756, 0.7640498876571655, 0.7946577072143555, 0.8252654671669006, 0.8558732867240906, 0.8864811062812805, 0.9170889258384705, 0.9476967453956604]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 8.0, 15.0, 18.0, 39.0, 63.0, 108.0, 261.0, 782.0, 4177247.0, 14531.0, 728.0, 237.0, 80.0, 64.0, 41.0, 20.0, 13.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.8395309448242188, -0.8148040771484375, -0.7900772094726562, -0.765350341796875, -0.7406234741210938, -0.7158966064453125, -0.6911697387695312, -0.66644287109375, -0.6417160034179688, -0.6169891357421875, -0.5922622680664062, -0.567535400390625, -0.5428085327148438, -0.5180816650390625, -0.49335479736328125, -0.4686279296875, -0.44390106201171875, -0.4191741943359375, -0.39444732666015625, -0.369720458984375, -0.34499359130859375, -0.3202667236328125, -0.29553985595703125, -0.27081298828125, -0.24608612060546875, -0.2213592529296875, -0.19663238525390625, -0.171905517578125, -0.14717864990234375, -0.1224517822265625, -0.09772491455078125, -0.072998046875, -0.04827117919921875, -0.0235443115234375, 0.00118255615234375, 0.025909423828125, 0.05063629150390625, 0.0753631591796875, 0.10009002685546875, 0.12481689453125, 0.14954376220703125, 0.1742706298828125, 0.19899749755859375, 0.223724365234375, 0.24845123291015625, 0.2731781005859375, 0.29790496826171875, 0.3226318359375, 0.34735870361328125, 0.3720855712890625, 0.39681243896484375, 0.421539306640625, 0.44626617431640625, 0.4709930419921875, 0.49571990966796875, 0.52044677734375, 0.5451736450195312, 0.5699005126953125, 0.5946273803710938, 0.619354248046875, 0.6440811157226562, 0.6688079833984375, 0.6935348510742188, 0.71826171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 1.0, 3.0, 5.0, 12.0, 16.0, 24.0, 50.0, 61.0, 88.0, 107.0, 126.0, 132.0, 115.0, 93.0, 56.0, 40.0, 34.0, 19.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12487602233886719, -0.12084579467773438, -0.11681556701660156, -0.11278533935546875, -0.10875511169433594, -0.10472488403320312, -0.10069465637207031, -0.0966644287109375, -0.09263420104980469, -0.08860397338867188, -0.08457374572753906, -0.08054351806640625, -0.07651329040527344, -0.07248306274414062, -0.06845283508300781, -0.064422607421875, -0.06039237976074219, -0.056362152099609375, -0.05233192443847656, -0.04830169677734375, -0.04427146911621094, -0.040241241455078125, -0.03621101379394531, -0.0321807861328125, -0.028150558471679688, -0.024120330810546875, -0.020090103149414062, -0.01605987548828125, -0.012029647827148438, -0.007999420166015625, -0.0039691925048828125, 6.103515625e-05, 0.0040912628173828125, 0.008121490478515625, 0.012151718139648438, 0.01618194580078125, 0.020212173461914062, 0.024242401123046875, 0.028272628784179688, 0.0323028564453125, 0.03633308410644531, 0.040363311767578125, 0.04439353942871094, 0.04842376708984375, 0.05245399475097656, 0.056484222412109375, 0.06051445007324219, 0.064544677734375, 0.06857490539550781, 0.07260513305664062, 0.07663536071777344, 0.08066558837890625, 0.08469581604003906, 0.08872604370117188, 0.09275627136230469, 0.0967864990234375, 0.10081672668457031, 0.10484695434570312, 0.10887718200683594, 0.11290740966796875, 0.11693763732910156, 0.12096786499023438, 0.12499809265136719, 0.1290283203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 13.0, 7.0, 27.0, 20.0, 37.0, 41.0, 41.0, 76.0, 107.0, 148.0, 262.0, 469.0, 1872.0, 4182704.0, 6841.0, 693.0, 288.0, 192.0, 120.0, 83.0, 69.0, 35.0, 29.0, 25.0, 32.0, 8.0, 9.0, 4.0, 3.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4326171875, -0.41754913330078125, -0.4024810791015625, -0.38741302490234375, -0.372344970703125, -0.35727691650390625, -0.3422088623046875, -0.32714080810546875, -0.31207275390625, -0.29700469970703125, -0.2819366455078125, -0.26686859130859375, -0.251800537109375, -0.23673248291015625, -0.2216644287109375, -0.20659637451171875, -0.1915283203125, -0.17646026611328125, -0.1613922119140625, -0.14632415771484375, -0.131256103515625, -0.11618804931640625, -0.1011199951171875, -0.08605194091796875, -0.07098388671875, -0.05591583251953125, -0.0408477783203125, -0.02577972412109375, -0.010711669921875, 0.00435638427734375, 0.0194244384765625, 0.03449249267578125, 0.049560546875, 0.06462860107421875, 0.0796966552734375, 0.09476470947265625, 0.109832763671875, 0.12490081787109375, 0.1399688720703125, 0.15503692626953125, 0.17010498046875, 0.18517303466796875, 0.2002410888671875, 0.21530914306640625, 0.230377197265625, 0.24544525146484375, 0.2605133056640625, 0.27558135986328125, 0.2906494140625, 0.30571746826171875, 0.3207855224609375, 0.33585357666015625, 0.350921630859375, 0.36598968505859375, 0.3810577392578125, 0.39612579345703125, 0.41119384765625, 0.42626190185546875, 0.4413299560546875, 0.45639801025390625, 0.471466064453125, 0.48653411865234375, 0.5016021728515625, 0.5166702270507812, 0.53173828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 14.0, 3991.0, 49.0, 10.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0147552490234375, -0.013221979141235352, -0.011688709259033203, -0.010155439376831055, -0.008622169494628906, -0.007088899612426758, -0.005555629730224609, -0.004022359848022461, -0.0024890899658203125, -0.0009558200836181641, 0.0005774497985839844, 0.002110719680786133, 0.0036439895629882812, 0.00517725944519043, 0.006710529327392578, 0.008243799209594727, 0.009777069091796875, 0.011310338973999023, 0.012843608856201172, 0.01437687873840332, 0.01591014862060547, 0.017443418502807617, 0.018976688385009766, 0.020509958267211914, 0.022043228149414062, 0.02357649803161621, 0.02510976791381836, 0.026643037796020508, 0.028176307678222656, 0.029709577560424805, 0.031242847442626953, 0.0327761173248291, 0.03430938720703125, 0.0358426570892334, 0.03737592697143555, 0.038909196853637695, 0.040442466735839844, 0.04197573661804199, 0.04350900650024414, 0.04504227638244629, 0.04657554626464844, 0.048108816146850586, 0.049642086029052734, 0.05117535591125488, 0.05270862579345703, 0.05424189567565918, 0.05577516555786133, 0.05730843544006348, 0.058841705322265625, 0.06037497520446777, 0.06190824508666992, 0.06344151496887207, 0.06497478485107422, 0.06650805473327637, 0.06804132461547852, 0.06957459449768066, 0.07110786437988281, 0.07264113426208496, 0.07417440414428711, 0.07570767402648926, 0.0772409439086914, 0.07877421379089355, 0.0803074836730957, 0.08184075355529785, 0.0833740234375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 10.0, 11.0, 30.0, 75.0, 222.0, 323.0, 149.0, 93.0, 36.0, 26.0, 14.0, 9.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10327893495559692, -0.09407509118318558, -0.08487124741077423, -0.07566741108894348, -0.06646356731653214, -0.05725972354412079, -0.04805588349699974, -0.03885204344987869, -0.029648199677467346, -0.02044435776770115, -0.011240515857934952, -0.0020366739481687546, 0.007167167961597443, 0.01637101173400879, 0.025574851781129837, 0.034778691828250885, 0.04398253560066223, 0.05318637937307358, 0.062390219420194626, 0.07159405946731567, 0.08079790323972702, 0.09000174701213837, 0.09920558333396912, 0.10840942710638046, 0.11761327087879181, 0.12681710720062256, 0.1360209584236145, 0.14522479474544525, 0.154428631067276, 0.16363248229026794, 0.1728363186120987, 0.18204015493392944, 0.191243976354599, 0.20044781267642975, 0.2096516638994217, 0.21885550022125244, 0.22805935144424438, 0.23726318776607513, 0.24646702408790588, 0.2556708753108978, 0.2648746967315674, 0.2740785479545593, 0.2832823693752289, 0.2924862205982208, 0.30169007182121277, 0.3108938932418823, 0.32009774446487427, 0.3293015956878662, 0.33850544691085815, 0.3477092981338501, 0.35691311955451965, 0.3661169707775116, 0.37532082200050354, 0.3845246434211731, 0.39372849464416504, 0.402932345867157, 0.4121361970901489, 0.42134004831314087, 0.4305438697338104, 0.43974772095680237, 0.4489515721797943, 0.45815539360046387, 0.4673592448234558, 0.47656309604644775, 0.4857669174671173]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 7.0, 3.0, 9.0, 10.0, 8.0, 17.0, 15.0, 26.0, 17.0, 23.0, 21.0, 21.0, 27.0, 27.0, 33.0, 38.0, 29.0, 38.0, 36.0, 32.0, 36.0, 28.0, 32.0, 33.0, 37.0, 37.0, 27.0, 37.0, 38.0, 22.0, 27.0, 31.0, 27.0, 21.0, 21.0, 21.0, 9.0, 17.0, 11.0, 9.0, 8.0, 6.0, 3.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.07390576601028442, -0.07175856083631516, -0.06961135566234589, -0.06746415793895721, -0.06531695276498795, -0.06316974759101868, -0.061022546142339706, -0.058875344693660736, -0.05672813951969147, -0.0545809343457222, -0.05243373289704323, -0.05028653144836426, -0.04813932627439499, -0.04599212110042572, -0.04384491965174675, -0.04169771820306778, -0.03955051302909851, -0.03740330785512924, -0.03525610640645027, -0.0331089049577713, -0.030961699783802032, -0.028814496472477913, -0.026667293161153793, -0.024520089849829674, -0.022372886538505554, -0.020225683227181435, -0.018078479915857315, -0.015931276604533195, -0.013784073293209076, -0.011636869981884956, -0.009489666670560837, -0.007342463359236717, -0.005195260047912598, -0.003048056736588478, -0.0009008534252643585, 0.001246349886059761, 0.0033935531973838806, 0.005540756508708, 0.00768795982003212, 0.00983516313135624, 0.011982366442680359, 0.014129569754004478, 0.016276773065328598, 0.018423976376652718, 0.020571179687976837, 0.022718382999300957, 0.024865586310625076, 0.027012789621949196, 0.029159992933273315, 0.031307198107242584, 0.033454399555921555, 0.035601601004600525, 0.037748806178569794, 0.03989601135253906, 0.04204321280121803, 0.044190414249897, 0.04633761942386627, 0.04848482459783554, 0.05063202604651451, 0.05277922749519348, 0.05492643266916275, 0.05707363784313202, 0.05922083929181099, 0.06136804074048996, 0.06351524591445923]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 3.0, 10.0, 14.0, 19.0, 20.0, 31.0, 32.0, 49.0, 55.0, 81.0, 93.0, 129.0, 145.0, 199.0, 263.0, 353.0, 534.0, 748.0, 1160.0, 2007.0, 3994.0, 8965.0, 22404.0, 63524.0, 243644.0, 525150.0, 111731.0, 36078.0, 13845.0, 5938.0, 2692.0, 1429.0, 890.0, 591.0, 398.0, 291.0, 246.0, 175.0, 135.0, 105.0, 90.0, 63.0, 69.0, 34.0, 33.0, 33.0, 20.0, 15.0, 6.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.29931640625, -0.29003143310546875, -0.2807464599609375, -0.27146148681640625, -0.262176513671875, -0.25289154052734375, -0.2436065673828125, -0.23432159423828125, -0.22503662109375, -0.21575164794921875, -0.2064666748046875, -0.19718170166015625, -0.187896728515625, -0.17861175537109375, -0.1693267822265625, -0.16004180908203125, -0.1507568359375, -0.14147186279296875, -0.1321868896484375, -0.12290191650390625, -0.113616943359375, -0.10433197021484375, -0.0950469970703125, -0.08576202392578125, -0.07647705078125, -0.06719207763671875, -0.0579071044921875, -0.04862213134765625, -0.039337158203125, -0.03005218505859375, -0.0207672119140625, -0.01148223876953125, -0.002197265625, 0.00708770751953125, 0.0163726806640625, 0.02565765380859375, 0.034942626953125, 0.04422760009765625, 0.0535125732421875, 0.06279754638671875, 0.07208251953125, 0.08136749267578125, 0.0906524658203125, 0.09993743896484375, 0.109222412109375, 0.11850738525390625, 0.1277923583984375, 0.13707733154296875, 0.1463623046875, 0.15564727783203125, 0.1649322509765625, 0.17421722412109375, 0.183502197265625, 0.19278717041015625, 0.2020721435546875, 0.21135711669921875, 0.22064208984375, 0.22992706298828125, 0.2392120361328125, 0.24849700927734375, 0.257781982421875, 0.26706695556640625, 0.2763519287109375, 0.28563690185546875, 0.294921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 14.0, 13.0, 29.0, 41.0, 60.0, 98.0, 98.0, 117.0, 137.0, 121.0, 84.0, 63.0, 46.0, 29.0, 24.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129150390625, -0.1251201629638672, -0.12108993530273438, -0.11705970764160156, -0.11302947998046875, -0.10899925231933594, -0.10496902465820312, -0.10093879699707031, -0.0969085693359375, -0.09287834167480469, -0.08884811401367188, -0.08481788635253906, -0.08078765869140625, -0.07675743103027344, -0.07272720336914062, -0.06869697570800781, -0.064666748046875, -0.06063652038574219, -0.056606292724609375, -0.05257606506347656, -0.04854583740234375, -0.04451560974121094, -0.040485382080078125, -0.03645515441894531, -0.0324249267578125, -0.028394699096679688, -0.024364471435546875, -0.020334243774414062, -0.01630401611328125, -0.012273788452148438, -0.008243560791015625, -0.0042133331298828125, -0.00018310546875, 0.0038471221923828125, 0.007877349853515625, 0.011907577514648438, 0.01593780517578125, 0.019968032836914062, 0.023998260498046875, 0.028028488159179688, 0.0320587158203125, 0.03608894348144531, 0.040119171142578125, 0.04414939880371094, 0.04817962646484375, 0.05220985412597656, 0.056240081787109375, 0.06027030944824219, 0.064300537109375, 0.06833076477050781, 0.07236099243164062, 0.07639122009277344, 0.08042144775390625, 0.08445167541503906, 0.08848190307617188, 0.09251213073730469, 0.0965423583984375, 0.10057258605957031, 0.10460281372070312, 0.10863304138183594, 0.11266326904296875, 0.11669349670410156, 0.12072372436523438, 0.12475395202636719, 0.1287841796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 12.0, 16.0, 20.0, 26.0, 46.0, 69.0, 129.0, 213.0, 479.0, 1128.0, 2628.0, 6024.0, 15932.0, 50312.0, 255728.0, 587996.0, 87994.0, 24554.0, 8665.0, 3630.0, 1571.0, 679.0, 285.0, 143.0, 82.0, 58.0, 38.0, 25.0, 21.0, 15.0, 5.0, 6.0, 7.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270263671875, -0.26212310791015625, -0.2539825439453125, -0.24584197998046875, -0.237701416015625, -0.22956085205078125, -0.2214202880859375, -0.21327972412109375, -0.20513916015625, -0.19699859619140625, -0.1888580322265625, -0.18071746826171875, -0.172576904296875, -0.16443634033203125, -0.1562957763671875, -0.14815521240234375, -0.1400146484375, -0.13187408447265625, -0.1237335205078125, -0.11559295654296875, -0.107452392578125, -0.09931182861328125, -0.0911712646484375, -0.08303070068359375, -0.07489013671875, -0.06674957275390625, -0.0586090087890625, -0.05046844482421875, -0.042327880859375, -0.03418731689453125, -0.0260467529296875, -0.01790618896484375, -0.009765625, -0.00162506103515625, 0.0065155029296875, 0.01465606689453125, 0.022796630859375, 0.03093719482421875, 0.0390777587890625, 0.04721832275390625, 0.05535888671875, 0.06349945068359375, 0.0716400146484375, 0.07978057861328125, 0.087921142578125, 0.09606170654296875, 0.1042022705078125, 0.11234283447265625, 0.1204833984375, 0.12862396240234375, 0.1367645263671875, 0.14490509033203125, 0.153045654296875, 0.16118621826171875, 0.1693267822265625, 0.17746734619140625, 0.18560791015625, 0.19374847412109375, 0.2018890380859375, 0.21002960205078125, 0.218170166015625, 0.22631072998046875, 0.2344512939453125, 0.24259185791015625, 0.250732421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 4.0, 13.0, 8.0, 6.0, 13.0, 13.0, 15.0, 24.0, 24.0, 25.0, 26.0, 45.0, 53.0, 42.0, 54.0, 49.0, 54.0, 52.0, 35.0, 55.0, 40.0, 54.0, 49.0, 44.0, 32.0, 34.0, 20.0, 21.0, 18.0, 16.0, 16.0, 10.0, 13.0, 8.0, 4.0, 11.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2144775390625, -0.2080821990966797, -0.20168685913085938, -0.19529151916503906, -0.18889617919921875, -0.18250083923339844, -0.17610549926757812, -0.1697101593017578, -0.1633148193359375, -0.1569194793701172, -0.15052413940429688, -0.14412879943847656, -0.13773345947265625, -0.13133811950683594, -0.12494277954101562, -0.11854743957519531, -0.112152099609375, -0.10575675964355469, -0.09936141967773438, -0.09296607971191406, -0.08657073974609375, -0.08017539978027344, -0.07378005981445312, -0.06738471984863281, -0.0609893798828125, -0.05459403991699219, -0.048198699951171875, -0.04180335998535156, -0.03540802001953125, -0.029012680053710938, -0.022617340087890625, -0.016222000122070312, -0.00982666015625, -0.0034313201904296875, 0.002964019775390625, 0.009359359741210938, 0.01575469970703125, 0.022150039672851562, 0.028545379638671875, 0.03494071960449219, 0.0413360595703125, 0.04773139953613281, 0.054126739501953125, 0.06052207946777344, 0.06691741943359375, 0.07331275939941406, 0.07970809936523438, 0.08610343933105469, 0.092498779296875, 0.09889411926269531, 0.10528945922851562, 0.11168479919433594, 0.11808013916015625, 0.12447547912597656, 0.13087081909179688, 0.1372661590576172, 0.1436614990234375, 0.1500568389892578, 0.15645217895507812, 0.16284751892089844, 0.16924285888671875, 0.17563819885253906, 0.18203353881835938, 0.1884288787841797, 0.19482421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 4.0, 6.0, 10.0, 24.0, 31.0, 57.0, 94.0, 210.0, 579.0, 1652.0, 6167.0, 46207.0, 887912.0, 92973.0, 9193.0, 2184.0, 666.0, 293.0, 123.0, 66.0, 30.0, 18.0, 9.0, 6.0, 5.0, 8.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.04730224609375, -0.046010494232177734, -0.04471874237060547, -0.0434269905090332, -0.04213523864746094, -0.04084348678588867, -0.039551734924316406, -0.03825998306274414, -0.036968231201171875, -0.03567647933959961, -0.034384727478027344, -0.03309297561645508, -0.03180122375488281, -0.030509471893310547, -0.02921772003173828, -0.027925968170166016, -0.02663421630859375, -0.025342464447021484, -0.02405071258544922, -0.022758960723876953, -0.021467208862304688, -0.020175457000732422, -0.018883705139160156, -0.01759195327758789, -0.016300201416015625, -0.01500844955444336, -0.013716697692871094, -0.012424945831298828, -0.011133193969726562, -0.009841442108154297, -0.008549690246582031, -0.007257938385009766, -0.0059661865234375, -0.004674434661865234, -0.0033826828002929688, -0.002090930938720703, -0.0007991790771484375, 0.0004925727844238281, 0.0017843246459960938, 0.0030760765075683594, 0.004367828369140625, 0.005659580230712891, 0.006951332092285156, 0.008243083953857422, 0.009534835815429688, 0.010826587677001953, 0.012118339538574219, 0.013410091400146484, 0.01470184326171875, 0.015993595123291016, 0.01728534698486328, 0.018577098846435547, 0.019868850708007812, 0.021160602569580078, 0.022452354431152344, 0.02374410629272461, 0.025035858154296875, 0.02632761001586914, 0.027619361877441406, 0.028911113739013672, 0.030202865600585938, 0.0314946174621582, 0.03278636932373047, 0.034078121185302734, 0.035369873046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 4.0, 15.0, 4.0, 13.0, 10.0, 13.0, 22.0, 28.0, 19.0, 43.0, 20.0, 59.0, 58.0, 33.0, 75.0, 32.0, 78.0, 71.0, 32.0, 63.0, 25.0, 51.0, 39.0, 14.0, 45.0, 18.0, 25.0, 24.0, 4.0, 15.0, 9.0, 6.0, 12.0, 0.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.9439106583595276e-06, -2.8479844331741333e-06, -2.752058207988739e-06, -2.6561319828033447e-06, -2.5602057576179504e-06, -2.464279532432556e-06, -2.368353307247162e-06, -2.2724270820617676e-06, -2.1765008568763733e-06, -2.080574631690979e-06, -1.9846484065055847e-06, -1.8887221813201904e-06, -1.7927959561347961e-06, -1.6968697309494019e-06, -1.6009435057640076e-06, -1.5050172805786133e-06, -1.409091055393219e-06, -1.3131648302078247e-06, -1.2172386050224304e-06, -1.1213123798370361e-06, -1.0253861546516418e-06, -9.294599294662476e-07, -8.335337042808533e-07, -7.37607479095459e-07, -6.416812539100647e-07, -5.457550287246704e-07, -4.498288035392761e-07, -3.5390257835388184e-07, -2.5797635316848755e-07, -1.6205012798309326e-07, -6.612390279769897e-08, 2.9802322387695312e-08, 1.257285475730896e-07, 2.2165477275848389e-07, 3.175809979438782e-07, 4.1350722312927246e-07, 5.094334483146667e-07, 6.05359673500061e-07, 7.012858986854553e-07, 7.972121238708496e-07, 8.931383490562439e-07, 9.890645742416382e-07, 1.0849907994270325e-06, 1.1809170246124268e-06, 1.276843249797821e-06, 1.3727694749832153e-06, 1.4686957001686096e-06, 1.564621925354004e-06, 1.6605481505393982e-06, 1.7564743757247925e-06, 1.8524006009101868e-06, 1.948326826095581e-06, 2.0442530512809753e-06, 2.1401792764663696e-06, 2.236105501651764e-06, 2.332031726837158e-06, 2.4279579520225525e-06, 2.5238841772079468e-06, 2.619810402393341e-06, 2.7157366275787354e-06, 2.8116628527641296e-06, 2.907589077949524e-06, 3.0035153031349182e-06, 3.0994415283203125e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 10.0, 18.0, 19.0, 21.0, 60.0, 72.0, 167.0, 228.0, 416.0, 895.0, 2175.0, 6922.0, 37469.0, 816809.0, 161756.0, 14948.0, 3813.0, 1360.0, 614.0, 317.0, 166.0, 106.0, 81.0, 40.0, 26.0, 19.0, 9.0, 10.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043609619140625, -0.042278289794921875, -0.04094696044921875, -0.039615631103515625, -0.0382843017578125, -0.036952972412109375, -0.03562164306640625, -0.034290313720703125, -0.032958984375, -0.031627655029296875, -0.03029632568359375, -0.028964996337890625, -0.0276336669921875, -0.026302337646484375, -0.02497100830078125, -0.023639678955078125, -0.022308349609375, -0.020977020263671875, -0.01964569091796875, -0.018314361572265625, -0.0169830322265625, -0.015651702880859375, -0.01432037353515625, -0.012989044189453125, -0.01165771484375, -0.010326385498046875, -0.00899505615234375, -0.007663726806640625, -0.0063323974609375, -0.005001068115234375, -0.00366973876953125, -0.002338409423828125, -0.001007080078125, 0.000324249267578125, 0.00165557861328125, 0.002986907958984375, 0.0043182373046875, 0.005649566650390625, 0.00698089599609375, 0.008312225341796875, 0.0096435546875, 0.010974884033203125, 0.01230621337890625, 0.013637542724609375, 0.0149688720703125, 0.016300201416015625, 0.01763153076171875, 0.018962860107421875, 0.020294189453125, 0.021625518798828125, 0.02295684814453125, 0.024288177490234375, 0.0256195068359375, 0.026950836181640625, 0.02828216552734375, 0.029613494873046875, 0.03094482421875, 0.032276153564453125, 0.03360748291015625, 0.034938812255859375, 0.0362701416015625, 0.037601470947265625, 0.03893280029296875, 0.040264129638671875, 0.041595458984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 9.0, 9.0, 14.0, 26.0, 23.0, 51.0, 106.0, 145.0, 197.0, 151.0, 120.0, 63.0, 34.0, 15.0, 6.0, 12.0, 9.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0404052734375, -0.039128780364990234, -0.03785228729248047, -0.0365757942199707, -0.03529930114746094, -0.03402280807495117, -0.032746315002441406, -0.03146982192993164, -0.030193328857421875, -0.02891683578491211, -0.027640342712402344, -0.026363849639892578, -0.025087356567382812, -0.023810863494873047, -0.02253437042236328, -0.021257877349853516, -0.01998138427734375, -0.018704891204833984, -0.01742839813232422, -0.016151905059814453, -0.014875411987304688, -0.013598918914794922, -0.012322425842285156, -0.01104593276977539, -0.009769439697265625, -0.00849294662475586, -0.007216453552246094, -0.005939960479736328, -0.0046634674072265625, -0.003386974334716797, -0.0021104812622070312, -0.0008339881896972656, 0.0004425048828125, 0.0017189979553222656, 0.0029954910278320312, 0.004271984100341797, 0.0055484771728515625, 0.006824970245361328, 0.008101463317871094, 0.00937795639038086, 0.010654449462890625, 0.01193094253540039, 0.013207435607910156, 0.014483928680419922, 0.015760421752929688, 0.017036914825439453, 0.01831340789794922, 0.019589900970458984, 0.02086639404296875, 0.022142887115478516, 0.02341938018798828, 0.024695873260498047, 0.025972366333007812, 0.027248859405517578, 0.028525352478027344, 0.02980184555053711, 0.031078338623046875, 0.03235483169555664, 0.033631324768066406, 0.03490781784057617, 0.03618431091308594, 0.0374608039855957, 0.03873729705810547, 0.040013790130615234, 0.041290283203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 1.0, 5.0, 7.0, 13.0, 10.0, 15.0, 29.0, 37.0, 57.0, 84.0, 178.0, 231.0, 109.0, 77.0, 36.0, 30.0, 31.0, 12.0, 8.0, 5.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8520621061325073, -0.8077298998832703, -0.7633976936340332, -0.7190654277801514, -0.6747332811355591, -0.6304010152816772, -0.5860688090324402, -0.5417366027832031, -0.49740439653396606, -0.453072190284729, -0.40873998403549194, -0.3644077479839325, -0.32007554173469543, -0.2757433354854584, -0.23141109943389893, -0.18707889318466187, -0.1427466869354248, -0.09841447323560715, -0.05408225953578949, -0.009750038385391235, 0.034582167863845825, 0.07891437411308289, 0.12324661016464233, 0.1675788164138794, 0.21191102266311646, 0.2562432289123535, 0.3005754351615906, 0.34490767121315, 0.3892398774623871, 0.43357208371162415, 0.4779043197631836, 0.5222365260124207, 0.5665686130523682, 0.6109008193016052, 0.6552330255508423, 0.6995652914047241, 0.7438974380493164, 0.7882297039031982, 0.8325619101524353, 0.8768941164016724, 0.9212263226509094, 0.9655585289001465, 1.0098907947540283, 1.0542229413986206, 1.0985552072525024, 1.1428873538970947, 1.1872196197509766, 1.2315518856048584, 1.2758840322494507, 1.3202162981033325, 1.3645484447479248, 1.4088807106018066, 1.453212857246399, 1.4975451231002808, 1.541877269744873, 1.5862095355987549, 1.6305418014526367, 1.6748740673065186, 1.7192062139511108, 1.7635384798049927, 1.807870626449585, 1.8522028923034668, 1.8965351581573486, 1.940867304801941, 1.9851994514465332]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 8.0, 17.0, 10.0, 15.0, 12.0, 21.0, 28.0, 30.0, 46.0, 39.0, 42.0, 39.0, 45.0, 35.0, 66.0, 50.0, 49.0, 54.0, 61.0, 42.0, 38.0, 29.0, 24.0, 34.0, 27.0, 23.0, 17.0, 10.0, 20.0, 16.0, 5.0, 8.0, 2.0, 4.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91109299659729, -0.8846433162689209, -0.858193576335907, -0.8317438960075378, -0.8052942156791687, -0.7788444757461548, -0.7523947954177856, -0.7259451150894165, -0.6994954347610474, -0.6730457544326782, -0.6465960144996643, -0.6201463341712952, -0.593696653842926, -0.5672469139099121, -0.540797233581543, -0.5143475532531738, -0.4878978431224823, -0.46144813299179077, -0.43499845266342163, -0.4085487425327301, -0.38209906220436096, -0.35564935207366943, -0.3291996717453003, -0.30274996161460876, -0.27630025148391724, -0.2498505562543869, -0.22340086102485657, -0.19695115089416504, -0.1705014705657959, -0.14405176043510437, -0.11760206520557404, -0.0911523699760437, -0.06470268964767456, -0.038252994418144226, -0.011803295463323593, 0.01464640349149704, 0.041096098721027374, 0.0675458014011383, 0.09399549663066864, 0.12044519186019897, 0.1468948870897293, 0.17334458231925964, 0.19979427754878998, 0.2262439727783203, 0.25269368290901184, 0.27914339303970337, 0.3055930733680725, 0.33204275369644165, 0.3584924638271332, 0.3849421739578247, 0.41139185428619385, 0.4378415644168854, 0.4642912447452545, 0.49074095487594604, 0.5171906352043152, 0.5436403751373291, 0.5700900554656982, 0.5965397357940674, 0.6229894757270813, 0.6494391560554504, 0.6758888363838196, 0.7023385763168335, 0.7287882566452026, 0.7552379369735718, 0.7816876173019409]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 15.0, 20.0, 17.0, 31.0, 47.0, 90.0, 149.0, 295.0, 544.0, 1205.0, 19999.0, 4169187.0, 1308.0, 621.0, 313.0, 192.0, 115.0, 37.0, 18.0, 16.0, 7.0, 7.0, 6.0, 6.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.486572265625, -0.4718475341796875, -0.457122802734375, -0.4423980712890625, -0.42767333984375, -0.4129486083984375, -0.398223876953125, -0.3834991455078125, -0.3687744140625, -0.3540496826171875, -0.339324951171875, -0.3246002197265625, -0.30987548828125, -0.2951507568359375, -0.280426025390625, -0.2657012939453125, -0.2509765625, -0.2362518310546875, -0.221527099609375, -0.2068023681640625, -0.19207763671875, -0.1773529052734375, -0.162628173828125, -0.1479034423828125, -0.1331787109375, -0.1184539794921875, -0.103729248046875, -0.0890045166015625, -0.07427978515625, -0.0595550537109375, -0.044830322265625, -0.0301055908203125, -0.015380859375, -0.0006561279296875, 0.014068603515625, 0.0287933349609375, 0.04351806640625, 0.0582427978515625, 0.072967529296875, 0.0876922607421875, 0.1024169921875, 0.1171417236328125, 0.131866455078125, 0.1465911865234375, 0.16131591796875, 0.1760406494140625, 0.190765380859375, 0.2054901123046875, 0.22021484375, 0.2349395751953125, 0.249664306640625, 0.2643890380859375, 0.27911376953125, 0.2938385009765625, 0.308563232421875, 0.3232879638671875, 0.3380126953125, 0.3527374267578125, 0.367462158203125, 0.3821868896484375, 0.39691162109375, 0.4116363525390625, 0.426361083984375, 0.4410858154296875, 0.455810546875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 6.0, 12.0, 15.0, 23.0, 38.0, 52.0, 97.0, 103.0, 124.0, 131.0, 118.0, 81.0, 72.0, 44.0, 37.0, 23.0, 9.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1292724609375, -0.12524795532226562, -0.12122344970703125, -0.11719894409179688, -0.1131744384765625, -0.10914993286132812, -0.10512542724609375, -0.10110092163085938, -0.097076416015625, -0.09305191040039062, -0.08902740478515625, -0.08500289916992188, -0.0809783935546875, -0.07695388793945312, -0.07292938232421875, -0.06890487670898438, -0.06488037109375, -0.060855865478515625, -0.05683135986328125, -0.052806854248046875, -0.0487823486328125, -0.044757843017578125, -0.04073333740234375, -0.036708831787109375, -0.032684326171875, -0.028659820556640625, -0.02463531494140625, -0.020610809326171875, -0.0165863037109375, -0.012561798095703125, -0.00853729248046875, -0.004512786865234375, -0.00048828125, 0.003536224365234375, 0.00756072998046875, 0.011585235595703125, 0.0156097412109375, 0.019634246826171875, 0.02365875244140625, 0.027683258056640625, 0.031707763671875, 0.035732269287109375, 0.03975677490234375, 0.043781280517578125, 0.0478057861328125, 0.051830291748046875, 0.05585479736328125, 0.059879302978515625, 0.06390380859375, 0.06792831420898438, 0.07195281982421875, 0.07597732543945312, 0.0800018310546875, 0.08402633666992188, 0.08805084228515625, 0.09207534790039062, 0.096099853515625, 0.10012435913085938, 0.10414886474609375, 0.10817337036132812, 0.1121978759765625, 0.11622238159179688, 0.12024688720703125, 0.12427139282226562, 0.1282958984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 12.0, 13.0, 18.0, 17.0, 25.0, 29.0, 39.0, 65.0, 98.0, 147.0, 225.0, 377.0, 723.0, 1471.0, 6909.0, 4178030.0, 3440.0, 1152.0, 557.0, 280.0, 190.0, 145.0, 99.0, 59.0, 44.0, 24.0, 16.0, 15.0, 8.0, 5.0, 11.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4990234375, -0.482574462890625, -0.46612548828125, -0.449676513671875, -0.4332275390625, -0.416778564453125, -0.40032958984375, -0.383880615234375, -0.367431640625, -0.350982666015625, -0.33453369140625, -0.318084716796875, -0.3016357421875, -0.285186767578125, -0.26873779296875, -0.252288818359375, -0.23583984375, -0.219390869140625, -0.20294189453125, -0.186492919921875, -0.1700439453125, -0.153594970703125, -0.13714599609375, -0.120697021484375, -0.104248046875, -0.087799072265625, -0.07135009765625, -0.054901123046875, -0.0384521484375, -0.022003173828125, -0.00555419921875, 0.010894775390625, 0.02734375, 0.043792724609375, 0.06024169921875, 0.076690673828125, 0.0931396484375, 0.109588623046875, 0.12603759765625, 0.142486572265625, 0.158935546875, 0.175384521484375, 0.19183349609375, 0.208282470703125, 0.2247314453125, 0.241180419921875, 0.25762939453125, 0.274078369140625, 0.29052734375, 0.306976318359375, 0.32342529296875, 0.339874267578125, 0.3563232421875, 0.372772216796875, 0.38922119140625, 0.405670166015625, 0.422119140625, 0.438568115234375, 0.45501708984375, 0.471466064453125, 0.4879150390625, 0.504364013671875, 0.52081298828125, 0.537261962890625, 0.5537109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 29.0, 4023.0, 16.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12223291397094727, -0.11934375762939453, -0.1164546012878418, -0.11356544494628906, -0.11067628860473633, -0.1077871322631836, -0.10489797592163086, -0.10200881958007812, -0.09911966323852539, -0.09623050689697266, -0.09334135055541992, -0.09045219421386719, -0.08756303787231445, -0.08467388153076172, -0.08178472518920898, -0.07889556884765625, -0.07600641250610352, -0.07311725616455078, -0.07022809982299805, -0.06733894348144531, -0.06444978713989258, -0.061560630798339844, -0.05867147445678711, -0.055782318115234375, -0.05289316177368164, -0.050004005432128906, -0.04711484909057617, -0.04422569274902344, -0.0413365364074707, -0.03844738006591797, -0.035558223724365234, -0.0326690673828125, -0.029779911041259766, -0.02689075469970703, -0.024001598358154297, -0.021112442016601562, -0.018223285675048828, -0.015334129333496094, -0.01244497299194336, -0.009555816650390625, -0.006666660308837891, -0.0037775039672851562, -0.0008883476257324219, 0.0020008087158203125, 0.004889965057373047, 0.007779121398925781, 0.010668277740478516, 0.01355743408203125, 0.016446590423583984, 0.01933574676513672, 0.022224903106689453, 0.025114059448242188, 0.028003215789794922, 0.030892372131347656, 0.03378152847290039, 0.036670684814453125, 0.03955984115600586, 0.042448997497558594, 0.04533815383911133, 0.04822731018066406, 0.0511164665222168, 0.05400562286376953, 0.056894779205322266, 0.059783935546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 7.0, 5.0, 10.0, 13.0, 13.0, 21.0, 30.0, 54.0, 62.0, 115.0, 173.0, 193.0, 128.0, 64.0, 32.0, 26.0, 14.0, 9.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16527009010314941, -0.15843909978866577, -0.15160810947418213, -0.1447771191596985, -0.13794612884521484, -0.1311151385307312, -0.12428416311740875, -0.11745317280292511, -0.11062218248844147, -0.10379119217395782, -0.09696020185947418, -0.09012921899557114, -0.0832982286810875, -0.07646723836660385, -0.0696362555027008, -0.06280526518821716, -0.05597427487373352, -0.04914328455924988, -0.042312297970056534, -0.03548131138086319, -0.028650321066379547, -0.021819330751895905, -0.01498834416270256, -0.008157357573509216, -0.0013263672590255737, 0.00550462119281292, 0.012335609644651413, 0.019166598096489906, 0.0259975865483284, 0.03282857686281204, 0.039659563452005386, 0.04649055004119873, 0.05332154035568237, 0.060152530670166016, 0.06698352098464966, 0.0738145038485527, 0.08064549416303635, 0.08747648447751999, 0.09430746734142303, 0.10113845765590668, 0.10796944797039032, 0.11480043828487396, 0.1216314285993576, 0.12846241891384125, 0.1352933943271637, 0.14212438464164734, 0.14895537495613098, 0.15578636527061462, 0.16261735558509827, 0.1694483458995819, 0.17627933621406555, 0.1831103265285492, 0.18994131684303284, 0.19677230715751648, 0.20360328257083893, 0.21043427288532257, 0.2172652631998062, 0.22409625351428986, 0.2309272438287735, 0.23775823414325714, 0.2445892095565796, 0.25142019987106323, 0.2582511901855469, 0.2650821805000305, 0.27191317081451416]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 13.0, 9.0, 13.0, 12.0, 20.0, 20.0, 23.0, 33.0, 31.0, 45.0, 27.0, 36.0, 26.0, 35.0, 45.0, 31.0, 31.0, 28.0, 29.0, 43.0, 43.0, 31.0, 36.0, 36.0, 35.0, 36.0, 25.0, 26.0, 23.0, 16.0, 23.0, 19.0, 18.0, 8.0, 12.0, 7.0, 9.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.0997384786605835, -0.09672235697507858, -0.09370624274015427, -0.09069012105464935, -0.08767400681972504, -0.08465788513422012, -0.08164176344871521, -0.0786256492137909, -0.07560952752828598, -0.07259340584278107, -0.06957729160785675, -0.06656116992235184, -0.06354504823684692, -0.06052893400192261, -0.057512812316417694, -0.05449669435620308, -0.051480576395988464, -0.04846445843577385, -0.045448340475559235, -0.04243221879005432, -0.039416100829839706, -0.03639998286962509, -0.03338386118412018, -0.030367743223905563, -0.02735162526369095, -0.024335507303476334, -0.02131938748061657, -0.018303267657756805, -0.01528714969754219, -0.012271030806005001, -0.009254911914467812, -0.0062387920916080475, -0.0032226741313934326, -0.00020655523985624313, 0.0028095636516809464, 0.005825682543218136, 0.008841801434755325, 0.011857920326292515, 0.014874039217829704, 0.01789015904068947, 0.020906277000904083, 0.023922394961118698, 0.026938514783978462, 0.029954634606838226, 0.03297075256705284, 0.035986870527267456, 0.03900299221277237, 0.042019110172986984, 0.0450352281332016, 0.048051346093416214, 0.05106746405363083, 0.05408358573913574, 0.05709970369935036, 0.06011582165956497, 0.06313194334506989, 0.0661480575799942, 0.06916417926549911, 0.07218030095100403, 0.07519641518592834, 0.07821253687143326, 0.08122865855693817, 0.08424477279186249, 0.0872608944773674, 0.09027701616287231, 0.09329313039779663]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 10.0, 5.0, 17.0, 18.0, 27.0, 29.0, 42.0, 60.0, 96.0, 98.0, 146.0, 208.0, 266.0, 388.0, 567.0, 882.0, 1579.0, 3048.0, 7052.0, 19460.0, 63255.0, 313263.0, 508848.0, 86446.0, 25219.0, 8901.0, 3680.0, 1775.0, 997.0, 645.0, 436.0, 263.0, 206.0, 170.0, 122.0, 74.0, 59.0, 53.0, 37.0, 32.0, 21.0, 15.0, 10.0, 12.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.367919921875, -0.3564643859863281, -0.34500885009765625, -0.3335533142089844, -0.3220977783203125, -0.3106422424316406, -0.29918670654296875, -0.2877311706542969, -0.276275634765625, -0.2648200988769531, -0.25336456298828125, -0.24190902709960938, -0.2304534912109375, -0.21899795532226562, -0.20754241943359375, -0.19608688354492188, -0.18463134765625, -0.17317581176757812, -0.16172027587890625, -0.15026473999023438, -0.1388092041015625, -0.12735366821289062, -0.11589813232421875, -0.10444259643554688, -0.092987060546875, -0.08153152465820312, -0.07007598876953125, -0.058620452880859375, -0.0471649169921875, -0.035709381103515625, -0.02425384521484375, -0.012798309326171875, -0.0013427734375, 0.010112762451171875, 0.02156829833984375, 0.033023834228515625, 0.0444793701171875, 0.055934906005859375, 0.06739044189453125, 0.07884597778320312, 0.090301513671875, 0.10175704956054688, 0.11321258544921875, 0.12466812133789062, 0.1361236572265625, 0.14757919311523438, 0.15903472900390625, 0.17049026489257812, 0.18194580078125, 0.19340133666992188, 0.20485687255859375, 0.21631240844726562, 0.2277679443359375, 0.23922348022460938, 0.25067901611328125, 0.2621345520019531, 0.273590087890625, 0.2850456237792969, 0.29650115966796875, 0.3079566955566406, 0.3194122314453125, 0.3308677673339844, 0.34232330322265625, 0.3537788391113281, 0.365234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 6.0, 2.0, 15.0, 13.0, 26.0, 31.0, 51.0, 81.0, 93.0, 117.0, 139.0, 125.0, 84.0, 69.0, 59.0, 39.0, 32.0, 8.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12622451782226562, -0.12220001220703125, -0.11817550659179688, -0.1141510009765625, -0.11012649536132812, -0.10610198974609375, -0.10207748413085938, -0.098052978515625, -0.09402847290039062, -0.09000396728515625, -0.08597946166992188, -0.0819549560546875, -0.07793045043945312, -0.07390594482421875, -0.06988143920898438, -0.06585693359375, -0.061832427978515625, -0.05780792236328125, -0.053783416748046875, -0.0497589111328125, -0.045734405517578125, -0.04170989990234375, -0.037685394287109375, -0.033660888671875, -0.029636383056640625, -0.02561187744140625, -0.021587371826171875, -0.0175628662109375, -0.013538360595703125, -0.00951385498046875, -0.005489349365234375, -0.00146484375, 0.002559661865234375, 0.00658416748046875, 0.010608673095703125, 0.0146331787109375, 0.018657684326171875, 0.02268218994140625, 0.026706695556640625, 0.030731201171875, 0.034755706787109375, 0.03878021240234375, 0.042804718017578125, 0.0468292236328125, 0.050853729248046875, 0.05487823486328125, 0.058902740478515625, 0.06292724609375, 0.06695175170898438, 0.07097625732421875, 0.07500076293945312, 0.0790252685546875, 0.08304977416992188, 0.08707427978515625, 0.09109878540039062, 0.095123291015625, 0.09914779663085938, 0.10317230224609375, 0.10719680786132812, 0.1112213134765625, 0.11524581909179688, 0.11927032470703125, 0.12329483032226562, 0.1273193359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 13.0, 5.0, 15.0, 12.0, 12.0, 22.0, 20.0, 53.0, 98.0, 200.0, 435.0, 1108.0, 2890.0, 8777.0, 33382.0, 214427.0, 696883.0, 67383.0, 15313.0, 4608.0, 1627.0, 634.0, 274.0, 131.0, 80.0, 43.0, 29.0, 13.0, 13.0, 11.0, 9.0, 7.0, 7.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.406494140625, -0.39527130126953125, -0.3840484619140625, -0.37282562255859375, -0.361602783203125, -0.35037994384765625, -0.3391571044921875, -0.32793426513671875, -0.31671142578125, -0.30548858642578125, -0.2942657470703125, -0.28304290771484375, -0.271820068359375, -0.26059722900390625, -0.2493743896484375, -0.23815155029296875, -0.2269287109375, -0.21570587158203125, -0.2044830322265625, -0.19326019287109375, -0.182037353515625, -0.17081451416015625, -0.1595916748046875, -0.14836883544921875, -0.13714599609375, -0.12592315673828125, -0.1147003173828125, -0.10347747802734375, -0.092254638671875, -0.08103179931640625, -0.0698089599609375, -0.05858612060546875, -0.04736328125, -0.03614044189453125, -0.0249176025390625, -0.01369476318359375, -0.002471923828125, 0.00875091552734375, 0.0199737548828125, 0.03119659423828125, 0.04241943359375, 0.05364227294921875, 0.0648651123046875, 0.07608795166015625, 0.087310791015625, 0.09853363037109375, 0.1097564697265625, 0.12097930908203125, 0.1322021484375, 0.14342498779296875, 0.1546478271484375, 0.16587066650390625, 0.177093505859375, 0.18831634521484375, 0.1995391845703125, 0.21076202392578125, 0.22198486328125, 0.23320770263671875, 0.2444305419921875, 0.25565338134765625, 0.266876220703125, 0.27809906005859375, 0.2893218994140625, 0.30054473876953125, 0.311767578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 2.0, 5.0, 2.0, 7.0, 13.0, 9.0, 11.0, 13.0, 20.0, 24.0, 25.0, 23.0, 36.0, 31.0, 35.0, 31.0, 52.0, 45.0, 41.0, 59.0, 45.0, 48.0, 42.0, 37.0, 30.0, 48.0, 41.0, 30.0, 29.0, 32.0, 29.0, 24.0, 11.0, 15.0, 10.0, 7.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1895751953125, -0.18369483947753906, -0.17781448364257812, -0.1719341278076172, -0.16605377197265625, -0.1601734161376953, -0.15429306030273438, -0.14841270446777344, -0.1425323486328125, -0.13665199279785156, -0.13077163696289062, -0.12489128112792969, -0.11901092529296875, -0.11313056945800781, -0.10725021362304688, -0.10136985778808594, -0.095489501953125, -0.08960914611816406, -0.08372879028320312, -0.07784843444824219, -0.07196807861328125, -0.06608772277832031, -0.060207366943359375, -0.05432701110839844, -0.0484466552734375, -0.04256629943847656, -0.036685943603515625, -0.030805587768554688, -0.02492523193359375, -0.019044876098632812, -0.013164520263671875, -0.0072841644287109375, -0.00140380859375, 0.0044765472412109375, 0.010356903076171875, 0.016237258911132812, 0.02211761474609375, 0.027997970581054688, 0.033878326416015625, 0.03975868225097656, 0.0456390380859375, 0.05151939392089844, 0.057399749755859375, 0.06328010559082031, 0.06916046142578125, 0.07504081726074219, 0.08092117309570312, 0.08680152893066406, 0.092681884765625, 0.09856224060058594, 0.10444259643554688, 0.11032295227050781, 0.11620330810546875, 0.12208366394042969, 0.12796401977539062, 0.13384437561035156, 0.1397247314453125, 0.14560508728027344, 0.15148544311523438, 0.1573657989501953, 0.16324615478515625, 0.1691265106201172, 0.17500686645507812, 0.18088722229003906, 0.186767578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 13.0, 15.0, 28.0, 48.0, 95.0, 147.0, 295.0, 831.0, 2940.0, 24686.0, 970814.0, 43025.0, 3867.0, 954.0, 367.0, 174.0, 99.0, 48.0, 31.0, 14.0, 14.0, 11.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06134033203125, -0.05919456481933594, -0.057048797607421875, -0.05490303039550781, -0.05275726318359375, -0.05061149597167969, -0.048465728759765625, -0.04631996154785156, -0.0441741943359375, -0.04202842712402344, -0.039882659912109375, -0.03773689270019531, -0.03559112548828125, -0.03344535827636719, -0.031299591064453125, -0.029153823852539062, -0.027008056640625, -0.024862289428710938, -0.022716522216796875, -0.020570755004882812, -0.01842498779296875, -0.016279220581054688, -0.014133453369140625, -0.011987686157226562, -0.0098419189453125, -0.0076961517333984375, -0.005550384521484375, -0.0034046173095703125, -0.00125885009765625, 0.0008869171142578125, 0.003032684326171875, 0.0051784515380859375, 0.00732421875, 0.009469985961914062, 0.011615753173828125, 0.013761520385742188, 0.01590728759765625, 0.018053054809570312, 0.020198822021484375, 0.022344589233398438, 0.0244903564453125, 0.026636123657226562, 0.028781890869140625, 0.030927658081054688, 0.03307342529296875, 0.03521919250488281, 0.037364959716796875, 0.03951072692871094, 0.041656494140625, 0.04380226135253906, 0.045948028564453125, 0.04809379577636719, 0.05023956298828125, 0.05238533020019531, 0.054531097412109375, 0.05667686462402344, 0.0588226318359375, 0.06096839904785156, 0.06311416625976562, 0.06525993347167969, 0.06740570068359375, 0.06955146789550781, 0.07169723510742188, 0.07384300231933594, 0.07598876953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 1.0, 6.0, 3.0, 11.0, 8.0, 8.0, 16.0, 22.0, 23.0, 30.0, 53.0, 51.0, 61.0, 56.0, 69.0, 63.0, 63.0, 71.0, 47.0, 55.0, 55.0, 58.0, 31.0, 41.0, 20.0, 20.0, 16.0, 10.0, 10.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.754161298274994e-06, -3.634020686149597e-06, -3.5138800740242004e-06, -3.3937394618988037e-06, -3.273598849773407e-06, -3.1534582376480103e-06, -3.0333176255226135e-06, -2.913177013397217e-06, -2.79303640127182e-06, -2.6728957891464233e-06, -2.5527551770210266e-06, -2.43261456489563e-06, -2.312473952770233e-06, -2.1923333406448364e-06, -2.0721927285194397e-06, -1.952052116394043e-06, -1.8319115042686462e-06, -1.7117708921432495e-06, -1.5916302800178528e-06, -1.471489667892456e-06, -1.3513490557670593e-06, -1.2312084436416626e-06, -1.1110678315162659e-06, -9.909272193908691e-07, -8.707866072654724e-07, -7.506459951400757e-07, -6.30505383014679e-07, -5.103647708892822e-07, -3.902241587638855e-07, -2.7008354663848877e-07, -1.4994293451309204e-07, -2.9802322387695312e-08, 9.033828973770142e-08, 2.1047890186309814e-07, 3.3061951398849487e-07, 4.507601261138916e-07, 5.709007382392883e-07, 6.910413503646851e-07, 8.111819624900818e-07, 9.313225746154785e-07, 1.0514631867408752e-06, 1.171603798866272e-06, 1.2917444109916687e-06, 1.4118850231170654e-06, 1.5320256352424622e-06, 1.6521662473678589e-06, 1.7723068594932556e-06, 1.8924474716186523e-06, 2.012588083744049e-06, 2.132728695869446e-06, 2.2528693079948425e-06, 2.3730099201202393e-06, 2.493150532245636e-06, 2.6132911443710327e-06, 2.7334317564964294e-06, 2.853572368621826e-06, 2.973712980747223e-06, 3.0938535928726196e-06, 3.2139942049980164e-06, 3.334134817123413e-06, 3.45427542924881e-06, 3.5744160413742065e-06, 3.6945566534996033e-06, 3.814697265625e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 5.0, 8.0, 10.0, 18.0, 32.0, 53.0, 79.0, 121.0, 215.0, 382.0, 918.0, 2468.0, 11176.0, 172795.0, 831081.0, 22878.0, 3995.0, 1189.0, 456.0, 278.0, 134.0, 102.0, 48.0, 37.0, 28.0, 16.0, 10.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.06723308563232422, -0.06537437438964844, -0.06351566314697266, -0.061656951904296875, -0.059798240661621094, -0.05793952941894531, -0.05608081817626953, -0.05422210693359375, -0.05236339569091797, -0.05050468444824219, -0.048645973205566406, -0.046787261962890625, -0.044928550720214844, -0.04306983947753906, -0.04121112823486328, -0.0393524169921875, -0.03749370574951172, -0.03563499450683594, -0.033776283264160156, -0.031917572021484375, -0.030058860778808594, -0.028200149536132812, -0.02634143829345703, -0.02448272705078125, -0.02262401580810547, -0.020765304565429688, -0.018906593322753906, -0.017047882080078125, -0.015189170837402344, -0.013330459594726562, -0.011471748352050781, -0.009613037109375, -0.007754325866699219, -0.0058956146240234375, -0.004036903381347656, -0.002178192138671875, -0.00031948089599609375, 0.0015392303466796875, 0.0033979415893554688, 0.00525665283203125, 0.007115364074707031, 0.008974075317382812, 0.010832786560058594, 0.012691497802734375, 0.014550209045410156, 0.016408920288085938, 0.01826763153076172, 0.0201263427734375, 0.02198505401611328, 0.023843765258789062, 0.025702476501464844, 0.027561187744140625, 0.029419898986816406, 0.03127861022949219, 0.03313732147216797, 0.03499603271484375, 0.03685474395751953, 0.03871345520019531, 0.040572166442871094, 0.042430877685546875, 0.044289588928222656, 0.04614830017089844, 0.04800701141357422, 0.04986572265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 11.0, 20.0, 21.0, 40.0, 52.0, 88.0, 133.0, 164.0, 181.0, 87.0, 56.0, 38.0, 28.0, 24.0, 14.0, 7.0, 5.0, 7.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.052154541015625, -0.05096173286437988, -0.049768924713134766, -0.04857611656188965, -0.04738330841064453, -0.046190500259399414, -0.0449976921081543, -0.04380488395690918, -0.04261207580566406, -0.041419267654418945, -0.04022645950317383, -0.03903365135192871, -0.037840843200683594, -0.03664803504943848, -0.03545522689819336, -0.03426241874694824, -0.033069610595703125, -0.03187680244445801, -0.03068399429321289, -0.029491186141967773, -0.028298377990722656, -0.02710556983947754, -0.025912761688232422, -0.024719953536987305, -0.023527145385742188, -0.02233433723449707, -0.021141529083251953, -0.019948720932006836, -0.01875591278076172, -0.0175631046295166, -0.016370296478271484, -0.015177488327026367, -0.01398468017578125, -0.012791872024536133, -0.011599063873291016, -0.010406255722045898, -0.009213447570800781, -0.008020639419555664, -0.006827831268310547, -0.00563502311706543, -0.0044422149658203125, -0.0032494068145751953, -0.002056598663330078, -0.0008637905120849609, 0.00032901763916015625, 0.0015218257904052734, 0.0027146339416503906, 0.003907442092895508, 0.005100250244140625, 0.006293058395385742, 0.007485866546630859, 0.008678674697875977, 0.009871482849121094, 0.011064291000366211, 0.012257099151611328, 0.013449907302856445, 0.014642715454101562, 0.01583552360534668, 0.017028331756591797, 0.018221139907836914, 0.01941394805908203, 0.02060675621032715, 0.021799564361572266, 0.022992372512817383, 0.0241851806640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 4.0, 5.0, 10.0, 18.0, 11.0, 27.0, 34.0, 43.0, 79.0, 122.0, 150.0, 142.0, 92.0, 58.0, 44.0, 32.0, 30.0, 22.0, 14.0, 9.0, 2.0, 5.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0698236227035522, -1.038955807685852, -1.0080881118774414, -0.977220356464386, -0.9463526010513306, -0.9154847860336304, -0.884617030620575, -0.8537492752075195, -0.8228815197944641, -0.7920137643814087, -0.7611460089683533, -0.7302782535552979, -0.6994104385375977, -0.668542742729187, -0.6376749277114868, -0.6068071722984314, -0.575939416885376, -0.5450716614723206, -0.5142039060592651, -0.48333612084388733, -0.4524683654308319, -0.4216006100177765, -0.3907328248023987, -0.35986506938934326, -0.32899731397628784, -0.2981295585632324, -0.267261803150177, -0.2363940179347992, -0.20552626252174377, -0.17465850710868835, -0.14379073679447174, -0.11292296648025513, -0.08205515146255493, -0.051187388598918915, -0.020319625735282898, 0.010548137128353119, 0.041415899991989136, 0.07228365540504456, 0.10315142571926117, 0.13401919603347778, 0.1648869514465332, 0.19575470685958862, 0.22662247717380524, 0.25749024748802185, 0.28835800290107727, 0.3192257583141327, 0.3500935435295105, 0.3809612989425659, 0.41182905435562134, 0.44269680976867676, 0.4735645651817322, 0.5044323205947876, 0.5353001356124878, 0.5661678314208984, 0.5970356464385986, 0.627903401851654, 0.6587711572647095, 0.6896389126777649, 0.7205066680908203, 0.7513744235038757, 0.7822421789169312, 0.8131099939346313, 0.8439777493476868, 0.8748455047607422, 0.9057132601737976]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 2.0, 9.0, 5.0, 7.0, 13.0, 12.0, 18.0, 20.0, 23.0, 32.0, 20.0, 31.0, 31.0, 35.0, 25.0, 48.0, 41.0, 46.0, 46.0, 33.0, 52.0, 50.0, 47.0, 36.0, 34.0, 36.0, 31.0, 21.0, 26.0, 17.0, 18.0, 14.0, 18.0, 15.0, 14.0, 10.0, 6.0, 9.0, 6.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.674320638179779, -0.6529638171195984, -0.6316070556640625, -0.6102502346038818, -0.5888934135437012, -0.5675366520881653, -0.5461798310279846, -0.5248230695724487, -0.5034662485122681, -0.4821094572544098, -0.4607526659965515, -0.43939584493637085, -0.4180390536785126, -0.3966822624206543, -0.37532544136047363, -0.35396865010261536, -0.3326118588447571, -0.3112550675868988, -0.2898982763290405, -0.26854145526885986, -0.2471846640110016, -0.2258278727531433, -0.20447106659412384, -0.18311426043510437, -0.1617574691772461, -0.14040067791938782, -0.11904387176036835, -0.09768707305192947, -0.0763302743434906, -0.05497347563505173, -0.033616676926612854, -0.012259870767593384, 0.009096920490264893, 0.030453719198703766, 0.05181051790714264, 0.07316731661558151, 0.09452411532402039, 0.11588091403245926, 0.13723771274089813, 0.1585945188999176, 0.17995131015777588, 0.20130810141563416, 0.22266490757465363, 0.2440217137336731, 0.26537850499153137, 0.28673529624938965, 0.3080921173095703, 0.3294489085674286, 0.35080569982528687, 0.37216249108314514, 0.3935192823410034, 0.4148761034011841, 0.43623289465904236, 0.45758968591690063, 0.4789465069770813, 0.5003032684326172, 0.5216600894927979, 0.5430169105529785, 0.5643736720085144, 0.5857304930686951, 0.607087254524231, 0.6284440755844116, 0.6498008966445923, 0.671157717704773, 0.6925144791603088]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 10.0, 16.0, 18.0, 18.0, 32.0, 36.0, 59.0, 103.0, 179.0, 390.0, 969.0, 2127.0, 6863.0, 4150832.0, 28025.0, 2545.0, 1026.0, 429.0, 253.0, 148.0, 60.0, 31.0, 25.0, 17.0, 10.0, 10.0, 8.0, 10.0, 5.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.263671875, -0.2558479309082031, -0.24802398681640625, -0.24020004272460938, -0.2323760986328125, -0.22455215454101562, -0.21672821044921875, -0.20890426635742188, -0.201080322265625, -0.19325637817382812, -0.18543243408203125, -0.17760848999023438, -0.1697845458984375, -0.16196060180664062, -0.15413665771484375, -0.14631271362304688, -0.13848876953125, -0.13066482543945312, -0.12284088134765625, -0.11501693725585938, -0.1071929931640625, -0.09936904907226562, -0.09154510498046875, -0.08372116088867188, -0.075897216796875, -0.06807327270507812, -0.06024932861328125, -0.052425384521484375, -0.0446014404296875, -0.036777496337890625, -0.02895355224609375, -0.021129608154296875, -0.0133056640625, -0.005481719970703125, 0.00234222412109375, 0.010166168212890625, 0.0179901123046875, 0.025814056396484375, 0.03363800048828125, 0.041461944580078125, 0.049285888671875, 0.057109832763671875, 0.06493377685546875, 0.07275772094726562, 0.0805816650390625, 0.08840560913085938, 0.09622955322265625, 0.10405349731445312, 0.11187744140625, 0.11970138549804688, 0.12752532958984375, 0.13534927368164062, 0.1431732177734375, 0.15099716186523438, 0.15882110595703125, 0.16664505004882812, 0.174468994140625, 0.18229293823242188, 0.19011688232421875, 0.19794082641601562, 0.2057647705078125, 0.21358871459960938, 0.22141265869140625, 0.22923660278320312, 0.237060546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 3.0, 4.0, 12.0, 7.0, 19.0, 36.0, 46.0, 77.0, 101.0, 119.0, 139.0, 122.0, 104.0, 68.0, 54.0, 43.0, 24.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12659263610839844, -0.12257003784179688, -0.11854743957519531, -0.11452484130859375, -0.11050224304199219, -0.10647964477539062, -0.10245704650878906, -0.0984344482421875, -0.09441184997558594, -0.09038925170898438, -0.08636665344238281, -0.08234405517578125, -0.07832145690917969, -0.07429885864257812, -0.07027626037597656, -0.066253662109375, -0.06223106384277344, -0.058208465576171875, -0.05418586730957031, -0.05016326904296875, -0.04614067077636719, -0.042118072509765625, -0.03809547424316406, -0.0340728759765625, -0.030050277709960938, -0.026027679443359375, -0.022005081176757812, -0.01798248291015625, -0.013959884643554688, -0.009937286376953125, -0.0059146881103515625, -0.00189208984375, 0.0021305084228515625, 0.006153106689453125, 0.010175704956054688, 0.01419830322265625, 0.018220901489257812, 0.022243499755859375, 0.026266098022460938, 0.0302886962890625, 0.03431129455566406, 0.038333892822265625, 0.04235649108886719, 0.04637908935546875, 0.05040168762207031, 0.054424285888671875, 0.05844688415527344, 0.062469482421875, 0.06649208068847656, 0.07051467895507812, 0.07453727722167969, 0.07855987548828125, 0.08258247375488281, 0.08660507202148438, 0.09062767028808594, 0.0946502685546875, 0.09867286682128906, 0.10269546508789062, 0.10671806335449219, 0.11074066162109375, 0.11476325988769531, 0.11878585815429688, 0.12280845642089844, 0.1268310546875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 10.0, 20.0, 20.0, 36.0, 56.0, 88.0, 189.0, 338.0, 672.0, 1549.0, 5280.0, 3891082.0, 287645.0, 4510.0, 1449.0, 620.0, 310.0, 171.0, 88.0, 60.0, 26.0, 18.0, 13.0, 12.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275634765625, -0.26458740234375, -0.2535400390625, -0.24249267578125, -0.2314453125, -0.22039794921875, -0.2093505859375, -0.19830322265625, -0.187255859375, -0.17620849609375, -0.1651611328125, -0.15411376953125, -0.14306640625, -0.13201904296875, -0.1209716796875, -0.10992431640625, -0.098876953125, -0.08782958984375, -0.0767822265625, -0.06573486328125, -0.0546875, -0.04364013671875, -0.0325927734375, -0.02154541015625, -0.010498046875, 0.00054931640625, 0.0115966796875, 0.02264404296875, 0.03369140625, 0.04473876953125, 0.0557861328125, 0.06683349609375, 0.077880859375, 0.08892822265625, 0.0999755859375, 0.11102294921875, 0.1220703125, 0.13311767578125, 0.1441650390625, 0.15521240234375, 0.166259765625, 0.17730712890625, 0.1883544921875, 0.19940185546875, 0.21044921875, 0.22149658203125, 0.2325439453125, 0.24359130859375, 0.254638671875, 0.26568603515625, 0.2767333984375, 0.28778076171875, 0.298828125, 0.30987548828125, 0.3209228515625, 0.33197021484375, 0.343017578125, 0.35406494140625, 0.3651123046875, 0.37615966796875, 0.38720703125, 0.39825439453125, 0.4093017578125, 0.42034912109375, 0.431396484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 53.0, 985.0, 2929.0, 59.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06329345703125, -0.0606689453125, -0.05804443359375, -0.055419921875, -0.05279541015625, -0.0501708984375, -0.04754638671875, -0.044921875, -0.04229736328125, -0.0396728515625, -0.03704833984375, -0.034423828125, -0.03179931640625, -0.0291748046875, -0.02655029296875, -0.02392578125, -0.02130126953125, -0.0186767578125, -0.01605224609375, -0.013427734375, -0.01080322265625, -0.0081787109375, -0.00555419921875, -0.0029296875, -0.00030517578125, 0.0023193359375, 0.00494384765625, 0.007568359375, 0.01019287109375, 0.0128173828125, 0.01544189453125, 0.01806640625, 0.02069091796875, 0.0233154296875, 0.02593994140625, 0.028564453125, 0.03118896484375, 0.0338134765625, 0.03643798828125, 0.0390625, 0.04168701171875, 0.0443115234375, 0.04693603515625, 0.049560546875, 0.05218505859375, 0.0548095703125, 0.05743408203125, 0.06005859375, 0.06268310546875, 0.0653076171875, 0.06793212890625, 0.070556640625, 0.07318115234375, 0.0758056640625, 0.07843017578125, 0.0810546875, 0.08367919921875, 0.0863037109375, 0.08892822265625, 0.091552734375, 0.09417724609375, 0.0968017578125, 0.09942626953125, 0.10205078125, 0.10467529296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 4.0, 9.0, 16.0, 18.0, 22.0, 26.0, 28.0, 42.0, 53.0, 64.0, 78.0, 94.0, 118.0, 93.0, 76.0, 44.0, 55.0, 45.0, 29.0, 16.0, 14.0, 8.0, 6.0, 9.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14416152238845825, -0.13914696872234344, -0.13413240015506744, -0.12911784648895264, -0.12410327792167664, -0.11908872425556183, -0.11407416313886642, -0.10905960202217102, -0.10404504090547562, -0.09903047978878021, -0.09401591867208481, -0.0890013575553894, -0.0839868038892746, -0.0789722353219986, -0.07395768165588379, -0.06894312053918839, -0.06392855942249298, -0.05891399830579758, -0.05389943718910217, -0.04888487979769707, -0.04387031868100166, -0.03885575756430626, -0.033841200172901154, -0.02882663905620575, -0.023812077939510345, -0.01879751682281494, -0.013782957568764687, -0.008768397383391857, -0.0037538371980190277, 0.0012607239186763763, 0.006275283172726631, 0.011289842426776886, 0.01630440354347229, 0.021318964660167694, 0.02633352391421795, 0.031348083168268204, 0.03636264428496361, 0.04137720540165901, 0.04639176279306412, 0.05140632390975952, 0.056420885026454926, 0.06143544614315033, 0.06645000725984573, 0.07146456837654114, 0.07647912204265594, 0.08149369060993195, 0.08650824427604675, 0.09152280539274216, 0.09653736650943756, 0.10155192762613297, 0.10656648874282837, 0.11158104985952377, 0.11659561097621918, 0.12161016464233398, 0.12662473320960999, 0.1316392868757248, 0.1366538405418396, 0.1416683942079544, 0.1466829627752304, 0.15169751644134521, 0.15671208500862122, 0.16172663867473602, 0.16674120724201202, 0.17175576090812683, 0.17677032947540283]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 9.0, 12.0, 14.0, 11.0, 12.0, 22.0, 28.0, 23.0, 33.0, 29.0, 34.0, 42.0, 27.0, 35.0, 54.0, 53.0, 47.0, 50.0, 42.0, 42.0, 32.0, 36.0, 35.0, 38.0, 31.0, 26.0, 21.0, 26.0, 20.0, 16.0, 21.0, 13.0, 13.0, 15.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.12792688608169556, -0.12437430769205093, -0.12082173675298691, -0.11726915836334229, -0.11371658742427826, -0.11016400903463364, -0.10661143064498901, -0.10305885970592499, -0.09950628131628036, -0.09595370292663574, -0.09240113198757172, -0.0888485535979271, -0.08529597520828247, -0.08174340426921844, -0.07819082587957382, -0.0746382474899292, -0.07108567655086517, -0.06753309816122055, -0.06398052722215652, -0.0604279488325119, -0.05687537416815758, -0.05332279950380325, -0.04977022111415863, -0.046217646449804306, -0.04266507178544998, -0.03911249712109566, -0.03555992245674133, -0.03200734406709671, -0.028454769402742386, -0.02490219473838806, -0.021349618211388588, -0.017797041684389114, -0.01424446702003479, -0.010691891424357891, -0.007139315828680992, -0.003586740233004093, -3.4164637327194214e-05, 0.00351841002702713, 0.007070986554026604, 0.010623563081026077, 0.014176137745380402, 0.017728712409734726, 0.0212812889367342, 0.024833865463733673, 0.028386440128087997, 0.03193901479244232, 0.035491593182086945, 0.03904416784644127, 0.04259674251079559, 0.04614931717514992, 0.04970189183950424, 0.053254470229148865, 0.05680704489350319, 0.06035961955785751, 0.06391219794750214, 0.06746476888656616, 0.07101734727621078, 0.07456992566585541, 0.07812249660491943, 0.08167507499456406, 0.08522765338420868, 0.0887802243232727, 0.09233280271291733, 0.09588538110256195, 0.09943795204162598]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 2.0, 5.0, 9.0, 17.0, 18.0, 27.0, 25.0, 27.0, 55.0, 57.0, 107.0, 118.0, 154.0, 257.0, 364.0, 604.0, 927.0, 1649.0, 3511.0, 8426.0, 26029.0, 111160.0, 643235.0, 191692.0, 39170.0, 11575.0, 4242.0, 1929.0, 1039.0, 635.0, 438.0, 290.0, 208.0, 153.0, 108.0, 75.0, 54.0, 53.0, 31.0, 18.0, 16.0, 14.0, 8.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37939453125, -0.3670158386230469, -0.35463714599609375, -0.3422584533691406, -0.3298797607421875, -0.3175010681152344, -0.30512237548828125, -0.2927436828613281, -0.280364990234375, -0.2679862976074219, -0.25560760498046875, -0.24322891235351562, -0.2308502197265625, -0.21847152709960938, -0.20609283447265625, -0.19371414184570312, -0.18133544921875, -0.16895675659179688, -0.15657806396484375, -0.14419937133789062, -0.1318206787109375, -0.11944198608398438, -0.10706329345703125, -0.09468460083007812, -0.082305908203125, -0.06992721557617188, -0.05754852294921875, -0.045169830322265625, -0.0327911376953125, -0.020412445068359375, -0.00803375244140625, 0.004344940185546875, 0.0167236328125, 0.029102325439453125, 0.04148101806640625, 0.053859710693359375, 0.0662384033203125, 0.07861709594726562, 0.09099578857421875, 0.10337448120117188, 0.115753173828125, 0.12813186645507812, 0.14051055908203125, 0.15288925170898438, 0.1652679443359375, 0.17764663696289062, 0.19002532958984375, 0.20240402221679688, 0.21478271484375, 0.22716140747070312, 0.23954010009765625, 0.2519187927246094, 0.2642974853515625, 0.2766761779785156, 0.28905487060546875, 0.3014335632324219, 0.313812255859375, 0.3261909484863281, 0.33856964111328125, 0.3509483337402344, 0.3633270263671875, 0.3757057189941406, 0.38808441162109375, 0.4004631042480469, 0.412841796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 2.0, 12.0, 11.0, 17.0, 33.0, 48.0, 80.0, 82.0, 130.0, 128.0, 143.0, 85.0, 78.0, 53.0, 50.0, 22.0, 11.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1309814453125, -0.1269550323486328, -0.12292861938476562, -0.11890220642089844, -0.11487579345703125, -0.11084938049316406, -0.10682296752929688, -0.10279655456542969, -0.0987701416015625, -0.09474372863769531, -0.09071731567382812, -0.08669090270996094, -0.08266448974609375, -0.07863807678222656, -0.07461166381835938, -0.07058525085449219, -0.066558837890625, -0.06253242492675781, -0.058506011962890625, -0.05447959899902344, -0.05045318603515625, -0.04642677307128906, -0.042400360107421875, -0.03837394714355469, -0.0343475341796875, -0.030321121215820312, -0.026294708251953125, -0.022268295288085938, -0.01824188232421875, -0.014215469360351562, -0.010189056396484375, -0.0061626434326171875, -0.00213623046875, 0.0018901824951171875, 0.005916595458984375, 0.009943008422851562, 0.01396942138671875, 0.017995834350585938, 0.022022247314453125, 0.026048660278320312, 0.0300750732421875, 0.03410148620605469, 0.038127899169921875, 0.04215431213378906, 0.04618072509765625, 0.05020713806152344, 0.054233551025390625, 0.05825996398925781, 0.062286376953125, 0.06631278991699219, 0.07033920288085938, 0.07436561584472656, 0.07839202880859375, 0.08241844177246094, 0.08644485473632812, 0.09047126770019531, 0.0944976806640625, 0.09852409362792969, 0.10255050659179688, 0.10657691955566406, 0.11060333251953125, 0.11462974548339844, 0.11865615844726562, 0.12268257141113281, 0.126708984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 6.0, 5.0, 9.0, 11.0, 17.0, 19.0, 24.0, 36.0, 54.0, 60.0, 105.0, 170.0, 322.0, 692.0, 1563.0, 3988.0, 11698.0, 43003.0, 265422.0, 625561.0, 69208.0, 17330.0, 5361.0, 2081.0, 864.0, 419.0, 188.0, 101.0, 69.0, 49.0, 31.0, 17.0, 11.0, 14.0, 9.0, 9.0, 6.0, 8.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324462890625, -0.31496429443359375, -0.3054656982421875, -0.29596710205078125, -0.286468505859375, -0.27696990966796875, -0.2674713134765625, -0.25797271728515625, -0.24847412109375, -0.23897552490234375, -0.2294769287109375, -0.21997833251953125, -0.210479736328125, -0.20098114013671875, -0.1914825439453125, -0.18198394775390625, -0.1724853515625, -0.16298675537109375, -0.1534881591796875, -0.14398956298828125, -0.134490966796875, -0.12499237060546875, -0.1154937744140625, -0.10599517822265625, -0.09649658203125, -0.08699798583984375, -0.0774993896484375, -0.06800079345703125, -0.058502197265625, -0.04900360107421875, -0.0395050048828125, -0.03000640869140625, -0.0205078125, -0.01100921630859375, -0.0015106201171875, 0.00798797607421875, 0.017486572265625, 0.02698516845703125, 0.0364837646484375, 0.04598236083984375, 0.05548095703125, 0.06497955322265625, 0.0744781494140625, 0.08397674560546875, 0.093475341796875, 0.10297393798828125, 0.1124725341796875, 0.12197113037109375, 0.1314697265625, 0.14096832275390625, 0.1504669189453125, 0.15996551513671875, 0.169464111328125, 0.17896270751953125, 0.1884613037109375, 0.19795989990234375, 0.20745849609375, 0.21695709228515625, 0.2264556884765625, 0.23595428466796875, 0.245452880859375, 0.25495147705078125, 0.2644500732421875, 0.27394866943359375, 0.283447265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 4.0, 5.0, 7.0, 8.0, 11.0, 11.0, 19.0, 13.0, 23.0, 26.0, 27.0, 25.0, 26.0, 34.0, 50.0, 48.0, 37.0, 44.0, 46.0, 42.0, 49.0, 47.0, 47.0, 40.0, 41.0, 40.0, 37.0, 34.0, 28.0, 25.0, 18.0, 25.0, 9.0, 8.0, 7.0, 1.0, 6.0, 7.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1922607421875, -0.18677330017089844, -0.18128585815429688, -0.1757984161376953, -0.17031097412109375, -0.1648235321044922, -0.15933609008789062, -0.15384864807128906, -0.1483612060546875, -0.14287376403808594, -0.13738632202148438, -0.1318988800048828, -0.12641143798828125, -0.12092399597167969, -0.11543655395507812, -0.10994911193847656, -0.104461669921875, -0.09897422790527344, -0.09348678588867188, -0.08799934387207031, -0.08251190185546875, -0.07702445983886719, -0.07153701782226562, -0.06604957580566406, -0.0605621337890625, -0.05507469177246094, -0.049587249755859375, -0.04409980773925781, -0.03861236572265625, -0.03312492370605469, -0.027637481689453125, -0.022150039672851562, -0.01666259765625, -0.011175155639648438, -0.005687713623046875, -0.0002002716064453125, 0.00528717041015625, 0.010774612426757812, 0.016262054443359375, 0.021749496459960938, 0.0272369384765625, 0.03272438049316406, 0.038211822509765625, 0.04369926452636719, 0.04918670654296875, 0.05467414855957031, 0.060161590576171875, 0.06564903259277344, 0.071136474609375, 0.07662391662597656, 0.08211135864257812, 0.08759880065917969, 0.09308624267578125, 0.09857368469238281, 0.10406112670898438, 0.10954856872558594, 0.1150360107421875, 0.12052345275878906, 0.12601089477539062, 0.1314983367919922, 0.13698577880859375, 0.1424732208251953, 0.14796066284179688, 0.15344810485839844, 0.158935546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 11.0, 21.0, 23.0, 37.0, 47.0, 80.0, 112.0, 155.0, 236.0, 439.0, 767.0, 1911.0, 5109.0, 18052.0, 136447.0, 811830.0, 56137.0, 10907.0, 3394.0, 1354.0, 596.0, 312.0, 229.0, 105.0, 77.0, 49.0, 26.0, 13.0, 8.0, 11.0, 5.0, 5.0, 7.0, 8.0, 3.0, 1.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271759033203125, -0.02621626853942871, -0.025256633758544922, -0.024296998977661133, -0.023337364196777344, -0.022377729415893555, -0.021418094635009766, -0.020458459854125977, -0.019498825073242188, -0.0185391902923584, -0.01757955551147461, -0.01661992073059082, -0.01566028594970703, -0.014700651168823242, -0.013741016387939453, -0.012781381607055664, -0.011821746826171875, -0.010862112045288086, -0.009902477264404297, -0.008942842483520508, -0.007983207702636719, -0.00702357292175293, -0.006063938140869141, -0.0051043033599853516, -0.0041446685791015625, -0.0031850337982177734, -0.0022253990173339844, -0.0012657642364501953, -0.00030612945556640625, 0.0006535053253173828, 0.0016131401062011719, 0.002572774887084961, 0.00353240966796875, 0.004492044448852539, 0.005451679229736328, 0.006411314010620117, 0.007370948791503906, 0.008330583572387695, 0.009290218353271484, 0.010249853134155273, 0.011209487915039062, 0.012169122695922852, 0.01312875747680664, 0.01408839225769043, 0.015048027038574219, 0.016007661819458008, 0.016967296600341797, 0.017926931381225586, 0.018886566162109375, 0.019846200942993164, 0.020805835723876953, 0.021765470504760742, 0.02272510528564453, 0.02368474006652832, 0.02464437484741211, 0.0256040096282959, 0.026563644409179688, 0.027523279190063477, 0.028482913970947266, 0.029442548751831055, 0.030402183532714844, 0.03136181831359863, 0.03232145309448242, 0.03328108787536621, 0.03424072265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 11.0, 6.0, 20.0, 22.0, 38.0, 42.0, 64.0, 93.0, 88.0, 98.0, 105.0, 92.0, 77.0, 59.0, 51.0, 41.0, 27.0, 22.0, 7.0, 20.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.838701665401459e-06, -6.644055247306824e-06, -6.449408829212189e-06, -6.254762411117554e-06, -6.060115993022919e-06, -5.865469574928284e-06, -5.670823156833649e-06, -5.476176738739014e-06, -5.281530320644379e-06, -5.086883902549744e-06, -4.892237484455109e-06, -4.697591066360474e-06, -4.502944648265839e-06, -4.308298230171204e-06, -4.113651812076569e-06, -3.919005393981934e-06, -3.7243589758872986e-06, -3.5297125577926636e-06, -3.3350661396980286e-06, -3.1404197216033936e-06, -2.9457733035087585e-06, -2.7511268854141235e-06, -2.5564804673194885e-06, -2.3618340492248535e-06, -2.1671876311302185e-06, -1.9725412130355835e-06, -1.7778947949409485e-06, -1.5832483768463135e-06, -1.3886019587516785e-06, -1.1939555406570435e-06, -9.993091225624084e-07, -8.046627044677734e-07, -6.100162863731384e-07, -4.153698682785034e-07, -2.207234501838684e-07, -2.60770320892334e-08, 1.685693860054016e-07, 3.632158041000366e-07, 5.578622221946716e-07, 7.525086402893066e-07, 9.471550583839417e-07, 1.1418014764785767e-06, 1.3364478945732117e-06, 1.5310943126678467e-06, 1.7257407307624817e-06, 1.9203871488571167e-06, 2.1150335669517517e-06, 2.3096799850463867e-06, 2.5043264031410217e-06, 2.6989728212356567e-06, 2.8936192393302917e-06, 3.0882656574249268e-06, 3.2829120755195618e-06, 3.4775584936141968e-06, 3.6722049117088318e-06, 3.866851329803467e-06, 4.061497747898102e-06, 4.256144165992737e-06, 4.450790584087372e-06, 4.645437002182007e-06, 4.840083420276642e-06, 5.034729838371277e-06, 5.229376256465912e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 15.0, 14.0, 24.0, 44.0, 91.0, 114.0, 200.0, 434.0, 1021.0, 2661.0, 8038.0, 37280.0, 642649.0, 318004.0, 27706.0, 6415.0, 2130.0, 852.0, 413.0, 172.0, 93.0, 57.0, 42.0, 22.0, 13.0, 16.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03485107421875, -0.033759117126464844, -0.03266716003417969, -0.03157520294189453, -0.030483245849609375, -0.02939128875732422, -0.028299331665039062, -0.027207374572753906, -0.02611541748046875, -0.025023460388183594, -0.023931503295898438, -0.02283954620361328, -0.021747589111328125, -0.02065563201904297, -0.019563674926757812, -0.018471717834472656, -0.0173797607421875, -0.016287803649902344, -0.015195846557617188, -0.014103889465332031, -0.013011932373046875, -0.011919975280761719, -0.010828018188476562, -0.009736061096191406, -0.00864410400390625, -0.007552146911621094, -0.0064601898193359375, -0.005368232727050781, -0.004276275634765625, -0.0031843185424804688, -0.0020923614501953125, -0.0010004043579101562, 9.1552734375e-05, 0.0011835098266601562, 0.0022754669189453125, 0.0033674240112304688, 0.004459381103515625, 0.005551338195800781, 0.0066432952880859375, 0.007735252380371094, 0.00882720947265625, 0.009919166564941406, 0.011011123657226562, 0.012103080749511719, 0.013195037841796875, 0.014286994934082031, 0.015378952026367188, 0.016470909118652344, 0.0175628662109375, 0.018654823303222656, 0.019746780395507812, 0.02083873748779297, 0.021930694580078125, 0.02302265167236328, 0.024114608764648438, 0.025206565856933594, 0.02629852294921875, 0.027390480041503906, 0.028482437133789062, 0.02957439422607422, 0.030666351318359375, 0.03175830841064453, 0.03285026550292969, 0.033942222595214844, 0.0350341796875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 11.0, 9.0, 10.0, 13.0, 17.0, 22.0, 20.0, 34.0, 37.0, 39.0, 57.0, 58.0, 95.0, 85.0, 105.0, 83.0, 60.0, 38.0, 37.0, 33.0, 19.0, 16.0, 26.0, 17.0, 10.0, 9.0, 8.0, 2.0, 8.0, 6.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.022308349609375, -0.02170252799987793, -0.02109670639038086, -0.02049088478088379, -0.01988506317138672, -0.01927924156188965, -0.018673419952392578, -0.018067598342895508, -0.017461776733398438, -0.016855955123901367, -0.016250133514404297, -0.015644311904907227, -0.015038490295410156, -0.014432668685913086, -0.013826847076416016, -0.013221025466918945, -0.012615203857421875, -0.012009382247924805, -0.011403560638427734, -0.010797739028930664, -0.010191917419433594, -0.009586095809936523, -0.008980274200439453, -0.008374452590942383, -0.0077686309814453125, -0.007162809371948242, -0.006556987762451172, -0.0059511661529541016, -0.005345344543457031, -0.004739522933959961, -0.004133701324462891, -0.0035278797149658203, -0.00292205810546875, -0.0023162364959716797, -0.0017104148864746094, -0.001104593276977539, -0.0004987716674804688, 0.00010704994201660156, 0.0007128715515136719, 0.0013186931610107422, 0.0019245147705078125, 0.002530336380004883, 0.003136157989501953, 0.0037419795989990234, 0.004347801208496094, 0.004953622817993164, 0.005559444427490234, 0.006165266036987305, 0.006771087646484375, 0.007376909255981445, 0.007982730865478516, 0.008588552474975586, 0.009194374084472656, 0.009800195693969727, 0.010406017303466797, 0.011011838912963867, 0.011617660522460938, 0.012223482131958008, 0.012829303741455078, 0.013435125350952148, 0.014040946960449219, 0.014646768569946289, 0.01525259017944336, 0.01585841178894043, 0.0164642333984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 4.0, 12.0, 6.0, 19.0, 18.0, 26.0, 34.0, 44.0, 60.0, 92.0, 146.0, 156.0, 99.0, 50.0, 50.0, 44.0, 25.0, 21.0, 20.0, 11.0, 9.0, 11.0, 5.0, 4.0, 2.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9857738614082336, -0.9541628360748291, -0.9225518107414246, -0.89094078540802, -0.8593297600746155, -0.8277187347412109, -0.7961076498031616, -0.7644966840744019, -0.7328855991363525, -0.701274573802948, -0.6696635484695435, -0.6380525231361389, -0.6064414978027344, -0.5748304724693298, -0.5432194471359253, -0.511608362197876, -0.4799973964691162, -0.44838637113571167, -0.41677534580230713, -0.3851643204689026, -0.35355329513549805, -0.3219422698020935, -0.2903312146663666, -0.25872018933296204, -0.2271091639995575, -0.19549813866615295, -0.1638871133327484, -0.13227607309818268, -0.10066504776477814, -0.0690540224313736, -0.03744298219680786, -0.00583195686340332, 0.025779008865356445, 0.057390037924051285, 0.08900106698274612, 0.12061209976673126, 0.1522231251001358, 0.18383415043354034, 0.21544519066810608, 0.24705621600151062, 0.27866724133491516, 0.3102782666683197, 0.34188929200172424, 0.37350034713745117, 0.4051113724708557, 0.43672239780426025, 0.4683334231376648, 0.49994444847106934, 0.5315554738044739, 0.5631664991378784, 0.594777524471283, 0.6263885498046875, 0.657999575138092, 0.6896106004714966, 0.7212216854095459, 0.7528326511383057, 0.784443736076355, 0.8160547614097595, 0.8476657867431641, 0.8792768120765686, 0.9108878374099731, 0.9424988627433777, 0.9741098880767822, 1.0057209730148315, 1.0373319387435913]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 8.0, 10.0, 8.0, 8.0, 14.0, 11.0, 16.0, 22.0, 33.0, 22.0, 33.0, 35.0, 30.0, 41.0, 53.0, 48.0, 49.0, 43.0, 53.0, 44.0, 41.0, 40.0, 43.0, 32.0, 33.0, 36.0, 31.0, 24.0, 28.0, 20.0, 17.0, 13.0, 17.0, 15.0, 8.0, 4.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7743234038352966, -0.7509793043136597, -0.7276352047920227, -0.7042911052703857, -0.680946946144104, -0.657602846622467, -0.6342587471008301, -0.6109146475791931, -0.5875705480575562, -0.5642264485359192, -0.5408823490142822, -0.5175382494926453, -0.4941941201686859, -0.47085002064704895, -0.4475058913230896, -0.42416179180145264, -0.4008176922798157, -0.3774735927581787, -0.35412949323654175, -0.3307853639125824, -0.30744126439094543, -0.28409716486930847, -0.2607530355453491, -0.23740893602371216, -0.2140648365020752, -0.19072073698043823, -0.16737662255764008, -0.14403250813484192, -0.12068840861320496, -0.0973443016409874, -0.07400019466876984, -0.05065608024597168, -0.027312040328979492, -0.003967933356761932, 0.019376173615455627, 0.04272028058767319, 0.06606438755989075, 0.0894084945321083, 0.11275260150432587, 0.13609671592712402, 0.159440815448761, 0.18278491497039795, 0.2061290293931961, 0.22947314381599426, 0.2528172433376312, 0.2761613428592682, 0.29950547218322754, 0.3228495717048645, 0.34619367122650146, 0.3695377707481384, 0.3928818702697754, 0.41622599959373474, 0.4395700991153717, 0.46291419863700867, 0.486258327960968, 0.509602427482605, 0.5329465270042419, 0.5562906265258789, 0.5796347260475159, 0.6029788255691528, 0.6263229846954346, 0.6496670842170715, 0.6730111837387085, 0.6963552832603455, 0.7196993827819824]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 9.0, 9.0, 12.0, 10.0, 15.0, 11.0, 20.0, 40.0, 36.0, 52.0, 78.0, 140.0, 215.0, 307.0, 519.0, 914.0, 1868.0, 4376.0, 15818.0, 106862.0, 3989059.0, 56743.0, 10529.0, 3480.0, 1395.0, 627.0, 324.0, 182.0, 136.0, 99.0, 89.0, 58.0, 47.0, 37.0, 36.0, 31.0, 21.0, 13.0, 13.0, 10.0, 17.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.30078125, -0.2914924621582031, -0.28220367431640625, -0.2729148864746094, -0.2636260986328125, -0.2543373107910156, -0.24504852294921875, -0.23575973510742188, -0.226470947265625, -0.21718215942382812, -0.20789337158203125, -0.19860458374023438, -0.1893157958984375, -0.18002700805664062, -0.17073822021484375, -0.16144943237304688, -0.15216064453125, -0.14287185668945312, -0.13358306884765625, -0.12429428100585938, -0.1150054931640625, -0.10571670532226562, -0.09642791748046875, -0.08713912963867188, -0.077850341796875, -0.06856155395507812, -0.05927276611328125, -0.049983978271484375, -0.0406951904296875, -0.031406402587890625, -0.02211761474609375, -0.012828826904296875, -0.0035400390625, 0.005748748779296875, 0.01503753662109375, 0.024326324462890625, 0.0336151123046875, 0.042903900146484375, 0.05219268798828125, 0.061481475830078125, 0.070770263671875, 0.08005905151367188, 0.08934783935546875, 0.09863662719726562, 0.1079254150390625, 0.11721420288085938, 0.12650299072265625, 0.13579177856445312, 0.14508056640625, 0.15436935424804688, 0.16365814208984375, 0.17294692993164062, 0.1822357177734375, 0.19152450561523438, 0.20081329345703125, 0.21010208129882812, 0.219390869140625, 0.22867965698242188, 0.23796844482421875, 0.24725723266601562, 0.2565460205078125, 0.2658348083496094, 0.27512359619140625, 0.2844123840332031, 0.293701171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 3.0, 3.0, 7.0, 12.0, 14.0, 25.0, 44.0, 67.0, 91.0, 118.0, 143.0, 133.0, 106.0, 90.0, 58.0, 42.0, 20.0, 14.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.1275768280029297, -0.12356185913085938, -0.11954689025878906, -0.11553192138671875, -0.11151695251464844, -0.10750198364257812, -0.10348701477050781, -0.0994720458984375, -0.09545707702636719, -0.09144210815429688, -0.08742713928222656, -0.08341217041015625, -0.07939720153808594, -0.07538223266601562, -0.07136726379394531, -0.067352294921875, -0.06333732604980469, -0.059322357177734375, -0.05530738830566406, -0.05129241943359375, -0.04727745056152344, -0.043262481689453125, -0.03924751281738281, -0.0352325439453125, -0.031217575073242188, -0.027202606201171875, -0.023187637329101562, -0.01917266845703125, -0.015157699584960938, -0.011142730712890625, -0.0071277618408203125, -0.00311279296875, 0.0009021759033203125, 0.004917144775390625, 0.008932113647460938, 0.01294708251953125, 0.016962051391601562, 0.020977020263671875, 0.024991989135742188, 0.0290069580078125, 0.03302192687988281, 0.037036895751953125, 0.04105186462402344, 0.04506683349609375, 0.04908180236816406, 0.053096771240234375, 0.05711174011230469, 0.061126708984375, 0.06514167785644531, 0.06915664672851562, 0.07317161560058594, 0.07718658447265625, 0.08120155334472656, 0.08521652221679688, 0.08923149108886719, 0.0932464599609375, 0.09726142883300781, 0.10127639770507812, 0.10529136657714844, 0.10930633544921875, 0.11332130432128906, 0.11733627319335938, 0.12135124206542969, 0.1253662109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 15.0, 26.0, 35.0, 61.0, 81.0, 181.0, 430.0, 1235.0, 4393.0, 26051.0, 3948949.0, 195436.0, 13113.0, 2723.0, 870.0, 325.0, 129.0, 90.0, 46.0, 30.0, 14.0, 17.0, 9.0, 2.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.485595703125, -0.4687461853027344, -0.45189666748046875, -0.4350471496582031, -0.4181976318359375, -0.4013481140136719, -0.38449859619140625, -0.3676490783691406, -0.350799560546875, -0.3339500427246094, -0.31710052490234375, -0.3002510070800781, -0.2834014892578125, -0.2665519714355469, -0.24970245361328125, -0.23285293579101562, -0.21600341796875, -0.19915390014648438, -0.18230438232421875, -0.16545486450195312, -0.1486053466796875, -0.13175582885742188, -0.11490631103515625, -0.09805679321289062, -0.081207275390625, -0.06435775756835938, -0.04750823974609375, -0.030658721923828125, -0.0138092041015625, 0.003040313720703125, 0.01988983154296875, 0.036739349365234375, 0.0535888671875, 0.07043838500976562, 0.08728790283203125, 0.10413742065429688, 0.1209869384765625, 0.13783645629882812, 0.15468597412109375, 0.17153549194335938, 0.188385009765625, 0.20523452758789062, 0.22208404541015625, 0.23893356323242188, 0.2557830810546875, 0.2726325988769531, 0.28948211669921875, 0.3063316345214844, 0.32318115234375, 0.3400306701660156, 0.35688018798828125, 0.3737297058105469, 0.3905792236328125, 0.4074287414550781, 0.42427825927734375, 0.4411277770996094, 0.457977294921875, 0.4748268127441406, 0.49167633056640625, 0.5085258483886719, 0.5253753662109375, 0.5422248840332031, 0.5590744018554688, 0.5759239196777344, 0.5927734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 15.0, 19.0, 16.0, 56.0, 64.0, 237.0, 2442.0, 899.0, 130.0, 54.0, 37.0, 25.0, 26.0, 10.0, 12.0, 8.0, 8.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2962150573730469, -0.28554534912109375, -0.2748756408691406, -0.2642059326171875, -0.2535362243652344, -0.24286651611328125, -0.23219680786132812, -0.221527099609375, -0.21085739135742188, -0.20018768310546875, -0.18951797485351562, -0.1788482666015625, -0.16817855834960938, -0.15750885009765625, -0.14683914184570312, -0.13616943359375, -0.12549972534179688, -0.11483001708984375, -0.10416030883789062, -0.0934906005859375, -0.08282089233398438, -0.07215118408203125, -0.061481475830078125, -0.050811767578125, -0.040142059326171875, -0.02947235107421875, -0.018802642822265625, -0.0081329345703125, 0.002536773681640625, 0.01320648193359375, 0.023876190185546875, 0.0345458984375, 0.045215606689453125, 0.05588531494140625, 0.06655502319335938, 0.0772247314453125, 0.08789443969726562, 0.09856414794921875, 0.10923385620117188, 0.119903564453125, 0.13057327270507812, 0.14124298095703125, 0.15191268920898438, 0.1625823974609375, 0.17325210571289062, 0.18392181396484375, 0.19459152221679688, 0.20526123046875, 0.21593093872070312, 0.22660064697265625, 0.23727035522460938, 0.2479400634765625, 0.2586097717285156, 0.26927947998046875, 0.2799491882324219, 0.290618896484375, 0.3012886047363281, 0.31195831298828125, 0.3226280212402344, 0.3332977294921875, 0.3439674377441406, 0.35463714599609375, 0.3653068542480469, 0.3759765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 2.0, 3.0, 4.0, 5.0, 14.0, 12.0, 11.0, 16.0, 19.0, 31.0, 29.0, 57.0, 73.0, 98.0, 100.0, 96.0, 85.0, 83.0, 42.0, 32.0, 36.0, 20.0, 26.0, 19.0, 9.0, 12.0, 9.0, 2.0, 7.0, 6.0, 4.0, 5.0, 10.0, 5.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8373650312423706, -0.8077936172485352, -0.7782222628593445, -0.7486509084701538, -0.7190794944763184, -0.6895080804824829, -0.6599367260932922, -0.6303653717041016, -0.6007939577102661, -0.5712225437164307, -0.54165118932724, -0.5120798349380493, -0.48250842094421387, -0.4529370367527008, -0.42336565256118774, -0.3937942683696747, -0.3642228841781616, -0.33465149998664856, -0.3050801157951355, -0.27550873160362244, -0.24593734741210938, -0.2163659632205963, -0.18679457902908325, -0.1572231948375702, -0.12765181064605713, -0.09808042645454407, -0.068509042263031, -0.038937658071517944, -0.009366273880004883, 0.02020511031150818, 0.04977649450302124, 0.0793478786945343, 0.10891926288604736, 0.13849064707756042, 0.1680620312690735, 0.19763341546058655, 0.2272047996520996, 0.25677618384361267, 0.28634756803512573, 0.3159189522266388, 0.34549033641815186, 0.3750617206096649, 0.404633104801178, 0.43420448899269104, 0.4637758731842041, 0.49334725737571716, 0.5229186415672302, 0.5524899959564209, 0.5820614099502563, 0.6116328239440918, 0.6412041783332825, 0.6707755327224731, 0.7003469467163086, 0.729918360710144, 0.7594897150993347, 0.7890610694885254, 0.8186324834823608, 0.8482038974761963, 0.877775251865387, 0.9073466062545776, 0.9369180202484131, 0.9664894342422485, 0.9960607886314392, 1.0256321430206299, 1.0552035570144653]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 9.0, 12.0, 16.0, 13.0, 20.0, 26.0, 25.0, 23.0, 34.0, 30.0, 44.0, 45.0, 54.0, 51.0, 56.0, 50.0, 50.0, 45.0, 48.0, 45.0, 30.0, 24.0, 31.0, 28.0, 27.0, 29.0, 29.0, 24.0, 22.0, 8.0, 12.0, 9.0, 6.0, 6.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9891502261161804, -0.9606451392173767, -0.932140052318573, -0.9036349654197693, -0.8751299381256104, -0.8466248512268066, -0.8181197643280029, -0.7896146774291992, -0.7611095905303955, -0.7326045036315918, -0.7040994167327881, -0.6755943298339844, -0.6470892429351807, -0.618584156036377, -0.590079128742218, -0.5615740418434143, -0.5330689549446106, -0.5045638680458069, -0.4760587811470032, -0.44755372405052185, -0.41904863715171814, -0.39054355025291443, -0.3620384931564331, -0.3335334062576294, -0.3050283193588257, -0.276523232460022, -0.24801816046237946, -0.21951308846473694, -0.19100800156593323, -0.16250291466712952, -0.133997842669487, -0.10549277067184448, -0.076987624168396, -0.04848254472017288, -0.019977465271949768, 0.008527614176273346, 0.03703269362449646, 0.06553778052330017, 0.09404285252094269, 0.1225479245185852, 0.15105301141738892, 0.17955809831619263, 0.20806317031383514, 0.23656824231147766, 0.26507332921028137, 0.2935784161090851, 0.3220834732055664, 0.3505885601043701, 0.37909364700317383, 0.40759873390197754, 0.43610382080078125, 0.4646088778972626, 0.4931139647960663, 0.5216190814971924, 0.5501241087913513, 0.578629195690155, 0.6071342825889587, 0.6356393694877625, 0.6641444563865662, 0.6926495432853699, 0.7211545705795288, 0.7496596574783325, 0.7781647443771362, 0.8066698312759399, 0.8351749181747437]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 13.0, 8.0, 14.0, 13.0, 21.0, 25.0, 41.0, 61.0, 70.0, 88.0, 102.0, 160.0, 206.0, 289.0, 403.0, 614.0, 1026.0, 1929.0, 4037.0, 10413.0, 33085.0, 139426.0, 660004.0, 143033.0, 33689.0, 10472.0, 4072.0, 1916.0, 1123.0, 656.0, 465.0, 316.0, 182.0, 140.0, 124.0, 84.0, 68.0, 40.0, 30.0, 33.0, 18.0, 17.0, 10.0, 11.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.383056640625, -0.3708992004394531, -0.35874176025390625, -0.3465843200683594, -0.3344268798828125, -0.3222694396972656, -0.31011199951171875, -0.2979545593261719, -0.285797119140625, -0.2736396789550781, -0.26148223876953125, -0.24932479858398438, -0.2371673583984375, -0.22500991821289062, -0.21285247802734375, -0.20069503784179688, -0.18853759765625, -0.17638015747070312, -0.16422271728515625, -0.15206527709960938, -0.1399078369140625, -0.12775039672851562, -0.11559295654296875, -0.10343551635742188, -0.091278076171875, -0.07912063598632812, -0.06696319580078125, -0.054805755615234375, -0.0426483154296875, -0.030490875244140625, -0.01833343505859375, -0.006175994873046875, 0.0059814453125, 0.018138885498046875, 0.03029632568359375, 0.042453765869140625, 0.0546112060546875, 0.06676864624023438, 0.07892608642578125, 0.09108352661132812, 0.103240966796875, 0.11539840698242188, 0.12755584716796875, 0.13971328735351562, 0.1518707275390625, 0.16402816772460938, 0.17618560791015625, 0.18834304809570312, 0.20050048828125, 0.21265792846679688, 0.22481536865234375, 0.23697280883789062, 0.2491302490234375, 0.2612876892089844, 0.27344512939453125, 0.2856025695800781, 0.297760009765625, 0.3099174499511719, 0.32207489013671875, 0.3342323303222656, 0.3463897705078125, 0.3585472106933594, 0.37070465087890625, 0.3828620910644531, 0.39501953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 2.0, 1.0, 13.0, 8.0, 19.0, 25.0, 44.0, 69.0, 95.0, 104.0, 150.0, 135.0, 106.0, 76.0, 69.0, 35.0, 27.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1326904296875, -0.12863540649414062, -0.12458038330078125, -0.12052536010742188, -0.1164703369140625, -0.11241531372070312, -0.10836029052734375, -0.10430526733398438, -0.100250244140625, -0.09619522094726562, -0.09214019775390625, -0.08808517456054688, -0.0840301513671875, -0.07997512817382812, -0.07592010498046875, -0.07186508178710938, -0.06781005859375, -0.06375503540039062, -0.05970001220703125, -0.055644989013671875, -0.0515899658203125, -0.047534942626953125, -0.04347991943359375, -0.039424896240234375, -0.035369873046875, -0.031314849853515625, -0.02725982666015625, -0.023204803466796875, -0.0191497802734375, -0.015094757080078125, -0.01103973388671875, -0.006984710693359375, -0.0029296875, 0.001125335693359375, 0.00518035888671875, 0.009235382080078125, 0.0132904052734375, 0.017345428466796875, 0.02140045166015625, 0.025455474853515625, 0.029510498046875, 0.033565521240234375, 0.03762054443359375, 0.041675567626953125, 0.0457305908203125, 0.049785614013671875, 0.05384063720703125, 0.057895660400390625, 0.06195068359375, 0.06600570678710938, 0.07006072998046875, 0.07411575317382812, 0.0781707763671875, 0.08222579956054688, 0.08628082275390625, 0.09033584594726562, 0.094390869140625, 0.09844589233398438, 0.10250091552734375, 0.10655593872070312, 0.1106109619140625, 0.11466598510742188, 0.11872100830078125, 0.12277603149414062, 0.1268310546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 16.0, 12.0, 21.0, 26.0, 30.0, 49.0, 98.0, 142.0, 251.0, 481.0, 1057.0, 2542.0, 6943.0, 22419.0, 103818.0, 750558.0, 122475.0, 24935.0, 7527.0, 2754.0, 1177.0, 526.0, 255.0, 146.0, 73.0, 59.0, 36.0, 33.0, 15.0, 15.0, 4.0, 8.0, 5.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.38671875, -0.37445831298828125, -0.3621978759765625, -0.34993743896484375, -0.337677001953125, -0.32541656494140625, -0.3131561279296875, -0.30089569091796875, -0.28863525390625, -0.27637481689453125, -0.2641143798828125, -0.25185394287109375, -0.239593505859375, -0.22733306884765625, -0.2150726318359375, -0.20281219482421875, -0.1905517578125, -0.17829132080078125, -0.1660308837890625, -0.15377044677734375, -0.141510009765625, -0.12924957275390625, -0.1169891357421875, -0.10472869873046875, -0.09246826171875, -0.08020782470703125, -0.0679473876953125, -0.05568695068359375, -0.043426513671875, -0.03116607666015625, -0.0189056396484375, -0.00664520263671875, 0.005615234375, 0.01787567138671875, 0.0301361083984375, 0.04239654541015625, 0.054656982421875, 0.06691741943359375, 0.0791778564453125, 0.09143829345703125, 0.10369873046875, 0.11595916748046875, 0.1282196044921875, 0.14048004150390625, 0.152740478515625, 0.16500091552734375, 0.1772613525390625, 0.18952178955078125, 0.2017822265625, 0.21404266357421875, 0.2263031005859375, 0.23856353759765625, 0.250823974609375, 0.26308441162109375, 0.2753448486328125, 0.28760528564453125, 0.29986572265625, 0.31212615966796875, 0.3243865966796875, 0.33664703369140625, 0.348907470703125, 0.36116790771484375, 0.3734283447265625, 0.38568878173828125, 0.39794921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 15.0, 10.0, 12.0, 20.0, 11.0, 16.0, 19.0, 32.0, 22.0, 30.0, 44.0, 44.0, 49.0, 69.0, 44.0, 40.0, 61.0, 41.0, 45.0, 46.0, 42.0, 38.0, 35.0, 36.0, 27.0, 28.0, 16.0, 17.0, 20.0, 14.0, 5.0, 4.0, 10.0, 4.0, 8.0, 3.0, 7.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20703125, -0.20044326782226562, -0.19385528564453125, -0.18726730346679688, -0.1806793212890625, -0.17409133911132812, -0.16750335693359375, -0.16091537475585938, -0.154327392578125, -0.14773941040039062, -0.14115142822265625, -0.13456344604492188, -0.1279754638671875, -0.12138748168945312, -0.11479949951171875, -0.10821151733398438, -0.10162353515625, -0.09503555297851562, -0.08844757080078125, -0.08185958862304688, -0.0752716064453125, -0.06868362426757812, -0.06209564208984375, -0.055507659912109375, -0.048919677734375, -0.042331695556640625, -0.03574371337890625, -0.029155731201171875, -0.0225677490234375, -0.015979766845703125, -0.00939178466796875, -0.002803802490234375, 0.0037841796875, 0.010372161865234375, 0.01696014404296875, 0.023548126220703125, 0.0301361083984375, 0.036724090576171875, 0.04331207275390625, 0.049900054931640625, 0.056488037109375, 0.06307601928710938, 0.06966400146484375, 0.07625198364257812, 0.0828399658203125, 0.08942794799804688, 0.09601593017578125, 0.10260391235351562, 0.10919189453125, 0.11577987670898438, 0.12236785888671875, 0.12895584106445312, 0.1355438232421875, 0.14213180541992188, 0.14871978759765625, 0.15530776977539062, 0.161895751953125, 0.16848373413085938, 0.17507171630859375, 0.18165969848632812, 0.1882476806640625, 0.19483566284179688, 0.20142364501953125, 0.20801162719726562, 0.214599609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 18.0, 24.0, 19.0, 42.0, 43.0, 63.0, 73.0, 144.0, 231.0, 366.0, 685.0, 1258.0, 2647.0, 6709.0, 22903.0, 168480.0, 766309.0, 57691.0, 12462.0, 4220.0, 1862.0, 890.0, 522.0, 324.0, 188.0, 111.0, 70.0, 44.0, 33.0, 32.0, 31.0, 13.0, 14.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.02490234375, -0.02410602569580078, -0.023309707641601562, -0.022513389587402344, -0.021717071533203125, -0.020920753479003906, -0.020124435424804688, -0.01932811737060547, -0.01853179931640625, -0.01773548126220703, -0.016939163208007812, -0.016142845153808594, -0.015346527099609375, -0.014550209045410156, -0.013753890991210938, -0.012957572937011719, -0.0121612548828125, -0.011364936828613281, -0.010568618774414062, -0.009772300720214844, -0.008975982666015625, -0.008179664611816406, -0.0073833465576171875, -0.006587028503417969, -0.00579071044921875, -0.004994392395019531, -0.0041980743408203125, -0.0034017562866210938, -0.002605438232421875, -0.0018091201782226562, -0.0010128021240234375, -0.00021648406982421875, 0.000579833984375, 0.0013761520385742188, 0.0021724700927734375, 0.0029687881469726562, 0.003765106201171875, 0.004561424255371094, 0.0053577423095703125, 0.006154060363769531, 0.00695037841796875, 0.007746696472167969, 0.008543014526367188, 0.009339332580566406, 0.010135650634765625, 0.010931968688964844, 0.011728286743164062, 0.012524604797363281, 0.0133209228515625, 0.014117240905761719, 0.014913558959960938, 0.015709877014160156, 0.016506195068359375, 0.017302513122558594, 0.018098831176757812, 0.01889514923095703, 0.01969146728515625, 0.02048778533935547, 0.021284103393554688, 0.022080421447753906, 0.022876739501953125, 0.023673057556152344, 0.024469375610351562, 0.02526569366455078, 0.02606201171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 10.0, 7.0, 5.0, 13.0, 16.0, 15.0, 20.0, 34.0, 25.0, 31.0, 47.0, 60.0, 48.0, 68.0, 80.0, 66.0, 61.0, 61.0, 53.0, 46.0, 47.0, 56.0, 24.0, 24.0, 13.0, 15.0, 14.0, 11.0, 12.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.627501428127289e-06, -3.4999102354049683e-06, -3.3723190426826477e-06, -3.244727849960327e-06, -3.1171366572380066e-06, -2.989545464515686e-06, -2.8619542717933655e-06, -2.734363079071045e-06, -2.6067718863487244e-06, -2.479180693626404e-06, -2.3515895009040833e-06, -2.2239983081817627e-06, -2.096407115459442e-06, -1.9688159227371216e-06, -1.841224730014801e-06, -1.7136335372924805e-06, -1.58604234457016e-06, -1.4584511518478394e-06, -1.3308599591255188e-06, -1.2032687664031982e-06, -1.0756775736808777e-06, -9.480863809585571e-07, -8.204951882362366e-07, -6.92903995513916e-07, -5.653128027915955e-07, -4.377216100692749e-07, -3.1013041734695435e-07, -1.825392246246338e-07, -5.494803190231323e-08, 7.264316082000732e-08, 2.0023435354232788e-07, 3.2782554626464844e-07, 4.55416738986969e-07, 5.830079317092896e-07, 7.105991244316101e-07, 8.381903171539307e-07, 9.657815098762512e-07, 1.0933727025985718e-06, 1.2209638953208923e-06, 1.3485550880432129e-06, 1.4761462807655334e-06, 1.603737473487854e-06, 1.7313286662101746e-06, 1.8589198589324951e-06, 1.9865110516548157e-06, 2.1141022443771362e-06, 2.2416934370994568e-06, 2.3692846298217773e-06, 2.496875822544098e-06, 2.6244670152664185e-06, 2.752058207988739e-06, 2.8796494007110596e-06, 3.00724059343338e-06, 3.1348317861557007e-06, 3.2624229788780212e-06, 3.390014171600342e-06, 3.5176053643226624e-06, 3.645196557044983e-06, 3.7727877497673035e-06, 3.900378942489624e-06, 4.027970135211945e-06, 4.155561327934265e-06, 4.283152520656586e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 7.0, 6.0, 8.0, 10.0, 16.0, 22.0, 55.0, 77.0, 136.0, 245.0, 547.0, 1021.0, 2484.0, 8040.0, 45403.0, 858822.0, 111977.0, 13366.0, 3606.0, 1377.0, 591.0, 310.0, 189.0, 93.0, 60.0, 31.0, 19.0, 15.0, 3.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031005859375, -0.029695987701416016, -0.02838611602783203, -0.027076244354248047, -0.025766372680664062, -0.024456501007080078, -0.023146629333496094, -0.02183675765991211, -0.020526885986328125, -0.01921701431274414, -0.017907142639160156, -0.016597270965576172, -0.015287399291992188, -0.013977527618408203, -0.012667655944824219, -0.011357784271240234, -0.01004791259765625, -0.008738040924072266, -0.007428169250488281, -0.006118297576904297, -0.0048084259033203125, -0.003498554229736328, -0.0021886825561523438, -0.0008788108825683594, 0.000431060791015625, 0.0017409324645996094, 0.0030508041381835938, 0.004360675811767578, 0.0056705474853515625, 0.006980419158935547, 0.008290290832519531, 0.009600162506103516, 0.0109100341796875, 0.012219905853271484, 0.013529777526855469, 0.014839649200439453, 0.016149520874023438, 0.017459392547607422, 0.018769264221191406, 0.02007913589477539, 0.021389007568359375, 0.02269887924194336, 0.024008750915527344, 0.025318622589111328, 0.026628494262695312, 0.027938365936279297, 0.02924823760986328, 0.030558109283447266, 0.03186798095703125, 0.033177852630615234, 0.03448772430419922, 0.0357975959777832, 0.03710746765136719, 0.03841733932495117, 0.039727210998535156, 0.04103708267211914, 0.042346954345703125, 0.04365682601928711, 0.044966697692871094, 0.04627656936645508, 0.04758644104003906, 0.04889631271362305, 0.05020618438720703, 0.051516056060791016, 0.052825927734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 6.0, 7.0, 5.0, 15.0, 12.0, 13.0, 20.0, 26.0, 38.0, 62.0, 69.0, 83.0, 101.0, 118.0, 104.0, 76.0, 45.0, 45.0, 41.0, 21.0, 22.0, 19.0, 8.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01849365234375, -0.01781296730041504, -0.017132282257080078, -0.016451597213745117, -0.015770912170410156, -0.015090227127075195, -0.014409542083740234, -0.013728857040405273, -0.013048171997070312, -0.012367486953735352, -0.01168680191040039, -0.01100611686706543, -0.010325431823730469, -0.009644746780395508, -0.008964061737060547, -0.008283376693725586, -0.007602691650390625, -0.006922006607055664, -0.006241321563720703, -0.005560636520385742, -0.004879951477050781, -0.00419926643371582, -0.0035185813903808594, -0.0028378963470458984, -0.0021572113037109375, -0.0014765262603759766, -0.0007958412170410156, -0.00011515617370605469, 0.0005655288696289062, 0.0012462139129638672, 0.0019268989562988281, 0.002607583999633789, 0.00328826904296875, 0.003968954086303711, 0.004649639129638672, 0.005330324172973633, 0.006011009216308594, 0.006691694259643555, 0.007372379302978516, 0.008053064346313477, 0.008733749389648438, 0.009414434432983398, 0.01009511947631836, 0.01077580451965332, 0.011456489562988281, 0.012137174606323242, 0.012817859649658203, 0.013498544692993164, 0.014179229736328125, 0.014859914779663086, 0.015540599822998047, 0.016221284866333008, 0.01690196990966797, 0.01758265495300293, 0.01826333999633789, 0.01894402503967285, 0.019624710083007812, 0.020305395126342773, 0.020986080169677734, 0.021666765213012695, 0.022347450256347656, 0.023028135299682617, 0.023708820343017578, 0.02438950538635254, 0.0250701904296875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 13.0, 10.0, 10.0, 18.0, 25.0, 31.0, 36.0, 55.0, 98.0, 172.0, 171.0, 106.0, 65.0, 39.0, 42.0, 24.0, 12.0, 17.0, 9.0, 10.0, 6.0, 7.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3879806995391846, -1.3484047651290894, -1.3088289499282837, -1.2692530155181885, -1.2296770811080933, -1.190101146697998, -1.1505253314971924, -1.1109493970870972, -1.071373462677002, -1.0317975282669067, -0.9922216534614563, -0.9526457786560059, -0.9130698442459106, -0.8734939694404602, -0.8339180946350098, -0.7943421602249146, -0.7547663450241089, -0.7151904702186584, -0.6756145358085632, -0.6360386610031128, -0.5964627265930176, -0.5568868517875671, -0.5173109769821167, -0.47773507237434387, -0.43815916776657104, -0.3985832631587982, -0.3590073585510254, -0.31943148374557495, -0.2798555791378021, -0.2402796745300293, -0.20070378482341766, -0.16112789511680603, -0.12155210971832275, -0.08197621256113052, -0.04240031540393829, -0.0028244182467460632, 0.03675147891044617, 0.076327383518219, 0.11590327322483063, 0.15547916293144226, 0.1950550675392151, 0.23463097214698792, 0.27420687675476074, 0.3137827515602112, 0.353358656167984, 0.39293456077575684, 0.4325104355812073, 0.4720863401889801, 0.5116622447967529, 0.5512381196022034, 0.5908140540122986, 0.630389928817749, 0.6699658632278442, 0.7095417380332947, 0.7491176128387451, 0.7886935472488403, 0.8282694220542908, 0.8678452968597412, 0.9074212312698364, 0.9469971060752869, 0.9865729808807373, 1.0261489152908325, 1.0657248497009277, 1.1053006649017334, 1.1448765993118286]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 12.0, 8.0, 6.0, 12.0, 18.0, 19.0, 25.0, 25.0, 38.0, 33.0, 35.0, 48.0, 57.0, 59.0, 55.0, 72.0, 67.0, 59.0, 53.0, 53.0, 22.0, 41.0, 34.0, 28.0, 14.0, 21.0, 18.0, 14.0, 13.0, 6.0, 8.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.788846492767334, -0.7593479752540588, -0.7298494577407837, -0.7003509998321533, -0.6708524823188782, -0.641353964805603, -0.6118555068969727, -0.5823569893836975, -0.5528584718704224, -0.5233599543571472, -0.49386146664619446, -0.4643629789352417, -0.43486446142196655, -0.4053659439086914, -0.37586745619773865, -0.3463689684867859, -0.31687045097351074, -0.2873719334602356, -0.25787344574928284, -0.22837494313716888, -0.19887644052505493, -0.16937793791294098, -0.13987943530082703, -0.11038093268871307, -0.08088243007659912, -0.05138392746448517, -0.021885424852371216, 0.007613077759742737, 0.03711158037185669, 0.06661008298397064, 0.0961085855960846, 0.12560708820819855, 0.1551055908203125, 0.18460409343242645, 0.2141025960445404, 0.24360109865665436, 0.2730996012687683, 0.30259811878204346, 0.3320966064929962, 0.361595094203949, 0.3910936117172241, 0.42059212923049927, 0.450090616941452, 0.4795891046524048, 0.5090876221656799, 0.5385861396789551, 0.5680845975875854, 0.5975831151008606, 0.6270816326141357, 0.6565801501274109, 0.686078667640686, 0.7155771255493164, 0.7450756430625916, 0.7745741605758667, 0.8040726184844971, 0.8335711359977722, 0.8630696535110474, 0.8925681710243225, 0.9220666885375977, 0.951565146446228, 0.9810636639595032, 1.0105621814727783, 1.0400606393814087, 1.0695592164993286, 1.099057674407959]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 4.0, 5.0, 12.0, 5.0, 12.0, 12.0, 35.0, 27.0, 42.0, 69.0, 117.0, 155.0, 280.0, 523.0, 1106.0, 2516.0, 10612.0, 316847.0, 3840547.0, 14992.0, 3618.0, 1312.0, 626.0, 287.0, 155.0, 94.0, 61.0, 41.0, 31.0, 21.0, 16.0, 26.0, 15.0, 5.0, 10.0, 6.0, 11.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.31787109375, -0.30828094482421875, -0.2986907958984375, -0.28910064697265625, -0.279510498046875, -0.26992034912109375, -0.2603302001953125, -0.25074005126953125, -0.24114990234375, -0.23155975341796875, -0.2219696044921875, -0.21237945556640625, -0.202789306640625, -0.19319915771484375, -0.1836090087890625, -0.17401885986328125, -0.1644287109375, -0.15483856201171875, -0.1452484130859375, -0.13565826416015625, -0.126068115234375, -0.11647796630859375, -0.1068878173828125, -0.09729766845703125, -0.08770751953125, -0.07811737060546875, -0.0685272216796875, -0.05893707275390625, -0.049346923828125, -0.03975677490234375, -0.0301666259765625, -0.02057647705078125, -0.010986328125, -0.00139617919921875, 0.0081939697265625, 0.01778411865234375, 0.027374267578125, 0.03696441650390625, 0.0465545654296875, 0.05614471435546875, 0.06573486328125, 0.07532501220703125, 0.0849151611328125, 0.09450531005859375, 0.104095458984375, 0.11368560791015625, 0.1232757568359375, 0.13286590576171875, 0.1424560546875, 0.15204620361328125, 0.1616363525390625, 0.17122650146484375, 0.180816650390625, 0.19040679931640625, 0.1999969482421875, 0.20958709716796875, 0.21917724609375, 0.22876739501953125, 0.2383575439453125, 0.24794769287109375, 0.257537841796875, 0.26712799072265625, 0.2767181396484375, 0.28630828857421875, 0.2958984375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 12.0, 18.0, 25.0, 43.0, 76.0, 93.0, 119.0, 134.0, 132.0, 116.0, 70.0, 59.0, 47.0, 26.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12756729125976562, -0.12354278564453125, -0.11951828002929688, -0.1154937744140625, -0.11146926879882812, -0.10744476318359375, -0.10342025756835938, -0.099395751953125, -0.09537124633789062, -0.09134674072265625, -0.08732223510742188, -0.0832977294921875, -0.07927322387695312, -0.07524871826171875, -0.07122421264648438, -0.06719970703125, -0.06317520141601562, -0.05915069580078125, -0.055126190185546875, -0.0511016845703125, -0.047077178955078125, -0.04305267333984375, -0.039028167724609375, -0.035003662109375, -0.030979156494140625, -0.02695465087890625, -0.022930145263671875, -0.0189056396484375, -0.014881134033203125, -0.01085662841796875, -0.006832122802734375, -0.0028076171875, 0.001216888427734375, 0.00524139404296875, 0.009265899658203125, 0.0132904052734375, 0.017314910888671875, 0.02133941650390625, 0.025363922119140625, 0.029388427734375, 0.033412933349609375, 0.03743743896484375, 0.041461944580078125, 0.0454864501953125, 0.049510955810546875, 0.05353546142578125, 0.057559967041015625, 0.06158447265625, 0.06560897827148438, 0.06963348388671875, 0.07365798950195312, 0.0776824951171875, 0.08170700073242188, 0.08573150634765625, 0.08975601196289062, 0.093780517578125, 0.09780502319335938, 0.10182952880859375, 0.10585403442382812, 0.1098785400390625, 0.11390304565429688, 0.11792755126953125, 0.12195205688476562, 0.1259765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 7.0, 17.0, 23.0, 35.0, 66.0, 102.0, 172.0, 316.0, 567.0, 1158.0, 2985.0, 10593.0, 157758.0, 3991929.0, 20747.0, 4710.0, 1677.0, 730.0, 294.0, 167.0, 91.0, 47.0, 28.0, 13.0, 11.0, 11.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5361328125, -0.522796630859375, -0.50946044921875, -0.496124267578125, -0.4827880859375, -0.469451904296875, -0.45611572265625, -0.442779541015625, -0.429443359375, -0.416107177734375, -0.40277099609375, -0.389434814453125, -0.3760986328125, -0.362762451171875, -0.34942626953125, -0.336090087890625, -0.32275390625, -0.309417724609375, -0.29608154296875, -0.282745361328125, -0.2694091796875, -0.256072998046875, -0.24273681640625, -0.229400634765625, -0.216064453125, -0.202728271484375, -0.18939208984375, -0.176055908203125, -0.1627197265625, -0.149383544921875, -0.13604736328125, -0.122711181640625, -0.109375, -0.096038818359375, -0.08270263671875, -0.069366455078125, -0.0560302734375, -0.042694091796875, -0.02935791015625, -0.016021728515625, -0.002685546875, 0.010650634765625, 0.02398681640625, 0.037322998046875, 0.0506591796875, 0.063995361328125, 0.07733154296875, 0.090667724609375, 0.10400390625, 0.117340087890625, 0.13067626953125, 0.144012451171875, 0.1573486328125, 0.170684814453125, 0.18402099609375, 0.197357177734375, 0.210693359375, 0.224029541015625, 0.23736572265625, 0.250701904296875, 0.2640380859375, 0.277374267578125, 0.29071044921875, 0.304046630859375, 0.3173828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 8.0, 12.0, 15.0, 10.0, 21.0, 52.0, 160.0, 744.0, 2431.0, 419.0, 93.0, 37.0, 11.0, 12.0, 8.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.292724609375, -0.2862691879272461, -0.2798137664794922, -0.2733583450317383, -0.2669029235839844, -0.26044750213623047, -0.25399208068847656, -0.24753665924072266, -0.24108123779296875, -0.23462581634521484, -0.22817039489746094, -0.22171497344970703, -0.21525955200195312, -0.20880413055419922, -0.2023487091064453, -0.1958932876586914, -0.1894378662109375, -0.1829824447631836, -0.1765270233154297, -0.17007160186767578, -0.16361618041992188, -0.15716075897216797, -0.15070533752441406, -0.14424991607666016, -0.13779449462890625, -0.13133907318115234, -0.12488365173339844, -0.11842823028564453, -0.11197280883789062, -0.10551738739013672, -0.09906196594238281, -0.0926065444946289, -0.086151123046875, -0.0796957015991211, -0.07324028015136719, -0.06678485870361328, -0.060329437255859375, -0.05387401580810547, -0.04741859436035156, -0.040963172912597656, -0.03450775146484375, -0.028052330017089844, -0.021596908569335938, -0.015141487121582031, -0.008686065673828125, -0.0022306442260742188, 0.0042247772216796875, 0.010680198669433594, 0.0171356201171875, 0.023591041564941406, 0.030046463012695312, 0.03650188446044922, 0.042957305908203125, 0.04941272735595703, 0.05586814880371094, 0.062323570251464844, 0.06877899169921875, 0.07523441314697266, 0.08168983459472656, 0.08814525604248047, 0.09460067749023438, 0.10105609893798828, 0.10751152038574219, 0.1139669418334961, 0.12042236328125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 11.0, 7.0, 8.0, 17.0, 11.0, 20.0, 34.0, 44.0, 74.0, 80.0, 131.0, 148.0, 125.0, 90.0, 49.0, 34.0, 29.0, 16.0, 15.0, 12.0, 5.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8662604093551636, -0.8405233025550842, -0.8147861957550049, -0.7890490889549255, -0.7633119821548462, -0.7375748753547668, -0.7118377685546875, -0.6861007213592529, -0.6603635549545288, -0.6346264481544495, -0.6088893413543701, -0.5831522345542908, -0.5574151277542114, -0.5316780209541321, -0.5059409141540527, -0.4802038371562958, -0.4544667601585388, -0.4287296533584595, -0.4029925465583801, -0.3772554397583008, -0.35151833295822144, -0.3257812261581421, -0.30004414916038513, -0.2743070423603058, -0.24856993556022644, -0.2228328287601471, -0.19709572196006775, -0.1713586300611496, -0.14562152326107025, -0.1198844164609909, -0.09414732456207275, -0.06841021776199341, -0.04267305135726929, -0.01693594828248024, 0.008801154792308807, 0.034538254141807556, 0.0602753609418869, 0.08601246774196625, 0.1117495596408844, 0.13748666644096375, 0.1632237732410431, 0.18896088004112244, 0.21469798684120178, 0.24043507874011993, 0.2661721706390381, 0.29190927743911743, 0.3176463842391968, 0.3433834910392761, 0.36912059783935547, 0.3948577046394348, 0.42059481143951416, 0.4463319182395935, 0.47206902503967285, 0.4978061318397522, 0.5235432386398315, 0.5492802858352661, 0.5750174522399902, 0.6007545590400696, 0.6264916658401489, 0.6522287726402283, 0.6779658794403076, 0.703702986240387, 0.7294400930404663, 0.7551771402359009, 0.7809142470359802]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 8.0, 9.0, 10.0, 13.0, 13.0, 13.0, 20.0, 18.0, 27.0, 20.0, 29.0, 42.0, 38.0, 41.0, 40.0, 29.0, 49.0, 40.0, 34.0, 45.0, 39.0, 54.0, 53.0, 39.0, 26.0, 34.0, 22.0, 20.0, 24.0, 14.0, 27.0, 12.0, 18.0, 13.0, 13.0, 7.0, 8.0, 2.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4660479426383972, -0.4512972831726074, -0.4365466237068176, -0.42179596424102783, -0.40704530477523804, -0.39229464530944824, -0.37754398584365845, -0.36279329657554626, -0.34804263710975647, -0.3332919776439667, -0.3185413181781769, -0.3037906587123871, -0.2890399992465973, -0.2742893099784851, -0.2595386505126953, -0.24478799104690552, -0.23003734648227692, -0.21528668701648712, -0.20053602755069733, -0.18578535318374634, -0.17103469371795654, -0.15628403425216675, -0.14153337478637695, -0.12678271532058716, -0.11203204840421677, -0.09728138893842697, -0.08253072202205658, -0.06778006255626678, -0.05302939936518669, -0.0382787361741066, -0.023528076708316803, -0.008777409791946411, 0.005973249673843384, 0.020723912864923477, 0.03547457605600357, 0.050225235521793365, 0.06497590243816376, 0.07972656190395355, 0.09447722136974335, 0.10922788828611374, 0.12397854775190353, 0.13872921466827393, 0.15347987413406372, 0.16823053359985352, 0.1829811930656433, 0.1977318525314331, 0.2124825119972229, 0.2272331863641739, 0.24198384582996368, 0.2567345201969147, 0.27148517966270447, 0.28623583912849426, 0.30098649859428406, 0.31573715806007385, 0.33048781752586365, 0.34523847699165344, 0.35998913645744324, 0.37473979592323303, 0.3894904553890228, 0.4042411148548126, 0.4189917743206024, 0.4337424635887146, 0.4484931230545044, 0.4632437825202942, 0.477994441986084]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 10.0, 6.0, 12.0, 16.0, 19.0, 23.0, 25.0, 44.0, 53.0, 77.0, 117.0, 160.0, 200.0, 346.0, 498.0, 863.0, 1603.0, 3201.0, 8333.0, 29015.0, 157193.0, 700016.0, 110813.0, 22431.0, 6988.0, 2771.0, 1422.0, 763.0, 463.0, 326.0, 216.0, 122.0, 102.0, 98.0, 48.0, 38.0, 24.0, 22.0, 21.0, 13.0, 7.0, 8.0, 8.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.435546875, -0.4216804504394531, -0.40781402587890625, -0.3939476013183594, -0.3800811767578125, -0.3662147521972656, -0.35234832763671875, -0.3384819030761719, -0.324615478515625, -0.3107490539550781, -0.29688262939453125, -0.2830162048339844, -0.2691497802734375, -0.2552833557128906, -0.24141693115234375, -0.22755050659179688, -0.21368408203125, -0.19981765747070312, -0.18595123291015625, -0.17208480834960938, -0.1582183837890625, -0.14435195922851562, -0.13048553466796875, -0.11661911010742188, -0.102752685546875, -0.08888626098632812, -0.07501983642578125, -0.061153411865234375, -0.0472869873046875, -0.033420562744140625, -0.01955413818359375, -0.005687713623046875, 0.0081787109375, 0.022045135498046875, 0.03591156005859375, 0.049777984619140625, 0.0636444091796875, 0.07751083374023438, 0.09137725830078125, 0.10524368286132812, 0.119110107421875, 0.13297653198242188, 0.14684295654296875, 0.16070938110351562, 0.1745758056640625, 0.18844223022460938, 0.20230865478515625, 0.21617507934570312, 0.23004150390625, 0.24390792846679688, 0.25777435302734375, 0.2716407775878906, 0.2855072021484375, 0.2993736267089844, 0.31324005126953125, 0.3271064758300781, 0.340972900390625, 0.3548393249511719, 0.36870574951171875, 0.3825721740722656, 0.3964385986328125, 0.4103050231933594, 0.42417144775390625, 0.4380378723144531, 0.451904296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 9.0, 10.0, 14.0, 32.0, 38.0, 78.0, 83.0, 126.0, 137.0, 127.0, 114.0, 81.0, 62.0, 42.0, 20.0, 9.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1319580078125, -0.12792587280273438, -0.12389373779296875, -0.11986160278320312, -0.1158294677734375, -0.11179733276367188, -0.10776519775390625, -0.10373306274414062, -0.099700927734375, -0.09566879272460938, -0.09163665771484375, -0.08760452270507812, -0.0835723876953125, -0.07954025268554688, -0.07550811767578125, -0.07147598266601562, -0.06744384765625, -0.06341171264648438, -0.05937957763671875, -0.055347442626953125, -0.0513153076171875, -0.047283172607421875, -0.04325103759765625, -0.039218902587890625, -0.035186767578125, -0.031154632568359375, -0.02712249755859375, -0.023090362548828125, -0.0190582275390625, -0.015026092529296875, -0.01099395751953125, -0.006961822509765625, -0.0029296875, 0.001102447509765625, 0.00513458251953125, 0.009166717529296875, 0.0131988525390625, 0.017230987548828125, 0.02126312255859375, 0.025295257568359375, 0.029327392578125, 0.033359527587890625, 0.03739166259765625, 0.041423797607421875, 0.0454559326171875, 0.049488067626953125, 0.05352020263671875, 0.057552337646484375, 0.06158447265625, 0.06561660766601562, 0.06964874267578125, 0.07368087768554688, 0.0777130126953125, 0.08174514770507812, 0.08577728271484375, 0.08980941772460938, 0.093841552734375, 0.09787368774414062, 0.10190582275390625, 0.10593795776367188, 0.1099700927734375, 0.11400222778320312, 0.11803436279296875, 0.12206649780273438, 0.1260986328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 14.0, 20.0, 16.0, 28.0, 30.0, 76.0, 103.0, 197.0, 419.0, 896.0, 2358.0, 6445.0, 22423.0, 107657.0, 752790.0, 119700.0, 23945.0, 7015.0, 2413.0, 993.0, 435.0, 203.0, 98.0, 77.0, 48.0, 28.0, 17.0, 21.0, 13.0, 10.0, 9.0, 7.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.414794921875, -0.40120697021484375, -0.3876190185546875, -0.37403106689453125, -0.360443115234375, -0.34685516357421875, -0.3332672119140625, -0.31967926025390625, -0.30609130859375, -0.29250335693359375, -0.2789154052734375, -0.26532745361328125, -0.251739501953125, -0.23815155029296875, -0.2245635986328125, -0.21097564697265625, -0.1973876953125, -0.18379974365234375, -0.1702117919921875, -0.15662384033203125, -0.143035888671875, -0.12944793701171875, -0.1158599853515625, -0.10227203369140625, -0.08868408203125, -0.07509613037109375, -0.0615081787109375, -0.04792022705078125, -0.034332275390625, -0.02074432373046875, -0.0071563720703125, 0.00643157958984375, 0.02001953125, 0.03360748291015625, 0.0471954345703125, 0.06078338623046875, 0.074371337890625, 0.08795928955078125, 0.1015472412109375, 0.11513519287109375, 0.12872314453125, 0.14231109619140625, 0.1558990478515625, 0.16948699951171875, 0.183074951171875, 0.19666290283203125, 0.2102508544921875, 0.22383880615234375, 0.2374267578125, 0.25101470947265625, 0.2646026611328125, 0.27819061279296875, 0.291778564453125, 0.30536651611328125, 0.3189544677734375, 0.33254241943359375, 0.34613037109375, 0.35971832275390625, 0.3733062744140625, 0.38689422607421875, 0.400482177734375, 0.41407012939453125, 0.4276580810546875, 0.44124603271484375, 0.454833984375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 3.0, 7.0, 20.0, 12.0, 13.0, 16.0, 16.0, 29.0, 22.0, 28.0, 49.0, 40.0, 33.0, 49.0, 39.0, 47.0, 45.0, 45.0, 53.0, 52.0, 40.0, 37.0, 35.0, 33.0, 30.0, 30.0, 20.0, 30.0, 26.0, 15.0, 11.0, 9.0, 11.0, 10.0, 8.0, 11.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1834716796875, -0.17737579345703125, -0.1712799072265625, -0.16518402099609375, -0.159088134765625, -0.15299224853515625, -0.1468963623046875, -0.14080047607421875, -0.13470458984375, -0.12860870361328125, -0.1225128173828125, -0.11641693115234375, -0.110321044921875, -0.10422515869140625, -0.0981292724609375, -0.09203338623046875, -0.0859375, -0.07984161376953125, -0.0737457275390625, -0.06764984130859375, -0.061553955078125, -0.05545806884765625, -0.0493621826171875, -0.04326629638671875, -0.03717041015625, -0.03107452392578125, -0.0249786376953125, -0.01888275146484375, -0.012786865234375, -0.00669097900390625, -0.0005950927734375, 0.00550079345703125, 0.0115966796875, 0.01769256591796875, 0.0237884521484375, 0.02988433837890625, 0.035980224609375, 0.04207611083984375, 0.0481719970703125, 0.05426788330078125, 0.06036376953125, 0.06645965576171875, 0.0725555419921875, 0.07865142822265625, 0.084747314453125, 0.09084320068359375, 0.0969390869140625, 0.10303497314453125, 0.109130859375, 0.11522674560546875, 0.1213226318359375, 0.12741851806640625, 0.133514404296875, 0.13961029052734375, 0.1457061767578125, 0.15180206298828125, 0.15789794921875, 0.16399383544921875, 0.1700897216796875, 0.17618560791015625, 0.182281494140625, 0.18837738037109375, 0.1944732666015625, 0.20056915283203125, 0.2066650390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 11.0, 20.0, 18.0, 29.0, 55.0, 68.0, 83.0, 172.0, 244.0, 425.0, 708.0, 1276.0, 3074.0, 7341.0, 22827.0, 115391.0, 759033.0, 103775.0, 21156.0, 6838.0, 2898.0, 1271.0, 705.0, 420.0, 235.0, 150.0, 115.0, 66.0, 40.0, 29.0, 14.0, 13.0, 8.0, 8.0, 13.0, 10.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0281829833984375, -0.027365446090698242, -0.026547908782958984, -0.025730371475219727, -0.02491283416748047, -0.02409529685974121, -0.023277759552001953, -0.022460222244262695, -0.021642684936523438, -0.02082514762878418, -0.020007610321044922, -0.019190073013305664, -0.018372535705566406, -0.01755499839782715, -0.01673746109008789, -0.015919923782348633, -0.015102386474609375, -0.014284849166870117, -0.01346731185913086, -0.012649774551391602, -0.011832237243652344, -0.011014699935913086, -0.010197162628173828, -0.00937962532043457, -0.008562088012695312, -0.007744550704956055, -0.006927013397216797, -0.006109476089477539, -0.005291938781738281, -0.0044744014739990234, -0.0036568641662597656, -0.002839326858520508, -0.00202178955078125, -0.0012042522430419922, -0.0003867149353027344, 0.00043082237243652344, 0.0012483596801757812, 0.002065896987915039, 0.002883434295654297, 0.0037009716033935547, 0.0045185089111328125, 0.00533604621887207, 0.006153583526611328, 0.006971120834350586, 0.007788658142089844, 0.008606195449829102, 0.00942373275756836, 0.010241270065307617, 0.011058807373046875, 0.011876344680786133, 0.01269388198852539, 0.013511419296264648, 0.014328956604003906, 0.015146493911743164, 0.015964031219482422, 0.01678156852722168, 0.017599105834960938, 0.018416643142700195, 0.019234180450439453, 0.02005171775817871, 0.02086925506591797, 0.021686792373657227, 0.022504329681396484, 0.023321866989135742, 0.024139404296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 9.0, 8.0, 10.0, 20.0, 22.0, 24.0, 54.0, 51.0, 80.0, 58.0, 93.0, 119.0, 60.0, 92.0, 71.0, 41.0, 43.0, 47.0, 25.0, 12.0, 22.0, 11.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.377696990966797e-06, -6.216578185558319e-06, -6.055459380149841e-06, -5.8943405747413635e-06, -5.733221769332886e-06, -5.572102963924408e-06, -5.41098415851593e-06, -5.249865353107452e-06, -5.088746547698975e-06, -4.927627742290497e-06, -4.766508936882019e-06, -4.605390131473541e-06, -4.4442713260650635e-06, -4.283152520656586e-06, -4.122033715248108e-06, -3.96091490983963e-06, -3.7997961044311523e-06, -3.6386772990226746e-06, -3.4775584936141968e-06, -3.316439688205719e-06, -3.155320882797241e-06, -2.9942020773887634e-06, -2.8330832719802856e-06, -2.671964466571808e-06, -2.51084566116333e-06, -2.3497268557548523e-06, -2.1886080503463745e-06, -2.0274892449378967e-06, -1.866370439529419e-06, -1.7052516341209412e-06, -1.5441328287124634e-06, -1.3830140233039856e-06, -1.2218952178955078e-06, -1.06077641248703e-06, -8.996576070785522e-07, -7.385388016700745e-07, -5.774199962615967e-07, -4.163011908531189e-07, -2.551823854446411e-07, -9.406358003616333e-08, 6.705522537231445e-08, 2.2817403078079224e-07, 3.8929283618927e-07, 5.504116415977478e-07, 7.115304470062256e-07, 8.726492524147034e-07, 1.0337680578231812e-06, 1.194886863231659e-06, 1.3560056686401367e-06, 1.5171244740486145e-06, 1.6782432794570923e-06, 1.83936208486557e-06, 2.000480890274048e-06, 2.1615996956825256e-06, 2.3227185010910034e-06, 2.483837306499481e-06, 2.644956111907959e-06, 2.8060749173164368e-06, 2.9671937227249146e-06, 3.1283125281333923e-06, 3.28943133354187e-06, 3.450550138950348e-06, 3.6116689443588257e-06, 3.7727877497673035e-06, 3.933906555175781e-06]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 16.0, 34.0, 36.0, 69.0, 185.0, 395.0, 1147.0, 4215.0, 26291.0, 809721.0, 189029.0, 13370.0, 2611.0, 805.0, 301.0, 128.0, 71.0, 45.0, 29.0, 12.0, 4.0, 13.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06829833984375, -0.06621837615966797, -0.06413841247558594, -0.062058448791503906, -0.059978485107421875, -0.057898521423339844, -0.05581855773925781, -0.05373859405517578, -0.05165863037109375, -0.04957866668701172, -0.04749870300292969, -0.045418739318847656, -0.043338775634765625, -0.041258811950683594, -0.03917884826660156, -0.03709888458251953, -0.0350189208984375, -0.03293895721435547, -0.030858993530273438, -0.028779029846191406, -0.026699066162109375, -0.024619102478027344, -0.022539138793945312, -0.02045917510986328, -0.01837921142578125, -0.01629924774169922, -0.014219284057617188, -0.012139320373535156, -0.010059356689453125, -0.007979393005371094, -0.0058994293212890625, -0.0038194656372070312, -0.001739501953125, 0.00034046173095703125, 0.0024204254150390625, 0.004500389099121094, 0.006580352783203125, 0.008660316467285156, 0.010740280151367188, 0.012820243835449219, 0.01490020751953125, 0.01698017120361328, 0.019060134887695312, 0.021140098571777344, 0.023220062255859375, 0.025300025939941406, 0.027379989624023438, 0.02945995330810547, 0.0315399169921875, 0.03361988067626953, 0.03569984436035156, 0.037779808044433594, 0.039859771728515625, 0.041939735412597656, 0.04401969909667969, 0.04609966278076172, 0.04817962646484375, 0.05025959014892578, 0.05233955383300781, 0.054419517517089844, 0.056499481201171875, 0.058579444885253906, 0.06065940856933594, 0.06273937225341797, 0.0648193359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 18.0, 24.0, 30.0, 56.0, 69.0, 99.0, 135.0, 128.0, 124.0, 92.0, 58.0, 42.0, 29.0, 27.0, 17.0, 10.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035919189453125, -0.03483867645263672, -0.03375816345214844, -0.032677650451660156, -0.031597137451171875, -0.030516624450683594, -0.029436111450195312, -0.02835559844970703, -0.02727508544921875, -0.02619457244873047, -0.025114059448242188, -0.024033546447753906, -0.022953033447265625, -0.021872520446777344, -0.020792007446289062, -0.01971149444580078, -0.0186309814453125, -0.01755046844482422, -0.016469955444335938, -0.015389442443847656, -0.014308929443359375, -0.013228416442871094, -0.012147903442382812, -0.011067390441894531, -0.00998687744140625, -0.008906364440917969, -0.007825851440429688, -0.006745338439941406, -0.005664825439453125, -0.004584312438964844, -0.0035037994384765625, -0.0024232864379882812, -0.0013427734375, -0.00026226043701171875, 0.0008182525634765625, 0.0018987655639648438, 0.002979278564453125, 0.004059791564941406, 0.0051403045654296875, 0.006220817565917969, 0.00730133056640625, 0.008381843566894531, 0.009462356567382812, 0.010542869567871094, 0.011623382568359375, 0.012703895568847656, 0.013784408569335938, 0.014864921569824219, 0.0159454345703125, 0.01702594757080078, 0.018106460571289062, 0.019186973571777344, 0.020267486572265625, 0.021347999572753906, 0.022428512573242188, 0.02350902557373047, 0.02458953857421875, 0.02567005157470703, 0.026750564575195312, 0.027831077575683594, 0.028911590576171875, 0.029992103576660156, 0.031072616577148438, 0.03215312957763672, 0.033233642578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 3.0, 9.0, 16.0, 21.0, 63.0, 138.0, 375.0, 209.0, 82.0, 38.0, 23.0, 10.0, 8.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.806081771850586, -3.722672939300537, -3.6392641067504883, -3.5558550357818604, -3.4724462032318115, -3.3890373706817627, -3.305628538131714, -3.222219467163086, -3.138810634613037, -3.0554018020629883, -2.9719929695129395, -2.8885838985443115, -2.8051750659942627, -2.721766233444214, -2.638357400894165, -2.554948329925537, -2.4715394973754883, -2.3881306648254395, -2.3047218322753906, -2.2213127613067627, -2.137903928756714, -2.054495096206665, -1.9710862636566162, -1.8876773118972778, -1.8042685985565186, -1.7208597660064697, -1.6374508142471313, -1.5540419816970825, -1.4706330299377441, -1.3872241973876953, -1.3038153648376465, -1.220406413078308, -1.1369975805282593, -1.0535887479782104, -0.9701797962188721, -0.8867709636688232, -0.8033620119094849, -0.719953179359436, -0.6365442872047424, -0.5531353950500488, -0.4697265028953552, -0.3863176107406616, -0.302908718585968, -0.2194998562335968, -0.1360909640789032, -0.052682071924209595, 0.03072679042816162, 0.11413568258285522, 0.19754457473754883, 0.28095346689224243, 0.36436235904693604, 0.44777122139930725, 0.5311801433563232, 0.6145889759063721, 0.6979978680610657, 0.7814067602157593, 0.8648156523704529, 0.9482245445251465, 1.0316333770751953, 1.1150423288345337, 1.1984511613845825, 1.281860113143921, 1.3652689456939697, 1.4486777782440186, 1.532086730003357]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 5.0, 10.0, 6.0, 15.0, 10.0, 15.0, 24.0, 27.0, 31.0, 35.0, 47.0, 47.0, 55.0, 76.0, 81.0, 63.0, 66.0, 58.0, 62.0, 43.0, 51.0, 30.0, 25.0, 24.0, 25.0, 18.0, 11.0, 6.0, 6.0, 6.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7111654281616211, -0.6802897453308105, -0.6494140625, -0.6185383796691895, -0.5876626968383789, -0.5567870140075684, -0.5259113311767578, -0.49503564834594727, -0.4641599655151367, -0.43328428268432617, -0.4024085998535156, -0.3715329170227051, -0.34065723419189453, -0.309781551361084, -0.27890586853027344, -0.2480301707983017, -0.21715447306632996, -0.1862787902355194, -0.15540310740470886, -0.12452741712331772, -0.09365173429250717, -0.06277604401111603, -0.03190036118030548, -0.001024678349494934, 0.029851004481315613, 0.06072668731212616, 0.0916023701429367, 0.12247806042432785, 0.153353750705719, 0.18422943353652954, 0.2151051163673401, 0.24598079919815063, 0.2768564820289612, 0.30773216485977173, 0.3386078476905823, 0.3694835305213928, 0.40035921335220337, 0.4312348961830139, 0.46211057901382446, 0.492986261844635, 0.5238619446754456, 0.5547376275062561, 0.5856133103370667, 0.6164889931678772, 0.6473646759986877, 0.6782403588294983, 0.7091160416603088, 0.7399917244911194, 0.7708674669265747, 0.8017431497573853, 0.8326188325881958, 0.8634945154190063, 0.8943701982498169, 0.9252458810806274, 0.956121563911438, 0.9869972467422485, 1.017872929573059, 1.0487486124038696, 1.0796242952346802, 1.1104999780654907, 1.1413756608963013, 1.1722513437271118, 1.2031270265579224, 1.234002709388733, 1.2648783922195435]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 3.0, 7.0, 9.0, 18.0, 11.0, 24.0, 40.0, 47.0, 77.0, 115.0, 220.0, 404.0, 768.0, 1860.0, 5796.0, 40034.0, 4093063.0, 42065.0, 6228.0, 1872.0, 680.0, 338.0, 166.0, 124.0, 71.0, 53.0, 35.0, 36.0, 32.0, 12.0, 16.0, 14.0, 7.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.387939453125, -0.3763618469238281, -0.36478424072265625, -0.3532066345214844, -0.3416290283203125, -0.3300514221191406, -0.31847381591796875, -0.3068962097167969, -0.295318603515625, -0.2837409973144531, -0.27216339111328125, -0.2605857849121094, -0.2490081787109375, -0.23743057250976562, -0.22585296630859375, -0.21427536010742188, -0.20269775390625, -0.19112014770507812, -0.17954254150390625, -0.16796493530273438, -0.1563873291015625, -0.14480972290039062, -0.13323211669921875, -0.12165451049804688, -0.110076904296875, -0.09849929809570312, -0.08692169189453125, -0.07534408569335938, -0.0637664794921875, -0.052188873291015625, -0.04061126708984375, -0.029033660888671875, -0.0174560546875, -0.005878448486328125, 0.00569915771484375, 0.017276763916015625, 0.0288543701171875, 0.040431976318359375, 0.05200958251953125, 0.06358718872070312, 0.075164794921875, 0.08674240112304688, 0.09832000732421875, 0.10989761352539062, 0.1214752197265625, 0.13305282592773438, 0.14463043212890625, 0.15620803833007812, 0.16778564453125, 0.17936325073242188, 0.19094085693359375, 0.20251846313476562, 0.2140960693359375, 0.22567367553710938, 0.23725128173828125, 0.24882888793945312, 0.260406494140625, 0.2719841003417969, 0.28356170654296875, 0.2951393127441406, 0.3067169189453125, 0.3182945251464844, 0.32987213134765625, 0.3414497375488281, 0.35302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 2.0, 5.0, 12.0, 10.0, 20.0, 37.0, 59.0, 89.0, 120.0, 134.0, 147.0, 110.0, 92.0, 68.0, 40.0, 26.0, 13.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12784385681152344, -0.12385177612304688, -0.11985969543457031, -0.11586761474609375, -0.11187553405761719, -0.10788345336914062, -0.10389137268066406, -0.0998992919921875, -0.09590721130371094, -0.09191513061523438, -0.08792304992675781, -0.08393096923828125, -0.07993888854980469, -0.07594680786132812, -0.07195472717285156, -0.067962646484375, -0.06397056579589844, -0.059978485107421875, -0.05598640441894531, -0.05199432373046875, -0.04800224304199219, -0.044010162353515625, -0.04001808166503906, -0.0360260009765625, -0.03203392028808594, -0.028041839599609375, -0.024049758911132812, -0.02005767822265625, -0.016065597534179688, -0.012073516845703125, -0.008081436157226562, -0.00408935546875, -9.72747802734375e-05, 0.003894805908203125, 0.007886886596679688, 0.01187896728515625, 0.015871047973632812, 0.019863128662109375, 0.023855209350585938, 0.0278472900390625, 0.03183937072753906, 0.035831451416015625, 0.03982353210449219, 0.04381561279296875, 0.04780769348144531, 0.051799774169921875, 0.05579185485839844, 0.059783935546875, 0.06377601623535156, 0.06776809692382812, 0.07176017761230469, 0.07575225830078125, 0.07974433898925781, 0.08373641967773438, 0.08772850036621094, 0.0917205810546875, 0.09571266174316406, 0.09970474243164062, 0.10369682312011719, 0.10768890380859375, 0.11168098449707031, 0.11567306518554688, 0.11966514587402344, 0.1236572265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 10.0, 17.0, 17.0, 20.0, 42.0, 81.0, 150.0, 237.0, 497.0, 1044.0, 2604.0, 7816.0, 39868.0, 4032808.0, 92489.0, 10963.0, 3152.0, 1239.0, 581.0, 281.0, 139.0, 86.0, 48.0, 33.0, 29.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4108848571777344, -0.39867401123046875, -0.3864631652832031, -0.3742523193359375, -0.3620414733886719, -0.34983062744140625, -0.3376197814941406, -0.325408935546875, -0.3131980895996094, -0.30098724365234375, -0.2887763977050781, -0.2765655517578125, -0.2643547058105469, -0.25214385986328125, -0.23993301391601562, -0.22772216796875, -0.21551132202148438, -0.20330047607421875, -0.19108963012695312, -0.1788787841796875, -0.16666793823242188, -0.15445709228515625, -0.14224624633789062, -0.130035400390625, -0.11782455444335938, -0.10561370849609375, -0.09340286254882812, -0.0811920166015625, -0.06898117065429688, -0.05677032470703125, -0.044559478759765625, -0.0323486328125, -0.020137786865234375, -0.00792694091796875, 0.004283905029296875, 0.0164947509765625, 0.028705596923828125, 0.04091644287109375, 0.053127288818359375, 0.065338134765625, 0.07754898071289062, 0.08975982666015625, 0.10197067260742188, 0.1141815185546875, 0.12639236450195312, 0.13860321044921875, 0.15081405639648438, 0.16302490234375, 0.17523574829101562, 0.18744659423828125, 0.19965744018554688, 0.2118682861328125, 0.22407913208007812, 0.23628997802734375, 0.24850082397460938, 0.260711669921875, 0.2729225158691406, 0.28513336181640625, 0.2973442077636719, 0.3095550537109375, 0.3217658996582031, 0.33397674560546875, 0.3461875915527344, 0.3583984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 5.0, 12.0, 6.0, 11.0, 13.0, 25.0, 31.0, 80.0, 285.0, 1371.0, 1767.0, 268.0, 61.0, 36.0, 21.0, 24.0, 9.0, 10.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2462158203125, -0.2391986846923828, -0.23218154907226562, -0.22516441345214844, -0.21814727783203125, -0.21113014221191406, -0.20411300659179688, -0.1970958709716797, -0.1900787353515625, -0.1830615997314453, -0.17604446411132812, -0.16902732849121094, -0.16201019287109375, -0.15499305725097656, -0.14797592163085938, -0.1409587860107422, -0.133941650390625, -0.1269245147705078, -0.11990737915039062, -0.11289024353027344, -0.10587310791015625, -0.09885597229003906, -0.09183883666992188, -0.08482170104980469, -0.0778045654296875, -0.07078742980957031, -0.06377029418945312, -0.05675315856933594, -0.04973602294921875, -0.04271888732910156, -0.035701751708984375, -0.028684616088867188, -0.02166748046875, -0.014650344848632812, -0.007633209228515625, -0.0006160736083984375, 0.00640106201171875, 0.013418197631835938, 0.020435333251953125, 0.027452468872070312, 0.0344696044921875, 0.04148674011230469, 0.048503875732421875, 0.05552101135253906, 0.06253814697265625, 0.06955528259277344, 0.07657241821289062, 0.08358955383300781, 0.090606689453125, 0.09762382507324219, 0.10464096069335938, 0.11165809631347656, 0.11867523193359375, 0.12569236755371094, 0.13270950317382812, 0.1397266387939453, 0.1467437744140625, 0.1537609100341797, 0.16077804565429688, 0.16779518127441406, 0.17481231689453125, 0.18182945251464844, 0.18884658813476562, 0.1958637237548828, 0.202880859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 5.0, 11.0, 15.0, 8.0, 17.0, 15.0, 25.0, 30.0, 46.0, 51.0, 66.0, 83.0, 114.0, 110.0, 87.0, 84.0, 52.0, 30.0, 25.0, 27.0, 19.0, 17.0, 12.0, 11.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7743282914161682, -0.7510244846343994, -0.7277206778526306, -0.7044168710708618, -0.6811130046844482, -0.6578091979026794, -0.6345053911209106, -0.6112015843391418, -0.587897777557373, -0.5645939707756042, -0.5412901639938354, -0.5179863572120667, -0.49468252062797546, -0.47137871384620667, -0.4480748772621155, -0.4247710704803467, -0.4014672636985779, -0.3781634569168091, -0.3548596501350403, -0.3315558135509491, -0.3082520067691803, -0.2849481999874115, -0.2616443634033203, -0.2383405566215515, -0.21503674983978271, -0.19173294305801392, -0.16842912137508392, -0.14512529969215393, -0.12182149291038513, -0.09851767867803574, -0.07521386444568634, -0.05191004276275635, -0.028606176376342773, -0.005302362143993378, 0.018001452088356018, 0.041305266320705414, 0.06460908055305481, 0.0879128947854042, 0.1112167090177536, 0.1345205307006836, 0.1578243374824524, 0.1811281442642212, 0.20443196594715118, 0.22773578763008118, 0.25103959441185, 0.2743434011936188, 0.29764723777770996, 0.32095104455947876, 0.34425485134124756, 0.36755865812301636, 0.39086246490478516, 0.41416630148887634, 0.43747010827064514, 0.46077391505241394, 0.4840777516365051, 0.5073815584182739, 0.5306853652000427, 0.5539891719818115, 0.5772929787635803, 0.6005967855453491, 0.6239006519317627, 0.6472044587135315, 0.6705082654953003, 0.6938120722770691, 0.7171158790588379]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 10.0, 5.0, 18.0, 17.0, 13.0, 15.0, 17.0, 27.0, 25.0, 26.0, 32.0, 38.0, 32.0, 38.0, 43.0, 47.0, 44.0, 35.0, 58.0, 40.0, 49.0, 59.0, 42.0, 34.0, 43.0, 32.0, 25.0, 32.0, 15.0, 16.0, 14.0, 12.0, 11.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.6696813702583313, -0.6511761546134949, -0.6326709389686584, -0.614165723323822, -0.5956605076789856, -0.5771552920341492, -0.5586500763893127, -0.5401449203491211, -0.5216397047042847, -0.5031344890594482, -0.4846292734146118, -0.4661240577697754, -0.44761884212493896, -0.42911362648010254, -0.4106084406375885, -0.3921032249927521, -0.37359797954559326, -0.35509276390075684, -0.3365875482559204, -0.318082332611084, -0.29957711696624756, -0.28107190132141113, -0.2625667154788971, -0.24406149983406067, -0.22555628418922424, -0.20705106854438782, -0.1885458528995514, -0.17004065215587616, -0.15153543651103973, -0.1330302208662033, -0.11452501267194748, -0.09601980447769165, -0.07751452922821045, -0.05900931730866432, -0.040504105389118195, -0.021998893469572067, -0.00349368155002594, 0.015011534094810486, 0.033516742289066315, 0.052021950483322144, 0.07052716612815857, 0.089032381772995, 0.10753758996725082, 0.12604279816150665, 0.14454801380634308, 0.1630532294511795, 0.18155843019485474, 0.20006364583969116, 0.2185688614845276, 0.237074077129364, 0.25557929277420044, 0.27408450841903687, 0.2925897240638733, 0.3110949397087097, 0.32960012555122375, 0.3481053411960602, 0.3666105568408966, 0.38511577248573303, 0.40362098813056946, 0.4221262037754059, 0.4406313896179199, 0.45913660526275635, 0.4776418209075928, 0.4961470365524292, 0.5146522521972656]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 15.0, 15.0, 17.0, 18.0, 38.0, 29.0, 52.0, 71.0, 88.0, 107.0, 138.0, 192.0, 253.0, 347.0, 450.0, 797.0, 1257.0, 2407.0, 5327.0, 14313.0, 47405.0, 244105.0, 604921.0, 86885.0, 23244.0, 7968.0, 3281.0, 1658.0, 988.0, 580.0, 414.0, 289.0, 215.0, 164.0, 112.0, 92.0, 62.0, 49.0, 50.0, 34.0, 28.0, 18.0, 15.0, 8.0, 7.0, 4.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3175010681152344, -0.30663299560546875, -0.2957649230957031, -0.2848968505859375, -0.2740287780761719, -0.26316070556640625, -0.2522926330566406, -0.241424560546875, -0.23055648803710938, -0.21968841552734375, -0.20882034301757812, -0.1979522705078125, -0.18708419799804688, -0.17621612548828125, -0.16534805297851562, -0.15447998046875, -0.14361190795898438, -0.13274383544921875, -0.12187576293945312, -0.1110076904296875, -0.10013961791992188, -0.08927154541015625, -0.07840347290039062, -0.067535400390625, -0.056667327880859375, -0.04579925537109375, -0.034931182861328125, -0.0240631103515625, -0.013195037841796875, -0.00232696533203125, 0.008541107177734375, 0.0194091796875, 0.030277252197265625, 0.04114532470703125, 0.052013397216796875, 0.0628814697265625, 0.07374954223632812, 0.08461761474609375, 0.09548568725585938, 0.106353759765625, 0.11722183227539062, 0.12808990478515625, 0.13895797729492188, 0.1498260498046875, 0.16069412231445312, 0.17156219482421875, 0.18243026733398438, 0.19329833984375, 0.20416641235351562, 0.21503448486328125, 0.22590255737304688, 0.2367706298828125, 0.24763870239257812, 0.25850677490234375, 0.2693748474121094, 0.280242919921875, 0.2911109924316406, 0.30197906494140625, 0.3128471374511719, 0.3237152099609375, 0.3345832824707031, 0.34545135498046875, 0.3563194274902344, 0.3671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 12.0, 8.0, 21.0, 33.0, 57.0, 86.0, 115.0, 141.0, 140.0, 109.0, 100.0, 68.0, 49.0, 28.0, 12.0, 4.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1318359375, -0.1278533935546875, -0.123870849609375, -0.1198883056640625, -0.11590576171875, -0.1119232177734375, -0.107940673828125, -0.1039581298828125, -0.0999755859375, -0.0959930419921875, -0.092010498046875, -0.0880279541015625, -0.08404541015625, -0.0800628662109375, -0.076080322265625, -0.0720977783203125, -0.068115234375, -0.0641326904296875, -0.060150146484375, -0.0561676025390625, -0.05218505859375, -0.0482025146484375, -0.044219970703125, -0.0402374267578125, -0.0362548828125, -0.0322723388671875, -0.028289794921875, -0.0243072509765625, -0.02032470703125, -0.0163421630859375, -0.012359619140625, -0.0083770751953125, -0.00439453125, -0.0004119873046875, 0.003570556640625, 0.0075531005859375, 0.01153564453125, 0.0155181884765625, 0.019500732421875, 0.0234832763671875, 0.0274658203125, 0.0314483642578125, 0.035430908203125, 0.0394134521484375, 0.04339599609375, 0.0473785400390625, 0.051361083984375, 0.0553436279296875, 0.059326171875, 0.0633087158203125, 0.067291259765625, 0.0712738037109375, 0.07525634765625, 0.0792388916015625, 0.083221435546875, 0.0872039794921875, 0.0911865234375, 0.0951690673828125, 0.099151611328125, 0.1031341552734375, 0.10711669921875, 0.1110992431640625, 0.115081787109375, 0.1190643310546875, 0.123046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 7.0, 15.0, 15.0, 14.0, 26.0, 47.0, 71.0, 143.0, 227.0, 438.0, 785.0, 1601.0, 3236.0, 7400.0, 18401.0, 54658.0, 292829.0, 562412.0, 68456.0, 21733.0, 8463.0, 3804.0, 1763.0, 852.0, 488.0, 230.0, 147.0, 97.0, 59.0, 41.0, 22.0, 19.0, 12.0, 9.0, 4.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41015625, -0.39775848388671875, -0.3853607177734375, -0.37296295166015625, -0.360565185546875, -0.34816741943359375, -0.3357696533203125, -0.32337188720703125, -0.31097412109375, -0.29857635498046875, -0.2861785888671875, -0.27378082275390625, -0.261383056640625, -0.24898529052734375, -0.2365875244140625, -0.22418975830078125, -0.2117919921875, -0.19939422607421875, -0.1869964599609375, -0.17459869384765625, -0.162200927734375, -0.14980316162109375, -0.1374053955078125, -0.12500762939453125, -0.11260986328125, -0.10021209716796875, -0.0878143310546875, -0.07541656494140625, -0.063018798828125, -0.05062103271484375, -0.0382232666015625, -0.02582550048828125, -0.013427734375, -0.00102996826171875, 0.0113677978515625, 0.02376556396484375, 0.036163330078125, 0.04856109619140625, 0.0609588623046875, 0.07335662841796875, 0.08575439453125, 0.09815216064453125, 0.1105499267578125, 0.12294769287109375, 0.135345458984375, 0.14774322509765625, 0.1601409912109375, 0.17253875732421875, 0.1849365234375, 0.19733428955078125, 0.2097320556640625, 0.22212982177734375, 0.234527587890625, 0.24692535400390625, 0.2593231201171875, 0.27172088623046875, 0.28411865234375, 0.29651641845703125, 0.3089141845703125, 0.32131195068359375, 0.333709716796875, 0.34610748291015625, 0.3585052490234375, 0.37090301513671875, 0.38330078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 7.0, 6.0, 8.0, 8.0, 8.0, 9.0, 16.0, 23.0, 30.0, 21.0, 23.0, 39.0, 59.0, 42.0, 44.0, 62.0, 56.0, 49.0, 46.0, 56.0, 58.0, 46.0, 40.0, 40.0, 28.0, 25.0, 19.0, 30.0, 20.0, 11.0, 9.0, 17.0, 7.0, 8.0, 7.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292724609375, -0.28359222412109375, -0.2744598388671875, -0.26532745361328125, -0.256195068359375, -0.24706268310546875, -0.2379302978515625, -0.22879791259765625, -0.21966552734375, -0.21053314208984375, -0.2014007568359375, -0.19226837158203125, -0.183135986328125, -0.17400360107421875, -0.1648712158203125, -0.15573883056640625, -0.1466064453125, -0.13747406005859375, -0.1283416748046875, -0.11920928955078125, -0.110076904296875, -0.10094451904296875, -0.0918121337890625, -0.08267974853515625, -0.07354736328125, -0.06441497802734375, -0.0552825927734375, -0.04615020751953125, -0.037017822265625, -0.02788543701171875, -0.0187530517578125, -0.00962066650390625, -0.00048828125, 0.00864410400390625, 0.0177764892578125, 0.02690887451171875, 0.036041259765625, 0.04517364501953125, 0.0543060302734375, 0.06343841552734375, 0.07257080078125, 0.08170318603515625, 0.0908355712890625, 0.09996795654296875, 0.109100341796875, 0.11823272705078125, 0.1273651123046875, 0.13649749755859375, 0.1456298828125, 0.15476226806640625, 0.1638946533203125, 0.17302703857421875, 0.182159423828125, 0.19129180908203125, 0.2004241943359375, 0.20955657958984375, 0.21868896484375, 0.22782135009765625, 0.2369537353515625, 0.24608612060546875, 0.255218505859375, 0.26435089111328125, 0.2734832763671875, 0.28261566162109375, 0.291748046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 8.0, 19.0, 20.0, 29.0, 55.0, 75.0, 133.0, 195.0, 382.0, 595.0, 1080.0, 2173.0, 4564.0, 11126.0, 33139.0, 159183.0, 708714.0, 88566.0, 22683.0, 8331.0, 3520.0, 1752.0, 931.0, 508.0, 289.0, 174.0, 106.0, 62.0, 44.0, 18.0, 21.0, 13.0, 7.0, 8.0, 8.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.015625, -0.015126466751098633, -0.014627933502197266, -0.014129400253295898, -0.013630867004394531, -0.013132333755493164, -0.012633800506591797, -0.01213526725769043, -0.011636734008789062, -0.011138200759887695, -0.010639667510986328, -0.010141134262084961, -0.009642601013183594, -0.009144067764282227, -0.00864553451538086, -0.008147001266479492, -0.007648468017578125, -0.007149934768676758, -0.006651401519775391, -0.0061528682708740234, -0.005654335021972656, -0.005155801773071289, -0.004657268524169922, -0.004158735275268555, -0.0036602020263671875, -0.0031616687774658203, -0.002663135528564453, -0.002164602279663086, -0.0016660690307617188, -0.0011675357818603516, -0.0006690025329589844, -0.0001704692840576172, 0.00032806396484375, 0.0008265972137451172, 0.0013251304626464844, 0.0018236637115478516, 0.0023221969604492188, 0.002820730209350586, 0.003319263458251953, 0.0038177967071533203, 0.0043163299560546875, 0.004814863204956055, 0.005313396453857422, 0.005811929702758789, 0.006310462951660156, 0.0068089962005615234, 0.007307529449462891, 0.007806062698364258, 0.008304595947265625, 0.008803129196166992, 0.00930166244506836, 0.009800195693969727, 0.010298728942871094, 0.010797262191772461, 0.011295795440673828, 0.011794328689575195, 0.012292861938476562, 0.01279139518737793, 0.013289928436279297, 0.013788461685180664, 0.014286994934082031, 0.014785528182983398, 0.015284061431884766, 0.015782594680786133, 0.0162811279296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 12.0, 6.0, 10.0, 14.0, 9.0, 13.0, 28.0, 39.0, 94.0, 66.0, 70.0, 87.0, 98.0, 124.0, 80.0, 65.0, 37.0, 49.0, 36.0, 24.0, 14.0, 9.0, 4.0, 9.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.827976226806641e-06, -4.637986421585083e-06, -4.447996616363525e-06, -4.258006811141968e-06, -4.06801700592041e-06, -3.8780272006988525e-06, -3.688037395477295e-06, -3.4980475902557373e-06, -3.3080577850341797e-06, -3.118067979812622e-06, -2.9280781745910645e-06, -2.738088369369507e-06, -2.5480985641479492e-06, -2.3581087589263916e-06, -2.168118953704834e-06, -1.9781291484832764e-06, -1.7881393432617188e-06, -1.5981495380401611e-06, -1.4081597328186035e-06, -1.218169927597046e-06, -1.0281801223754883e-06, -8.381903171539307e-07, -6.48200511932373e-07, -4.5821070671081543e-07, -2.682209014892578e-07, -7.82310962677002e-08, 1.1175870895385742e-07, 3.0174851417541504e-07, 4.917383193969727e-07, 6.817281246185303e-07, 8.717179298400879e-07, 1.0617077350616455e-06, 1.2516975402832031e-06, 1.4416873455047607e-06, 1.6316771507263184e-06, 1.821666955947876e-06, 2.0116567611694336e-06, 2.201646566390991e-06, 2.391636371612549e-06, 2.5816261768341064e-06, 2.771615982055664e-06, 2.9616057872772217e-06, 3.1515955924987793e-06, 3.341585397720337e-06, 3.5315752029418945e-06, 3.721565008163452e-06, 3.91155481338501e-06, 4.101544618606567e-06, 4.291534423828125e-06, 4.481524229049683e-06, 4.67151403427124e-06, 4.861503839492798e-06, 5.0514936447143555e-06, 5.241483449935913e-06, 5.431473255157471e-06, 5.621463060379028e-06, 5.811452865600586e-06, 6.0014426708221436e-06, 6.191432476043701e-06, 6.381422281265259e-06, 6.571412086486816e-06, 6.761401891708374e-06, 6.951391696929932e-06, 7.141381502151489e-06, 7.331371307373047e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 0.0, 4.0, 9.0, 7.0, 7.0, 9.0, 19.0, 35.0, 47.0, 66.0, 164.0, 266.0, 445.0, 854.0, 1808.0, 3824.0, 9398.0, 26080.0, 113042.0, 746289.0, 105087.0, 24804.0, 8896.0, 3724.0, 1752.0, 862.0, 445.0, 241.0, 149.0, 75.0, 54.0, 31.0, 23.0, 17.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0225982666015625, -0.021880388259887695, -0.02116250991821289, -0.020444631576538086, -0.01972675323486328, -0.019008874893188477, -0.018290996551513672, -0.017573118209838867, -0.016855239868164062, -0.016137361526489258, -0.015419483184814453, -0.014701604843139648, -0.013983726501464844, -0.013265848159790039, -0.012547969818115234, -0.01183009147644043, -0.011112213134765625, -0.01039433479309082, -0.009676456451416016, -0.008958578109741211, -0.008240699768066406, -0.0075228214263916016, -0.006804943084716797, -0.006087064743041992, -0.0053691864013671875, -0.004651308059692383, -0.003933429718017578, -0.0032155513763427734, -0.0024976730346679688, -0.001779794692993164, -0.0010619163513183594, -0.0003440380096435547, 0.00037384033203125, 0.0010917186737060547, 0.0018095970153808594, 0.002527475357055664, 0.0032453536987304688, 0.0039632320404052734, 0.004681110382080078, 0.005398988723754883, 0.0061168670654296875, 0.006834745407104492, 0.007552623748779297, 0.008270502090454102, 0.008988380432128906, 0.009706258773803711, 0.010424137115478516, 0.01114201545715332, 0.011859893798828125, 0.01257777214050293, 0.013295650482177734, 0.014013528823852539, 0.014731407165527344, 0.015449285507202148, 0.016167163848876953, 0.016885042190551758, 0.017602920532226562, 0.018320798873901367, 0.019038677215576172, 0.019756555557250977, 0.02047443389892578, 0.021192312240600586, 0.02191019058227539, 0.022628068923950195, 0.023345947265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 3.0, 5.0, 7.0, 9.0, 9.0, 14.0, 16.0, 18.0, 17.0, 30.0, 28.0, 48.0, 67.0, 70.0, 89.0, 94.0, 78.0, 79.0, 60.0, 46.0, 36.0, 36.0, 23.0, 18.0, 17.0, 15.0, 13.0, 11.0, 7.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179290771484375, -0.01735997200012207, -0.01679086685180664, -0.01622176170349121, -0.01565265655517578, -0.015083551406860352, -0.014514446258544922, -0.013945341110229492, -0.013376235961914062, -0.012807130813598633, -0.012238025665283203, -0.011668920516967773, -0.011099815368652344, -0.010530710220336914, -0.009961605072021484, -0.009392499923706055, -0.008823394775390625, -0.008254289627075195, -0.007685184478759766, -0.007116079330444336, -0.006546974182128906, -0.0059778690338134766, -0.005408763885498047, -0.004839658737182617, -0.0042705535888671875, -0.003701448440551758, -0.003132343292236328, -0.0025632381439208984, -0.0019941329956054688, -0.001425027847290039, -0.0008559226989746094, -0.0002868175506591797, 0.00028228759765625, 0.0008513927459716797, 0.0014204978942871094, 0.001989603042602539, 0.0025587081909179688, 0.0031278133392333984, 0.003696918487548828, 0.004266023635864258, 0.0048351287841796875, 0.005404233932495117, 0.005973339080810547, 0.0065424442291259766, 0.007111549377441406, 0.007680654525756836, 0.008249759674072266, 0.008818864822387695, 0.009387969970703125, 0.009957075119018555, 0.010526180267333984, 0.011095285415649414, 0.011664390563964844, 0.012233495712280273, 0.012802600860595703, 0.013371706008911133, 0.013940811157226562, 0.014509916305541992, 0.015079021453857422, 0.01564812660217285, 0.01621723175048828, 0.01678633689880371, 0.01735544204711914, 0.01792454719543457, 0.01849365234375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 9.0, 2.0, 5.0, 7.0, 14.0, 27.0, 31.0, 26.0, 39.0, 63.0, 114.0, 206.0, 156.0, 57.0, 57.0, 45.0, 25.0, 13.0, 14.0, 15.0, 13.0, 15.0, 11.0, 5.0, 2.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2559759616851807, -1.2163389921188354, -1.1767021417617798, -1.1370651721954346, -1.097428321838379, -1.0577913522720337, -1.018154501914978, -0.9785175323486328, -0.9388806819915771, -0.8992437720298767, -0.8596068620681763, -0.8199699521064758, -0.7803330421447754, -0.740696132183075, -0.7010592222213745, -0.6614222526550293, -0.6217853426933289, -0.5821484327316284, -0.542511522769928, -0.5028746128082275, -0.4632377028465271, -0.42360079288482666, -0.38396385312080383, -0.3443269431591034, -0.30469003319740295, -0.2650531232357025, -0.22541621327400208, -0.18577928841114044, -0.14614237844944, -0.10650546848773956, -0.06686854362487793, -0.02723163366317749, 0.01240527629852295, 0.05204218998551369, 0.09167910367250443, 0.13131602108478546, 0.1709529310464859, 0.21058984100818634, 0.250226765871048, 0.2898636758327484, 0.32950058579444885, 0.3691374957561493, 0.40877440571784973, 0.44841134548187256, 0.488048255443573, 0.5276851654052734, 0.5673220753669739, 0.6069589853286743, 0.6465958952903748, 0.6862328052520752, 0.7258697152137756, 0.7655066251754761, 0.8051435351371765, 0.844780445098877, 0.8844174146652222, 0.9240542650222778, 0.963691234588623, 1.0033282041549683, 1.042965054512024, 1.0826020240783691, 1.1222388744354248, 1.16187584400177, 1.2015126943588257, 1.241149663925171, 1.2807865142822266]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 7.0, 4.0, 17.0, 16.0, 23.0, 23.0, 24.0, 21.0, 21.0, 29.0, 26.0, 30.0, 29.0, 48.0, 62.0, 74.0, 80.0, 46.0, 50.0, 29.0, 35.0, 36.0, 36.0, 34.0, 26.0, 22.0, 26.0, 20.0, 16.0, 14.0, 8.0, 5.0, 8.0, 13.0, 7.0, 2.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0], "bins": [-1.0623339414596558, -1.033735990524292, -1.0051379203796387, -0.9765399694442749, -0.9479419589042664, -0.9193439483642578, -0.890745997428894, -0.8621479868888855, -0.833549976348877, -0.8049519658088684, -0.7763539552688599, -0.7477560043334961, -0.7191579937934875, -0.690559983253479, -0.6619620323181152, -0.6333640217781067, -0.6047660112380981, -0.5761680006980896, -0.547569990158081, -0.5189720392227173, -0.49037402868270874, -0.4617760181427002, -0.43317803740501404, -0.4045800566673279, -0.37598204612731934, -0.3473840355873108, -0.31878605484962463, -0.2901880741119385, -0.26159006357192993, -0.23299206793308258, -0.20439407229423523, -0.17579607665538788, -0.14719808101654053, -0.11860008537769318, -0.09000208973884583, -0.061404094099998474, -0.03280609846115112, -0.004208102822303772, 0.02438989281654358, 0.05298788845539093, 0.08158588409423828, 0.11018387973308563, 0.13878187537193298, 0.16737987101078033, 0.19597786664962769, 0.22457586228847504, 0.2531738579273224, 0.28177183866500854, 0.3103698492050171, 0.33896785974502563, 0.3675658404827118, 0.39616382122039795, 0.4247618317604065, 0.45335984230041504, 0.4819578230381012, 0.5105558037757874, 0.5391538143157959, 0.5677518248558044, 0.596349835395813, 0.6249477863311768, 0.6535457968711853, 0.6821438074111938, 0.7107417583465576, 0.7393397688865662, 0.7679377794265747]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 5.0, 3.0, 11.0, 12.0, 24.0, 24.0, 23.0, 34.0, 53.0, 71.0, 107.0, 154.0, 255.0, 403.0, 690.0, 1391.0, 2908.0, 7536.0, 29581.0, 275852.0, 3775183.0, 77473.0, 14125.0, 4142.0, 1707.0, 876.0, 498.0, 306.0, 223.0, 158.0, 119.0, 77.0, 54.0, 59.0, 33.0, 18.0, 29.0, 13.0, 17.0, 10.0, 4.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.35107421875, -0.3405265808105469, -0.32997894287109375, -0.3194313049316406, -0.3088836669921875, -0.2983360290527344, -0.28778839111328125, -0.2772407531738281, -0.266693115234375, -0.2561454772949219, -0.24559783935546875, -0.23505020141601562, -0.2245025634765625, -0.21395492553710938, -0.20340728759765625, -0.19285964965820312, -0.18231201171875, -0.17176437377929688, -0.16121673583984375, -0.15066909790039062, -0.1401214599609375, -0.12957382202148438, -0.11902618408203125, -0.10847854614257812, -0.097930908203125, -0.08738327026367188, -0.07683563232421875, -0.06628799438476562, -0.0557403564453125, -0.045192718505859375, -0.03464508056640625, -0.024097442626953125, -0.0135498046875, -0.003002166748046875, 0.00754547119140625, 0.018093109130859375, 0.0286407470703125, 0.039188385009765625, 0.04973602294921875, 0.060283660888671875, 0.070831298828125, 0.08137893676757812, 0.09192657470703125, 0.10247421264648438, 0.1130218505859375, 0.12356948852539062, 0.13411712646484375, 0.14466476440429688, 0.15521240234375, 0.16576004028320312, 0.17630767822265625, 0.18685531616210938, 0.1974029541015625, 0.20795059204101562, 0.21849822998046875, 0.22904586791992188, 0.239593505859375, 0.2501411437988281, 0.26068878173828125, 0.2712364196777344, 0.2817840576171875, 0.2923316955566406, 0.30287933349609375, 0.3134269714355469, 0.323974609375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 8.0, 15.0, 18.0, 38.0, 52.0, 67.0, 114.0, 144.0, 141.0, 119.0, 87.0, 89.0, 50.0, 23.0, 12.0, 3.0, 9.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1309814453125, -0.12703609466552734, -0.12309074401855469, -0.11914539337158203, -0.11520004272460938, -0.11125469207763672, -0.10730934143066406, -0.1033639907836914, -0.09941864013671875, -0.0954732894897461, -0.09152793884277344, -0.08758258819580078, -0.08363723754882812, -0.07969188690185547, -0.07574653625488281, -0.07180118560791016, -0.0678558349609375, -0.06391048431396484, -0.05996513366699219, -0.05601978302001953, -0.052074432373046875, -0.04812908172607422, -0.04418373107910156, -0.040238380432128906, -0.03629302978515625, -0.032347679138183594, -0.028402328491210938, -0.02445697784423828, -0.020511627197265625, -0.01656627655029297, -0.012620925903320312, -0.008675575256347656, -0.004730224609375, -0.0007848739624023438, 0.0031604766845703125, 0.007105827331542969, 0.011051177978515625, 0.014996528625488281, 0.018941879272460938, 0.022887229919433594, 0.02683258056640625, 0.030777931213378906, 0.03472328186035156, 0.03866863250732422, 0.042613983154296875, 0.04655933380126953, 0.05050468444824219, 0.054450035095214844, 0.0583953857421875, 0.062340736389160156, 0.06628608703613281, 0.07023143768310547, 0.07417678833007812, 0.07812213897705078, 0.08206748962402344, 0.0860128402709961, 0.08995819091796875, 0.0939035415649414, 0.09784889221191406, 0.10179424285888672, 0.10573959350585938, 0.10968494415283203, 0.11363029479980469, 0.11757564544677734, 0.12152099609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 1.0, 9.0, 12.0, 20.0, 26.0, 48.0, 72.0, 113.0, 203.0, 401.0, 699.0, 1436.0, 3336.0, 8835.0, 29468.0, 155146.0, 3668739.0, 266149.0, 40658.0, 11529.0, 4047.0, 1640.0, 746.0, 385.0, 216.0, 125.0, 75.0, 47.0, 31.0, 18.0, 17.0, 11.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.41748046875, -0.40541839599609375, -0.3933563232421875, -0.38129425048828125, -0.369232177734375, -0.35717010498046875, -0.3451080322265625, -0.33304595947265625, -0.32098388671875, -0.30892181396484375, -0.2968597412109375, -0.28479766845703125, -0.272735595703125, -0.26067352294921875, -0.2486114501953125, -0.23654937744140625, -0.2244873046875, -0.21242523193359375, -0.2003631591796875, -0.18830108642578125, -0.176239013671875, -0.16417694091796875, -0.1521148681640625, -0.14005279541015625, -0.12799072265625, -0.11592864990234375, -0.1038665771484375, -0.09180450439453125, -0.079742431640625, -0.06768035888671875, -0.0556182861328125, -0.04355621337890625, -0.031494140625, -0.01943206787109375, -0.0073699951171875, 0.00469207763671875, 0.016754150390625, 0.02881622314453125, 0.0408782958984375, 0.05294036865234375, 0.06500244140625, 0.07706451416015625, 0.0891265869140625, 0.10118865966796875, 0.113250732421875, 0.12531280517578125, 0.1373748779296875, 0.14943695068359375, 0.1614990234375, 0.17356109619140625, 0.1856231689453125, 0.19768524169921875, 0.209747314453125, 0.22180938720703125, 0.2338714599609375, 0.24593353271484375, 0.25799560546875, 0.27005767822265625, 0.2821197509765625, 0.29418182373046875, 0.306243896484375, 0.31830596923828125, 0.3303680419921875, 0.34243011474609375, 0.3544921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 13.0, 10.0, 11.0, 17.0, 14.0, 34.0, 50.0, 54.0, 62.0, 110.0, 135.0, 240.0, 763.0, 1340.0, 502.0, 218.0, 124.0, 89.0, 67.0, 58.0, 37.0, 19.0, 20.0, 22.0, 16.0, 9.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.289794921875, -0.2815971374511719, -0.27339935302734375, -0.2652015686035156, -0.2570037841796875, -0.24880599975585938, -0.24060821533203125, -0.23241043090820312, -0.224212646484375, -0.21601486206054688, -0.20781707763671875, -0.19961929321289062, -0.1914215087890625, -0.18322372436523438, -0.17502593994140625, -0.16682815551757812, -0.15863037109375, -0.15043258666992188, -0.14223480224609375, -0.13403701782226562, -0.1258392333984375, -0.11764144897460938, -0.10944366455078125, -0.10124588012695312, -0.093048095703125, -0.08485031127929688, -0.07665252685546875, -0.06845474243164062, -0.0602569580078125, -0.052059173583984375, -0.04386138916015625, -0.035663604736328125, -0.0274658203125, -0.019268035888671875, -0.01107025146484375, -0.002872467041015625, 0.0053253173828125, 0.013523101806640625, 0.02172088623046875, 0.029918670654296875, 0.038116455078125, 0.046314239501953125, 0.05451202392578125, 0.06270980834960938, 0.0709075927734375, 0.07910537719726562, 0.08730316162109375, 0.09550094604492188, 0.10369873046875, 0.11189651489257812, 0.12009429931640625, 0.12829208374023438, 0.1364898681640625, 0.14468765258789062, 0.15288543701171875, 0.16108322143554688, 0.169281005859375, 0.17747879028320312, 0.18567657470703125, 0.19387435913085938, 0.2020721435546875, 0.21026992797851562, 0.21846771240234375, 0.22666549682617188, 0.23486328125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 2.0, 4.0, 10.0, 19.0, 14.0, 23.0, 33.0, 58.0, 83.0, 125.0, 152.0, 127.0, 78.0, 74.0, 29.0, 25.0, 28.0, 23.0, 16.0, 8.0, 12.0, 4.0, 8.0, 4.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7415661811828613, -1.6925015449523926, -1.6434369087219238, -1.594372272491455, -1.5453076362609863, -1.496242880821228, -1.4471782445907593, -1.3981136083602905, -1.3490489721298218, -1.299984335899353, -1.2509196996688843, -1.2018550634384155, -1.1527903079986572, -1.1037256717681885, -1.0546610355377197, -1.005596399307251, -0.9565317630767822, -0.9074671268463135, -0.8584024906158447, -0.8093377947807312, -0.7602731585502625, -0.7112085223197937, -0.6621438264846802, -0.6130791902542114, -0.5640145540237427, -0.5149499177932739, -0.4658852517604828, -0.41682058572769165, -0.3677559494972229, -0.31869131326675415, -0.269626647233963, -0.22056198120117188, -0.17149722576141357, -0.12243257462978363, -0.07336792349815369, -0.024303272366523743, 0.0247613787651062, 0.07382602989673615, 0.12289068102836609, 0.17195534706115723, 0.22101998329162598, 0.2700846195220947, 0.31914928555488586, 0.368213951587677, 0.41727858781814575, 0.4663432240486145, 0.515407919883728, 0.5644725561141968, 0.6135371923446655, 0.6626018285751343, 0.711666464805603, 0.7607311606407166, 0.8097957968711853, 0.858860433101654, 0.9079251289367676, 0.9569897651672363, 1.006054401397705, 1.0551190376281738, 1.1041836738586426, 1.1532483100891113, 1.20231294631958, 1.2513777017593384, 1.3004423379898071, 1.3495069742202759, 1.3985716104507446]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 6.0, 12.0, 10.0, 14.0, 30.0, 26.0, 21.0, 24.0, 36.0, 41.0, 31.0, 35.0, 46.0, 43.0, 43.0, 40.0, 41.0, 50.0, 54.0, 41.0, 47.0, 35.0, 31.0, 35.0, 25.0, 28.0, 28.0, 28.0, 12.0, 11.0, 7.0, 8.0, 9.0, 9.0, 8.0, 7.0, 3.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0276708602905273, -0.9939342141151428, -0.9601975679397583, -0.9264609217643738, -0.8927242755889893, -0.85898756980896, -0.8252509236335754, -0.7915142774581909, -0.7577776312828064, -0.7240409851074219, -0.6903043389320374, -0.6565676927566528, -0.6228309869766235, -0.5890944004058838, -0.5553576946258545, -0.52162104845047, -0.48788440227508545, -0.4541477560997009, -0.4204111099243164, -0.3866744339466095, -0.352937787771225, -0.31920114159584045, -0.28546446561813354, -0.251727819442749, -0.2179911732673645, -0.18425452709197998, -0.15051786601543427, -0.11678121238946915, -0.08304455876350403, -0.04930791258811951, -0.015571251511573792, 0.018165409564971924, 0.051901936531066895, 0.08563859015703201, 0.11937524378299713, 0.15311190485954285, 0.18684855103492737, 0.2205851972103119, 0.2543218731880188, 0.2880585193634033, 0.32179516553878784, 0.35553181171417236, 0.3892684578895569, 0.4230051338672638, 0.4567417800426483, 0.49047842621803284, 0.5242151021957397, 0.5579517483711243, 0.5916883945465088, 0.6254250407218933, 0.6591616868972778, 0.6928983330726624, 0.7266349792480469, 0.7603716850280762, 0.7941083312034607, 0.8278449773788452, 0.8615816235542297, 0.8953182697296143, 0.9290549159049988, 0.9627915620803833, 0.9965282678604126, 1.0302648544311523, 1.0640015602111816, 1.097738265991211, 1.1314748525619507]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 13.0, 9.0, 10.0, 11.0, 15.0, 23.0, 30.0, 31.0, 52.0, 60.0, 75.0, 83.0, 139.0, 196.0, 215.0, 301.0, 490.0, 729.0, 1120.0, 2055.0, 4399.0, 10949.0, 33118.0, 136347.0, 666517.0, 137106.0, 33316.0, 10907.0, 4509.0, 2150.0, 1133.0, 698.0, 483.0, 291.0, 246.0, 167.0, 118.0, 109.0, 76.0, 58.0, 46.0, 29.0, 28.0, 27.0, 18.0, 16.0, 13.0, 4.0, 6.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.34765625, -0.3369598388671875, -0.326263427734375, -0.3155670166015625, -0.30487060546875, -0.2941741943359375, -0.283477783203125, -0.2727813720703125, -0.2620849609375, -0.2513885498046875, -0.240692138671875, -0.2299957275390625, -0.21929931640625, -0.2086029052734375, -0.197906494140625, -0.1872100830078125, -0.176513671875, -0.1658172607421875, -0.155120849609375, -0.1444244384765625, -0.13372802734375, -0.1230316162109375, -0.112335205078125, -0.1016387939453125, -0.0909423828125, -0.0802459716796875, -0.069549560546875, -0.0588531494140625, -0.04815673828125, -0.0374603271484375, -0.026763916015625, -0.0160675048828125, -0.00537109375, 0.0053253173828125, 0.016021728515625, 0.0267181396484375, 0.03741455078125, 0.0481109619140625, 0.058807373046875, 0.0695037841796875, 0.0802001953125, 0.0908966064453125, 0.101593017578125, 0.1122894287109375, 0.12298583984375, 0.1336822509765625, 0.144378662109375, 0.1550750732421875, 0.165771484375, 0.1764678955078125, 0.187164306640625, 0.1978607177734375, 0.20855712890625, 0.2192535400390625, 0.229949951171875, 0.2406463623046875, 0.2513427734375, 0.2620391845703125, 0.272735595703125, 0.2834320068359375, 0.29412841796875, 0.3048248291015625, 0.315521240234375, 0.3262176513671875, 0.3369140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 15.0, 18.0, 30.0, 52.0, 73.0, 90.0, 133.0, 151.0, 134.0, 97.0, 74.0, 51.0, 32.0, 17.0, 10.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12860584259033203, -0.12464332580566406, -0.1206808090209961, -0.11671829223632812, -0.11275577545166016, -0.10879325866699219, -0.10483074188232422, -0.10086822509765625, -0.09690570831298828, -0.09294319152832031, -0.08898067474365234, -0.08501815795898438, -0.0810556411743164, -0.07709312438964844, -0.07313060760498047, -0.0691680908203125, -0.06520557403564453, -0.06124305725097656, -0.057280540466308594, -0.053318023681640625, -0.049355506896972656, -0.04539299011230469, -0.04143047332763672, -0.03746795654296875, -0.03350543975830078, -0.029542922973632812, -0.025580406188964844, -0.021617889404296875, -0.017655372619628906, -0.013692855834960938, -0.009730339050292969, -0.005767822265625, -0.0018053054809570312, 0.0021572113037109375, 0.006119728088378906, 0.010082244873046875, 0.014044761657714844, 0.018007278442382812, 0.02196979522705078, 0.02593231201171875, 0.02989482879638672, 0.03385734558105469, 0.037819862365722656, 0.041782379150390625, 0.045744895935058594, 0.04970741271972656, 0.05366992950439453, 0.0576324462890625, 0.06159496307373047, 0.06555747985839844, 0.0695199966430664, 0.07348251342773438, 0.07744503021240234, 0.08140754699707031, 0.08537006378173828, 0.08933258056640625, 0.09329509735107422, 0.09725761413574219, 0.10122013092041016, 0.10518264770507812, 0.1091451644897461, 0.11310768127441406, 0.11707019805908203, 0.12103271484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 9.0, 5.0, 10.0, 10.0, 13.0, 22.0, 33.0, 56.0, 125.0, 244.0, 580.0, 1508.0, 4143.0, 13864.0, 70803.0, 809563.0, 119296.0, 19553.0, 5493.0, 1876.0, 702.0, 291.0, 148.0, 76.0, 29.0, 31.0, 25.0, 13.0, 6.0, 9.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.4917449951171875, -0.471771240234375, -0.4517974853515625, -0.43182373046875, -0.4118499755859375, -0.391876220703125, -0.3719024658203125, -0.3519287109375, -0.3319549560546875, -0.311981201171875, -0.2920074462890625, -0.27203369140625, -0.2520599365234375, -0.232086181640625, -0.2121124267578125, -0.192138671875, -0.1721649169921875, -0.152191162109375, -0.1322174072265625, -0.11224365234375, -0.0922698974609375, -0.072296142578125, -0.0523223876953125, -0.0323486328125, -0.0123748779296875, 0.007598876953125, 0.0275726318359375, 0.04754638671875, 0.0675201416015625, 0.087493896484375, 0.1074676513671875, 0.12744140625, 0.1474151611328125, 0.167388916015625, 0.1873626708984375, 0.20733642578125, 0.2273101806640625, 0.247283935546875, 0.2672576904296875, 0.2872314453125, 0.3072052001953125, 0.327178955078125, 0.3471527099609375, 0.36712646484375, 0.3871002197265625, 0.407073974609375, 0.4270477294921875, 0.447021484375, 0.4669952392578125, 0.486968994140625, 0.5069427490234375, 0.52691650390625, 0.5468902587890625, 0.566864013671875, 0.5868377685546875, 0.6068115234375, 0.6267852783203125, 0.646759033203125, 0.6667327880859375, 0.68670654296875, 0.7066802978515625, 0.726654052734375, 0.7466278076171875, 0.7666015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 4.0, 10.0, 7.0, 10.0, 19.0, 25.0, 29.0, 38.0, 37.0, 56.0, 74.0, 59.0, 72.0, 62.0, 77.0, 82.0, 65.0, 53.0, 44.0, 32.0, 25.0, 26.0, 14.0, 15.0, 15.0, 8.0, 10.0, 6.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.274169921875, -0.2634429931640625, -0.252716064453125, -0.2419891357421875, -0.23126220703125, -0.2205352783203125, -0.209808349609375, -0.1990814208984375, -0.1883544921875, -0.1776275634765625, -0.166900634765625, -0.1561737060546875, -0.14544677734375, -0.1347198486328125, -0.123992919921875, -0.1132659912109375, -0.1025390625, -0.0918121337890625, -0.081085205078125, -0.0703582763671875, -0.05963134765625, -0.0489044189453125, -0.038177490234375, -0.0274505615234375, -0.0167236328125, -0.0059967041015625, 0.004730224609375, 0.0154571533203125, 0.02618408203125, 0.0369110107421875, 0.047637939453125, 0.0583648681640625, 0.069091796875, 0.0798187255859375, 0.090545654296875, 0.1012725830078125, 0.11199951171875, 0.1227264404296875, 0.133453369140625, 0.1441802978515625, 0.1549072265625, 0.1656341552734375, 0.176361083984375, 0.1870880126953125, 0.19781494140625, 0.2085418701171875, 0.219268798828125, 0.2299957275390625, 0.24072265625, 0.2514495849609375, 0.262176513671875, 0.2729034423828125, 0.28363037109375, 0.2943572998046875, 0.305084228515625, 0.3158111572265625, 0.3265380859375, 0.3372650146484375, 0.347991943359375, 0.3587188720703125, 0.36944580078125, 0.3801727294921875, 0.390899658203125, 0.4016265869140625, 0.412353515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 18.0, 14.0, 25.0, 35.0, 59.0, 71.0, 140.0, 177.0, 290.0, 442.0, 698.0, 1108.0, 1829.0, 3279.0, 6070.0, 12528.0, 29648.0, 93694.0, 600216.0, 209131.0, 50735.0, 18891.0, 8622.0, 4509.0, 2422.0, 1466.0, 842.0, 538.0, 327.0, 226.0, 163.0, 94.0, 63.0, 43.0, 44.0, 21.0, 24.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0091094970703125, -0.008831381797790527, -0.008553266525268555, -0.008275151252746582, -0.00799703598022461, -0.007718920707702637, -0.007440805435180664, -0.007162690162658691, -0.006884574890136719, -0.006606459617614746, -0.0063283443450927734, -0.006050229072570801, -0.005772113800048828, -0.0054939985275268555, -0.005215883255004883, -0.00493776798248291, -0.0046596527099609375, -0.004381537437438965, -0.004103422164916992, -0.0038253068923950195, -0.003547191619873047, -0.0032690763473510742, -0.0029909610748291016, -0.002712845802307129, -0.0024347305297851562, -0.0021566152572631836, -0.001878499984741211, -0.0016003847122192383, -0.0013222694396972656, -0.001044154167175293, -0.0007660388946533203, -0.00048792362213134766, -0.000209808349609375, 6.830692291259766e-05, 0.0003464221954345703, 0.000624537467956543, 0.0009026527404785156, 0.0011807680130004883, 0.001458883285522461, 0.0017369985580444336, 0.0020151138305664062, 0.002293229103088379, 0.0025713443756103516, 0.0028494596481323242, 0.003127574920654297, 0.0034056901931762695, 0.003683805465698242, 0.003961920738220215, 0.0042400360107421875, 0.00451815128326416, 0.004796266555786133, 0.0050743818283081055, 0.005352497100830078, 0.005630612373352051, 0.0059087276458740234, 0.006186842918395996, 0.006464958190917969, 0.006743073463439941, 0.007021188735961914, 0.007299304008483887, 0.007577419281005859, 0.007855534553527832, 0.008133649826049805, 0.008411765098571777, 0.00868988037109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 5.0, 3.0, 7.0, 12.0, 20.0, 24.0, 28.0, 34.0, 75.0, 89.0, 74.0, 95.0, 130.0, 80.0, 75.0, 61.0, 62.0, 31.0, 24.0, 22.0, 20.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.033348083496094e-06, -6.839632987976074e-06, -6.645917892456055e-06, -6.452202796936035e-06, -6.258487701416016e-06, -6.064772605895996e-06, -5.8710575103759766e-06, -5.677342414855957e-06, -5.4836273193359375e-06, -5.289912223815918e-06, -5.0961971282958984e-06, -4.902482032775879e-06, -4.708766937255859e-06, -4.51505184173584e-06, -4.32133674621582e-06, -4.127621650695801e-06, -3.933906555175781e-06, -3.7401914596557617e-06, -3.546476364135742e-06, -3.3527612686157227e-06, -3.159046173095703e-06, -2.9653310775756836e-06, -2.771615982055664e-06, -2.5779008865356445e-06, -2.384185791015625e-06, -2.1904706954956055e-06, -1.996755599975586e-06, -1.8030405044555664e-06, -1.6093254089355469e-06, -1.4156103134155273e-06, -1.2218952178955078e-06, -1.0281801223754883e-06, -8.344650268554688e-07, -6.407499313354492e-07, -4.470348358154297e-07, -2.5331974029541016e-07, -5.960464477539063e-08, 1.341104507446289e-07, 3.2782554626464844e-07, 5.21540641784668e-07, 7.152557373046875e-07, 9.08970832824707e-07, 1.1026859283447266e-06, 1.296401023864746e-06, 1.4901161193847656e-06, 1.6838312149047852e-06, 1.8775463104248047e-06, 2.0712614059448242e-06, 2.2649765014648438e-06, 2.4586915969848633e-06, 2.652406692504883e-06, 2.8461217880249023e-06, 3.039836883544922e-06, 3.2335519790649414e-06, 3.427267074584961e-06, 3.6209821701049805e-06, 3.814697265625e-06, 4.0084123611450195e-06, 4.202127456665039e-06, 4.395842552185059e-06, 4.589557647705078e-06, 4.783272743225098e-06, 4.976987838745117e-06, 5.170702934265137e-06, 5.364418029785156e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 10.0, 4.0, 17.0, 13.0, 23.0, 31.0, 45.0, 103.0, 178.0, 382.0, 803.0, 1861.0, 5267.0, 17164.0, 86087.0, 790261.0, 115501.0, 20924.0, 5988.0, 2122.0, 880.0, 413.0, 208.0, 104.0, 55.0, 47.0, 15.0, 16.0, 4.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01873779296875, -0.018124818801879883, -0.017511844635009766, -0.01689887046813965, -0.01628589630126953, -0.015672922134399414, -0.015059947967529297, -0.01444697380065918, -0.013833999633789062, -0.013221025466918945, -0.012608051300048828, -0.011995077133178711, -0.011382102966308594, -0.010769128799438477, -0.01015615463256836, -0.009543180465698242, -0.008930206298828125, -0.008317232131958008, -0.007704257965087891, -0.0070912837982177734, -0.006478309631347656, -0.005865335464477539, -0.005252361297607422, -0.004639387130737305, -0.0040264129638671875, -0.0034134387969970703, -0.002800464630126953, -0.002187490463256836, -0.0015745162963867188, -0.0009615421295166016, -0.0003485679626464844, 0.0002644062042236328, 0.00087738037109375, 0.0014903545379638672, 0.0021033287048339844, 0.0027163028717041016, 0.0033292770385742188, 0.003942251205444336, 0.004555225372314453, 0.00516819953918457, 0.0057811737060546875, 0.006394147872924805, 0.007007122039794922, 0.007620096206665039, 0.008233070373535156, 0.008846044540405273, 0.00945901870727539, 0.010071992874145508, 0.010684967041015625, 0.011297941207885742, 0.01191091537475586, 0.012523889541625977, 0.013136863708496094, 0.013749837875366211, 0.014362812042236328, 0.014975786209106445, 0.015588760375976562, 0.01620173454284668, 0.016814708709716797, 0.017427682876586914, 0.01804065704345703, 0.01865363121032715, 0.019266605377197266, 0.019879579544067383, 0.0204925537109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 6.0, 3.0, 8.0, 11.0, 13.0, 17.0, 15.0, 16.0, 21.0, 33.0, 44.0, 48.0, 47.0, 71.0, 85.0, 79.0, 88.0, 70.0, 48.0, 56.0, 34.0, 31.0, 40.0, 33.0, 20.0, 19.0, 12.0, 9.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01031494140625, -0.009979605674743652, -0.009644269943237305, -0.009308934211730957, -0.00897359848022461, -0.008638262748718262, -0.008302927017211914, -0.007967591285705566, -0.007632255554199219, -0.007296919822692871, -0.0069615840911865234, -0.006626248359680176, -0.006290912628173828, -0.0059555768966674805, -0.005620241165161133, -0.005284905433654785, -0.0049495697021484375, -0.00461423397064209, -0.004278898239135742, -0.0039435625076293945, -0.003608226776123047, -0.0032728910446166992, -0.0029375553131103516, -0.002602219581604004, -0.0022668838500976562, -0.0019315481185913086, -0.001596212387084961, -0.0012608766555786133, -0.0009255409240722656, -0.000590205192565918, -0.0002548694610595703, 8.046627044677734e-05, 0.000415802001953125, 0.0007511377334594727, 0.0010864734649658203, 0.001421809196472168, 0.0017571449279785156, 0.0020924806594848633, 0.002427816390991211, 0.0027631521224975586, 0.0030984878540039062, 0.003433823585510254, 0.0037691593170166016, 0.004104495048522949, 0.004439830780029297, 0.0047751665115356445, 0.005110502243041992, 0.00544583797454834, 0.0057811737060546875, 0.006116509437561035, 0.006451845169067383, 0.0067871809005737305, 0.007122516632080078, 0.007457852363586426, 0.0077931880950927734, 0.008128523826599121, 0.008463859558105469, 0.008799195289611816, 0.009134531021118164, 0.009469866752624512, 0.00980520248413086, 0.010140538215637207, 0.010475873947143555, 0.010811209678649902, 0.01114654541015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 7.0, 8.0, 8.0, 15.0, 23.0, 30.0, 55.0, 68.0, 144.0, 312.0, 133.0, 78.0, 36.0, 18.0, 17.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1246178150177, -2.059148073196411, -1.9936785697937012, -1.9282089471817017, -1.8627393245697021, -1.797269582748413, -1.7317999601364136, -1.666330337524414, -1.6008607149124146, -1.535391092300415, -1.4699214696884155, -1.404451847076416, -1.338982105255127, -1.273512601852417, -1.208042860031128, -1.1425732374191284, -1.077103614807129, -1.0116339921951294, -0.9461643695831299, -0.8806946873664856, -0.8152250647544861, -0.7497554421424866, -0.6842857599258423, -0.6188161373138428, -0.5533465147018433, -0.48787689208984375, -0.42240723967552185, -0.35693758726119995, -0.29146796464920044, -0.22599834203720093, -0.16052868962287903, -0.09505903720855713, -0.029589176177978516, 0.03588046133518219, 0.1013500988483429, 0.1668197363615036, 0.2322893738746643, 0.2977589964866638, 0.3632286489009857, 0.4286983013153076, 0.49416792392730713, 0.5596375465393066, 0.6251071691513062, 0.6905768513679504, 0.75604647397995, 0.8215160965919495, 0.8869857788085938, 0.9524554014205933, 1.0179250240325928, 1.0833946466445923, 1.1488642692565918, 1.2143338918685913, 1.2798035144805908, 1.3452732563018799, 1.4107428789138794, 1.476212501525879, 1.5416821241378784, 1.607151746749878, 1.6726213693618774, 1.738090991973877, 1.803560733795166, 1.869030237197876, 1.934499979019165, 1.9999696016311646, 2.065439224243164]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 2.0, 9.0, 10.0, 17.0, 27.0, 21.0, 21.0, 22.0, 28.0, 31.0, 37.0, 32.0, 52.0, 71.0, 82.0, 90.0, 71.0, 47.0, 52.0, 40.0, 35.0, 23.0, 30.0, 31.0, 22.0, 19.0, 18.0, 17.0, 11.0, 10.0, 10.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4406206607818604, -1.4028966426849365, -1.3651727437973022, -1.3274487257003784, -1.2897248268127441, -1.2520008087158203, -1.214276909828186, -1.1765528917312622, -1.138828992843628, -1.101104974746704, -1.0633810758590698, -1.025657057762146, -0.9879331588745117, -0.9502092003822327, -0.9124852418899536, -0.8747612237930298, -0.8370372653007507, -0.7993133068084717, -0.7615893483161926, -0.7238653898239136, -0.6861414313316345, -0.6484174728393555, -0.6106934547424316, -0.5729695558547974, -0.5352455377578735, -0.4975215792655945, -0.45979762077331543, -0.4220736622810364, -0.3843497037887573, -0.34662574529647827, -0.30890175700187683, -0.2711777985095978, -0.2334538698196411, -0.19572991132736206, -0.158005952835083, -0.12028197944164276, -0.08255802094936371, -0.044834062457084656, -0.007110089063644409, 0.030613869428634644, 0.0683378279209137, 0.10606178641319275, 0.1437857449054718, 0.18150971829891205, 0.2192336767911911, 0.25695765018463135, 0.2946816086769104, 0.33240556716918945, 0.3701295256614685, 0.40785348415374756, 0.4455774426460266, 0.48330140113830566, 0.5210253596305847, 0.5587493181228638, 0.5964733362197876, 0.6341972351074219, 0.6719212532043457, 0.7096452116966248, 0.7473691701889038, 0.7850931286811829, 0.8228170871734619, 0.860541045665741, 0.89826500415802, 0.9359890222549438, 0.9737129211425781]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 8.0, 8.0, 4.0, 8.0, 21.0, 17.0, 14.0, 29.0, 46.0, 61.0, 73.0, 122.0, 197.0, 366.0, 638.0, 1342.0, 3196.0, 10903.0, 122692.0, 4021741.0, 23150.0, 5654.0, 1996.0, 877.0, 374.0, 211.0, 139.0, 73.0, 42.0, 61.0, 45.0, 36.0, 28.0, 17.0, 16.0, 13.0, 10.0, 11.0, 9.0, 7.0, 4.0, 6.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3544921875, -0.3438301086425781, -0.33316802978515625, -0.3225059509277344, -0.3118438720703125, -0.3011817932128906, -0.29051971435546875, -0.2798576354980469, -0.269195556640625, -0.2585334777832031, -0.24787139892578125, -0.23720932006835938, -0.2265472412109375, -0.21588516235351562, -0.20522308349609375, -0.19456100463867188, -0.18389892578125, -0.17323684692382812, -0.16257476806640625, -0.15191268920898438, -0.1412506103515625, -0.13058853149414062, -0.11992645263671875, -0.10926437377929688, -0.098602294921875, -0.08794021606445312, -0.07727813720703125, -0.06661605834960938, -0.0559539794921875, -0.045291900634765625, -0.03462982177734375, -0.023967742919921875, -0.0133056640625, -0.002643585205078125, 0.00801849365234375, 0.018680572509765625, 0.0293426513671875, 0.040004730224609375, 0.05066680908203125, 0.061328887939453125, 0.071990966796875, 0.08265304565429688, 0.09331512451171875, 0.10397720336914062, 0.1146392822265625, 0.12530136108398438, 0.13596343994140625, 0.14662551879882812, 0.15728759765625, 0.16794967651367188, 0.17861175537109375, 0.18927383422851562, 0.1999359130859375, 0.21059799194335938, 0.22126007080078125, 0.23192214965820312, 0.242584228515625, 0.2532463073730469, 0.26390838623046875, 0.2745704650878906, 0.2852325439453125, 0.2958946228027344, 0.30655670166015625, 0.3172187805175781, 0.327880859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 5.0, 4.0, 11.0, 16.0, 34.0, 45.0, 75.0, 92.0, 136.0, 144.0, 141.0, 102.0, 71.0, 59.0, 30.0, 16.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.1288461685180664, -0.12487983703613281, -0.12091350555419922, -0.11694717407226562, -0.11298084259033203, -0.10901451110839844, -0.10504817962646484, -0.10108184814453125, -0.09711551666259766, -0.09314918518066406, -0.08918285369873047, -0.08521652221679688, -0.08125019073486328, -0.07728385925292969, -0.0733175277709961, -0.0693511962890625, -0.0653848648071289, -0.06141853332519531, -0.05745220184326172, -0.053485870361328125, -0.04951953887939453, -0.04555320739746094, -0.041586875915527344, -0.03762054443359375, -0.033654212951660156, -0.029687881469726562, -0.02572154998779297, -0.021755218505859375, -0.01778888702392578, -0.013822555541992188, -0.009856224060058594, -0.005889892578125, -0.0019235610961914062, 0.0020427703857421875, 0.006009101867675781, 0.009975433349609375, 0.013941764831542969, 0.017908096313476562, 0.021874427795410156, 0.02584075927734375, 0.029807090759277344, 0.03377342224121094, 0.03773975372314453, 0.041706085205078125, 0.04567241668701172, 0.04963874816894531, 0.053605079650878906, 0.0575714111328125, 0.061537742614746094, 0.06550407409667969, 0.06947040557861328, 0.07343673706054688, 0.07740306854248047, 0.08136940002441406, 0.08533573150634766, 0.08930206298828125, 0.09326839447021484, 0.09723472595214844, 0.10120105743408203, 0.10516738891601562, 0.10913372039794922, 0.11310005187988281, 0.1170663833618164, 0.12103271484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 8.0, 2.0, 10.0, 18.0, 20.0, 62.0, 155.0, 290.0, 752.0, 1935.0, 6124.0, 34195.0, 4055938.0, 81629.0, 9063.0, 2445.0, 912.0, 367.0, 169.0, 73.0, 41.0, 16.0, 14.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470703125, -0.45482635498046875, -0.4389495849609375, -0.42307281494140625, -0.407196044921875, -0.39131927490234375, -0.3754425048828125, -0.35956573486328125, -0.34368896484375, -0.32781219482421875, -0.3119354248046875, -0.29605865478515625, -0.280181884765625, -0.26430511474609375, -0.2484283447265625, -0.23255157470703125, -0.2166748046875, -0.20079803466796875, -0.1849212646484375, -0.16904449462890625, -0.153167724609375, -0.13729095458984375, -0.1214141845703125, -0.10553741455078125, -0.08966064453125, -0.07378387451171875, -0.0579071044921875, -0.04203033447265625, -0.026153564453125, -0.01027679443359375, 0.0055999755859375, 0.02147674560546875, 0.037353515625, 0.05323028564453125, 0.0691070556640625, 0.08498382568359375, 0.100860595703125, 0.11673736572265625, 0.1326141357421875, 0.14849090576171875, 0.16436767578125, 0.18024444580078125, 0.1961212158203125, 0.21199798583984375, 0.227874755859375, 0.24375152587890625, 0.2596282958984375, 0.27550506591796875, 0.2913818359375, 0.30725860595703125, 0.3231353759765625, 0.33901214599609375, 0.354888916015625, 0.37076568603515625, 0.3866424560546875, 0.40251922607421875, 0.41839599609375, 0.43427276611328125, 0.4501495361328125, 0.46602630615234375, 0.481903076171875, 0.49777984619140625, 0.5136566162109375, 0.5295333862304688, 0.54541015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 2.0, 4.0, 8.0, 8.0, 7.0, 14.0, 12.0, 32.0, 33.0, 68.0, 157.0, 401.0, 2461.0, 451.0, 186.0, 73.0, 34.0, 24.0, 19.0, 10.0, 14.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1715087890625, -0.1656970977783203, -0.15988540649414062, -0.15407371520996094, -0.14826202392578125, -0.14245033264160156, -0.13663864135742188, -0.1308269500732422, -0.1250152587890625, -0.11920356750488281, -0.11339187622070312, -0.10758018493652344, -0.10176849365234375, -0.09595680236816406, -0.09014511108398438, -0.08433341979980469, -0.078521728515625, -0.07271003723144531, -0.06689834594726562, -0.06108665466308594, -0.05527496337890625, -0.04946327209472656, -0.043651580810546875, -0.03783988952636719, -0.0320281982421875, -0.026216506958007812, -0.020404815673828125, -0.014593124389648438, -0.00878143310546875, -0.0029697418212890625, 0.002841949462890625, 0.008653640747070312, 0.01446533203125, 0.020277023315429688, 0.026088714599609375, 0.03190040588378906, 0.03771209716796875, 0.04352378845214844, 0.049335479736328125, 0.05514717102050781, 0.0609588623046875, 0.06677055358886719, 0.07258224487304688, 0.07839393615722656, 0.08420562744140625, 0.09001731872558594, 0.09582901000976562, 0.10164070129394531, 0.107452392578125, 0.11326408386230469, 0.11907577514648438, 0.12488746643066406, 0.13069915771484375, 0.13651084899902344, 0.14232254028320312, 0.1481342315673828, 0.1539459228515625, 0.1597576141357422, 0.16556930541992188, 0.17138099670410156, 0.17719268798828125, 0.18300437927246094, 0.18881607055664062, 0.1946277618408203, 0.200439453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 4.0, 3.0, 9.0, 18.0, 14.0, 17.0, 24.0, 34.0, 46.0, 74.0, 105.0, 153.0, 148.0, 103.0, 66.0, 46.0, 18.0, 22.0, 16.0, 11.0, 12.0, 14.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8650817275047302, -0.8403849005699158, -0.8156881332397461, -0.7909913063049316, -0.766294538974762, -0.7415977120399475, -0.7169009447097778, -0.6922041177749634, -0.6675072908401489, -0.6428104639053345, -0.6181136965751648, -0.5934168696403503, -0.5687201023101807, -0.5440232753753662, -0.5193264484405518, -0.4946296811103821, -0.4699329137802124, -0.44523611664772034, -0.42053931951522827, -0.3958424925804138, -0.37114572525024414, -0.3464488983154297, -0.3217521011829376, -0.29705530405044556, -0.2723585069179535, -0.24766170978546143, -0.22296491265296936, -0.1982681006193161, -0.17357130348682404, -0.14887450635433197, -0.12417769432067871, -0.09948089718818665, -0.07478410005569458, -0.050087299197912216, -0.025390498340129852, -0.0006936937570571899, 0.024003103375434875, 0.04869990050792694, 0.0733967125415802, 0.09809350967407227, 0.12279030680656433, 0.1474871039390564, 0.17218390107154846, 0.19688071310520172, 0.2215775102376938, 0.24627430737018585, 0.2709711194038391, 0.2956679165363312, 0.32036471366882324, 0.3450615108013153, 0.3697583079338074, 0.3944551348686218, 0.4191519021987915, 0.44384872913360596, 0.468545526266098, 0.4932423233985901, 0.5179390907287598, 0.5426359176635742, 0.5673326849937439, 0.5920295119285583, 0.616726279258728, 0.6414231061935425, 0.6661199331283569, 0.6908167004585266, 0.7155135273933411]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 6.0, 8.0, 5.0, 16.0, 11.0, 9.0, 14.0, 20.0, 28.0, 28.0, 21.0, 44.0, 35.0, 44.0, 38.0, 44.0, 57.0, 39.0, 62.0, 68.0, 38.0, 54.0, 38.0, 27.0, 35.0, 28.0, 28.0, 26.0, 20.0, 16.0, 22.0, 15.0, 15.0, 10.0, 10.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5958070158958435, -0.578436017036438, -0.5610649585723877, -0.5436939597129822, -0.5263229608535767, -0.5089519023895264, -0.49158090353012085, -0.47420987486839294, -0.45683884620666504, -0.43946781754493713, -0.42209678888320923, -0.4047257900238037, -0.3873547613620758, -0.3699837327003479, -0.3526127338409424, -0.3352417051792145, -0.3178706765174866, -0.30049964785575867, -0.28312861919403076, -0.26575762033462524, -0.24838659167289734, -0.23101556301116943, -0.21364454925060272, -0.196273535490036, -0.1789025068283081, -0.1615314781665802, -0.1441604644060135, -0.12678945064544678, -0.10941842198371887, -0.09204740077257156, -0.07467637956142426, -0.05730535835027695, -0.03993427753448486, -0.022563256323337555, -0.005192235112190247, 0.012178786098957062, 0.02954980731010437, 0.04692082852125168, 0.06429184973239899, 0.0816628709435463, 0.0990338921546936, 0.11640491336584091, 0.13377593457698822, 0.15114694833755493, 0.16851797699928284, 0.18588900566101074, 0.20326001942157745, 0.22063103318214417, 0.23800206184387207, 0.2553730905056, 0.2727441191673279, 0.2901151180267334, 0.3074861466884613, 0.3248571753501892, 0.3422281742095947, 0.35959920287132263, 0.37697023153305054, 0.39434126019477844, 0.41171228885650635, 0.42908328771591187, 0.44645431637763977, 0.4638253450393677, 0.4811963438987732, 0.4985673725605011, 0.515938401222229]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 7.0, 6.0, 10.0, 11.0, 20.0, 19.0, 20.0, 44.0, 51.0, 78.0, 111.0, 172.0, 270.0, 394.0, 751.0, 1368.0, 3325.0, 9965.0, 49247.0, 721596.0, 224831.0, 24868.0, 6368.0, 2284.0, 1083.0, 578.0, 341.0, 224.0, 129.0, 115.0, 71.0, 46.0, 37.0, 30.0, 16.0, 15.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7809982299804688, -0.7538909912109375, -0.7267837524414062, -0.699676513671875, -0.6725692749023438, -0.6454620361328125, -0.6183547973632812, -0.59124755859375, -0.5641403198242188, -0.5370330810546875, -0.5099258422851562, -0.482818603515625, -0.45571136474609375, -0.4286041259765625, -0.40149688720703125, -0.3743896484375, -0.34728240966796875, -0.3201751708984375, -0.29306793212890625, -0.265960693359375, -0.23885345458984375, -0.2117462158203125, -0.18463897705078125, -0.15753173828125, -0.13042449951171875, -0.1033172607421875, -0.07621002197265625, -0.049102783203125, -0.02199554443359375, 0.0051116943359375, 0.03221893310546875, 0.059326171875, 0.08643341064453125, 0.1135406494140625, 0.14064788818359375, 0.167755126953125, 0.19486236572265625, 0.2219696044921875, 0.24907684326171875, 0.27618408203125, 0.30329132080078125, 0.3303985595703125, 0.35750579833984375, 0.384613037109375, 0.41172027587890625, 0.4388275146484375, 0.46593475341796875, 0.4930419921875, 0.5201492309570312, 0.5472564697265625, 0.5743637084960938, 0.601470947265625, 0.6285781860351562, 0.6556854248046875, 0.6827926635742188, 0.70989990234375, 0.7370071411132812, 0.7641143798828125, 0.7912216186523438, 0.818328857421875, 0.8454360961914062, 0.8725433349609375, 0.8996505737304688, 0.9267578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 10.0, 16.0, 34.0, 49.0, 76.0, 88.0, 149.0, 138.0, 129.0, 114.0, 68.0, 63.0, 24.0, 11.0, 8.0, 9.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.12836647033691406, -0.12440872192382812, -0.12045097351074219, -0.11649322509765625, -0.11253547668457031, -0.10857772827148438, -0.10461997985839844, -0.1006622314453125, -0.09670448303222656, -0.09274673461914062, -0.08878898620605469, -0.08483123779296875, -0.08087348937988281, -0.07691574096679688, -0.07295799255371094, -0.069000244140625, -0.06504249572753906, -0.061084747314453125, -0.05712699890136719, -0.05316925048828125, -0.04921150207519531, -0.045253753662109375, -0.04129600524902344, -0.0373382568359375, -0.03338050842285156, -0.029422760009765625, -0.025465011596679688, -0.02150726318359375, -0.017549514770507812, -0.013591766357421875, -0.009634017944335938, -0.00567626953125, -0.0017185211181640625, 0.002239227294921875, 0.0061969757080078125, 0.01015472412109375, 0.014112472534179688, 0.018070220947265625, 0.022027969360351562, 0.0259857177734375, 0.029943466186523438, 0.033901214599609375, 0.03785896301269531, 0.04181671142578125, 0.04577445983886719, 0.049732208251953125, 0.05368995666503906, 0.057647705078125, 0.06160545349121094, 0.06556320190429688, 0.06952095031738281, 0.07347869873046875, 0.07743644714355469, 0.08139419555664062, 0.08535194396972656, 0.0893096923828125, 0.09326744079589844, 0.09722518920898438, 0.10118293762207031, 0.10514068603515625, 0.10909843444824219, 0.11305618286132812, 0.11701393127441406, 0.1209716796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 8.0, 11.0, 20.0, 34.0, 46.0, 91.0, 128.0, 256.0, 438.0, 915.0, 1960.0, 4991.0, 16036.0, 81992.0, 825466.0, 89991.0, 16796.0, 5270.0, 2045.0, 917.0, 499.0, 268.0, 143.0, 85.0, 40.0, 30.0, 23.0, 13.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7934722900390625, -0.769073486328125, -0.7446746826171875, -0.72027587890625, -0.6958770751953125, -0.671478271484375, -0.6470794677734375, -0.6226806640625, -0.5982818603515625, -0.573883056640625, -0.5494842529296875, -0.52508544921875, -0.5006866455078125, -0.476287841796875, -0.4518890380859375, -0.427490234375, -0.4030914306640625, -0.378692626953125, -0.3542938232421875, -0.32989501953125, -0.3054962158203125, -0.281097412109375, -0.2566986083984375, -0.2322998046875, -0.2079010009765625, -0.183502197265625, -0.1591033935546875, -0.13470458984375, -0.1103057861328125, -0.085906982421875, -0.0615081787109375, -0.037109375, -0.0127105712890625, 0.011688232421875, 0.0360870361328125, 0.06048583984375, 0.0848846435546875, 0.109283447265625, 0.1336822509765625, 0.1580810546875, 0.1824798583984375, 0.206878662109375, 0.2312774658203125, 0.25567626953125, 0.2800750732421875, 0.304473876953125, 0.3288726806640625, 0.353271484375, 0.3776702880859375, 0.402069091796875, 0.4264678955078125, 0.45086669921875, 0.4752655029296875, 0.499664306640625, 0.5240631103515625, 0.5484619140625, 0.5728607177734375, 0.597259521484375, 0.6216583251953125, 0.64605712890625, 0.6704559326171875, 0.694854736328125, 0.7192535400390625, 0.74365234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 0.0, 4.0, 8.0, 7.0, 5.0, 9.0, 13.0, 14.0, 19.0, 25.0, 30.0, 47.0, 35.0, 44.0, 61.0, 81.0, 46.0, 67.0, 75.0, 56.0, 66.0, 70.0, 51.0, 30.0, 35.0, 25.0, 16.0, 15.0, 10.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.3489112854003906, -0.33844757080078125, -0.3279838562011719, -0.3175201416015625, -0.3070564270019531, -0.29659271240234375, -0.2861289978027344, -0.275665283203125, -0.2652015686035156, -0.25473785400390625, -0.24427413940429688, -0.2338104248046875, -0.22334671020507812, -0.21288299560546875, -0.20241928100585938, -0.19195556640625, -0.18149185180664062, -0.17102813720703125, -0.16056442260742188, -0.1501007080078125, -0.13963699340820312, -0.12917327880859375, -0.11870956420898438, -0.108245849609375, -0.09778213500976562, -0.08731842041015625, -0.07685470581054688, -0.0663909912109375, -0.055927276611328125, -0.04546356201171875, -0.034999847412109375, -0.0245361328125, -0.014072418212890625, -0.00360870361328125, 0.006855010986328125, 0.0173187255859375, 0.027782440185546875, 0.03824615478515625, 0.048709869384765625, 0.059173583984375, 0.06963729858398438, 0.08010101318359375, 0.09056472778320312, 0.1010284423828125, 0.11149215698242188, 0.12195587158203125, 0.13241958618164062, 0.14288330078125, 0.15334701538085938, 0.16381072998046875, 0.17427444458007812, 0.1847381591796875, 0.19520187377929688, 0.20566558837890625, 0.21612930297851562, 0.226593017578125, 0.23705673217773438, 0.24752044677734375, 0.2579841613769531, 0.2684478759765625, 0.2789115905761719, 0.28937530517578125, 0.2998390197753906, 0.310302734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 5.0, 10.0, 24.0, 28.0, 35.0, 41.0, 73.0, 144.0, 169.0, 220.0, 364.0, 597.0, 864.0, 1376.0, 2317.0, 3999.0, 7441.0, 16068.0, 41451.0, 176961.0, 666149.0, 80087.0, 25544.0, 11142.0, 5501.0, 2960.0, 1748.0, 1129.0, 682.0, 482.0, 283.0, 212.0, 151.0, 95.0, 67.0, 42.0, 32.0, 15.0, 15.0, 12.0, 10.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0243988037109375, -0.023642539978027344, -0.022886276245117188, -0.02213001251220703, -0.021373748779296875, -0.02061748504638672, -0.019861221313476562, -0.019104957580566406, -0.01834869384765625, -0.017592430114746094, -0.016836166381835938, -0.01607990264892578, -0.015323638916015625, -0.014567375183105469, -0.013811111450195312, -0.013054847717285156, -0.012298583984375, -0.011542320251464844, -0.010786056518554688, -0.010029792785644531, -0.009273529052734375, -0.008517265319824219, -0.0077610015869140625, -0.007004737854003906, -0.00624847412109375, -0.005492210388183594, -0.0047359466552734375, -0.003979682922363281, -0.003223419189453125, -0.0024671554565429688, -0.0017108917236328125, -0.0009546279907226562, -0.0001983642578125, 0.0005578994750976562, 0.0013141632080078125, 0.0020704269409179688, 0.002826690673828125, 0.0035829544067382812, 0.0043392181396484375, 0.005095481872558594, 0.00585174560546875, 0.006608009338378906, 0.0073642730712890625, 0.008120536804199219, 0.008876800537109375, 0.009633064270019531, 0.010389328002929688, 0.011145591735839844, 0.01190185546875, 0.012658119201660156, 0.013414382934570312, 0.014170646667480469, 0.014926910400390625, 0.01568317413330078, 0.016439437866210938, 0.017195701599121094, 0.01795196533203125, 0.018708229064941406, 0.019464492797851562, 0.02022075653076172, 0.020977020263671875, 0.02173328399658203, 0.022489547729492188, 0.023245811462402344, 0.0240020751953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 11.0, 13.0, 7.0, 19.0, 31.0, 49.0, 62.0, 79.0, 98.0, 129.0, 149.0, 98.0, 77.0, 52.0, 39.0, 21.0, 25.0, 12.0, 6.0, 4.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2814998626708984e-05, -1.2448988854885101e-05, -1.2082979083061218e-05, -1.1716969311237335e-05, -1.1350959539413452e-05, -1.0984949767589569e-05, -1.0618939995765686e-05, -1.0252930223941803e-05, -9.88692045211792e-06, -9.520910680294037e-06, -9.154900908470154e-06, -8.78889113664627e-06, -8.422881364822388e-06, -8.056871592998505e-06, -7.690861821174622e-06, -7.3248520493507385e-06, -6.9588422775268555e-06, -6.592832505702972e-06, -6.226822733879089e-06, -5.860812962055206e-06, -5.494803190231323e-06, -5.12879341840744e-06, -4.762783646583557e-06, -4.396773874759674e-06, -4.030764102935791e-06, -3.664754331111908e-06, -3.298744559288025e-06, -2.932734787464142e-06, -2.566725015640259e-06, -2.2007152438163757e-06, -1.8347054719924927e-06, -1.4686957001686096e-06, -1.1026859283447266e-06, -7.366761565208435e-07, -3.7066638469696045e-07, -4.6566128730773926e-09, 3.6135315895080566e-07, 7.273629307746887e-07, 1.0933727025985718e-06, 1.4593824744224548e-06, 1.8253922462463379e-06, 2.191402018070221e-06, 2.557411789894104e-06, 2.923421561717987e-06, 3.28943133354187e-06, 3.655441105365753e-06, 4.021450877189636e-06, 4.387460649013519e-06, 4.753470420837402e-06, 5.119480192661285e-06, 5.4854899644851685e-06, 5.8514997363090515e-06, 6.2175095081329346e-06, 6.583519279956818e-06, 6.949529051780701e-06, 7.315538823604584e-06, 7.681548595428467e-06, 8.04755836725235e-06, 8.413568139076233e-06, 8.779577910900116e-06, 9.145587682723999e-06, 9.511597454547882e-06, 9.877607226371765e-06, 1.0243616998195648e-05, 1.0609626770019531e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 19.0, 21.0, 30.0, 49.0, 92.0, 147.0, 262.0, 516.0, 1191.0, 2914.0, 9305.0, 48529.0, 871569.0, 93633.0, 13421.0, 3937.0, 1514.0, 632.0, 309.0, 151.0, 105.0, 57.0, 39.0, 35.0, 13.0, 10.0, 3.0, 13.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.0697021484375, -0.06802797317504883, -0.06635379791259766, -0.06467962265014648, -0.06300544738769531, -0.06133127212524414, -0.05965709686279297, -0.0579829216003418, -0.056308746337890625, -0.05463457107543945, -0.05296039581298828, -0.05128622055053711, -0.04961204528808594, -0.047937870025634766, -0.046263694763183594, -0.04458951950073242, -0.04291534423828125, -0.04124116897583008, -0.039566993713378906, -0.037892818450927734, -0.03621864318847656, -0.03454446792602539, -0.03287029266357422, -0.031196117401123047, -0.029521942138671875, -0.027847766876220703, -0.02617359161376953, -0.02449941635131836, -0.022825241088867188, -0.021151065826416016, -0.019476890563964844, -0.017802715301513672, -0.0161285400390625, -0.014454364776611328, -0.012780189514160156, -0.011106014251708984, -0.009431838989257812, -0.007757663726806641, -0.006083488464355469, -0.004409313201904297, -0.002735137939453125, -0.0010609626770019531, 0.0006132125854492188, 0.0022873878479003906, 0.0039615631103515625, 0.005635738372802734, 0.007309913635253906, 0.008984088897705078, 0.01065826416015625, 0.012332439422607422, 0.014006614685058594, 0.015680789947509766, 0.017354965209960938, 0.01902914047241211, 0.02070331573486328, 0.022377490997314453, 0.024051666259765625, 0.025725841522216797, 0.02740001678466797, 0.02907419204711914, 0.030748367309570312, 0.032422542572021484, 0.034096717834472656, 0.03577089309692383, 0.037445068359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 8.0, 18.0, 26.0, 20.0, 22.0, 41.0, 39.0, 62.0, 98.0, 125.0, 121.0, 107.0, 70.0, 57.0, 48.0, 31.0, 15.0, 10.0, 12.0, 10.0, 8.0, 11.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.029876708984375, -0.029152631759643555, -0.02842855453491211, -0.027704477310180664, -0.02698040008544922, -0.026256322860717773, -0.025532245635986328, -0.024808168411254883, -0.024084091186523438, -0.023360013961791992, -0.022635936737060547, -0.0219118595123291, -0.021187782287597656, -0.02046370506286621, -0.019739627838134766, -0.01901555061340332, -0.018291473388671875, -0.01756739616394043, -0.016843318939208984, -0.01611924171447754, -0.015395164489746094, -0.014671087265014648, -0.013947010040283203, -0.013222932815551758, -0.012498855590820312, -0.011774778366088867, -0.011050701141357422, -0.010326623916625977, -0.009602546691894531, -0.008878469467163086, -0.00815439224243164, -0.007430315017700195, -0.00670623779296875, -0.005982160568237305, -0.005258083343505859, -0.004534006118774414, -0.0038099288940429688, -0.0030858516693115234, -0.002361774444580078, -0.0016376972198486328, -0.0009136199951171875, -0.0001895427703857422, 0.0005345344543457031, 0.0012586116790771484, 0.0019826889038085938, 0.002706766128540039, 0.0034308433532714844, 0.00415492057800293, 0.004878997802734375, 0.00560307502746582, 0.006327152252197266, 0.007051229476928711, 0.007775306701660156, 0.008499383926391602, 0.009223461151123047, 0.009947538375854492, 0.010671615600585938, 0.011395692825317383, 0.012119770050048828, 0.012843847274780273, 0.013567924499511719, 0.014292001724243164, 0.01501607894897461, 0.015740156173706055, 0.0164642333984375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 9.0, 15.0, 21.0, 13.0, 26.0, 24.0, 36.0, 52.0, 64.0, 111.0, 233.0, 96.0, 72.0, 46.0, 39.0, 23.0, 19.0, 10.0, 10.0, 7.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1504859924316406, -1.1150015592575073, -1.079517126083374, -1.0440326929092407, -1.0085482597351074, -0.9730638265609741, -0.9375793933868408, -0.9020949602127075, -0.8666105270385742, -0.8311260938644409, -0.7956416606903076, -0.7601572275161743, -0.724672794342041, -0.6891883611679077, -0.6537039279937744, -0.6182194948196411, -0.5827350616455078, -0.5472506284713745, -0.5117661952972412, -0.4762817621231079, -0.4407973289489746, -0.4053128957748413, -0.369828462600708, -0.3343440294265747, -0.2988595962524414, -0.2633751630783081, -0.2278907299041748, -0.1924062967300415, -0.1569218635559082, -0.1214374303817749, -0.0859529972076416, -0.0504685640335083, -0.01498425006866455, 0.02050018310546875, 0.05598461627960205, 0.09146904945373535, 0.12695348262786865, 0.16243791580200195, 0.19792234897613525, 0.23340678215026855, 0.26889121532440186, 0.30437564849853516, 0.33986008167266846, 0.37534451484680176, 0.41082894802093506, 0.44631338119506836, 0.48179781436920166, 0.517282247543335, 0.5527666807174683, 0.5882511138916016, 0.6237355470657349, 0.6592199802398682, 0.6947044134140015, 0.7301888465881348, 0.7656732797622681, 0.8011577129364014, 0.8366421461105347, 0.872126579284668, 0.9076110124588013, 0.9430954456329346, 0.9785798788070679, 1.0140643119812012, 1.0495487451553345, 1.0850331783294678, 1.120517611503601]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 18.0, 18.0, 23.0, 18.0, 24.0, 26.0, 31.0, 43.0, 41.0, 56.0, 58.0, 77.0, 105.0, 77.0, 66.0, 37.0, 43.0, 39.0, 33.0, 27.0, 22.0, 29.0, 16.0, 12.0, 10.0, 10.0, 4.0, 7.0, 5.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9617964029312134, -0.9268282651901245, -0.8918601870536804, -0.8568920493125916, -0.8219239711761475, -0.7869558334350586, -0.7519876956939697, -0.7170195579528809, -0.6820514798164368, -0.6470833420753479, -0.6121152639389038, -0.5771471261978149, -0.5421789884567261, -0.507210910320282, -0.4722427725791931, -0.43727466464042664, -0.40230655670166016, -0.3673384487628937, -0.3323703408241272, -0.29740220308303833, -0.26243409514427185, -0.22746598720550537, -0.1924978643655777, -0.15752974152565002, -0.12256163358688354, -0.08759351819753647, -0.05262540280818939, -0.017657287418842316, 0.01731082797050476, 0.05227893590927124, 0.08724705874919891, 0.12221518158912659, 0.15718340873718262, 0.1921515166759491, 0.22711963951587677, 0.26208776235580444, 0.2970558702945709, 0.3320239782333374, 0.36699211597442627, 0.40196022391319275, 0.43692833185195923, 0.4718964397907257, 0.5068645477294922, 0.541832685470581, 0.5768008232116699, 0.611768901348114, 0.6467370390892029, 0.681705117225647, 0.7166732549667358, 0.7516413927078247, 0.7866094708442688, 0.8215776085853577, 0.8565456867218018, 0.8915138244628906, 0.9264819622039795, 0.9614500999450684, 0.9964181780815125, 1.0313862562179565, 1.0663543939590454, 1.1013225317001343, 1.1362906694412231, 1.1712586879730225, 1.2062268257141113, 1.2411949634552002, 1.276163101196289]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 4.0, 8.0, 4.0, 10.0, 14.0, 32.0, 39.0, 63.0, 98.0, 150.0, 214.0, 355.0, 566.0, 1003.0, 2093.0, 5594.0, 18979.0, 122103.0, 3579716.0, 414614.0, 34332.0, 7418.0, 3001.0, 1542.0, 918.0, 605.0, 321.0, 164.0, 111.0, 68.0, 33.0, 21.0, 24.0, 14.0, 5.0, 6.0, 8.0, 7.0, 2.0, 5.0, 6.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.2861328125, -1.24908447265625, -1.2120361328125, -1.17498779296875, -1.137939453125, -1.10089111328125, -1.0638427734375, -1.02679443359375, -0.98974609375, -0.95269775390625, -0.9156494140625, -0.87860107421875, -0.841552734375, -0.80450439453125, -0.7674560546875, -0.73040771484375, -0.693359375, -0.65631103515625, -0.6192626953125, -0.58221435546875, -0.545166015625, -0.50811767578125, -0.4710693359375, -0.43402099609375, -0.39697265625, -0.35992431640625, -0.3228759765625, -0.28582763671875, -0.248779296875, -0.21173095703125, -0.1746826171875, -0.13763427734375, -0.1005859375, -0.06353759765625, -0.0264892578125, 0.01055908203125, 0.047607421875, 0.08465576171875, 0.1217041015625, 0.15875244140625, 0.19580078125, 0.23284912109375, 0.2698974609375, 0.30694580078125, 0.343994140625, 0.38104248046875, 0.4180908203125, 0.45513916015625, 0.4921875, 0.52923583984375, 0.5662841796875, 0.60333251953125, 0.640380859375, 0.67742919921875, 0.7144775390625, 0.75152587890625, 0.78857421875, 0.82562255859375, 0.8626708984375, 0.89971923828125, 0.936767578125, 0.97381591796875, 1.0108642578125, 1.04791259765625, 1.0849609375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 7.0, 18.0, 32.0, 46.0, 74.0, 96.0, 138.0, 162.0, 119.0, 103.0, 81.0, 55.0, 23.0, 17.0, 9.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12860965728759766, -0.12465095520019531, -0.12069225311279297, -0.11673355102539062, -0.11277484893798828, -0.10881614685058594, -0.1048574447631836, -0.10089874267578125, -0.0969400405883789, -0.09298133850097656, -0.08902263641357422, -0.08506393432617188, -0.08110523223876953, -0.07714653015136719, -0.07318782806396484, -0.0692291259765625, -0.06527042388916016, -0.06131172180175781, -0.05735301971435547, -0.053394317626953125, -0.04943561553955078, -0.04547691345214844, -0.041518211364746094, -0.03755950927734375, -0.033600807189941406, -0.029642105102539062, -0.02568340301513672, -0.021724700927734375, -0.01776599884033203, -0.013807296752929688, -0.009848594665527344, -0.005889892578125, -0.0019311904907226562, 0.0020275115966796875, 0.005986213684082031, 0.009944915771484375, 0.013903617858886719, 0.017862319946289062, 0.021821022033691406, 0.02577972412109375, 0.029738426208496094, 0.03369712829589844, 0.03765583038330078, 0.041614532470703125, 0.04557323455810547, 0.04953193664550781, 0.053490638732910156, 0.0574493408203125, 0.061408042907714844, 0.06536674499511719, 0.06932544708251953, 0.07328414916992188, 0.07724285125732422, 0.08120155334472656, 0.0851602554321289, 0.08911895751953125, 0.0930776596069336, 0.09703636169433594, 0.10099506378173828, 0.10495376586914062, 0.10891246795654297, 0.11287117004394531, 0.11682987213134766, 0.12078857421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 21.0, 25.0, 43.0, 62.0, 118.0, 169.0, 247.0, 376.0, 625.0, 1065.0, 1619.0, 2835.0, 4842.0, 8424.0, 15730.0, 31985.0, 68706.0, 172169.0, 568988.0, 2467282.0, 546866.0, 166846.0, 67503.0, 31083.0, 15834.0, 8527.0, 4761.0, 2845.0, 1783.0, 1068.0, 667.0, 416.0, 300.0, 155.0, 120.0, 57.0, 40.0, 24.0, 17.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.251953125, -0.243408203125, -0.23486328125, -0.226318359375, -0.2177734375, -0.209228515625, -0.20068359375, -0.192138671875, -0.18359375, -0.175048828125, -0.16650390625, -0.157958984375, -0.1494140625, -0.140869140625, -0.13232421875, -0.123779296875, -0.115234375, -0.106689453125, -0.09814453125, -0.089599609375, -0.0810546875, -0.072509765625, -0.06396484375, -0.055419921875, -0.046875, -0.038330078125, -0.02978515625, -0.021240234375, -0.0126953125, -0.004150390625, 0.00439453125, 0.012939453125, 0.021484375, 0.030029296875, 0.03857421875, 0.047119140625, 0.0556640625, 0.064208984375, 0.07275390625, 0.081298828125, 0.08984375, 0.098388671875, 0.10693359375, 0.115478515625, 0.1240234375, 0.132568359375, 0.14111328125, 0.149658203125, 0.158203125, 0.166748046875, 0.17529296875, 0.183837890625, 0.1923828125, 0.200927734375, 0.20947265625, 0.218017578125, 0.2265625, 0.235107421875, 0.24365234375, 0.252197265625, 0.2607421875, 0.269287109375, 0.27783203125, 0.286376953125, 0.294921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 12.0, 6.0, 11.0, 9.0, 9.0, 23.0, 20.0, 24.0, 54.0, 36.0, 53.0, 72.0, 103.0, 124.0, 136.0, 193.0, 218.0, 283.0, 536.0, 529.0, 336.0, 221.0, 205.0, 178.0, 134.0, 109.0, 86.0, 73.0, 58.0, 44.0, 41.0, 38.0, 22.0, 21.0, 16.0, 11.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.4150390625, -0.4043998718261719, -0.39376068115234375, -0.3831214904785156, -0.3724822998046875, -0.3618431091308594, -0.35120391845703125, -0.3405647277832031, -0.329925537109375, -0.3192863464355469, -0.30864715576171875, -0.2980079650878906, -0.2873687744140625, -0.2767295837402344, -0.26609039306640625, -0.2554512023925781, -0.24481201171875, -0.23417282104492188, -0.22353363037109375, -0.21289443969726562, -0.2022552490234375, -0.19161605834960938, -0.18097686767578125, -0.17033767700195312, -0.159698486328125, -0.14905929565429688, -0.13842010498046875, -0.12778091430664062, -0.1171417236328125, -0.10650253295898438, -0.09586334228515625, -0.08522415161132812, -0.0745849609375, -0.06394577026367188, -0.05330657958984375, -0.042667388916015625, -0.0320281982421875, -0.021389007568359375, -0.01074981689453125, -0.000110626220703125, 0.010528564453125, 0.021167755126953125, 0.03180694580078125, 0.042446136474609375, 0.0530853271484375, 0.06372451782226562, 0.07436370849609375, 0.08500289916992188, 0.09564208984375, 0.10628128051757812, 0.11692047119140625, 0.12755966186523438, 0.1381988525390625, 0.14883804321289062, 0.15947723388671875, 0.17011642456054688, 0.180755615234375, 0.19139480590820312, 0.20203399658203125, 0.21267318725585938, 0.2233123779296875, 0.23395156860351562, 0.24459075927734375, 0.2552299499511719, 0.265869140625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 9.0, 11.0, 15.0, 10.0, 14.0, 29.0, 41.0, 66.0, 80.0, 126.0, 111.0, 85.0, 62.0, 54.0, 46.0, 29.0, 33.0, 27.0, 22.0, 26.0, 18.0, 9.0, 12.0, 11.0, 5.0, 4.0, 12.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.71455979347229, -2.607809543609619, -2.5010592937469482, -2.3943090438842773, -2.2875585556030273, -2.1808083057403564, -2.0740580558776855, -1.9673078060150146, -1.8605574369430542, -1.7538071870803833, -1.6470568180084229, -1.540306568145752, -1.433556318283081, -1.3268059492111206, -1.2200556993484497, -1.1133053302764893, -1.0065550804138184, -0.8998047709465027, -0.793054461479187, -0.6863042116165161, -0.5795539021492004, -0.47280359268188477, -0.36605334281921387, -0.2593030333518982, -0.15255272388458252, -0.04580242931842804, 0.06094786524772644, 0.16769814491271973, 0.2744484543800354, 0.3811987638473511, 0.487949013710022, 0.5946993231773376, 0.7014498710632324, 0.8082001805305481, 0.9149504899978638, 1.0217007398605347, 1.1284511089324951, 1.235201358795166, 1.341951608657837, 1.4487018585205078, 1.5554522275924683, 1.6622024774551392, 1.7689528465270996, 1.8757030963897705, 1.9824533462524414, 2.0892038345336914, 2.195953845977783, 2.302704334259033, 2.409454584121704, 2.516204833984375, 2.622955083847046, 2.729705333709717, 2.836455821990967, 2.9432060718536377, 3.0499563217163086, 3.1567065715789795, 3.2634568214416504, 3.3702070713043213, 3.476957321166992, 3.583707809448242, 3.690458059310913, 3.797208309173584, 3.903958559036255, 4.010708808898926, 4.117459297180176]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 8.0, 10.0, 11.0, 9.0, 11.0, 17.0, 28.0, 37.0, 35.0, 40.0, 36.0, 28.0, 38.0, 37.0, 45.0, 39.0, 32.0, 39.0, 30.0, 25.0, 28.0, 36.0, 31.0, 32.0, 29.0, 36.0, 30.0, 29.0, 27.0, 27.0, 26.0, 24.0, 18.0, 11.0, 10.0, 9.0, 9.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8354053497314453, -2.752150535583496, -2.668895959854126, -2.5856411457061768, -2.5023863315582275, -2.4191317558288574, -2.335876941680908, -2.252622127532959, -2.1693673133850098, -2.0861124992370605, -2.0028579235076904, -1.9196031093597412, -1.836348295211792, -1.7530936002731323, -1.6698389053344727, -1.5865840911865234, -1.5033295154571533, -1.4200748205184937, -1.3368200063705444, -1.2535653114318848, -1.1703104972839355, -1.0870558023452759, -1.0038011074066162, -0.9205463528633118, -0.8372915983200073, -0.7540368437767029, -0.6707820892333984, -0.5875273942947388, -0.5042726397514343, -0.4210178852081299, -0.3377631604671478, -0.25450843572616577, -0.17125344276428223, -0.08799870312213898, -0.0047439634799957275, 0.07851077616214752, 0.16176551580429077, 0.24502027034759521, 0.32827499508857727, 0.4115297198295593, 0.49478447437286377, 0.5780392289161682, 0.6612939834594727, 0.7445486783981323, 0.8278034329414368, 0.9110581874847412, 0.9943128824234009, 1.0775675773620605, 1.1608223915100098, 1.2440770864486694, 1.3273319005966187, 1.4105865955352783, 1.4938414096832275, 1.5770961046218872, 1.6603507995605469, 1.743605613708496, 1.8268603086471558, 1.9101150035858154, 1.9933698177337646, 2.076624631881714, 2.159879207611084, 2.243134021759033, 2.3263888359069824, 2.4096434116363525, 2.4928982257843018]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 12.0, 12.0, 20.0, 30.0, 30.0, 60.0, 75.0, 134.0, 186.0, 313.0, 456.0, 747.0, 1215.0, 2200.0, 4177.0, 8511.0, 18030.0, 44039.0, 136621.0, 564326.0, 173801.0, 52730.0, 20780.0, 9192.0, 4604.0, 2519.0, 1459.0, 836.0, 512.0, 297.0, 189.0, 124.0, 81.0, 68.0, 40.0, 32.0, 20.0, 19.0, 10.0, 10.0, 10.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.70751953125, -0.6858062744140625, -0.664093017578125, -0.6423797607421875, -0.62066650390625, -0.5989532470703125, -0.577239990234375, -0.5555267333984375, -0.5338134765625, -0.5121002197265625, -0.490386962890625, -0.4686737060546875, -0.44696044921875, -0.4252471923828125, -0.403533935546875, -0.3818206787109375, -0.360107421875, -0.3383941650390625, -0.316680908203125, -0.2949676513671875, -0.27325439453125, -0.2515411376953125, -0.229827880859375, -0.2081146240234375, -0.1864013671875, -0.1646881103515625, -0.142974853515625, -0.1212615966796875, -0.09954833984375, -0.0778350830078125, -0.056121826171875, -0.0344085693359375, -0.0126953125, 0.0090179443359375, 0.030731201171875, 0.0524444580078125, 0.07415771484375, 0.0958709716796875, 0.117584228515625, 0.1392974853515625, 0.1610107421875, 0.1827239990234375, 0.204437255859375, 0.2261505126953125, 0.24786376953125, 0.2695770263671875, 0.291290283203125, 0.3130035400390625, 0.334716796875, 0.3564300537109375, 0.378143310546875, 0.3998565673828125, 0.42156982421875, 0.4432830810546875, 0.464996337890625, 0.4867095947265625, 0.5084228515625, 0.5301361083984375, 0.551849365234375, 0.5735626220703125, 0.59527587890625, 0.6169891357421875, 0.638702392578125, 0.6604156494140625, 0.68212890625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 11.0, 13.0, 18.0, 17.0, 20.0, 22.0, 33.0, 35.0, 55.0, 70.0, 65.0, 62.0, 74.0, 68.0, 67.0, 58.0, 51.0, 60.0, 45.0, 37.0, 28.0, 21.0, 24.0, 16.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.141845703125, -0.13753700256347656, -0.13322830200195312, -0.1289196014404297, -0.12461090087890625, -0.12030220031738281, -0.11599349975585938, -0.11168479919433594, -0.1073760986328125, -0.10306739807128906, -0.09875869750976562, -0.09444999694824219, -0.09014129638671875, -0.08583259582519531, -0.08152389526367188, -0.07721519470214844, -0.072906494140625, -0.06859779357910156, -0.06428909301757812, -0.05998039245605469, -0.05567169189453125, -0.05136299133300781, -0.047054290771484375, -0.04274559020996094, -0.0384368896484375, -0.03412818908691406, -0.029819488525390625, -0.025510787963867188, -0.02120208740234375, -0.016893386840820312, -0.012584686279296875, -0.008275985717773438, -0.00396728515625, 0.0003414154052734375, 0.004650115966796875, 0.008958816528320312, 0.01326751708984375, 0.017576217651367188, 0.021884918212890625, 0.026193618774414062, 0.0305023193359375, 0.03481101989746094, 0.039119720458984375, 0.04342842102050781, 0.04773712158203125, 0.05204582214355469, 0.056354522705078125, 0.06066322326660156, 0.064971923828125, 0.06928062438964844, 0.07358932495117188, 0.07789802551269531, 0.08220672607421875, 0.08651542663574219, 0.09082412719726562, 0.09513282775878906, 0.0994415283203125, 0.10375022888183594, 0.10805892944335938, 0.11236763000488281, 0.11667633056640625, 0.12098503112792969, 0.12529373168945312, 0.12960243225097656, 0.1339111328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 2.0, 5.0, 10.0, 8.0, 10.0, 15.0, 19.0, 15.0, 46.0, 53.0, 77.0, 114.0, 175.0, 264.0, 423.0, 653.0, 1151.0, 1963.0, 3791.0, 8058.0, 19171.0, 62455.0, 678729.0, 203905.0, 39965.0, 14035.0, 6220.0, 3020.0, 1645.0, 924.0, 581.0, 356.0, 246.0, 140.0, 96.0, 67.0, 58.0, 28.0, 19.0, 9.0, 13.0, 7.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85302734375, -0.8278121948242188, -0.8025970458984375, -0.7773818969726562, -0.752166748046875, -0.7269515991210938, -0.7017364501953125, -0.6765213012695312, -0.65130615234375, -0.6260910034179688, -0.6008758544921875, -0.5756607055664062, -0.550445556640625, -0.5252304077148438, -0.5000152587890625, -0.47480010986328125, -0.4495849609375, -0.42436981201171875, -0.3991546630859375, -0.37393951416015625, -0.348724365234375, -0.32350921630859375, -0.2982940673828125, -0.27307891845703125, -0.24786376953125, -0.22264862060546875, -0.1974334716796875, -0.17221832275390625, -0.147003173828125, -0.12178802490234375, -0.0965728759765625, -0.07135772705078125, -0.046142578125, -0.02092742919921875, 0.0042877197265625, 0.02950286865234375, 0.054718017578125, 0.07993316650390625, 0.1051483154296875, 0.13036346435546875, 0.15557861328125, 0.18079376220703125, 0.2060089111328125, 0.23122406005859375, 0.256439208984375, 0.28165435791015625, 0.3068695068359375, 0.33208465576171875, 0.3572998046875, 0.38251495361328125, 0.4077301025390625, 0.43294525146484375, 0.458160400390625, 0.48337554931640625, 0.5085906982421875, 0.5338058471679688, 0.55902099609375, 0.5842361450195312, 0.6094512939453125, 0.6346664428710938, 0.659881591796875, 0.6850967407226562, 0.7103118896484375, 0.7355270385742188, 0.7607421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 6.0, 19.0, 14.0, 20.0, 27.0, 34.0, 43.0, 46.0, 61.0, 71.0, 66.0, 86.0, 71.0, 84.0, 56.0, 59.0, 39.0, 40.0, 15.0, 31.0, 18.0, 20.0, 7.0, 7.0, 7.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.61865234375, -0.5985641479492188, -0.5784759521484375, -0.5583877563476562, -0.538299560546875, -0.5182113647460938, -0.4981231689453125, -0.47803497314453125, -0.45794677734375, -0.43785858154296875, -0.4177703857421875, -0.39768218994140625, -0.377593994140625, -0.35750579833984375, -0.3374176025390625, -0.31732940673828125, -0.2972412109375, -0.27715301513671875, -0.2570648193359375, -0.23697662353515625, -0.216888427734375, -0.19680023193359375, -0.1767120361328125, -0.15662384033203125, -0.13653564453125, -0.11644744873046875, -0.0963592529296875, -0.07627105712890625, -0.056182861328125, -0.03609466552734375, -0.0160064697265625, 0.00408172607421875, 0.024169921875, 0.04425811767578125, 0.0643463134765625, 0.08443450927734375, 0.104522705078125, 0.12461090087890625, 0.1446990966796875, 0.16478729248046875, 0.18487548828125, 0.20496368408203125, 0.2250518798828125, 0.24514007568359375, 0.265228271484375, 0.28531646728515625, 0.3054046630859375, 0.32549285888671875, 0.3455810546875, 0.36566925048828125, 0.3857574462890625, 0.40584564208984375, 0.425933837890625, 0.44602203369140625, 0.4661102294921875, 0.48619842529296875, 0.50628662109375, 0.5263748168945312, 0.5464630126953125, 0.5665512084960938, 0.586639404296875, 0.6067276000976562, 0.6268157958984375, 0.6469039916992188, 0.6669921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 9.0, 7.0, 13.0, 17.0, 16.0, 38.0, 61.0, 84.0, 151.0, 249.0, 450.0, 890.0, 1833.0, 4195.0, 12546.0, 72986.0, 880093.0, 56622.0, 11066.0, 3690.0, 1681.0, 824.0, 430.0, 231.0, 128.0, 71.0, 70.0, 31.0, 18.0, 20.0, 12.0, 3.0, 3.0, 9.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1180419921875, -0.114288330078125, -0.11053466796875, -0.106781005859375, -0.10302734375, -0.099273681640625, -0.09552001953125, -0.091766357421875, -0.0880126953125, -0.084259033203125, -0.08050537109375, -0.076751708984375, -0.072998046875, -0.069244384765625, -0.06549072265625, -0.061737060546875, -0.0579833984375, -0.054229736328125, -0.05047607421875, -0.046722412109375, -0.04296875, -0.039215087890625, -0.03546142578125, -0.031707763671875, -0.0279541015625, -0.024200439453125, -0.02044677734375, -0.016693115234375, -0.012939453125, -0.009185791015625, -0.00543212890625, -0.001678466796875, 0.0020751953125, 0.005828857421875, 0.00958251953125, 0.013336181640625, 0.01708984375, 0.020843505859375, 0.02459716796875, 0.028350830078125, 0.0321044921875, 0.035858154296875, 0.03961181640625, 0.043365478515625, 0.047119140625, 0.050872802734375, 0.05462646484375, 0.058380126953125, 0.0621337890625, 0.065887451171875, 0.06964111328125, 0.073394775390625, 0.0771484375, 0.080902099609375, 0.08465576171875, 0.088409423828125, 0.0921630859375, 0.095916748046875, 0.09967041015625, 0.103424072265625, 0.107177734375, 0.110931396484375, 0.11468505859375, 0.118438720703125, 0.1221923828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 8.0, 7.0, 10.0, 12.0, 9.0, 26.0, 26.0, 55.0, 90.0, 182.0, 189.0, 131.0, 84.0, 34.0, 35.0, 14.0, 16.0, 17.0, 8.0, 7.0, 11.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4318695068359375e-05, -2.354290336370468e-05, -2.2767111659049988e-05, -2.1991319954395294e-05, -2.12155282497406e-05, -2.0439736545085907e-05, -1.9663944840431213e-05, -1.888815313577652e-05, -1.8112361431121826e-05, -1.7336569726467133e-05, -1.656077802181244e-05, -1.5784986317157745e-05, -1.5009194612503052e-05, -1.4233402907848358e-05, -1.3457611203193665e-05, -1.2681819498538971e-05, -1.1906027793884277e-05, -1.1130236089229584e-05, -1.035444438457489e-05, -9.578652679920197e-06, -8.802860975265503e-06, -8.02706927061081e-06, -7.251277565956116e-06, -6.475485861301422e-06, -5.6996941566467285e-06, -4.923902451992035e-06, -4.148110747337341e-06, -3.3723190426826477e-06, -2.596527338027954e-06, -1.8207356333732605e-06, -1.044943928718567e-06, -2.691522240638733e-07, 5.066394805908203e-07, 1.282431185245514e-06, 2.0582228899002075e-06, 2.834014594554901e-06, 3.6098062992095947e-06, 4.385598003864288e-06, 5.161389708518982e-06, 5.9371814131736755e-06, 6.712973117828369e-06, 7.488764822483063e-06, 8.264556527137756e-06, 9.04034823179245e-06, 9.816139936447144e-06, 1.0591931641101837e-05, 1.136772334575653e-05, 1.2143515050411224e-05, 1.2919306755065918e-05, 1.3695098459720612e-05, 1.4470890164375305e-05, 1.5246681869029999e-05, 1.6022473573684692e-05, 1.6798265278339386e-05, 1.757405698299408e-05, 1.8349848687648773e-05, 1.9125640392303467e-05, 1.990143209695816e-05, 2.0677223801612854e-05, 2.1453015506267548e-05, 2.222880721092224e-05, 2.3004598915576935e-05, 2.378039062023163e-05, 2.4556182324886322e-05, 2.5331974029541016e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 13.0, 12.0, 19.0, 27.0, 39.0, 56.0, 72.0, 134.0, 210.0, 277.0, 422.0, 686.0, 1119.0, 1987.0, 3856.0, 8089.0, 20357.0, 84487.0, 797707.0, 90557.0, 21072.0, 8203.0, 3928.0, 2042.0, 1220.0, 690.0, 441.0, 252.0, 162.0, 124.0, 68.0, 61.0, 40.0, 36.0, 22.0, 12.0, 17.0, 6.0, 6.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07080078125, -0.06868839263916016, -0.06657600402832031, -0.06446361541748047, -0.062351226806640625, -0.06023883819580078, -0.05812644958496094, -0.056014060974121094, -0.05390167236328125, -0.051789283752441406, -0.04967689514160156, -0.04756450653076172, -0.045452117919921875, -0.04333972930908203, -0.04122734069824219, -0.039114952087402344, -0.0370025634765625, -0.034890174865722656, -0.03277778625488281, -0.03066539764404297, -0.028553009033203125, -0.02644062042236328, -0.024328231811523438, -0.022215843200683594, -0.02010345458984375, -0.017991065979003906, -0.015878677368164062, -0.013766288757324219, -0.011653900146484375, -0.009541511535644531, -0.0074291229248046875, -0.005316734313964844, -0.003204345703125, -0.0010919570922851562, 0.0010204315185546875, 0.0031328201293945312, 0.005245208740234375, 0.007357597351074219, 0.009469985961914062, 0.011582374572753906, 0.01369476318359375, 0.015807151794433594, 0.017919540405273438, 0.02003192901611328, 0.022144317626953125, 0.02425670623779297, 0.026369094848632812, 0.028481483459472656, 0.0305938720703125, 0.032706260681152344, 0.03481864929199219, 0.03693103790283203, 0.039043426513671875, 0.04115581512451172, 0.04326820373535156, 0.045380592346191406, 0.04749298095703125, 0.049605369567871094, 0.05171775817871094, 0.05383014678955078, 0.055942535400390625, 0.05805492401123047, 0.06016731262207031, 0.062279701232910156, 0.06439208984375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 2.0, 4.0, 14.0, 21.0, 30.0, 28.0, 37.0, 58.0, 65.0, 98.0, 117.0, 117.0, 96.0, 79.0, 50.0, 27.0, 24.0, 14.0, 14.0, 13.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.051300048828125, -0.04962635040283203, -0.04795265197753906, -0.046278953552246094, -0.044605255126953125, -0.042931556701660156, -0.04125785827636719, -0.03958415985107422, -0.03791046142578125, -0.03623676300048828, -0.03456306457519531, -0.032889366149902344, -0.031215667724609375, -0.029541969299316406, -0.027868270874023438, -0.02619457244873047, -0.0245208740234375, -0.02284717559814453, -0.021173477172851562, -0.019499778747558594, -0.017826080322265625, -0.016152381896972656, -0.014478683471679688, -0.012804985046386719, -0.01113128662109375, -0.009457588195800781, -0.0077838897705078125, -0.006110191345214844, -0.004436492919921875, -0.0027627944946289062, -0.0010890960693359375, 0.0005846023559570312, 0.00225830078125, 0.003931999206542969, 0.0056056976318359375, 0.007279396057128906, 0.008953094482421875, 0.010626792907714844, 0.012300491333007812, 0.013974189758300781, 0.01564788818359375, 0.01732158660888672, 0.018995285034179688, 0.020668983459472656, 0.022342681884765625, 0.024016380310058594, 0.025690078735351562, 0.02736377716064453, 0.0290374755859375, 0.03071117401123047, 0.03238487243652344, 0.034058570861816406, 0.035732269287109375, 0.037405967712402344, 0.03907966613769531, 0.04075336456298828, 0.04242706298828125, 0.04410076141357422, 0.04577445983886719, 0.047448158264160156, 0.049121856689453125, 0.050795555114746094, 0.05246925354003906, 0.05414295196533203, 0.055816650390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 17.0, 21.0, 29.0, 23.0, 36.0, 59.0, 90.0, 185.0, 289.0, 91.0, 46.0, 33.0, 22.0, 18.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.372138023376465, -4.2660064697265625, -4.159875392913818, -4.053743839263916, -3.9476125240325928, -3.8414812088012695, -3.7353498935699463, -3.629218578338623, -3.5230872631073, -3.4169559478759766, -3.3108246326446533, -3.20469331741333, -3.0985617637634277, -2.9924304485321045, -2.8862991333007812, -2.780167818069458, -2.6740365028381348, -2.5679051876068115, -2.4617738723754883, -2.355642318725586, -2.2495110034942627, -2.1433796882629395, -2.037248373031616, -1.931117057800293, -1.8249855041503906, -1.7188541889190674, -1.6127227544784546, -1.5065914392471313, -1.400460124015808, -1.2943286895751953, -1.188197374343872, -1.0820660591125488, -0.9759347438812256, -0.8698033690452576, -0.7636720538139343, -0.6575406789779663, -0.5514093637466431, -0.44527798891067505, -0.33914661407470703, -0.2330152988433838, -0.12688392400741577, -0.020752571523189545, 0.08537878096103668, 0.1915101408958435, 0.29764148592948914, 0.40377283096313477, 0.5099042057991028, 0.616035521030426, 0.722166895866394, 0.8282982707023621, 0.9344295859336853, 1.0405609607696533, 1.1466922760009766, 1.2528235912322998, 1.3589550256729126, 1.4650863409042358, 1.5712177753448486, 1.6773490905761719, 1.7834805250167847, 1.889611840248108, 1.9957431554794312, 2.101874589920044, 2.208005905151367, 2.3141372203826904, 2.4202685356140137]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 8.0, 4.0, 5.0, 9.0, 8.0, 8.0, 10.0, 18.0, 21.0, 14.0, 27.0, 24.0, 27.0, 21.0, 28.0, 40.0, 26.0, 52.0, 72.0, 100.0, 91.0, 54.0, 48.0, 28.0, 29.0, 33.0, 31.0, 20.0, 22.0, 17.0, 17.0, 14.0, 17.0, 7.0, 5.0, 8.0, 5.0, 7.0, 3.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.649893045425415, -1.5982118844985962, -1.546530842781067, -1.494849681854248, -1.4431686401367188, -1.3914874792099, -1.339806318283081, -1.2881252765655518, -1.2364442348480225, -1.1847630739212036, -1.1330820322036743, -1.0814008712768555, -1.0297198295593262, -0.9780386686325073, -0.9263575673103333, -0.8746764659881592, -0.8229953050613403, -0.7713142037391663, -0.7196331024169922, -0.6679519414901733, -0.616270899772644, -0.5645897388458252, -0.5129086375236511, -0.46122753620147705, -0.409546434879303, -0.3578653335571289, -0.30618423223495483, -0.2545031011104584, -0.2028219997882843, -0.15114089846611023, -0.09945976734161377, -0.0477786660194397, 0.003902435302734375, 0.055583544075489044, 0.10726465284824371, 0.15894576907157898, 0.21062687039375305, 0.2623079717159271, 0.3139891028404236, 0.36567020416259766, 0.41735130548477173, 0.4690324068069458, 0.5207135081291199, 0.572394609451294, 0.6240757703781128, 0.6757568120956421, 0.7274379730224609, 0.779119074344635, 0.8308001756668091, 0.8824812769889832, 0.9341623783111572, 0.9858435392379761, 1.0375245809555054, 1.0892057418823242, 1.1408867835998535, 1.1925679445266724, 1.2442491054534912, 1.29593026638031, 1.3476113080978394, 1.3992924690246582, 1.4509735107421875, 1.5026546716690063, 1.5543358325958252, 1.6060168743133545, 1.6576979160308838]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 7.0, 20.0, 37.0, 38.0, 60.0, 73.0, 127.0, 135.0, 166.0, 274.0, 402.0, 835.0, 2136.0, 83465.0, 4098336.0, 5316.0, 1114.0, 610.0, 333.0, 240.0, 139.0, 109.0, 87.0, 63.0, 41.0, 19.0, 16.0, 11.0, 13.0, 11.0, 5.0, 4.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1396484375, -1.1072921752929688, -1.0749359130859375, -1.0425796508789062, -1.010223388671875, -0.9778671264648438, -0.9455108642578125, -0.9131546020507812, -0.88079833984375, -0.8484420776367188, -0.8160858154296875, -0.7837295532226562, -0.751373291015625, -0.7190170288085938, -0.6866607666015625, -0.6543045043945312, -0.6219482421875, -0.5895919799804688, -0.5572357177734375, -0.5248794555664062, -0.492523193359375, -0.46016693115234375, -0.4278106689453125, -0.39545440673828125, -0.36309814453125, -0.33074188232421875, -0.2983856201171875, -0.26602935791015625, -0.233673095703125, -0.20131683349609375, -0.1689605712890625, -0.13660430908203125, -0.104248046875, -0.07189178466796875, -0.0395355224609375, -0.00717926025390625, 0.025177001953125, 0.05753326416015625, 0.0898895263671875, 0.12224578857421875, 0.15460205078125, 0.18695831298828125, 0.2193145751953125, 0.25167083740234375, 0.284027099609375, 0.31638336181640625, 0.3487396240234375, 0.38109588623046875, 0.4134521484375, 0.44580841064453125, 0.4781646728515625, 0.5105209350585938, 0.542877197265625, 0.5752334594726562, 0.6075897216796875, 0.6399459838867188, 0.67230224609375, 0.7046585083007812, 0.7370147705078125, 0.7693710327148438, 0.801727294921875, 0.8340835571289062, 0.8664398193359375, 0.8987960815429688, 0.93115234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 12.0, 14.0, 17.0, 25.0, 27.0, 28.0, 36.0, 40.0, 61.0, 62.0, 60.0, 80.0, 75.0, 52.0, 60.0, 67.0, 62.0, 63.0, 38.0, 21.0, 27.0, 16.0, 19.0, 9.0, 6.0, 1.0, 4.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1419677734375, -0.13772010803222656, -0.13347244262695312, -0.1292247772216797, -0.12497711181640625, -0.12072944641113281, -0.11648178100585938, -0.11223411560058594, -0.1079864501953125, -0.10373878479003906, -0.09949111938476562, -0.09524345397949219, -0.09099578857421875, -0.08674812316894531, -0.08250045776367188, -0.07825279235839844, -0.074005126953125, -0.06975746154785156, -0.06550979614257812, -0.06126213073730469, -0.05701446533203125, -0.05276679992675781, -0.048519134521484375, -0.04427146911621094, -0.0400238037109375, -0.03577613830566406, -0.031528472900390625, -0.027280807495117188, -0.02303314208984375, -0.018785476684570312, -0.014537811279296875, -0.010290145874023438, -0.00604248046875, -0.0017948150634765625, 0.002452850341796875, 0.0067005157470703125, 0.01094818115234375, 0.015195846557617188, 0.019443511962890625, 0.023691177368164062, 0.0279388427734375, 0.03218650817871094, 0.036434173583984375, 0.04068183898925781, 0.04492950439453125, 0.04917716979980469, 0.053424835205078125, 0.05767250061035156, 0.061920166015625, 0.06616783142089844, 0.07041549682617188, 0.07466316223144531, 0.07891082763671875, 0.08315849304199219, 0.08740615844726562, 0.09165382385253906, 0.0959014892578125, 0.10014915466308594, 0.10439682006835938, 0.10864448547363281, 0.11289215087890625, 0.11713981628417969, 0.12138748168945312, 0.12563514709472656, 0.1298828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 5.0, 6.0, 13.0, 21.0, 20.0, 31.0, 51.0, 71.0, 115.0, 210.0, 353.0, 531.0, 834.0, 1510.0, 3570.0, 17856.0, 2516488.0, 1627909.0, 16830.0, 3671.0, 1600.0, 890.0, 572.0, 421.0, 226.0, 162.0, 119.0, 82.0, 34.0, 27.0, 15.0, 13.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.68994140625, -0.66693115234375, -0.6439208984375, -0.62091064453125, -0.597900390625, -0.57489013671875, -0.5518798828125, -0.52886962890625, -0.505859375, -0.48284912109375, -0.4598388671875, -0.43682861328125, -0.413818359375, -0.39080810546875, -0.3677978515625, -0.34478759765625, -0.32177734375, -0.29876708984375, -0.2757568359375, -0.25274658203125, -0.229736328125, -0.20672607421875, -0.1837158203125, -0.16070556640625, -0.1376953125, -0.11468505859375, -0.0916748046875, -0.06866455078125, -0.045654296875, -0.02264404296875, 0.0003662109375, 0.02337646484375, 0.04638671875, 0.06939697265625, 0.0924072265625, 0.11541748046875, 0.138427734375, 0.16143798828125, 0.1844482421875, 0.20745849609375, 0.23046875, 0.25347900390625, 0.2764892578125, 0.29949951171875, 0.322509765625, 0.34552001953125, 0.3685302734375, 0.39154052734375, 0.41455078125, 0.43756103515625, 0.4605712890625, 0.48358154296875, 0.506591796875, 0.52960205078125, 0.5526123046875, 0.57562255859375, 0.5986328125, 0.62164306640625, 0.6446533203125, 0.66766357421875, 0.690673828125, 0.71368408203125, 0.7366943359375, 0.75970458984375, 0.78271484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 16.0, 26.0, 78.0, 146.0, 435.0, 1960.0, 1050.0, 182.0, 65.0, 34.0, 18.0, 8.0, 11.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.360595703125, -0.3390769958496094, -0.31755828857421875, -0.2960395812988281, -0.2745208740234375, -0.2530021667480469, -0.23148345947265625, -0.20996475219726562, -0.188446044921875, -0.16692733764648438, -0.14540863037109375, -0.12388992309570312, -0.1023712158203125, -0.08085250854492188, -0.05933380126953125, -0.037815093994140625, -0.01629638671875, 0.005222320556640625, 0.02674102783203125, 0.048259735107421875, 0.0697784423828125, 0.09129714965820312, 0.11281585693359375, 0.13433456420898438, 0.155853271484375, 0.17737197875976562, 0.19889068603515625, 0.22040939331054688, 0.2419281005859375, 0.2634468078613281, 0.28496551513671875, 0.3064842224121094, 0.3280029296875, 0.3495216369628906, 0.37104034423828125, 0.3925590515136719, 0.4140777587890625, 0.4355964660644531, 0.45711517333984375, 0.4786338806152344, 0.500152587890625, 0.5216712951660156, 0.5431900024414062, 0.5647087097167969, 0.5862274169921875, 0.6077461242675781, 0.6292648315429688, 0.6507835388183594, 0.67230224609375, 0.6938209533691406, 0.7153396606445312, 0.7368583679199219, 0.7583770751953125, 0.7798957824707031, 0.8014144897460938, 0.8229331970214844, 0.844451904296875, 0.8659706115722656, 0.8874893188476562, 0.9090080261230469, 0.9305267333984375, 0.9520454406738281, 0.9735641479492188, 0.9950828552246094, 1.0166015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 8.0, 18.0, 33.0, 60.0, 105.0, 216.0, 177.0, 109.0, 75.0, 62.0, 35.0, 27.0, 17.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.118007659912109, -4.976589202880859, -4.835170269012451, -4.693751335144043, -4.552332878112793, -4.410914421081543, -4.269495487213135, -4.128076553344727, -3.9866580963134766, -3.8452394008636475, -3.7038207054138184, -3.5624020099639893, -3.42098331451416, -3.279564619064331, -3.138145923614502, -2.996727228164673, -2.8553085327148438, -2.7138898372650146, -2.5724711418151855, -2.4310524463653564, -2.2896337509155273, -2.1482150554656982, -2.006796360015869, -1.86537766456604, -1.723958969116211, -1.5825402736663818, -1.4411215782165527, -1.2997028827667236, -1.1582841873168945, -1.0168654918670654, -0.8754467964172363, -0.7340281009674072, -0.5926089286804199, -0.4511902332305908, -0.3097715377807617, -0.16835284233093262, -0.026934146881103516, 0.11448454856872559, 0.2559032440185547, 0.3973219394683838, 0.5387406349182129, 0.680159330368042, 0.8215780258178711, 0.9629967212677002, 1.1044154167175293, 1.2458341121673584, 1.3872528076171875, 1.5286715030670166, 1.6700901985168457, 1.8115088939666748, 1.952927589416504, 2.094346284866333, 2.235764980316162, 2.377183675765991, 2.5186023712158203, 2.6600210666656494, 2.8014397621154785, 2.9428584575653076, 3.0842771530151367, 3.225695848464966, 3.367114543914795, 3.508533239364624, 3.649951934814453, 3.7913706302642822, 3.9327893257141113]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 9.0, 12.0, 22.0, 28.0, 22.0, 23.0, 34.0, 34.0, 32.0, 41.0, 48.0, 39.0, 66.0, 54.0, 59.0, 69.0, 61.0, 56.0, 36.0, 31.0, 35.0, 24.0, 28.0, 27.0, 24.0, 16.0, 14.0, 11.0, 11.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.838979959487915, -3.723130702972412, -3.6072816848754883, -3.4914324283599854, -3.3755831718444824, -3.2597341537475586, -3.1438848972320557, -3.0280356407165527, -2.912186622619629, -2.796337366104126, -2.680488348007202, -2.564639091491699, -2.4487900733947754, -2.3329408168792725, -2.2170915603637695, -2.1012425422668457, -1.9853932857513428, -1.8695441484451294, -1.753695011138916, -1.637845754623413, -1.5219966173171997, -1.4061474800109863, -1.2902982234954834, -1.17444908618927, -1.0585999488830566, -0.9427508115768433, -0.8269016146659851, -0.711052417755127, -0.5952032804489136, -0.4793541431427002, -0.36350494623184204, -0.2476557493209839, -0.1318066120147705, -0.01595744490623474, 0.09989172220230103, 0.2157408893108368, 0.33159005641937256, 0.44743919372558594, 0.5632883906364441, 0.6791375875473022, 0.7949867248535156, 0.910835862159729, 1.0266849994659424, 1.1425342559814453, 1.2583833932876587, 1.374232530593872, 1.490081787109375, 1.6059309244155884, 1.7217800617218018, 1.8376291990280151, 1.9534783363342285, 2.0693275928497314, 2.1851768493652344, 2.301025867462158, 2.416875123977661, 2.532724380493164, 2.648573398590088, 2.764422655105591, 2.8802716732025146, 2.9961209297180176, 3.1119699478149414, 3.2278192043304443, 3.3436684608459473, 3.459517478942871, 3.575366735458374]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 7.0, 16.0, 33.0, 31.0, 57.0, 89.0, 133.0, 286.0, 445.0, 987.0, 2037.0, 5090.0, 14606.0, 59066.0, 581824.0, 323209.0, 41576.0, 11439.0, 4036.0, 1763.0, 821.0, 414.0, 233.0, 130.0, 78.0, 50.0, 36.0, 20.0, 8.0, 4.0, 9.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0614547729492188, -1.0301361083984375, -0.9988174438476562, -0.967498779296875, -0.9361801147460938, -0.9048614501953125, -0.8735427856445312, -0.84222412109375, -0.8109054565429688, -0.7795867919921875, -0.7482681274414062, -0.716949462890625, -0.6856307983398438, -0.6543121337890625, -0.6229934692382812, -0.5916748046875, -0.5603561401367188, -0.5290374755859375, -0.49771881103515625, -0.466400146484375, -0.43508148193359375, -0.4037628173828125, -0.37244415283203125, -0.34112548828125, -0.30980682373046875, -0.2784881591796875, -0.24716949462890625, -0.215850830078125, -0.18453216552734375, -0.1532135009765625, -0.12189483642578125, -0.090576171875, -0.05925750732421875, -0.0279388427734375, 0.00337982177734375, 0.034698486328125, 0.06601715087890625, 0.0973358154296875, 0.12865447998046875, 0.15997314453125, 0.19129180908203125, 0.2226104736328125, 0.25392913818359375, 0.285247802734375, 0.31656646728515625, 0.3478851318359375, 0.37920379638671875, 0.4105224609375, 0.44184112548828125, 0.4731597900390625, 0.5044784545898438, 0.535797119140625, 0.5671157836914062, 0.5984344482421875, 0.6297531127929688, 0.66107177734375, 0.6923904418945312, 0.7237091064453125, 0.7550277709960938, 0.786346435546875, 0.8176651000976562, 0.8489837646484375, 0.8803024291992188, 0.91162109375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 9.0, 9.0, 23.0, 16.0, 37.0, 27.0, 39.0, 50.0, 64.0, 70.0, 76.0, 68.0, 86.0, 75.0, 82.0, 57.0, 47.0, 32.0, 35.0, 35.0, 15.0, 15.0, 11.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32080078125, -0.31163787841796875, -0.3024749755859375, -0.29331207275390625, -0.284149169921875, -0.27498626708984375, -0.2658233642578125, -0.25666046142578125, -0.24749755859375, -0.23833465576171875, -0.2291717529296875, -0.22000885009765625, -0.210845947265625, -0.20168304443359375, -0.1925201416015625, -0.18335723876953125, -0.1741943359375, -0.16503143310546875, -0.1558685302734375, -0.14670562744140625, -0.137542724609375, -0.12837982177734375, -0.1192169189453125, -0.11005401611328125, -0.10089111328125, -0.09172821044921875, -0.0825653076171875, -0.07340240478515625, -0.064239501953125, -0.05507659912109375, -0.0459136962890625, -0.03675079345703125, -0.027587890625, -0.01842498779296875, -0.0092620849609375, -9.918212890625e-05, 0.009063720703125, 0.01822662353515625, 0.0273895263671875, 0.03655242919921875, 0.04571533203125, 0.05487823486328125, 0.0640411376953125, 0.07320404052734375, 0.082366943359375, 0.09152984619140625, 0.1006927490234375, 0.10985565185546875, 0.1190185546875, 0.12818145751953125, 0.1373443603515625, 0.14650726318359375, 0.155670166015625, 0.16483306884765625, 0.1739959716796875, 0.18315887451171875, 0.19232177734375, 0.20148468017578125, 0.2106475830078125, 0.21981048583984375, 0.228973388671875, 0.23813629150390625, 0.2472991943359375, 0.25646209716796875, 0.265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 7.0, 6.0, 15.0, 20.0, 43.0, 76.0, 88.0, 180.0, 295.0, 629.0, 1359.0, 3580.0, 12045.0, 60285.0, 799186.0, 140787.0, 20824.0, 5513.0, 1914.0, 771.0, 379.0, 221.0, 116.0, 75.0, 48.0, 28.0, 18.0, 15.0, 10.0, 11.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82275390625, -0.7967910766601562, -0.7708282470703125, -0.7448654174804688, -0.718902587890625, -0.6929397583007812, -0.6669769287109375, -0.6410140991210938, -0.61505126953125, -0.5890884399414062, -0.5631256103515625, -0.5371627807617188, -0.511199951171875, -0.48523712158203125, -0.4592742919921875, -0.43331146240234375, -0.4073486328125, -0.38138580322265625, -0.3554229736328125, -0.32946014404296875, -0.303497314453125, -0.27753448486328125, -0.2515716552734375, -0.22560882568359375, -0.19964599609375, -0.17368316650390625, -0.1477203369140625, -0.12175750732421875, -0.095794677734375, -0.06983184814453125, -0.0438690185546875, -0.01790618896484375, 0.008056640625, 0.03401947021484375, 0.0599822998046875, 0.08594512939453125, 0.111907958984375, 0.13787078857421875, 0.1638336181640625, 0.18979644775390625, 0.21575927734375, 0.24172210693359375, 0.2676849365234375, 0.29364776611328125, 0.319610595703125, 0.34557342529296875, 0.3715362548828125, 0.39749908447265625, 0.4234619140625, 0.44942474365234375, 0.4753875732421875, 0.5013504028320312, 0.527313232421875, 0.5532760620117188, 0.5792388916015625, 0.6052017211914062, 0.63116455078125, 0.6571273803710938, 0.6830902099609375, 0.7090530395507812, 0.735015869140625, 0.7609786987304688, 0.7869415283203125, 0.8129043579101562, 0.8388671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 6.0, 5.0, 6.0, 14.0, 11.0, 15.0, 20.0, 21.0, 31.0, 25.0, 38.0, 48.0, 48.0, 52.0, 50.0, 62.0, 57.0, 69.0, 63.0, 58.0, 59.0, 33.0, 48.0, 23.0, 27.0, 26.0, 15.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 7.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8495941162109375, -0.822723388671875, -0.7958526611328125, -0.76898193359375, -0.7421112060546875, -0.715240478515625, -0.6883697509765625, -0.6614990234375, -0.6346282958984375, -0.607757568359375, -0.5808868408203125, -0.55401611328125, -0.5271453857421875, -0.500274658203125, -0.4734039306640625, -0.446533203125, -0.4196624755859375, -0.392791748046875, -0.3659210205078125, -0.33905029296875, -0.3121795654296875, -0.285308837890625, -0.2584381103515625, -0.2315673828125, -0.2046966552734375, -0.177825927734375, -0.1509552001953125, -0.12408447265625, -0.0972137451171875, -0.070343017578125, -0.0434722900390625, -0.0166015625, 0.0102691650390625, 0.037139892578125, 0.0640106201171875, 0.09088134765625, 0.1177520751953125, 0.144622802734375, 0.1714935302734375, 0.1983642578125, 0.2252349853515625, 0.252105712890625, 0.2789764404296875, 0.30584716796875, 0.3327178955078125, 0.359588623046875, 0.3864593505859375, 0.413330078125, 0.4402008056640625, 0.467071533203125, 0.4939422607421875, 0.52081298828125, 0.5476837158203125, 0.574554443359375, 0.6014251708984375, 0.6282958984375, 0.6551666259765625, 0.682037353515625, 0.7089080810546875, 0.73577880859375, 0.7626495361328125, 0.789520263671875, 0.8163909912109375, 0.84326171875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 18.0, 14.0, 26.0, 45.0, 78.0, 118.0, 297.0, 683.0, 2232.0, 13638.0, 931025.0, 92463.0, 5679.0, 1303.0, 479.0, 210.0, 83.0, 50.0, 23.0, 26.0, 21.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.346923828125, -0.3339729309082031, -0.32102203369140625, -0.3080711364746094, -0.2951202392578125, -0.2821693420410156, -0.26921844482421875, -0.2562675476074219, -0.243316650390625, -0.23036575317382812, -0.21741485595703125, -0.20446395874023438, -0.1915130615234375, -0.17856216430664062, -0.16561126708984375, -0.15266036987304688, -0.13970947265625, -0.12675857543945312, -0.11380767822265625, -0.10085678100585938, -0.0879058837890625, -0.07495498657226562, -0.06200408935546875, -0.049053192138671875, -0.036102294921875, -0.023151397705078125, -0.01020050048828125, 0.002750396728515625, 0.0157012939453125, 0.028652191162109375, 0.04160308837890625, 0.054553985595703125, 0.0675048828125, 0.08045578002929688, 0.09340667724609375, 0.10635757446289062, 0.1193084716796875, 0.13225936889648438, 0.14521026611328125, 0.15816116333007812, 0.171112060546875, 0.18406295776367188, 0.19701385498046875, 0.20996475219726562, 0.2229156494140625, 0.23586654663085938, 0.24881744384765625, 0.2617683410644531, 0.27471923828125, 0.2876701354980469, 0.30062103271484375, 0.3135719299316406, 0.3265228271484375, 0.3394737243652344, 0.35242462158203125, 0.3653755187988281, 0.378326416015625, 0.3912773132324219, 0.40422821044921875, 0.4171791076660156, 0.4301300048828125, 0.4430809020996094, 0.45603179931640625, 0.4689826965332031, 0.48193359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 15.0, 18.0, 26.0, 28.0, 65.0, 98.0, 116.0, 169.0, 168.0, 94.0, 49.0, 46.0, 31.0, 18.0, 15.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6106834411621094e-05, -2.4956651031970978e-05, -2.3806467652320862e-05, -2.2656284272670746e-05, -2.150610089302063e-05, -2.0355917513370514e-05, -1.9205734133720398e-05, -1.8055550754070282e-05, -1.6905367374420166e-05, -1.575518399477005e-05, -1.4605000615119934e-05, -1.3454817235469818e-05, -1.2304633855819702e-05, -1.1154450476169586e-05, -1.000426709651947e-05, -8.854083716869354e-06, -7.703900337219238e-06, -6.553716957569122e-06, -5.403533577919006e-06, -4.25335019826889e-06, -3.1031668186187744e-06, -1.9529834389686584e-06, -8.028000593185425e-07, 3.473833203315735e-07, 1.4975666999816895e-06, 2.6477500796318054e-06, 3.7979334592819214e-06, 4.948116838932037e-06, 6.098300218582153e-06, 7.248483598232269e-06, 8.398666977882385e-06, 9.548850357532501e-06, 1.0699033737182617e-05, 1.1849217116832733e-05, 1.2999400496482849e-05, 1.4149583876132965e-05, 1.529976725578308e-05, 1.6449950635433197e-05, 1.7600134015083313e-05, 1.875031739473343e-05, 1.9900500774383545e-05, 2.105068415403366e-05, 2.2200867533683777e-05, 2.3351050913333893e-05, 2.450123429298401e-05, 2.5651417672634125e-05, 2.680160105228424e-05, 2.7951784431934357e-05, 2.9101967811584473e-05, 3.025215119123459e-05, 3.1402334570884705e-05, 3.255251795053482e-05, 3.3702701330184937e-05, 3.485288470983505e-05, 3.600306808948517e-05, 3.7153251469135284e-05, 3.83034348487854e-05, 3.9453618228435516e-05, 4.060380160808563e-05, 4.175398498773575e-05, 4.2904168367385864e-05, 4.405435174703598e-05, 4.5204535126686096e-05, 4.635471850633621e-05, 4.750490188598633e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 13.0, 19.0, 33.0, 45.0, 63.0, 116.0, 251.0, 572.0, 1747.0, 10916.0, 969684.0, 59730.0, 3631.0, 919.0, 373.0, 166.0, 100.0, 54.0, 39.0, 19.0, 12.0, 15.0, 11.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59912109375, -0.5828170776367188, -0.5665130615234375, -0.5502090454101562, -0.533905029296875, -0.5176010131835938, -0.5012969970703125, -0.48499298095703125, -0.46868896484375, -0.45238494873046875, -0.4360809326171875, -0.41977691650390625, -0.403472900390625, -0.38716888427734375, -0.3708648681640625, -0.35456085205078125, -0.3382568359375, -0.32195281982421875, -0.3056488037109375, -0.28934478759765625, -0.273040771484375, -0.25673675537109375, -0.2404327392578125, -0.22412872314453125, -0.20782470703125, -0.19152069091796875, -0.1752166748046875, -0.15891265869140625, -0.142608642578125, -0.12630462646484375, -0.1100006103515625, -0.09369659423828125, -0.077392578125, -0.06108856201171875, -0.0447845458984375, -0.02848052978515625, -0.012176513671875, 0.00412750244140625, 0.0204315185546875, 0.03673553466796875, 0.05303955078125, 0.06934356689453125, 0.0856475830078125, 0.10195159912109375, 0.118255615234375, 0.13455963134765625, 0.1508636474609375, 0.16716766357421875, 0.1834716796875, 0.19977569580078125, 0.2160797119140625, 0.23238372802734375, 0.248687744140625, 0.26499176025390625, 0.2812957763671875, 0.29759979248046875, 0.31390380859375, 0.33020782470703125, 0.3465118408203125, 0.36281585693359375, 0.379119873046875, 0.39542388916015625, 0.4117279052734375, 0.42803192138671875, 0.4443359375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 21.0, 25.0, 49.0, 127.0, 357.0, 229.0, 87.0, 49.0, 20.0, 13.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85302734375, -0.829833984375, -0.806640625, -0.783447265625, -0.76025390625, -0.737060546875, -0.7138671875, -0.690673828125, -0.66748046875, -0.644287109375, -0.62109375, -0.597900390625, -0.57470703125, -0.551513671875, -0.5283203125, -0.505126953125, -0.48193359375, -0.458740234375, -0.435546875, -0.412353515625, -0.38916015625, -0.365966796875, -0.3427734375, -0.319580078125, -0.29638671875, -0.273193359375, -0.25, -0.226806640625, -0.20361328125, -0.180419921875, -0.1572265625, -0.134033203125, -0.11083984375, -0.087646484375, -0.064453125, -0.041259765625, -0.01806640625, 0.005126953125, 0.0283203125, 0.051513671875, 0.07470703125, 0.097900390625, 0.12109375, 0.144287109375, 0.16748046875, 0.190673828125, 0.2138671875, 0.237060546875, 0.26025390625, 0.283447265625, 0.306640625, 0.329833984375, 0.35302734375, 0.376220703125, 0.3994140625, 0.422607421875, 0.44580078125, 0.468994140625, 0.4921875, 0.515380859375, 0.53857421875, 0.561767578125, 0.5849609375, 0.608154296875, 0.63134765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 14.0, 109.0, 575.0, 182.0, 55.0, 35.0, 19.0, 11.0, 8.0, 2.0, 0.0, 1.0], "bins": [-26.248733520507812, -25.76715850830078, -25.28558349609375, -24.80400848388672, -24.322433471679688, -23.840858459472656, -23.359283447265625, -22.877708435058594, -22.396133422851562, -21.91455841064453, -21.4329833984375, -20.95140838623047, -20.469833374023438, -19.988258361816406, -19.506683349609375, -19.025108337402344, -18.543533325195312, -18.06195831298828, -17.58038330078125, -17.09880828857422, -16.617233276367188, -16.135658264160156, -15.654083251953125, -15.172508239746094, -14.690932273864746, -14.209357261657715, -13.727782249450684, -13.246207237243652, -12.764632225036621, -12.28305721282959, -11.801482200622559, -11.319907188415527, -10.838332176208496, -10.356757164001465, -9.875182151794434, -9.393607139587402, -8.912032127380371, -8.43045711517334, -7.948882102966309, -7.467307090759277, -6.985732078552246, -6.504157066345215, -6.022582054138184, -5.541007041931152, -5.059432029724121, -4.57785701751709, -4.096282005310059, -3.6147067546844482, -3.133131504058838, -2.6515564918518066, -2.1699814796447754, -1.6884063482284546, -1.2068313360214233, -0.7252562046051025, -0.2436811923980713, 0.23789381980895996, 0.7194688320159912, 1.2010438442230225, 1.6826188564300537, 2.164194107055664, 2.6457691192626953, 3.1273441314697266, 3.608919143676758, 4.090494155883789, 4.57206916809082]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 6.0, 5.0, 11.0, 12.0, 10.0, 18.0, 13.0, 20.0, 30.0, 27.0, 40.0, 62.0, 86.0, 83.0, 58.0, 61.0, 71.0, 86.0, 65.0, 49.0, 28.0, 39.0, 20.0, 23.0, 14.0, 14.0, 16.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.384174346923828, -5.2064900398254395, -5.028805255889893, -4.851120948791504, -4.673436164855957, -4.495751857757568, -4.31806755065918, -4.140382766723633, -3.962698459625244, -3.7850139141082764, -3.6073293685913086, -3.42964506149292, -3.251960515975952, -3.0742759704589844, -2.8965914249420166, -2.718906879425049, -2.541222333908081, -2.3635377883911133, -2.1858532428741455, -2.0081686973571777, -1.830484390258789, -1.6527998447418213, -1.4751152992248535, -1.2974308729171753, -1.1197463274002075, -0.9420618414878845, -0.7643773555755615, -0.5866928100585938, -0.40900832414627075, -0.23132383823394775, -0.05363929271697998, 0.12404513359069824, 0.301729679107666, 0.479414165019989, 0.657098650932312, 0.8347831964492798, 1.012467622756958, 1.1901521682739258, 1.3678367137908936, 1.5455211400985718, 1.7232056856155396, 1.9008902311325073, 2.0785746574401855, 2.2562592029571533, 2.433943748474121, 2.6116280555725098, 2.7893128395080566, 2.9669971466064453, 3.144681692123413, 3.322366237640381, 3.5000507831573486, 3.6777353286743164, 3.855419635772705, 4.033103942871094, 4.210788726806641, 4.388473033905029, 4.566157817840576, 4.743842124938965, 4.921526908874512, 5.0992112159729, 5.276895999908447, 5.454580307006836, 5.632265090942383, 5.8099493980407715, 5.98763370513916]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 12.0, 18.0, 34.0, 37.0, 52.0, 64.0, 134.0, 177.0, 277.0, 415.0, 713.0, 1567.0, 4286.0, 33174.0, 559718.0, 3188132.0, 377547.0, 20463.0, 4097.0, 1469.0, 725.0, 387.0, 261.0, 153.0, 103.0, 87.0, 57.0, 36.0, 25.0, 9.0, 15.0, 8.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.44970703125, -0.4370155334472656, -0.42432403564453125, -0.4116325378417969, -0.3989410400390625, -0.3862495422363281, -0.37355804443359375, -0.3608665466308594, -0.348175048828125, -0.3354835510253906, -0.32279205322265625, -0.3101005554199219, -0.2974090576171875, -0.2847175598144531, -0.27202606201171875, -0.2593345642089844, -0.24664306640625, -0.23395156860351562, -0.22126007080078125, -0.20856857299804688, -0.1958770751953125, -0.18318557739257812, -0.17049407958984375, -0.15780258178710938, -0.145111083984375, -0.13241958618164062, -0.11972808837890625, -0.10703659057617188, -0.0943450927734375, -0.08165359497070312, -0.06896209716796875, -0.056270599365234375, -0.0435791015625, -0.030887603759765625, -0.01819610595703125, -0.005504608154296875, 0.0071868896484375, 0.019878387451171875, 0.03256988525390625, 0.045261383056640625, 0.057952880859375, 0.07064437866210938, 0.08333587646484375, 0.09602737426757812, 0.1087188720703125, 0.12141036987304688, 0.13410186767578125, 0.14679336547851562, 0.15948486328125, 0.17217636108398438, 0.18486785888671875, 0.19755935668945312, 0.2102508544921875, 0.22294235229492188, 0.23563385009765625, 0.24832534790039062, 0.261016845703125, 0.2737083435058594, 0.28639984130859375, 0.2990913391113281, 0.3117828369140625, 0.3244743347167969, 0.33716583251953125, 0.3498573303222656, 0.362548828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 3.0, 8.0, 11.0, 12.0, 15.0, 22.0, 22.0, 24.0, 30.0, 33.0, 37.0, 43.0, 43.0, 51.0, 53.0, 55.0, 44.0, 52.0, 59.0, 51.0, 50.0, 41.0, 39.0, 29.0, 26.0, 17.0, 26.0, 20.0, 11.0, 21.0, 9.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2568359375, -0.2496204376220703, -0.24240493774414062, -0.23518943786621094, -0.22797393798828125, -0.22075843811035156, -0.21354293823242188, -0.2063274383544922, -0.1991119384765625, -0.1918964385986328, -0.18468093872070312, -0.17746543884277344, -0.17024993896484375, -0.16303443908691406, -0.15581893920898438, -0.1486034393310547, -0.141387939453125, -0.1341724395751953, -0.12695693969726562, -0.11974143981933594, -0.11252593994140625, -0.10531044006347656, -0.09809494018554688, -0.09087944030761719, -0.0836639404296875, -0.07644844055175781, -0.06923294067382812, -0.06201744079589844, -0.05480194091796875, -0.04758644104003906, -0.040370941162109375, -0.03315544128417969, -0.02593994140625, -0.018724441528320312, -0.011508941650390625, -0.0042934417724609375, 0.00292205810546875, 0.010137557983398438, 0.017353057861328125, 0.024568557739257812, 0.0317840576171875, 0.03899955749511719, 0.046215057373046875, 0.05343055725097656, 0.06064605712890625, 0.06786155700683594, 0.07507705688476562, 0.08229255676269531, 0.089508056640625, 0.09672355651855469, 0.10393905639648438, 0.11115455627441406, 0.11837005615234375, 0.12558555603027344, 0.13280105590820312, 0.1400165557861328, 0.1472320556640625, 0.1544475555419922, 0.16166305541992188, 0.16887855529785156, 0.17609405517578125, 0.18330955505371094, 0.19052505493164062, 0.1977405548095703, 0.2049560546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 14.0, 30.0, 108.0, 447.0, 7417.0, 4183765.0, 1929.0, 385.0, 107.0, 36.0, 23.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.79339599609375, -5.6531982421875, -5.51300048828125, -5.372802734375, -5.23260498046875, -5.0924072265625, -4.95220947265625, -4.81201171875, -4.67181396484375, -4.5316162109375, -4.39141845703125, -4.251220703125, -4.11102294921875, -3.9708251953125, -3.83062744140625, -3.6904296875, -3.55023193359375, -3.4100341796875, -3.26983642578125, -3.129638671875, -2.98944091796875, -2.8492431640625, -2.70904541015625, -2.56884765625, -2.42864990234375, -2.2884521484375, -2.14825439453125, -2.008056640625, -1.86785888671875, -1.7276611328125, -1.58746337890625, -1.447265625, -1.30706787109375, -1.1668701171875, -1.02667236328125, -0.886474609375, -0.74627685546875, -0.6060791015625, -0.46588134765625, -0.32568359375, -0.18548583984375, -0.0452880859375, 0.09490966796875, 0.235107421875, 0.37530517578125, 0.5155029296875, 0.65570068359375, 0.7958984375, 0.93609619140625, 1.0762939453125, 1.21649169921875, 1.356689453125, 1.49688720703125, 1.6370849609375, 1.77728271484375, 1.91748046875, 2.05767822265625, 2.1978759765625, 2.33807373046875, 2.478271484375, 2.61846923828125, 2.7586669921875, 2.89886474609375, 3.0390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 5.0, 12.0, 24.0, 75.0, 189.0, 621.0, 2252.0, 698.0, 117.0, 50.0, 12.0, 12.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74853515625, -0.6891403198242188, -0.6297454833984375, -0.5703506469726562, -0.510955810546875, -0.45156097412109375, -0.3921661376953125, -0.33277130126953125, -0.27337646484375, -0.21398162841796875, -0.1545867919921875, -0.09519195556640625, -0.035797119140625, 0.02359771728515625, 0.0829925537109375, 0.14238739013671875, 0.2017822265625, 0.26117706298828125, 0.3205718994140625, 0.37996673583984375, 0.439361572265625, 0.49875640869140625, 0.5581512451171875, 0.6175460815429688, 0.67694091796875, 0.7363357543945312, 0.7957305908203125, 0.8551254272460938, 0.914520263671875, 0.9739151000976562, 1.0333099365234375, 1.0927047729492188, 1.152099609375, 1.2114944458007812, 1.2708892822265625, 1.3302841186523438, 1.389678955078125, 1.4490737915039062, 1.5084686279296875, 1.5678634643554688, 1.62725830078125, 1.6866531372070312, 1.7460479736328125, 1.8054428100585938, 1.864837646484375, 1.9242324829101562, 1.9836273193359375, 2.0430221557617188, 2.1024169921875, 2.1618118286132812, 2.2212066650390625, 2.2806015014648438, 2.339996337890625, 2.3993911743164062, 2.4587860107421875, 2.5181808471679688, 2.57757568359375, 2.6369705200195312, 2.6963653564453125, 2.7557601928710938, 2.815155029296875, 2.8745498657226562, 2.9339447021484375, 2.9933395385742188, 3.052734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 11.0, 19.0, 30.0, 137.0, 457.0, 246.0, 55.0, 16.0, 10.0, 13.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25665283203125, -7.771399021148682, -7.286145210266113, -6.800890922546387, -6.315637588500977, -5.83038330078125, -5.345129489898682, -4.859875679016113, -4.374621868133545, -3.8893680572509766, -3.404114246368408, -2.9188601970672607, -2.4336063861846924, -1.948352575302124, -1.4630985260009766, -0.9778447151184082, -0.49259090423583984, -0.007337033748626709, 0.4779168367385864, 0.9631707668304443, 1.4484245777130127, 1.933678388595581, 2.4189324378967285, 2.904186248779297, 3.3894400596618652, 3.8746938705444336, 4.359947681427002, 4.84520149230957, 5.330455780029297, 5.815709114074707, 6.300963401794434, 6.786217212677002, 7.27147102355957, 7.756724834442139, 8.241978645324707, 8.727232933044434, 9.212486267089844, 9.69774055480957, 10.182994842529297, 10.668248176574707, 11.153501510620117, 11.638755798339844, 12.124009132385254, 12.60926342010498, 13.09451675415039, 13.579771041870117, 14.065025329589844, 14.550278663635254, 15.03553295135498, 15.520787239074707, 16.006040573120117, 16.491294860839844, 16.97654914855957, 17.461801528930664, 17.94705581665039, 18.432310104370117, 18.917564392089844, 19.40281867980957, 19.888072967529297, 20.37332534790039, 20.858579635620117, 21.343833923339844, 21.82908821105957, 22.314342498779297, 22.79959487915039]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 5.0, 15.0, 22.0, 24.0, 45.0, 42.0, 51.0, 66.0, 97.0, 92.0, 104.0, 88.0, 73.0, 55.0, 37.0, 40.0, 42.0, 18.0, 13.0, 13.0, 11.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.028036117553711, -8.798752784729004, -8.569469451904297, -8.340187072753906, -8.1109037399292, -7.881620407104492, -7.652337074279785, -7.423053741455078, -7.193770885467529, -6.964487552642822, -6.735204696655273, -6.505921363830566, -6.276638031005859, -6.0473551750183105, -5.8180718421936035, -5.588788986206055, -5.359505653381348, -5.130222320556641, -4.900939464569092, -4.671656131744385, -4.442373275756836, -4.213089942932129, -3.983806610107422, -3.754523515701294, -3.525240421295166, -3.295957326889038, -3.06667423248291, -2.837390899658203, -2.608107805252075, -2.3788247108459473, -2.1495413780212402, -1.9202582836151123, -1.6909751892089844, -1.4616920948028564, -1.232408881187439, -1.0031256675720215, -0.7738425731658936, -0.5445594787597656, -0.31527626514434814, -0.08599305152893066, 0.14329004287719727, 0.37257319688796997, 0.6018563508987427, 0.8311395049095154, 1.060422658920288, 1.289705753326416, 1.5189889669418335, 1.748272180557251, 1.977555274963379, 2.206838369369507, 2.4361214637756348, 2.665404796600342, 2.8946878910064697, 3.1239709854125977, 3.3532543182373047, 3.5825374126434326, 3.8118205070495605, 4.041103839874268, 4.270386695861816, 4.499670028686523, 4.7289533615112305, 4.958236217498779, 5.187519550323486, 5.416802406311035, 5.646085739135742]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 16.0, 6.0, 7.0, 16.0, 10.0, 25.0, 28.0, 38.0, 49.0, 67.0, 99.0, 157.0, 203.0, 374.0, 526.0, 906.0, 1576.0, 2948.0, 6116.0, 15065.0, 50596.0, 338610.0, 530530.0, 66784.0, 18633.0, 7066.0, 3449.0, 1780.0, 1045.0, 683.0, 347.0, 251.0, 152.0, 104.0, 65.0, 48.0, 43.0, 30.0, 28.0, 17.0, 17.0, 16.0, 7.0, 7.0, 7.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.57861328125, -0.5621261596679688, -0.5456390380859375, -0.5291519165039062, -0.512664794921875, -0.49617767333984375, -0.4796905517578125, -0.46320343017578125, -0.44671630859375, -0.43022918701171875, -0.4137420654296875, -0.39725494384765625, -0.380767822265625, -0.36428070068359375, -0.3477935791015625, -0.33130645751953125, -0.3148193359375, -0.29833221435546875, -0.2818450927734375, -0.26535797119140625, -0.248870849609375, -0.23238372802734375, -0.2158966064453125, -0.19940948486328125, -0.18292236328125, -0.16643524169921875, -0.1499481201171875, -0.13346099853515625, -0.116973876953125, -0.10048675537109375, -0.0839996337890625, -0.06751251220703125, -0.051025390625, -0.03453826904296875, -0.0180511474609375, -0.00156402587890625, 0.014923095703125, 0.03141021728515625, 0.0478973388671875, 0.06438446044921875, 0.08087158203125, 0.09735870361328125, 0.1138458251953125, 0.13033294677734375, 0.146820068359375, 0.16330718994140625, 0.1797943115234375, 0.19628143310546875, 0.2127685546875, 0.22925567626953125, 0.2457427978515625, 0.26222991943359375, 0.278717041015625, 0.29520416259765625, 0.3116912841796875, 0.32817840576171875, 0.34466552734375, 0.36115264892578125, 0.3776397705078125, 0.39412689208984375, 0.410614013671875, 0.42710113525390625, 0.4435882568359375, 0.46007537841796875, 0.4765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 10.0, 9.0, 21.0, 21.0, 29.0, 25.0, 40.0, 42.0, 76.0, 85.0, 93.0, 82.0, 83.0, 71.0, 67.0, 49.0, 48.0, 40.0, 27.0, 20.0, 12.0, 16.0, 5.0, 2.0, 9.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467041015625, -0.45343017578125, -0.4398193359375, -0.42620849609375, -0.41259765625, -0.39898681640625, -0.3853759765625, -0.37176513671875, -0.358154296875, -0.34454345703125, -0.3309326171875, -0.31732177734375, -0.3037109375, -0.29010009765625, -0.2764892578125, -0.26287841796875, -0.249267578125, -0.23565673828125, -0.2220458984375, -0.20843505859375, -0.19482421875, -0.18121337890625, -0.1676025390625, -0.15399169921875, -0.140380859375, -0.12677001953125, -0.1131591796875, -0.09954833984375, -0.0859375, -0.07232666015625, -0.0587158203125, -0.04510498046875, -0.031494140625, -0.01788330078125, -0.0042724609375, 0.00933837890625, 0.02294921875, 0.03656005859375, 0.0501708984375, 0.06378173828125, 0.077392578125, 0.09100341796875, 0.1046142578125, 0.11822509765625, 0.1318359375, 0.14544677734375, 0.1590576171875, 0.17266845703125, 0.186279296875, 0.19989013671875, 0.2135009765625, 0.22711181640625, 0.24072265625, 0.25433349609375, 0.2679443359375, 0.28155517578125, 0.295166015625, 0.30877685546875, 0.3223876953125, 0.33599853515625, 0.349609375, 0.36322021484375, 0.3768310546875, 0.39044189453125, 0.404052734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 2.0, 7.0, 9.0, 3.0, 7.0, 17.0, 12.0, 18.0, 22.0, 52.0, 62.0, 67.0, 95.0, 146.0, 220.0, 347.0, 645.0, 1191.0, 2722.0, 8610.0, 50376.0, 878701.0, 86589.0, 11945.0, 3489.0, 1403.0, 704.0, 378.0, 237.0, 139.0, 102.0, 67.0, 37.0, 32.0, 38.0, 22.0, 13.0, 13.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6508712768554688, -0.6288909912109375, -0.6069107055664062, -0.584930419921875, -0.5629501342773438, -0.5409698486328125, -0.5189895629882812, -0.49700927734375, -0.47502899169921875, -0.4530487060546875, -0.43106842041015625, -0.409088134765625, -0.38710784912109375, -0.3651275634765625, -0.34314727783203125, -0.3211669921875, -0.29918670654296875, -0.2772064208984375, -0.25522613525390625, -0.233245849609375, -0.21126556396484375, -0.1892852783203125, -0.16730499267578125, -0.14532470703125, -0.12334442138671875, -0.1013641357421875, -0.07938385009765625, -0.057403564453125, -0.03542327880859375, -0.0134429931640625, 0.00853729248046875, 0.030517578125, 0.05249786376953125, 0.0744781494140625, 0.09645843505859375, 0.118438720703125, 0.14041900634765625, 0.1623992919921875, 0.18437957763671875, 0.20635986328125, 0.22834014892578125, 0.2503204345703125, 0.27230072021484375, 0.294281005859375, 0.31626129150390625, 0.3382415771484375, 0.36022186279296875, 0.3822021484375, 0.40418243408203125, 0.4261627197265625, 0.44814300537109375, 0.470123291015625, 0.49210357666015625, 0.5140838623046875, 0.5360641479492188, 0.55804443359375, 0.5800247192382812, 0.6020050048828125, 0.6239852905273438, 0.645965576171875, 0.6679458618164062, 0.6899261474609375, 0.7119064331054688, 0.73388671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 1.0, 10.0, 11.0, 9.0, 10.0, 12.0, 11.0, 29.0, 24.0, 38.0, 52.0, 52.0, 73.0, 67.0, 75.0, 66.0, 56.0, 63.0, 63.0, 64.0, 45.0, 33.0, 25.0, 24.0, 18.0, 13.0, 8.0, 10.0, 11.0, 4.0, 8.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4765625, -1.427978515625, -1.37939453125, -1.330810546875, -1.2822265625, -1.233642578125, -1.18505859375, -1.136474609375, -1.087890625, -1.039306640625, -0.99072265625, -0.942138671875, -0.8935546875, -0.844970703125, -0.79638671875, -0.747802734375, -0.69921875, -0.650634765625, -0.60205078125, -0.553466796875, -0.5048828125, -0.456298828125, -0.40771484375, -0.359130859375, -0.310546875, -0.261962890625, -0.21337890625, -0.164794921875, -0.1162109375, -0.067626953125, -0.01904296875, 0.029541015625, 0.078125, 0.126708984375, 0.17529296875, 0.223876953125, 0.2724609375, 0.321044921875, 0.36962890625, 0.418212890625, 0.466796875, 0.515380859375, 0.56396484375, 0.612548828125, 0.6611328125, 0.709716796875, 0.75830078125, 0.806884765625, 0.85546875, 0.904052734375, 0.95263671875, 1.001220703125, 1.0498046875, 1.098388671875, 1.14697265625, 1.195556640625, 1.244140625, 1.292724609375, 1.34130859375, 1.389892578125, 1.4384765625, 1.487060546875, 1.53564453125, 1.584228515625, 1.6328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 6.0, 7.0, 12.0, 18.0, 12.0, 19.0, 17.0, 36.0, 40.0, 64.0, 103.0, 152.0, 256.0, 519.0, 1125.0, 2740.0, 11680.0, 942576.0, 79702.0, 5801.0, 1829.0, 798.0, 391.0, 195.0, 137.0, 81.0, 39.0, 38.0, 30.0, 23.0, 23.0, 16.0, 13.0, 10.0, 8.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.32373046875, -0.3135528564453125, -0.303375244140625, -0.2931976318359375, -0.28302001953125, -0.2728424072265625, -0.262664794921875, -0.2524871826171875, -0.2423095703125, -0.2321319580078125, -0.221954345703125, -0.2117767333984375, -0.20159912109375, -0.1914215087890625, -0.181243896484375, -0.1710662841796875, -0.160888671875, -0.1507110595703125, -0.140533447265625, -0.1303558349609375, -0.12017822265625, -0.1100006103515625, -0.099822998046875, -0.0896453857421875, -0.0794677734375, -0.0692901611328125, -0.059112548828125, -0.0489349365234375, -0.03875732421875, -0.0285797119140625, -0.018402099609375, -0.0082244873046875, 0.001953125, 0.0121307373046875, 0.022308349609375, 0.0324859619140625, 0.04266357421875, 0.0528411865234375, 0.063018798828125, 0.0731964111328125, 0.0833740234375, 0.0935516357421875, 0.103729248046875, 0.1139068603515625, 0.12408447265625, 0.1342620849609375, 0.144439697265625, 0.1546173095703125, 0.164794921875, 0.1749725341796875, 0.185150146484375, 0.1953277587890625, 0.20550537109375, 0.2156829833984375, 0.225860595703125, 0.2360382080078125, 0.2462158203125, 0.2563934326171875, 0.266571044921875, 0.2767486572265625, 0.28692626953125, 0.2971038818359375, 0.307281494140625, 0.3174591064453125, 0.32763671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 14.0, 17.0, 19.0, 39.0, 71.0, 166.0, 308.0, 169.0, 79.0, 41.0, 14.0, 19.0, 7.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18832015991211e-05, -6.980262696743011e-05, -6.772205233573914e-05, -6.564147770404816e-05, -6.356090307235718e-05, -6.14803284406662e-05, -5.939975380897522e-05, -5.731917917728424e-05, -5.523860454559326e-05, -5.315802991390228e-05, -5.1077455282211304e-05, -4.8996880650520325e-05, -4.6916306018829346e-05, -4.483573138713837e-05, -4.275515675544739e-05, -4.067458212375641e-05, -3.859400749206543e-05, -3.651343286037445e-05, -3.443285822868347e-05, -3.235228359699249e-05, -3.0271708965301514e-05, -2.8191134333610535e-05, -2.6110559701919556e-05, -2.4029985070228577e-05, -2.1949410438537598e-05, -1.986883580684662e-05, -1.778826117515564e-05, -1.570768654346466e-05, -1.3627111911773682e-05, -1.1546537280082703e-05, -9.465962648391724e-06, -7.385388016700745e-06, -5.304813385009766e-06, -3.2242387533187866e-06, -1.1436641216278076e-06, 9.369105100631714e-07, 3.0174851417541504e-06, 5.098059773445129e-06, 7.178634405136108e-06, 9.259209036827087e-06, 1.1339783668518066e-05, 1.3420358300209045e-05, 1.5500932931900024e-05, 1.7581507563591003e-05, 1.9662082195281982e-05, 2.174265682697296e-05, 2.382323145866394e-05, 2.590380609035492e-05, 2.79843807220459e-05, 3.0064955353736877e-05, 3.2145529985427856e-05, 3.4226104617118835e-05, 3.6306679248809814e-05, 3.8387253880500793e-05, 4.046782851219177e-05, 4.254840314388275e-05, 4.462897777557373e-05, 4.670955240726471e-05, 4.879012703895569e-05, 5.087070167064667e-05, 5.2951276302337646e-05, 5.5031850934028625e-05, 5.7112425565719604e-05, 5.9193000197410583e-05, 6.127357482910156e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 5.0, 10.0, 11.0, 19.0, 25.0, 32.0, 37.0, 51.0, 69.0, 93.0, 136.0, 245.0, 480.0, 1057.0, 2585.0, 8694.0, 71016.0, 924134.0, 30394.0, 5690.0, 1832.0, 834.0, 378.0, 222.0, 128.0, 84.0, 67.0, 41.0, 41.0, 21.0, 21.0, 12.0, 13.0, 23.0, 11.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08978271484375, -0.08623981475830078, -0.08269691467285156, -0.07915401458740234, -0.07561111450195312, -0.0720682144165039, -0.06852531433105469, -0.06498241424560547, -0.06143951416015625, -0.05789661407470703, -0.05435371398925781, -0.050810813903808594, -0.047267913818359375, -0.043725013732910156, -0.04018211364746094, -0.03663921356201172, -0.0330963134765625, -0.02955341339111328, -0.026010513305664062, -0.022467613220214844, -0.018924713134765625, -0.015381813049316406, -0.011838912963867188, -0.008296012878417969, -0.00475311279296875, -0.0012102127075195312, 0.0023326873779296875, 0.005875587463378906, 0.009418487548828125, 0.012961387634277344, 0.016504287719726562, 0.02004718780517578, 0.023590087890625, 0.02713298797607422, 0.030675888061523438, 0.034218788146972656, 0.037761688232421875, 0.041304588317871094, 0.04484748840332031, 0.04839038848876953, 0.05193328857421875, 0.05547618865966797, 0.05901908874511719, 0.0625619888305664, 0.06610488891601562, 0.06964778900146484, 0.07319068908691406, 0.07673358917236328, 0.0802764892578125, 0.08381938934326172, 0.08736228942871094, 0.09090518951416016, 0.09444808959960938, 0.0979909896850586, 0.10153388977050781, 0.10507678985595703, 0.10861968994140625, 0.11216259002685547, 0.11570549011230469, 0.1192483901977539, 0.12279129028320312, 0.12633419036865234, 0.12987709045410156, 0.13341999053955078, 0.136962890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 12.0, 10.0, 14.0, 31.0, 52.0, 66.0, 142.0, 207.0, 178.0, 96.0, 55.0, 38.0, 25.0, 12.0, 12.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2052001953125, -0.1969127655029297, -0.18862533569335938, -0.18033790588378906, -0.17205047607421875, -0.16376304626464844, -0.15547561645507812, -0.1471881866455078, -0.1389007568359375, -0.1306133270263672, -0.12232589721679688, -0.11403846740722656, -0.10575103759765625, -0.09746360778808594, -0.08917617797851562, -0.08088874816894531, -0.072601318359375, -0.06431388854980469, -0.056026458740234375, -0.04773902893066406, -0.03945159912109375, -0.031164169311523438, -0.022876739501953125, -0.014589309692382812, -0.0063018798828125, 0.0019855499267578125, 0.010272979736328125, 0.018560409545898438, 0.02684783935546875, 0.03513526916503906, 0.043422698974609375, 0.05171012878417969, 0.05999755859375, 0.06828498840332031, 0.07657241821289062, 0.08485984802246094, 0.09314727783203125, 0.10143470764160156, 0.10972213745117188, 0.11800956726074219, 0.1262969970703125, 0.1345844268798828, 0.14287185668945312, 0.15115928649902344, 0.15944671630859375, 0.16773414611816406, 0.17602157592773438, 0.1843090057373047, 0.192596435546875, 0.2008838653564453, 0.20917129516601562, 0.21745872497558594, 0.22574615478515625, 0.23403358459472656, 0.24232101440429688, 0.2506084442138672, 0.2588958740234375, 0.2671833038330078, 0.2754707336425781, 0.28375816345214844, 0.29204559326171875, 0.30033302307128906, 0.3086204528808594, 0.3169078826904297, 0.3251953125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 14.0, 13.0, 71.0, 309.0, 393.0, 110.0, 45.0, 22.0, 14.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.451303482055664, -6.073531150817871, -5.69575834274292, -5.317986011505127, -4.940213203430176, -4.562440872192383, -4.18466854095459, -3.8068959712982178, -3.4291234016418457, -3.0513508319854736, -2.6735782623291016, -2.2958059310913086, -1.9180333614349365, -1.5402607917785645, -1.1624884605407715, -0.7847158908843994, -0.40694332122802734, -0.02917081117630005, 0.34860169887542725, 0.7263741493225098, 1.1041467189788818, 1.481919288635254, 1.8596916198730469, 2.237464189529419, 2.615236759185791, 2.993009328842163, 3.370781898498535, 3.748554229736328, 4.126326560974121, 4.504099369049072, 4.881871700286865, 5.259644508361816, 5.637416839599609, 6.015189170837402, 6.3929619789123535, 6.7707343101501465, 7.148507118225098, 7.526279449462891, 7.904051780700684, 8.281824111938477, 8.659597396850586, 9.037369728088379, 9.415142059326172, 9.792915344238281, 10.170687675476074, 10.548460006713867, 10.92623233795166, 11.304004669189453, 11.681777000427246, 12.059549331665039, 12.437321662902832, 12.815093994140625, 13.192867279052734, 13.570639610290527, 13.94841194152832, 14.326184272766113, 14.703956604003906, 15.0817289352417, 15.459501266479492, 15.837274551391602, 16.215045928955078, 16.592819213867188, 16.970592498779297, 17.348363876342773, 17.726137161254883]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 7.0, 2.0, 13.0, 13.0, 13.0, 14.0, 26.0, 23.0, 39.0, 124.0, 93.0, 51.0, 43.0, 39.0, 48.0, 64.0, 140.0, 81.0, 21.0, 18.0, 29.0, 16.0, 14.0, 9.0, 12.0, 11.0, 4.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.614171981811523, -5.440032958984375, -5.265893936157227, -5.091754913330078, -4.91761589050293, -4.743476867675781, -4.569337844848633, -4.395198822021484, -4.221059799194336, -4.0469207763671875, -3.872781753540039, -3.6986427307128906, -3.524503707885742, -3.3503646850585938, -3.176225423812866, -3.0020864009857178, -2.8279471397399902, -2.653808116912842, -2.4796690940856934, -2.305530071258545, -2.1313910484313965, -1.9572519063949585, -1.7831127643585205, -1.608973741531372, -1.4348347187042236, -1.2606956958770752, -1.0865566730499268, -0.9124175310134888, -0.7382785081863403, -0.5641394853591919, -0.3900003433227539, -0.21586132049560547, -0.04172229766845703, 0.1324167549610138, 0.3065558075904846, 0.48069489002227783, 0.6548339128494263, 0.8289729356765747, 1.0031120777130127, 1.1772511005401611, 1.3513901233673096, 1.525529146194458, 1.6996681690216064, 1.8738073110580444, 2.0479464530944824, 2.222085475921631, 2.3962244987487793, 2.5703635215759277, 2.744502544403076, 2.9186415672302246, 3.092780590057373, 3.2669196128845215, 3.44105863571167, 3.6151976585388184, 3.789336919784546, 3.9634759426116943, 4.137615203857422, 4.31175422668457, 4.485893249511719, 4.660032272338867, 4.834171295166016, 5.008310317993164, 5.1824493408203125, 5.356588363647461, 5.530727386474609]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 5.0, 4.0, 15.0, 13.0, 18.0, 20.0, 15.0, 30.0, 29.0, 36.0, 52.0, 92.0, 286.0, 112.0, 52.0, 33.0, 25.0, 20.0, 16.0, 23.0, 16.0, 12.0, 11.0, 7.0, 6.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.2852058410644531, -0.27646636962890625, -0.2677268981933594, -0.2589874267578125, -0.2502479553222656, -0.24150848388671875, -0.23276901245117188, -0.224029541015625, -0.21529006958007812, -0.20655059814453125, -0.19781112670898438, -0.1890716552734375, -0.18033218383789062, -0.17159271240234375, -0.16285324096679688, -0.15411376953125, -0.14537429809570312, -0.13663482666015625, -0.12789535522460938, -0.1191558837890625, -0.11041641235351562, -0.10167694091796875, -0.09293746948242188, -0.084197998046875, -0.07545852661132812, -0.06671905517578125, -0.057979583740234375, -0.0492401123046875, -0.040500640869140625, -0.03176116943359375, -0.023021697998046875, -0.0142822265625, -0.005542755126953125, 0.00319671630859375, 0.011936187744140625, 0.0206756591796875, 0.029415130615234375, 0.03815460205078125, 0.046894073486328125, 0.055633544921875, 0.06437301635742188, 0.07311248779296875, 0.08185195922851562, 0.0905914306640625, 0.09933090209960938, 0.10807037353515625, 0.11680984497070312, 0.12554931640625, 0.13428878784179688, 0.14302825927734375, 0.15176773071289062, 0.1605072021484375, 0.16924667358398438, 0.17798614501953125, 0.18672561645507812, 0.195465087890625, 0.20420455932617188, 0.21294403076171875, 0.22168350219726562, 0.2304229736328125, 0.23916244506835938, 0.24790191650390625, 0.2566413879394531, 0.265380859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 11.0, 22.0, 10.0, 9.0, 7.0, 36.0, 56.0, 63.0, 203.0, 646.0, 3704.0, 8365542.0, 16170.0, 1385.0, 306.0, 144.0, 93.0, 49.0, 25.0, 10.0, 12.0, 22.0, 5.0, 8.0, 2.0, 0.0, 9.0, 6.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0], "bins": [-3.158407211303711, -3.067457675933838, -2.976508140563965, -2.8855583667755127, -2.7946088314056396, -2.7036592960357666, -2.6127095222473145, -2.5217599868774414, -2.4308104515075684, -2.3398609161376953, -2.2489113807678223, -2.15796160697937, -2.067012071609497, -1.976062536239624, -1.8851128816604614, -1.7941632270812988, -1.7032136917114258, -1.6122641563415527, -1.5213145017623901, -1.4303648471832275, -1.3394153118133545, -1.2484657764434814, -1.1575161218643188, -1.0665664672851562, -0.9756169319152832, -0.8846673369407654, -0.7937177419662476, -0.7027681469917297, -0.6118185520172119, -0.5208689570426941, -0.42991936206817627, -0.33896976709365845, -0.24802041053771973, -0.1570708155632019, -0.06612122058868408, 0.02482837438583374, 0.11577796936035156, 0.20672756433486938, 0.2976771593093872, 0.38862675428390503, 0.47957634925842285, 0.5705259442329407, 0.6614755392074585, 0.7524251341819763, 0.8433747291564941, 0.934324324131012, 1.0252739191055298, 1.1162235736846924, 1.2071731090545654, 1.2981226444244385, 1.389072299003601, 1.4800219535827637, 1.5709714889526367, 1.6619210243225098, 1.7528706789016724, 1.843820333480835, 1.934769868850708, 2.025719404220581, 2.116669178009033, 2.2076187133789062, 2.2985682487487793, 2.3895177841186523, 2.4804673194885254, 2.5714170932769775, 2.6623666286468506]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 7.0, 8.0, 4.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3165010213851929, -1.2922567129135132, -1.2680124044418335, -1.2437680959701538, -1.2195237874984741, -1.1952793598175049, -1.1710350513458252, -1.1467907428741455, -1.1225464344024658, -1.0983021259307861, -1.0740578174591064, -1.0498135089874268, -1.025569200515747, -1.0013248920440674, -0.9770805239677429, -0.9528362154960632, -0.9285919070243835, -0.9043475985527039, -0.8801032900810242, -0.8558589220046997, -0.83161461353302, -0.8073703050613403, -0.7831259965896606, -0.758881688117981, -0.7346373796463013, -0.7103930711746216, -0.6861487627029419, -0.6619044542312622, -0.6376600861549377, -0.6134157776832581, -0.5891714692115784, -0.5649271607398987, -0.5406827926635742, -0.5164384841918945, -0.49219414591789246, -0.46794983744621277, -0.4437054991722107, -0.419461190700531, -0.3952168822288513, -0.37097257375717163, -0.34672826528549194, -0.32248395681381226, -0.2982396185398102, -0.2739953100681305, -0.2497509866952896, -0.22550666332244873, -0.20126235485076904, -0.17701803147792816, -0.1527736932039261, -0.1285293698310852, -0.10428505390882492, -0.08004073798656464, -0.055796414613723755, -0.031552091240882874, -0.007307782769203186, 0.016936540603637695, 0.04118086397647858, 0.06542518734931946, 0.08966950327157974, 0.11391381919384003, 0.1381581425666809, 0.1624024659395218, 0.18664677441120148, 0.21089109778404236, 0.23513542115688324]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 11.0, 14.0, 20.0, 25.0, 53.0, 92.0, 128.0, 234.0, 592.0, 1324.0, 4448.0, 17484.0, 107062.0, 315499.0, 61507.0, 11062.0, 2893.0, 957.0, 395.0, 176.0, 95.0, 63.0, 31.0, 28.0, 11.0, 7.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.017578125, -1.9635772705078125, -1.909576416015625, -1.8555755615234375, -1.80157470703125, -1.7475738525390625, -1.693572998046875, -1.6395721435546875, -1.5855712890625, -1.5315704345703125, -1.477569580078125, -1.4235687255859375, -1.36956787109375, -1.3155670166015625, -1.261566162109375, -1.2075653076171875, -1.153564453125, -1.0995635986328125, -1.045562744140625, -0.9915618896484375, -0.93756103515625, -0.8835601806640625, -0.829559326171875, -0.7755584716796875, -0.7215576171875, -0.6675567626953125, -0.613555908203125, -0.5595550537109375, -0.50555419921875, -0.4515533447265625, -0.397552490234375, -0.3435516357421875, -0.28955078125, -0.2355499267578125, -0.181549072265625, -0.1275482177734375, -0.07354736328125, -0.0195465087890625, 0.034454345703125, 0.0884552001953125, 0.1424560546875, 0.1964569091796875, 0.250457763671875, 0.3044586181640625, 0.35845947265625, 0.4124603271484375, 0.466461181640625, 0.5204620361328125, 0.574462890625, 0.6284637451171875, 0.682464599609375, 0.7364654541015625, 0.79046630859375, 0.8444671630859375, 0.898468017578125, 0.9524688720703125, 1.0064697265625, 1.0604705810546875, 1.114471435546875, 1.1684722900390625, 1.22247314453125, 1.2764739990234375, 1.330474853515625, 1.3844757080078125, 1.4384765625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 7.0, 8.0, 9.0, 6.0, 17.0, 10.0, 17.0, 24.0, 24.0, 29.0, 34.0, 51.0, 79.0, 62.0, 80.0, 69.0, 68.0, 62.0, 58.0, 54.0, 58.0, 31.0, 22.0, 34.0, 20.0, 17.0, 11.0, 8.0, 11.0, 1.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.384521484375, -0.3737335205078125, -0.362945556640625, -0.3521575927734375, -0.34136962890625, -0.3305816650390625, -0.319793701171875, -0.3090057373046875, -0.2982177734375, -0.2874298095703125, -0.276641845703125, -0.2658538818359375, -0.25506591796875, -0.2442779541015625, -0.233489990234375, -0.2227020263671875, -0.2119140625, -0.2011260986328125, -0.190338134765625, -0.1795501708984375, -0.16876220703125, -0.1579742431640625, -0.147186279296875, -0.1363983154296875, -0.1256103515625, -0.1148223876953125, -0.104034423828125, -0.0932464599609375, -0.08245849609375, -0.0716705322265625, -0.060882568359375, -0.0500946044921875, -0.039306640625, -0.0285186767578125, -0.017730712890625, -0.0069427490234375, 0.00384521484375, 0.0146331787109375, 0.025421142578125, 0.0362091064453125, 0.0469970703125, 0.0577850341796875, 0.068572998046875, 0.0793609619140625, 0.09014892578125, 0.1009368896484375, 0.111724853515625, 0.1225128173828125, 0.13330078125, 0.1440887451171875, 0.154876708984375, 0.1656646728515625, 0.17645263671875, 0.1872406005859375, 0.198028564453125, 0.2088165283203125, 0.2196044921875, 0.2303924560546875, 0.241180419921875, 0.2519683837890625, 0.26275634765625, 0.2735443115234375, 0.284332275390625, 0.2951202392578125, 0.305908203125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 5.0, 13.0, 14.0, 22.0, 52.0, 247.0, 118.0, 11.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1787147521972656, -3.008788585662842, -2.838862180709839, -2.668936014175415, -2.499009609222412, -2.3290834426879883, -2.1591572761535645, -1.989230990409851, -1.8193047046661377, -1.6493784189224243, -1.479452133178711, -1.309525966644287, -1.1395996809005737, -0.9696733951568604, -0.7997472286224365, -0.6298209428787231, -0.45989465713500977, -0.2899684011936188, -0.12004214525222778, 0.04988408088684082, 0.2198103666305542, 0.3897366523742676, 0.5596628189086914, 0.7295891046524048, 0.8995153903961182, 1.0694416761398315, 1.239367961883545, 1.4092941284179688, 1.5792204141616821, 1.7491466999053955, 1.9190728664398193, 2.0889992713928223, 2.258925437927246, 2.42885160446167, 2.598778009414673, 2.7687041759490967, 2.9386305809020996, 3.1085567474365234, 3.2784829139709473, 3.448409080505371, 3.618335485458374, 3.788261651992798, 3.958188056945801, 4.128114223480225, 4.298040390014648, 4.4679670333862305, 4.637892723083496, 4.807819366455078, 4.977745532989502, 5.147671699523926, 5.31759786605835, 5.487524032592773, 5.6574506759643555, 5.827376842498779, 5.997303009033203, 6.167229175567627, 6.337155342102051, 6.507081508636475, 6.677007675170898, 6.8469343185424805, 7.016860485076904, 7.186786651611328, 7.356712818145752, 7.526638984680176, 7.696565628051758]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 5.0, 4.0, 11.0, 7.0, 29.0, 58.0, 83.0, 109.0, 70.0, 37.0, 15.0, 11.0, 4.0, 7.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.472254753112793, -2.3982508182525635, -2.324246644973755, -2.2502427101135254, -2.176238775253296, -2.1022348403930664, -2.028230667114258, -1.9542267322540283, -1.8802226781845093, -1.8062186241149902, -1.7322146892547607, -1.6582106351852417, -1.5842065811157227, -1.5102026462554932, -1.4361985921859741, -1.362194538116455, -1.2881906032562256, -1.2141865491867065, -1.140182614326477, -1.066178560256958, -0.9921745657920837, -0.9181705713272095, -0.8441665172576904, -0.7701625227928162, -0.6961585283279419, -0.6221545338630676, -0.5481505393981934, -0.4741464853286743, -0.40014249086380005, -0.3261384963989258, -0.2521344721317291, -0.17813044786453247, -0.1041264533996582, -0.03012244403362274, 0.04388156533241272, 0.11788557469844818, 0.19188958406448364, 0.2658935785293579, 0.33989760279655457, 0.4139016270637512, 0.4879056215286255, 0.5619096159934998, 0.635913610458374, 0.7099176645278931, 0.7839216589927673, 0.8579256534576416, 0.9319297075271606, 1.0059337615966797, 1.0799376964569092, 1.1539417505264282, 1.2279456853866577, 1.3019497394561768, 1.3759536743164062, 1.4499577283859253, 1.5239617824554443, 1.5979657173156738, 1.6719697713851929, 1.745973825454712, 1.8199777603149414, 1.8939818143844604, 1.9679858684539795, 2.041989803314209, 2.1159937381744385, 2.189997911453247, 2.2640018463134766]}, "eval/loss": 4.591245651245117, "eval/wer": 1.96449821499405, "eval/runtime": 931.3082, "eval/samples_per_second": 2.837, "eval/steps_per_second": 0.355} \ No newline at end of file