diff --git "a/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" "b/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" --- "a/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" +++ "b/wandb/run-20220302_085255-16llzpbl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.584, "train/learning_rate": 6.728971962616821e-05, "train/epoch": 0.84, "train/global_step": 1500, "_runtime": 7602, "_timestamp": 1646218777, "_step": 1502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1000.0, 17.0], "bins": [-1409.9154052734375, -1387.4149169921875, -1364.9144287109375, -1342.4139404296875, -1319.913330078125, -1297.412841796875, -1274.912353515625, -1252.411865234375, -1229.911376953125, -1207.410888671875, -1184.910400390625, -1162.409912109375, -1139.9093017578125, -1117.4088134765625, -1094.9083251953125, -1072.4078369140625, -1049.9073486328125, -1027.4068603515625, -1004.9063110351562, -982.4058227539062, -959.9053344726562, -937.4048461914062, -914.904296875, -892.40380859375, -869.9032592773438, -847.4027709960938, -824.9022216796875, -802.4017333984375, -779.9012451171875, -757.4007568359375, -734.9002075195312, -712.3997192382812, -689.8992309570312, -667.3987426757812, -644.898193359375, -622.397705078125, -599.897216796875, -577.396728515625, -554.8961791992188, -532.3956909179688, -509.8951721191406, -487.3946533203125, -464.8941650390625, -442.3936462402344, -419.8931579589844, -397.39263916015625, -374.89215087890625, -352.3916320800781, -329.8911437988281, -307.390625, -284.89013671875, -262.3896179199219, -239.88912963867188, -217.38861083984375, -194.8881072998047, -172.38760375976562, -149.8870849609375, -127.38658142089844, -104.88607788085938, -82.38556671142578, -59.88506317138672, -37.384559631347656, -14.884048461914062, 7.616455078125, 30.116952896118164]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 15.0, 10.0, 19.0, 30.0, 29.0, 47.0, 37.0, 49.0, 50.0, 55.0, 87.0, 83.0, 74.0, 69.0, 65.0, 61.0, 54.0, 50.0, 31.0, 25.0, 18.0, 14.0, 16.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.76513671875, -121.13980102539062, -117.51445770263672, -113.88911437988281, -110.26377868652344, -106.63844299316406, -103.01309967041016, -99.38775634765625, -95.76242065429688, -92.1370849609375, -88.5117416381836, -84.88639831542969, -81.26106262207031, -77.63572692871094, -74.01038360595703, -70.38504028320312, -66.75970458984375, -63.13436508178711, -59.50902557373047, -55.88368606567383, -52.25834655761719, -48.63300704956055, -45.007667541503906, -41.382328033447266, -37.756988525390625, -34.131649017333984, -30.506309509277344, -26.880970001220703, -23.255630493164062, -19.630290985107422, -16.00495147705078, -12.37961196899414, -8.7542724609375, -5.128932952880859, -1.5035934448242188, 2.121746063232422, 5.7470855712890625, 9.372425079345703, 12.997764587402344, 16.623104095458984, 20.248443603515625, 23.873783111572266, 27.499122619628906, 31.124462127685547, 34.74980163574219, 38.37514114379883, 42.00048065185547, 45.62582015991211, 49.25115966796875, 52.87649917602539, 56.50183868408203, 60.12717819213867, 63.75251770019531, 67.37785339355469, 71.0031967163086, 74.6285400390625, 78.25387573242188, 81.87921142578125, 85.50455474853516, 89.12989807128906, 92.75523376464844, 96.38056945800781, 100.00591278076172, 103.63125610351562, 107.256591796875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 11.0, 15.0, 12.0, 24.0, 17.0, 25.0, 33.0, 23.0, 47.0, 32.0, 36.0, 45.0, 40.0, 38.0, 58.0, 47.0, 37.0, 46.0, 52.0, 37.0, 53.0, 36.0, 43.0, 29.0, 28.0, 28.0, 31.0, 17.0, 12.0, 10.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.9755859375, -1.922882080078125, -1.87017822265625, -1.817474365234375, -1.7647705078125, -1.712066650390625, -1.65936279296875, -1.606658935546875, -1.553955078125, -1.501251220703125, -1.44854736328125, -1.395843505859375, -1.3431396484375, -1.290435791015625, -1.23773193359375, -1.185028076171875, -1.13232421875, -1.079620361328125, -1.02691650390625, -0.974212646484375, -0.9215087890625, -0.868804931640625, -0.81610107421875, -0.763397216796875, -0.710693359375, -0.657989501953125, -0.60528564453125, -0.552581787109375, -0.4998779296875, -0.447174072265625, -0.39447021484375, -0.341766357421875, -0.2890625, -0.236358642578125, -0.18365478515625, -0.130950927734375, -0.0782470703125, -0.025543212890625, 0.02716064453125, 0.079864501953125, 0.132568359375, 0.185272216796875, 0.23797607421875, 0.290679931640625, 0.3433837890625, 0.396087646484375, 0.44879150390625, 0.501495361328125, 0.55419921875, 0.606903076171875, 0.65960693359375, 0.712310791015625, 0.7650146484375, 0.817718505859375, 0.87042236328125, 0.923126220703125, 0.975830078125, 1.028533935546875, 1.08123779296875, 1.133941650390625, 1.1866455078125, 1.239349365234375, 1.29205322265625, 1.344757080078125, 1.3974609375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 15.0, 6.0, 18.0, 19.0, 23.0, 38.0, 45.0, 53.0, 104.0, 124.0, 154.0, 217.0, 303.0, 446.0, 682.0, 992.0, 1660.0, 3267.0, 8986.0, 41399.0, 661063.0, 3326052.0, 120138.0, 17255.0, 5100.0, 2287.0, 1224.0, 835.0, 525.0, 353.0, 208.0, 185.0, 137.0, 98.0, 64.0, 53.0, 41.0, 30.0, 20.0, 11.0, 16.0, 9.0, 6.0, 9.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0], "bins": [-12.109375, -11.7557373046875, -11.402099609375, -11.0484619140625, -10.69482421875, -10.3411865234375, -9.987548828125, -9.6339111328125, -9.2802734375, -8.9266357421875, -8.572998046875, -8.2193603515625, -7.86572265625, -7.5120849609375, -7.158447265625, -6.8048095703125, -6.451171875, -6.0975341796875, -5.743896484375, -5.3902587890625, -5.03662109375, -4.6829833984375, -4.329345703125, -3.9757080078125, -3.6220703125, -3.2684326171875, -2.914794921875, -2.5611572265625, -2.20751953125, -1.8538818359375, -1.500244140625, -1.1466064453125, -0.79296875, -0.4393310546875, -0.085693359375, 0.2679443359375, 0.62158203125, 0.9752197265625, 1.328857421875, 1.6824951171875, 2.0361328125, 2.3897705078125, 2.743408203125, 3.0970458984375, 3.45068359375, 3.8043212890625, 4.157958984375, 4.5115966796875, 4.865234375, 5.2188720703125, 5.572509765625, 5.9261474609375, 6.27978515625, 6.6334228515625, 6.987060546875, 7.3406982421875, 7.6943359375, 8.0479736328125, 8.401611328125, 8.7552490234375, 9.10888671875, 9.4625244140625, 9.816162109375, 10.1697998046875, 10.5234375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 8.0, 7.0, 9.0, 28.0, 58.0, 110.0, 190.0, 416.0, 830.0, 1144.0, 663.0, 311.0, 148.0, 81.0, 36.0, 19.0, 5.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.2386474609375, -16.789794921875, -16.3409423828125, -15.89208984375, -15.4432373046875, -14.994384765625, -14.5455322265625, -14.0966796875, -13.6478271484375, -13.198974609375, -12.7501220703125, -12.30126953125, -11.8524169921875, -11.403564453125, -10.9547119140625, -10.505859375, -10.0570068359375, -9.608154296875, -9.1593017578125, -8.71044921875, -8.2615966796875, -7.812744140625, -7.3638916015625, -6.9150390625, -6.4661865234375, -6.017333984375, -5.5684814453125, -5.11962890625, -4.6707763671875, -4.221923828125, -3.7730712890625, -3.32421875, -2.8753662109375, -2.426513671875, -1.9776611328125, -1.52880859375, -1.0799560546875, -0.631103515625, -0.1822509765625, 0.2666015625, 0.7154541015625, 1.164306640625, 1.6131591796875, 2.06201171875, 2.5108642578125, 2.959716796875, 3.4085693359375, 3.857421875, 4.3062744140625, 4.755126953125, 5.2039794921875, 5.65283203125, 6.1016845703125, 6.550537109375, 6.9993896484375, 7.4482421875, 7.8970947265625, 8.345947265625, 8.7947998046875, 9.24365234375, 9.6925048828125, 10.141357421875, 10.5902099609375, 11.0390625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 12.0, 10.0, 19.0, 38.0, 91.0, 222.0, 511.0, 1534.0, 19336.0, 4134956.0, 34886.0, 1670.0, 553.0, 241.0, 97.0, 39.0, 35.0, 20.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.8125, -37.40380859375, -35.9951171875, -34.58642578125, -33.177734375, -31.76904296875, -30.3603515625, -28.95166015625, -27.54296875, -26.13427734375, -24.7255859375, -23.31689453125, -21.908203125, -20.49951171875, -19.0908203125, -17.68212890625, -16.2734375, -14.86474609375, -13.4560546875, -12.04736328125, -10.638671875, -9.22998046875, -7.8212890625, -6.41259765625, -5.00390625, -3.59521484375, -2.1865234375, -0.77783203125, 0.630859375, 2.03955078125, 3.4482421875, 4.85693359375, 6.265625, 7.67431640625, 9.0830078125, 10.49169921875, 11.900390625, 13.30908203125, 14.7177734375, 16.12646484375, 17.53515625, 18.94384765625, 20.3525390625, 21.76123046875, 23.169921875, 24.57861328125, 25.9873046875, 27.39599609375, 28.8046875, 30.21337890625, 31.6220703125, 33.03076171875, 34.439453125, 35.84814453125, 37.2568359375, 38.66552734375, 40.07421875, 41.48291015625, 42.8916015625, 44.30029296875, 45.708984375, 47.11767578125, 48.5263671875, 49.93505859375, 51.34375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 197.0, 790.0, 29.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.370916366577148, -8.736455917358398, -2.101996421813965, 4.532463073730469, 11.166923522949219, 17.801382064819336, 24.435842514038086, 31.070302963256836, 37.70476531982422, 44.33922576904297, 50.97368621826172, 57.60814666748047, 64.24260711669922, 70.87705993652344, 77.51152038574219, 84.14598083496094, 90.78044128417969, 97.41490173339844, 104.04936218261719, 110.68382263183594, 117.31828308105469, 123.95274353027344, 130.5872039794922, 137.22166442871094, 143.8561248779297, 150.49058532714844, 157.1250457763672, 163.75950622558594, 170.3939666748047, 177.02842712402344, 183.6628875732422, 190.29734802246094, 196.9318084716797, 203.56626892089844, 210.2007293701172, 216.83518981933594, 223.4696502685547, 230.10411071777344, 236.7385711669922, 243.37303161621094, 250.0074920654297, 256.6419372558594, 263.2763977050781, 269.9108581542969, 276.5453186035156, 283.1797790527344, 289.8142395019531, 296.4486999511719, 303.0831604003906, 309.7176208496094, 316.3520812988281, 322.9865417480469, 329.6210021972656, 336.2554626464844, 342.8899230957031, 349.5243835449219, 356.1588439941406, 362.7933044433594, 369.4277648925781, 376.0622253417969, 382.6966857910156, 389.3311462402344, 395.9656066894531, 402.6000671386719, 409.2345275878906]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 10.0, 2.0, 7.0, 10.0, 14.0, 14.0, 27.0, 20.0, 20.0, 30.0, 43.0, 42.0, 36.0, 49.0, 45.0, 48.0, 55.0, 51.0, 49.0, 49.0, 42.0, 52.0, 33.0, 41.0, 36.0, 47.0, 24.0, 22.0, 17.0, 18.0, 11.0, 9.0, 8.0, 9.0, 2.0, 10.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.17803192138672, -26.27369499206543, -25.369359970092773, -24.465023040771484, -23.560688018798828, -22.65635108947754, -21.75201416015625, -20.847679138183594, -19.943344116210938, -19.03900718688965, -18.134672164916992, -17.230335235595703, -16.326000213623047, -15.421663284301758, -14.517327308654785, -13.612991333007812, -12.708654403686523, -11.80431842803955, -10.899982452392578, -9.995645523071289, -9.091310501098633, -8.186973571777344, -7.282637596130371, -6.378301620483398, -5.473965644836426, -4.569629669189453, -3.6652934551239014, -2.7609572410583496, -1.856621265411377, -0.9522852897644043, -0.04794883728027344, 0.8563871383666992, 1.7607231140136719, 2.6650590896606445, 3.5693953037261963, 4.473731517791748, 5.378067493438721, 6.282403469085693, 7.186739921569824, 8.091075897216797, 8.99541187286377, 9.899747848510742, 10.804083824157715, 11.708419799804688, 12.612756729125977, 13.517091751098633, 14.421428680419922, 15.325764656066895, 16.230100631713867, 17.134437561035156, 18.038772583007812, 18.9431095123291, 19.847444534301758, 20.751781463623047, 21.656116485595703, 22.560453414916992, 23.46479034423828, 24.36912727355957, 25.273462295532227, 26.177799224853516, 27.082134246826172, 27.98647117614746, 28.89080810546875, 29.795143127441406, 30.699478149414062]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 11.0, 14.0, 14.0, 13.0, 24.0, 26.0, 24.0, 34.0, 35.0, 44.0, 34.0, 42.0, 31.0, 34.0, 28.0, 34.0, 55.0, 38.0, 36.0, 47.0, 38.0, 41.0, 40.0, 38.0, 36.0, 26.0, 24.0, 32.0, 15.0, 11.0, 13.0, 14.0, 7.0, 10.0, 5.0, 3.0, 0.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.8076171875, -1.7589874267578125, -1.710357666015625, -1.6617279052734375, -1.61309814453125, -1.5644683837890625, -1.515838623046875, -1.4672088623046875, -1.4185791015625, -1.3699493408203125, -1.321319580078125, -1.2726898193359375, -1.22406005859375, -1.1754302978515625, -1.126800537109375, -1.0781707763671875, -1.029541015625, -0.9809112548828125, -0.932281494140625, -0.8836517333984375, -0.83502197265625, -0.7863922119140625, -0.737762451171875, -0.6891326904296875, -0.6405029296875, -0.5918731689453125, -0.543243408203125, -0.4946136474609375, -0.44598388671875, -0.3973541259765625, -0.348724365234375, -0.3000946044921875, -0.25146484375, -0.2028350830078125, -0.154205322265625, -0.1055755615234375, -0.05694580078125, -0.0083160400390625, 0.040313720703125, 0.0889434814453125, 0.1375732421875, 0.1862030029296875, 0.234832763671875, 0.2834625244140625, 0.33209228515625, 0.3807220458984375, 0.429351806640625, 0.4779815673828125, 0.526611328125, 0.5752410888671875, 0.623870849609375, 0.6725006103515625, 0.72113037109375, 0.7697601318359375, 0.818389892578125, 0.8670196533203125, 0.9156494140625, 0.9642791748046875, 1.012908935546875, 1.0615386962890625, 1.11016845703125, 1.1587982177734375, 1.207427978515625, 1.2560577392578125, 1.3046875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 10.0, 17.0, 17.0, 33.0, 30.0, 55.0, 82.0, 125.0, 207.0, 278.0, 413.0, 603.0, 873.0, 1294.0, 1961.0, 2715.0, 4184.0, 6164.0, 9389.0, 14220.0, 22004.0, 34557.0, 55488.0, 89530.0, 155683.0, 259905.0, 151144.0, 87082.0, 53687.0, 33501.0, 21383.0, 13792.0, 9272.0, 6024.0, 4199.0, 2757.0, 1856.0, 1318.0, 847.0, 577.0, 424.0, 268.0, 168.0, 155.0, 73.0, 58.0, 53.0, 29.0, 20.0, 14.0, 4.0, 10.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.05462646484375, -0.052890777587890625, -0.05115509033203125, -0.049419403076171875, -0.0476837158203125, -0.045948028564453125, -0.04421234130859375, -0.042476654052734375, -0.040740966796875, -0.039005279541015625, -0.03726959228515625, -0.035533905029296875, -0.0337982177734375, -0.032062530517578125, -0.03032684326171875, -0.028591156005859375, -0.02685546875, -0.025119781494140625, -0.02338409423828125, -0.021648406982421875, -0.0199127197265625, -0.018177032470703125, -0.01644134521484375, -0.014705657958984375, -0.012969970703125, -0.011234283447265625, -0.00949859619140625, -0.007762908935546875, -0.0060272216796875, -0.004291534423828125, -0.00255584716796875, -0.000820159912109375, 0.00091552734375, 0.002651214599609375, 0.00438690185546875, 0.006122589111328125, 0.0078582763671875, 0.009593963623046875, 0.01132965087890625, 0.013065338134765625, 0.014801025390625, 0.016536712646484375, 0.01827239990234375, 0.020008087158203125, 0.0217437744140625, 0.023479461669921875, 0.02521514892578125, 0.026950836181640625, 0.0286865234375, 0.030422210693359375, 0.03215789794921875, 0.033893585205078125, 0.0356292724609375, 0.037364959716796875, 0.03910064697265625, 0.040836334228515625, 0.042572021484375, 0.044307708740234375, 0.04604339599609375, 0.047779083251953125, 0.0495147705078125, 0.051250457763671875, 0.05298614501953125, 0.054721832275390625, 0.05645751953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 15.0, 9.0, 13.0, 14.0, 22.0, 22.0, 24.0, 31.0, 33.0, 32.0, 39.0, 46.0, 45.0, 31.0, 37.0, 58.0, 1055.0, 46.0, 34.0, 64.0, 46.0, 47.0, 38.0, 38.0, 21.0, 25.0, 37.0, 16.0, 19.0, 9.0, 10.0, 9.0, 6.0, 8.0, 5.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.08660888671875, -1.0482177734375, -1.00982666015625, -0.971435546875, -0.93304443359375, -0.8946533203125, -0.85626220703125, -0.81787109375, -0.77947998046875, -0.7410888671875, -0.70269775390625, -0.664306640625, -0.62591552734375, -0.5875244140625, -0.54913330078125, -0.5107421875, -0.47235107421875, -0.4339599609375, -0.39556884765625, -0.357177734375, -0.31878662109375, -0.2803955078125, -0.24200439453125, -0.20361328125, -0.16522216796875, -0.1268310546875, -0.08843994140625, -0.050048828125, -0.01165771484375, 0.0267333984375, 0.06512451171875, 0.103515625, 0.14190673828125, 0.1802978515625, 0.21868896484375, 0.257080078125, 0.29547119140625, 0.3338623046875, 0.37225341796875, 0.41064453125, 0.44903564453125, 0.4874267578125, 0.52581787109375, 0.564208984375, 0.60260009765625, 0.6409912109375, 0.67938232421875, 0.7177734375, 0.75616455078125, 0.7945556640625, 0.83294677734375, 0.871337890625, 0.90972900390625, 0.9481201171875, 0.98651123046875, 1.02490234375, 1.06329345703125, 1.1016845703125, 1.14007568359375, 1.178466796875, 1.21685791015625, 1.2552490234375, 1.29364013671875, 1.33203125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 9.0, 11.0, 12.0, 11.0, 36.0, 43.0, 85.0, 116.0, 165.0, 241.0, 410.0, 576.0, 823.0, 1257.0, 1838.0, 2634.0, 3938.0, 5817.0, 8757.0, 13410.0, 20695.0, 32115.0, 52011.0, 89509.0, 170643.0, 1325427.0, 150987.0, 81111.0, 48326.0, 29658.0, 18820.0, 12416.0, 8333.0, 5518.0, 3617.0, 2487.0, 1754.0, 1146.0, 780.0, 520.0, 364.0, 246.0, 143.0, 97.0, 73.0, 48.0, 39.0, 22.0, 17.0, 8.0, 9.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.029144287109375, -0.02829742431640625, -0.0274505615234375, -0.02660369873046875, -0.0257568359375, -0.02490997314453125, -0.0240631103515625, -0.02321624755859375, -0.022369384765625, -0.02152252197265625, -0.0206756591796875, -0.01982879638671875, -0.01898193359375, -0.01813507080078125, -0.0172882080078125, -0.01644134521484375, -0.015594482421875, -0.01474761962890625, -0.0139007568359375, -0.01305389404296875, -0.01220703125, -0.01136016845703125, -0.0105133056640625, -0.00966644287109375, -0.008819580078125, -0.00797271728515625, -0.0071258544921875, -0.00627899169921875, -0.00543212890625, -0.00458526611328125, -0.0037384033203125, -0.00289154052734375, -0.002044677734375, -0.00119781494140625, -0.0003509521484375, 0.00049591064453125, 0.0013427734375, 0.00218963623046875, 0.0030364990234375, 0.00388336181640625, 0.004730224609375, 0.00557708740234375, 0.0064239501953125, 0.00727081298828125, 0.00811767578125, 0.00896453857421875, 0.0098114013671875, 0.01065826416015625, 0.011505126953125, 0.01235198974609375, 0.0131988525390625, 0.01404571533203125, 0.014892578125, 0.01573944091796875, 0.0165863037109375, 0.01743316650390625, 0.018280029296875, 0.01912689208984375, 0.0199737548828125, 0.02082061767578125, 0.02166748046875, 0.02251434326171875, 0.0233612060546875, 0.02420806884765625, 0.025054931640625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 10.0, 5.0, 7.0, 11.0, 15.0, 13.0, 10.0, 11.0, 18.0, 42.0, 36.0, 43.0, 26.0, 34.0, 50.0, 55.0, 55.0, 45.0, 62.0, 53.0, 46.0, 40.0, 32.0, 39.0, 38.0, 32.0, 25.0, 22.0, 25.0, 19.0, 16.0, 14.0, 12.0, 6.0, 6.0, 5.0, 9.0, 3.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-1.722574234008789e-05, -1.6761943697929382e-05, -1.6298145055770874e-05, -1.5834346413612366e-05, -1.5370547771453857e-05, -1.4906749129295349e-05, -1.444295048713684e-05, -1.3979151844978333e-05, -1.3515353202819824e-05, -1.3051554560661316e-05, -1.2587755918502808e-05, -1.21239572763443e-05, -1.1660158634185791e-05, -1.1196359992027283e-05, -1.0732561349868774e-05, -1.0268762707710266e-05, -9.804964065551758e-06, -9.34116542339325e-06, -8.877366781234741e-06, -8.413568139076233e-06, -7.949769496917725e-06, -7.485970854759216e-06, -7.022172212600708e-06, -6.5583735704422e-06, -6.094574928283691e-06, -5.630776286125183e-06, -5.166977643966675e-06, -4.7031790018081665e-06, -4.239380359649658e-06, -3.77558171749115e-06, -3.3117830753326416e-06, -2.8479844331741333e-06, -2.384185791015625e-06, -1.9203871488571167e-06, -1.4565885066986084e-06, -9.927898645401e-07, -5.289912223815918e-07, -6.51925802230835e-08, 3.986060619354248e-07, 8.624047040939331e-07, 1.3262033462524414e-06, 1.7900019884109497e-06, 2.253800630569458e-06, 2.7175992727279663e-06, 3.1813979148864746e-06, 3.645196557044983e-06, 4.108995199203491e-06, 4.5727938413619995e-06, 5.036592483520508e-06, 5.500391125679016e-06, 5.964189767837524e-06, 6.427988409996033e-06, 6.891787052154541e-06, 7.355585694313049e-06, 7.819384336471558e-06, 8.283182978630066e-06, 8.746981620788574e-06, 9.210780262947083e-06, 9.67457890510559e-06, 1.0138377547264099e-05, 1.0602176189422607e-05, 1.1065974831581116e-05, 1.1529773473739624e-05, 1.1993572115898132e-05, 1.245737075805664e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 8.0, 6.0, 15.0, 7.0, 11.0, 19.0, 20.0, 27.0, 39.0, 51.0, 45.0, 71.0, 49.0, 91.0, 132.0, 180.0, 176.0, 266.0, 516.0, 3018.0, 1040803.0, 1429.0, 405.0, 257.0, 185.0, 147.0, 108.0, 103.0, 86.0, 69.0, 46.0, 30.0, 29.0, 28.0, 27.0, 9.0, 12.0, 14.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000255584716796875, -0.0002462528645992279, -0.0002369210124015808, -0.00022758916020393372, -0.00021825730800628662, -0.00020892545580863953, -0.00019959360361099243, -0.00019026175141334534, -0.00018092989921569824, -0.00017159804701805115, -0.00016226619482040405, -0.00015293434262275696, -0.00014360249042510986, -0.00013427063822746277, -0.00012493878602981567, -0.00011560693383216858, -0.00010627508163452148, -9.694322943687439e-05, -8.76113772392273e-05, -7.82795250415802e-05, -6.89476728439331e-05, -5.961582064628601e-05, -5.0283968448638916e-05, -4.095211625099182e-05, -3.1620264053344727e-05, -2.2288411855697632e-05, -1.2956559658050537e-05, -3.6247074604034424e-06, 5.707144737243652e-06, 1.5038996934890747e-05, 2.4370849132537842e-05, 3.3702701330184937e-05, 4.303455352783203e-05, 5.2366405725479126e-05, 6.169825792312622e-05, 7.103011012077332e-05, 8.036196231842041e-05, 8.96938145160675e-05, 9.90256667137146e-05, 0.0001083575189113617, 0.00011768937110900879, 0.00012702122330665588, 0.00013635307550430298, 0.00014568492770195007, 0.00015501677989959717, 0.00016434863209724426, 0.00017368048429489136, 0.00018301233649253845, 0.00019234418869018555, 0.00020167604088783264, 0.00021100789308547974, 0.00022033974528312683, 0.00022967159748077393, 0.00023900344967842102, 0.0002483353018760681, 0.0002576671540737152, 0.0002669990062713623, 0.0002763308584690094, 0.0002856627106666565, 0.0002949945628643036, 0.0003043264150619507, 0.0003136582672595978, 0.0003229901194572449, 0.00033232197165489197, 0.00034165382385253906]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 636.0, 381.0, 1.0], "bins": [-0.0003590731939766556, -0.00035328048397786915, -0.00034748780308291316, -0.0003416950930841267, -0.0003359024121891707, -0.00033010970219038427, -0.0003243170212954283, -0.0003185243112966418, -0.00031273163040168583, -0.0003069389204028994, -0.0003011462395079434, -0.00029535352950915694, -0.00028956084861420095, -0.0002837681386154145, -0.0002779754577204585, -0.00027218274772167206, -0.0002663900377228856, -0.00026059732772409916, -0.00025480464682914317, -0.0002490119368303567, -0.00024321925593540072, -0.00023742654593661427, -0.00023163386504165828, -0.00022584115504287183, -0.00022004847414791584, -0.00021425577870104462, -0.0002084630832541734, -0.00020267038780730218, -0.00019687769236043096, -0.0001910849823616445, -0.00018529230146668851, -0.00017949959146790206, -0.00017370691057294607, -0.00016791421512607485, -0.00016212151967920363, -0.0001563288242323324, -0.0001505361287854612, -0.00014474341878667474, -0.00013895073789171875, -0.0001331580278929323, -0.00012736533244606107, -0.00012157263699918985, -0.00011577994155231863, -0.00010998724610544741, -0.00010419454338261858, -9.840184793574736e-05, -9.260915248887613e-05, -8.68164497660473e-05, -8.102375431917608e-05, -7.523105887230486e-05, -6.943836342543364e-05, -6.364566797856241e-05, -5.785296525573358e-05, -5.206026980886236e-05, -4.626757436199114e-05, -4.047487527714111e-05, -3.4682183468248695e-05, -2.888948620238807e-05, -2.3096788936527446e-05, -1.7304093489656225e-05, -1.15113962237956e-05, -5.718698957934976e-06, 7.399648893624544e-08, 5.866695573786274e-06, 1.1659392839646898e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 3.0, 9.0, 15.0, 16.0, 30.0, 30.0, 29.0, 48.0, 75.0, 62.0, 85.0, 83.0, 61.0, 77.0, 77.0, 58.0, 68.0, 34.0, 43.0, 28.0, 28.0, 14.0, 9.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.621246337890625e-05, -1.5694648027420044e-05, -1.5176832675933838e-05, -1.4659017324447632e-05, -1.4141201972961426e-05, -1.362338662147522e-05, -1.3105571269989014e-05, -1.2587755918502808e-05, -1.2069940567016602e-05, -1.1552125215530396e-05, -1.103430986404419e-05, -1.0516494512557983e-05, -9.998679161071777e-06, -9.480863809585571e-06, -8.963048458099365e-06, -8.44523310661316e-06, -7.927417755126953e-06, -7.409602403640747e-06, -6.891787052154541e-06, -6.373971700668335e-06, -5.856156349182129e-06, -5.338340997695923e-06, -4.820525646209717e-06, -4.302710294723511e-06, -3.7848949432373047e-06, -3.2670795917510986e-06, -2.7492642402648926e-06, -2.2314488887786865e-06, -1.7136335372924805e-06, -1.1958181858062744e-06, -6.780028343200684e-07, -1.601874828338623e-07, 3.5762786865234375e-07, 8.754432201385498e-07, 1.3932585716247559e-06, 1.911073923110962e-06, 2.428889274597168e-06, 2.946704626083374e-06, 3.46451997756958e-06, 3.982335329055786e-06, 4.500150680541992e-06, 5.017966032028198e-06, 5.535781383514404e-06, 6.05359673500061e-06, 6.571412086486816e-06, 7.0892274379730225e-06, 7.6070427894592285e-06, 8.124858140945435e-06, 8.64267349243164e-06, 9.160488843917847e-06, 9.678304195404053e-06, 1.0196119546890259e-05, 1.0713934898376465e-05, 1.1231750249862671e-05, 1.1749565601348877e-05, 1.2267380952835083e-05, 1.2785196304321289e-05, 1.3303011655807495e-05, 1.3820827007293701e-05, 1.4338642358779907e-05, 1.4856457710266113e-05, 1.537427306175232e-05, 1.5892088413238525e-05, 1.640990376472473e-05, 1.6927719116210938e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 11.0, 14.0, 14.0, 13.0, 24.0, 26.0, 24.0, 34.0, 35.0, 44.0, 34.0, 42.0, 31.0, 34.0, 28.0, 34.0, 55.0, 38.0, 36.0, 47.0, 38.0, 41.0, 40.0, 38.0, 36.0, 26.0, 24.0, 32.0, 15.0, 11.0, 13.0, 14.0, 7.0, 10.0, 5.0, 3.0, 0.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.8076171875, -1.7589874267578125, -1.710357666015625, -1.6617279052734375, -1.61309814453125, -1.5644683837890625, -1.515838623046875, -1.4672088623046875, -1.4185791015625, -1.3699493408203125, -1.321319580078125, -1.2726898193359375, -1.22406005859375, -1.1754302978515625, -1.126800537109375, -1.0781707763671875, -1.029541015625, -0.9809112548828125, -0.932281494140625, -0.8836517333984375, -0.83502197265625, -0.7863922119140625, -0.737762451171875, -0.6891326904296875, -0.6405029296875, -0.5918731689453125, -0.543243408203125, -0.4946136474609375, -0.44598388671875, -0.3973541259765625, -0.348724365234375, -0.3000946044921875, -0.25146484375, -0.2028350830078125, -0.154205322265625, -0.1055755615234375, -0.05694580078125, -0.0083160400390625, 0.040313720703125, 0.0889434814453125, 0.1375732421875, 0.1862030029296875, 0.234832763671875, 0.2834625244140625, 0.33209228515625, 0.3807220458984375, 0.429351806640625, 0.4779815673828125, 0.526611328125, 0.5752410888671875, 0.623870849609375, 0.6725006103515625, 0.72113037109375, 0.7697601318359375, 0.818389892578125, 0.8670196533203125, 0.9156494140625, 0.9642791748046875, 1.012908935546875, 1.0615386962890625, 1.11016845703125, 1.1587982177734375, 1.207427978515625, 1.2560577392578125, 1.3046875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 14.0, 27.0, 27.0, 49.0, 77.0, 137.0, 245.0, 407.0, 686.0, 1311.0, 2319.0, 4505.0, 9360.0, 25172.0, 144815.0, 714443.0, 105928.0, 21596.0, 8457.0, 4084.0, 2131.0, 1181.0, 624.0, 376.0, 230.0, 143.0, 78.0, 48.0, 32.0, 17.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.390625, -9.10107421875, -8.8115234375, -8.52197265625, -8.232421875, -7.94287109375, -7.6533203125, -7.36376953125, -7.07421875, -6.78466796875, -6.4951171875, -6.20556640625, -5.916015625, -5.62646484375, -5.3369140625, -5.04736328125, -4.7578125, -4.46826171875, -4.1787109375, -3.88916015625, -3.599609375, -3.31005859375, -3.0205078125, -2.73095703125, -2.44140625, -2.15185546875, -1.8623046875, -1.57275390625, -1.283203125, -0.99365234375, -0.7041015625, -0.41455078125, -0.125, 0.16455078125, 0.4541015625, 0.74365234375, 1.033203125, 1.32275390625, 1.6123046875, 1.90185546875, 2.19140625, 2.48095703125, 2.7705078125, 3.06005859375, 3.349609375, 3.63916015625, 3.9287109375, 4.21826171875, 4.5078125, 4.79736328125, 5.0869140625, 5.37646484375, 5.666015625, 5.95556640625, 6.2451171875, 6.53466796875, 6.82421875, 7.11376953125, 7.4033203125, 7.69287109375, 7.982421875, 8.27197265625, 8.5615234375, 8.85107421875, 9.140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 13.0, 10.0, 10.0, 14.0, 20.0, 25.0, 24.0, 22.0, 39.0, 27.0, 49.0, 42.0, 51.0, 77.0, 89.0, 121.0, 167.0, 1452.0, 174.0, 115.0, 82.0, 58.0, 55.0, 53.0, 52.0, 33.0, 24.0, 25.0, 20.0, 21.0, 6.0, 11.0, 17.0, 6.0, 8.0, 8.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.40234375, -5.2452392578125, -5.088134765625, -4.9310302734375, -4.77392578125, -4.6168212890625, -4.459716796875, -4.3026123046875, -4.1455078125, -3.9884033203125, -3.831298828125, -3.6741943359375, -3.51708984375, -3.3599853515625, -3.202880859375, -3.0457763671875, -2.888671875, -2.7315673828125, -2.574462890625, -2.4173583984375, -2.26025390625, -2.1031494140625, -1.946044921875, -1.7889404296875, -1.6318359375, -1.4747314453125, -1.317626953125, -1.1605224609375, -1.00341796875, -0.8463134765625, -0.689208984375, -0.5321044921875, -0.375, -0.2178955078125, -0.060791015625, 0.0963134765625, 0.25341796875, 0.4105224609375, 0.567626953125, 0.7247314453125, 0.8818359375, 1.0389404296875, 1.196044921875, 1.3531494140625, 1.51025390625, 1.6673583984375, 1.824462890625, 1.9815673828125, 2.138671875, 2.2957763671875, 2.452880859375, 2.6099853515625, 2.76708984375, 2.9241943359375, 3.081298828125, 3.2384033203125, 3.3955078125, 3.5526123046875, 3.709716796875, 3.8668212890625, 4.02392578125, 4.1810302734375, 4.338134765625, 4.4952392578125, 4.65234375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 3.0, 9.0, 10.0, 12.0, 14.0, 15.0, 15.0, 18.0, 21.0, 25.0, 39.0, 57.0, 70.0, 108.0, 246.0, 644.0, 4240.0, 2802074.0, 334908.0, 2051.0, 500.0, 193.0, 90.0, 57.0, 52.0, 32.0, 36.0, 29.0, 21.0, 17.0, 17.0, 11.0, 19.0, 9.0, 6.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.90625, -21.1728515625, -20.439453125, -19.7060546875, -18.97265625, -18.2392578125, -17.505859375, -16.7724609375, -16.0390625, -15.3056640625, -14.572265625, -13.8388671875, -13.10546875, -12.3720703125, -11.638671875, -10.9052734375, -10.171875, -9.4384765625, -8.705078125, -7.9716796875, -7.23828125, -6.5048828125, -5.771484375, -5.0380859375, -4.3046875, -3.5712890625, -2.837890625, -2.1044921875, -1.37109375, -0.6376953125, 0.095703125, 0.8291015625, 1.5625, 2.2958984375, 3.029296875, 3.7626953125, 4.49609375, 5.2294921875, 5.962890625, 6.6962890625, 7.4296875, 8.1630859375, 8.896484375, 9.6298828125, 10.36328125, 11.0966796875, 11.830078125, 12.5634765625, 13.296875, 14.0302734375, 14.763671875, 15.4970703125, 16.23046875, 16.9638671875, 17.697265625, 18.4306640625, 19.1640625, 19.8974609375, 20.630859375, 21.3642578125, 22.09765625, 22.8310546875, 23.564453125, 24.2978515625, 25.03125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 24.0, 128.0, 327.0, 356.0, 125.0, 41.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.879621505737305, -18.87913703918457, -17.87865447998047, -16.878170013427734, -15.877685546875, -14.877201080322266, -13.876717567443848, -12.87623405456543, -11.875749588012695, -10.875265121459961, -9.874781608581543, -8.874298095703125, -7.873813629150391, -6.8733296394348145, -5.872845649719238, -4.872361660003662, -3.871877670288086, -2.8713936805725098, -1.8709096908569336, -0.8704257011413574, 0.13005828857421875, 1.130542278289795, 2.131026268005371, 3.1315102577209473, 4.131994247436523, 5.1324782371521, 6.132962226867676, 7.133446216583252, 8.133930206298828, 9.134414672851562, 10.13489818572998, 11.135381698608398, 12.135868072509766, 13.1363525390625, 14.136836051940918, 15.137319564819336, 16.13780403137207, 17.138288497924805, 18.138771057128906, 19.13925552368164, 20.139739990234375, 21.14022445678711, 22.140708923339844, 23.141191482543945, 24.14167594909668, 25.142160415649414, 26.142642974853516, 27.14312744140625, 28.143611907958984, 29.14409637451172, 30.144580841064453, 31.145063400268555, 32.145545959472656, 33.14603042602539, 34.146514892578125, 35.14699935913086, 36.147483825683594, 37.14796829223633, 38.14845275878906, 39.1489372253418, 40.14942169189453, 41.14990234375, 42.150386810302734, 43.15087127685547, 44.1513557434082]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 19.0, 5.0, 12.0, 17.0, 14.0, 20.0, 22.0, 25.0, 22.0, 42.0, 34.0, 41.0, 49.0, 46.0, 40.0, 45.0, 39.0, 47.0, 45.0, 36.0, 36.0, 43.0, 35.0, 30.0, 35.0, 28.0, 24.0, 28.0, 24.0, 13.0, 15.0, 10.0, 8.0, 10.0, 13.0, 6.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-22.5528564453125, -21.899646759033203, -21.246435165405273, -20.593223571777344, -19.940013885498047, -19.28680419921875, -18.63359260559082, -17.98038101196289, -17.327171325683594, -16.673961639404297, -16.020750045776367, -15.367539405822754, -14.71432876586914, -14.061118125915527, -13.407907485961914, -12.7546968460083, -12.101486206054688, -11.448275566101074, -10.795064926147461, -10.141854286193848, -9.488643646240234, -8.835433006286621, -8.182222366333008, -7.5290117263793945, -6.875801086425781, -6.222590446472168, -5.569379806518555, -4.916169166564941, -4.262958526611328, -3.609747886657715, -2.9565372467041016, -2.3033266067504883, -1.650115966796875, -0.9969053268432617, -0.34369468688964844, 0.30951595306396484, 0.9627265930175781, 1.6159372329711914, 2.2691478729248047, 2.922358512878418, 3.5755691528320312, 4.2287797927856445, 4.881990432739258, 5.535201072692871, 6.188411712646484, 6.841622352600098, 7.494832992553711, 8.148043632507324, 8.801254272460938, 9.45446491241455, 10.107675552368164, 10.760886192321777, 11.41409683227539, 12.067307472229004, 12.720518112182617, 13.37372875213623, 14.026939392089844, 14.680150032043457, 15.33336067199707, 15.986571311950684, 16.639781951904297, 17.292991638183594, 17.946203231811523, 18.599414825439453, 19.25262451171875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 15.0, 13.0, 11.0, 18.0, 20.0, 21.0, 25.0, 33.0, 28.0, 35.0, 41.0, 31.0, 39.0, 32.0, 38.0, 49.0, 39.0, 40.0, 33.0, 44.0, 42.0, 42.0, 44.0, 40.0, 36.0, 25.0, 20.0, 25.0, 25.0, 20.0, 11.0, 11.0, 8.0, 7.0, 10.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.8671875, -1.8161163330078125, -1.765045166015625, -1.7139739990234375, -1.66290283203125, -1.6118316650390625, -1.560760498046875, -1.5096893310546875, -1.4586181640625, -1.4075469970703125, -1.356475830078125, -1.3054046630859375, -1.25433349609375, -1.2032623291015625, -1.152191162109375, -1.1011199951171875, -1.050048828125, -0.9989776611328125, -0.947906494140625, -0.8968353271484375, -0.84576416015625, -0.7946929931640625, -0.743621826171875, -0.6925506591796875, -0.6414794921875, -0.5904083251953125, -0.539337158203125, -0.4882659912109375, -0.43719482421875, -0.3861236572265625, -0.335052490234375, -0.2839813232421875, -0.23291015625, -0.1818389892578125, -0.130767822265625, -0.0796966552734375, -0.02862548828125, 0.0224456787109375, 0.073516845703125, 0.1245880126953125, 0.1756591796875, 0.2267303466796875, 0.277801513671875, 0.3288726806640625, 0.37994384765625, 0.4310150146484375, 0.482086181640625, 0.5331573486328125, 0.584228515625, 0.6352996826171875, 0.686370849609375, 0.7374420166015625, 0.78851318359375, 0.8395843505859375, 0.890655517578125, 0.9417266845703125, 0.9927978515625, 1.0438690185546875, 1.094940185546875, 1.1460113525390625, 1.19708251953125, 1.2481536865234375, 1.299224853515625, 1.3502960205078125, 1.4013671875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 4.0, 12.0, 10.0, 14.0, 25.0, 24.0, 40.0, 44.0, 71.0, 97.0, 157.0, 234.0, 311.0, 541.0, 1003.0, 2428.0, 8371.0, 46563.0, 493389.0, 3322236.0, 277272.0, 30751.0, 6301.0, 2055.0, 896.0, 464.0, 272.0, 214.0, 147.0, 92.0, 68.0, 45.0, 26.0, 21.0, 14.0, 17.0, 14.0, 11.0, 7.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4644775390625, -8.155517578125, -7.8465576171875, -7.53759765625, -7.2286376953125, -6.919677734375, -6.6107177734375, -6.3017578125, -5.9927978515625, -5.683837890625, -5.3748779296875, -5.06591796875, -4.7569580078125, -4.447998046875, -4.1390380859375, -3.830078125, -3.5211181640625, -3.212158203125, -2.9031982421875, -2.59423828125, -2.2852783203125, -1.976318359375, -1.6673583984375, -1.3583984375, -1.0494384765625, -0.740478515625, -0.4315185546875, -0.12255859375, 0.1864013671875, 0.495361328125, 0.8043212890625, 1.11328125, 1.4222412109375, 1.731201171875, 2.0401611328125, 2.34912109375, 2.6580810546875, 2.967041015625, 3.2760009765625, 3.5849609375, 3.8939208984375, 4.202880859375, 4.5118408203125, 4.82080078125, 5.1297607421875, 5.438720703125, 5.7476806640625, 6.056640625, 6.3656005859375, 6.674560546875, 6.9835205078125, 7.29248046875, 7.6014404296875, 7.910400390625, 8.2193603515625, 8.5283203125, 8.8372802734375, 9.146240234375, 9.4552001953125, 9.76416015625, 10.0731201171875, 10.382080078125, 10.6910400390625, 11.0]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 14.0, 14.0, 28.0, 28.0, 43.0, 56.0, 97.0, 152.0, 170.0, 266.0, 375.0, 541.0, 647.0, 496.0, 350.0, 244.0, 184.0, 99.0, 79.0, 53.0, 42.0, 32.0, 20.0, 17.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.39398193359375, -4.1668701171875, -3.93975830078125, -3.712646484375, -3.48553466796875, -3.2584228515625, -3.03131103515625, -2.80419921875, -2.57708740234375, -2.3499755859375, -2.12286376953125, -1.895751953125, -1.66864013671875, -1.4415283203125, -1.21441650390625, -0.9873046875, -0.76019287109375, -0.5330810546875, -0.30596923828125, -0.078857421875, 0.14825439453125, 0.3753662109375, 0.60247802734375, 0.82958984375, 1.05670166015625, 1.2838134765625, 1.51092529296875, 1.738037109375, 1.96514892578125, 2.1922607421875, 2.41937255859375, 2.646484375, 2.87359619140625, 3.1007080078125, 3.32781982421875, 3.554931640625, 3.78204345703125, 4.0091552734375, 4.23626708984375, 4.46337890625, 4.69049072265625, 4.9176025390625, 5.14471435546875, 5.371826171875, 5.59893798828125, 5.8260498046875, 6.05316162109375, 6.2802734375, 6.50738525390625, 6.7344970703125, 6.96160888671875, 7.188720703125, 7.41583251953125, 7.6429443359375, 7.87005615234375, 8.09716796875, 8.32427978515625, 8.5513916015625, 8.77850341796875, 9.005615234375, 9.23272705078125, 9.4598388671875, 9.68695068359375, 9.9140625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 11.0, 25.0, 33.0, 57.0, 90.0, 181.0, 439.0, 1132.0, 4412.0, 36393.0, 846859.0, 3171086.0, 120648.0, 9727.0, 1991.0, 641.0, 281.0, 127.0, 52.0, 33.0, 21.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.609375, -17.006591796875, -16.40380859375, -15.801025390625, -15.1982421875, -14.595458984375, -13.99267578125, -13.389892578125, -12.787109375, -12.184326171875, -11.58154296875, -10.978759765625, -10.3759765625, -9.773193359375, -9.17041015625, -8.567626953125, -7.96484375, -7.362060546875, -6.75927734375, -6.156494140625, -5.5537109375, -4.950927734375, -4.34814453125, -3.745361328125, -3.142578125, -2.539794921875, -1.93701171875, -1.334228515625, -0.7314453125, -0.128662109375, 0.47412109375, 1.076904296875, 1.6796875, 2.282470703125, 2.88525390625, 3.488037109375, 4.0908203125, 4.693603515625, 5.29638671875, 5.899169921875, 6.501953125, 7.104736328125, 7.70751953125, 8.310302734375, 8.9130859375, 9.515869140625, 10.11865234375, 10.721435546875, 11.32421875, 11.927001953125, 12.52978515625, 13.132568359375, 13.7353515625, 14.338134765625, 14.94091796875, 15.543701171875, 16.146484375, 16.749267578125, 17.35205078125, 17.954833984375, 18.5576171875, 19.160400390625, 19.76318359375, 20.365966796875, 20.96875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 32.0, 305.0, 513.0, 154.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.835845947265625, -18.562938690185547, -14.290033340454102, -10.01712703704834, -5.744220733642578, -1.4713134765625, 2.8015918731689453, 7.074497222900391, 11.347404479980469, 15.62031078338623, 19.893217086791992, 24.166122436523438, 28.439029693603516, 32.711936950683594, 36.984840393066406, 41.257747650146484, 45.53065490722656, 49.80356216430664, 54.07646942138672, 58.34937286376953, 62.62228012084961, 66.89518737792969, 71.1680908203125, 75.44099426269531, 79.71390533447266, 83.98680877685547, 88.25971984863281, 92.53262329101562, 96.80552673339844, 101.07843780517578, 105.3513412475586, 109.62425231933594, 113.89714050292969, 118.1700439453125, 122.44295501708984, 126.71585845947266, 130.98876953125, 135.2616729736328, 139.53457641601562, 143.80747985839844, 148.08038330078125, 152.35328674316406, 156.62619018554688, 160.89910888671875, 165.17201232910156, 169.44491577148438, 173.7178192138672, 177.99072265625, 182.26364135742188, 186.5365447998047, 190.8094482421875, 195.08236694335938, 199.3552703857422, 203.628173828125, 207.9010772705078, 212.17398071289062, 216.4468994140625, 220.7198028564453, 224.99270629882812, 229.265625, 233.5385284423828, 237.81143188476562, 242.08433532714844, 246.35723876953125, 250.63014221191406]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 2.0, 7.0, 8.0, 7.0, 7.0, 14.0, 10.0, 14.0, 16.0, 25.0, 26.0, 25.0, 34.0, 37.0, 34.0, 33.0, 43.0, 48.0, 45.0, 33.0, 45.0, 39.0, 41.0, 45.0, 46.0, 37.0, 33.0, 24.0, 29.0, 23.0, 29.0, 24.0, 25.0, 18.0, 11.0, 12.0, 11.0, 9.0, 6.0, 8.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.81810760498047, -18.187110900878906, -17.55611228942871, -16.92511558532715, -16.294116973876953, -15.66312026977539, -15.032122611999512, -14.401124954223633, -13.770127296447754, -13.139129638671875, -12.508131980895996, -11.877134323120117, -11.246137619018555, -10.61513900756836, -9.984142303466797, -9.353144645690918, -8.722146987915039, -8.09114933013916, -7.460151672363281, -6.8291544914245605, -6.198156833648682, -5.567159175872803, -4.936161994934082, -4.305164337158203, -3.674166679382324, -3.0431690216064453, -2.4121716022491455, -1.7811740636825562, -1.1501765251159668, -0.5191788673400879, 0.11181855201721191, 0.7428159713745117, 1.3738136291503906, 2.0048112869262695, 2.6358087062835693, 3.266806125640869, 3.897803783416748, 4.528801441192627, 5.159798622131348, 5.790796279907227, 6.4217939376831055, 7.052791595458984, 7.683789253234863, 8.314786911010742, 8.945783615112305, 9.5767822265625, 10.207778930664062, 10.838776588439941, 11.46977424621582, 12.1007719039917, 12.731769561767578, 13.362767219543457, 13.993764877319336, 14.624761581420898, 15.255759239196777, 15.886756896972656, 16.51775360107422, 17.14875030517578, 17.779748916625977, 18.41074562072754, 19.041744232177734, 19.672740936279297, 20.303739547729492, 20.934736251831055, 21.56573486328125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 8.0, 6.0, 7.0, 13.0, 13.0, 16.0, 25.0, 22.0, 26.0, 27.0, 28.0, 27.0, 31.0, 42.0, 31.0, 40.0, 36.0, 44.0, 38.0, 39.0, 34.0, 31.0, 34.0, 45.0, 45.0, 46.0, 37.0, 26.0, 30.0, 28.0, 24.0, 18.0, 21.0, 13.0, 9.0, 12.0, 9.0, 7.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6736907958984375, -1.621795654296875, -1.5699005126953125, -1.51800537109375, -1.4661102294921875, -1.414215087890625, -1.3623199462890625, -1.3104248046875, -1.2585296630859375, -1.206634521484375, -1.1547393798828125, -1.10284423828125, -1.0509490966796875, -0.999053955078125, -0.9471588134765625, -0.895263671875, -0.8433685302734375, -0.791473388671875, -0.7395782470703125, -0.68768310546875, -0.6357879638671875, -0.583892822265625, -0.5319976806640625, -0.4801025390625, -0.4282073974609375, -0.376312255859375, -0.3244171142578125, -0.27252197265625, -0.2206268310546875, -0.168731689453125, -0.1168365478515625, -0.06494140625, -0.0130462646484375, 0.038848876953125, 0.0907440185546875, 0.14263916015625, 0.1945343017578125, 0.246429443359375, 0.2983245849609375, 0.3502197265625, 0.4021148681640625, 0.454010009765625, 0.5059051513671875, 0.55780029296875, 0.6096954345703125, 0.661590576171875, 0.7134857177734375, 0.765380859375, 0.8172760009765625, 0.869171142578125, 0.9210662841796875, 0.97296142578125, 1.0248565673828125, 1.076751708984375, 1.1286468505859375, 1.1805419921875, 1.2324371337890625, 1.284332275390625, 1.3362274169921875, 1.38812255859375, 1.4400177001953125, 1.491912841796875, 1.5438079833984375, 1.595703125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 0.0, 7.0, 9.0, 17.0, 19.0, 39.0, 64.0, 64.0, 124.0, 181.0, 232.0, 406.0, 609.0, 997.0, 1508.0, 2386.0, 3637.0, 6157.0, 10108.0, 16519.0, 27811.0, 48338.0, 88623.0, 187028.0, 334384.0, 144161.0, 73365.0, 40930.0, 23728.0, 14070.0, 8728.0, 5297.0, 3254.0, 2051.0, 1336.0, 841.0, 525.0, 330.0, 225.0, 162.0, 94.0, 73.0, 36.0, 37.0, 13.0, 18.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0679931640625, -0.06589126586914062, -0.06378936767578125, -0.061687469482421875, -0.0595855712890625, -0.057483673095703125, -0.05538177490234375, -0.053279876708984375, -0.051177978515625, -0.049076080322265625, -0.04697418212890625, -0.044872283935546875, -0.0427703857421875, -0.040668487548828125, -0.03856658935546875, -0.036464691162109375, -0.03436279296875, -0.032260894775390625, -0.03015899658203125, -0.028057098388671875, -0.0259552001953125, -0.023853302001953125, -0.02175140380859375, -0.019649505615234375, -0.017547607421875, -0.015445709228515625, -0.01334381103515625, -0.011241912841796875, -0.0091400146484375, -0.007038116455078125, -0.00493621826171875, -0.002834320068359375, -0.000732421875, 0.001369476318359375, 0.00347137451171875, 0.005573272705078125, 0.0076751708984375, 0.009777069091796875, 0.01187896728515625, 0.013980865478515625, 0.016082763671875, 0.018184661865234375, 0.02028656005859375, 0.022388458251953125, 0.0244903564453125, 0.026592254638671875, 0.02869415283203125, 0.030796051025390625, 0.03289794921875, 0.034999847412109375, 0.03710174560546875, 0.039203643798828125, 0.0413055419921875, 0.043407440185546875, 0.04550933837890625, 0.047611236572265625, 0.049713134765625, 0.051815032958984375, 0.05391693115234375, 0.056018829345703125, 0.0581207275390625, 0.060222625732421875, 0.06232452392578125, 0.06442642211914062, 0.0665283203125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 11.0, 12.0, 7.0, 18.0, 13.0, 10.0, 19.0, 25.0, 23.0, 26.0, 43.0, 32.0, 50.0, 48.0, 34.0, 35.0, 46.0, 40.0, 1072.0, 34.0, 47.0, 45.0, 36.0, 35.0, 36.0, 35.0, 34.0, 20.0, 27.0, 26.0, 14.0, 15.0, 9.0, 13.0, 10.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1875, -1.150482177734375, -1.11346435546875, -1.076446533203125, -1.0394287109375, -1.002410888671875, -0.96539306640625, -0.928375244140625, -0.891357421875, -0.854339599609375, -0.81732177734375, -0.780303955078125, -0.7432861328125, -0.706268310546875, -0.66925048828125, -0.632232666015625, -0.59521484375, -0.558197021484375, -0.52117919921875, -0.484161376953125, -0.4471435546875, -0.410125732421875, -0.37310791015625, -0.336090087890625, -0.299072265625, -0.262054443359375, -0.22503662109375, -0.188018798828125, -0.1510009765625, -0.113983154296875, -0.07696533203125, -0.039947509765625, -0.0029296875, 0.034088134765625, 0.07110595703125, 0.108123779296875, 0.1451416015625, 0.182159423828125, 0.21917724609375, 0.256195068359375, 0.293212890625, 0.330230712890625, 0.36724853515625, 0.404266357421875, 0.4412841796875, 0.478302001953125, 0.51531982421875, 0.552337646484375, 0.58935546875, 0.626373291015625, 0.66339111328125, 0.700408935546875, 0.7374267578125, 0.774444580078125, 0.81146240234375, 0.848480224609375, 0.885498046875, 0.922515869140625, 0.95953369140625, 0.996551513671875, 1.0335693359375, 1.070587158203125, 1.10760498046875, 1.144622802734375, 1.181640625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 7.0, 15.0, 16.0, 23.0, 47.0, 70.0, 92.0, 148.0, 218.0, 330.0, 516.0, 790.0, 1216.0, 1838.0, 2985.0, 4738.0, 7346.0, 11855.0, 19656.0, 32274.0, 56294.0, 103094.0, 215110.0, 1332665.0, 133892.0, 69719.0, 40151.0, 23477.0, 14384.0, 8813.0, 5456.0, 3524.0, 2229.0, 1458.0, 939.0, 587.0, 415.0, 252.0, 162.0, 101.0, 83.0, 43.0, 34.0, 24.0, 17.0, 10.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.02799844741821289, -0.02700519561767578, -0.026011943817138672, -0.025018692016601562, -0.024025440216064453, -0.023032188415527344, -0.022038936614990234, -0.021045684814453125, -0.020052433013916016, -0.019059181213378906, -0.018065929412841797, -0.017072677612304688, -0.016079425811767578, -0.015086174011230469, -0.01409292221069336, -0.01309967041015625, -0.01210641860961914, -0.011113166809082031, -0.010119915008544922, -0.009126663208007812, -0.008133411407470703, -0.007140159606933594, -0.006146907806396484, -0.005153656005859375, -0.004160404205322266, -0.0031671524047851562, -0.002173900604248047, -0.0011806488037109375, -0.00018739700317382812, 0.0008058547973632812, 0.0017991065979003906, 0.0027923583984375, 0.0037856101989746094, 0.004778861999511719, 0.005772113800048828, 0.0067653656005859375, 0.007758617401123047, 0.008751869201660156, 0.009745121002197266, 0.010738372802734375, 0.011731624603271484, 0.012724876403808594, 0.013718128204345703, 0.014711380004882812, 0.015704631805419922, 0.01669788360595703, 0.01769113540649414, 0.01868438720703125, 0.01967763900756836, 0.02067089080810547, 0.021664142608642578, 0.022657394409179688, 0.023650646209716797, 0.024643898010253906, 0.025637149810791016, 0.026630401611328125, 0.027623653411865234, 0.028616905212402344, 0.029610157012939453, 0.030603408813476562, 0.03159666061401367, 0.03258991241455078, 0.03358316421508789, 0.034576416015625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 7.0, 1.0, 7.0, 7.0, 7.0, 16.0, 8.0, 16.0, 17.0, 22.0, 24.0, 22.0, 33.0, 50.0, 45.0, 51.0, 50.0, 71.0, 83.0, 82.0, 82.0, 50.0, 47.0, 34.0, 43.0, 22.0, 21.0, 23.0, 21.0, 11.0, 4.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1742115020751953e-05, -1.1353753507137299e-05, -1.0965391993522644e-05, -1.057703047990799e-05, -1.0188668966293335e-05, -9.80030745267868e-06, -9.411945939064026e-06, -9.023584425449371e-06, -8.635222911834717e-06, -8.246861398220062e-06, -7.858499884605408e-06, -7.470138370990753e-06, -7.081776857376099e-06, -6.693415343761444e-06, -6.3050538301467896e-06, -5.916692316532135e-06, -5.5283308029174805e-06, -5.139969289302826e-06, -4.751607775688171e-06, -4.363246262073517e-06, -3.974884748458862e-06, -3.5865232348442078e-06, -3.1981617212295532e-06, -2.8098002076148987e-06, -2.421438694000244e-06, -2.0330771803855896e-06, -1.644715666770935e-06, -1.2563541531562805e-06, -8.67992639541626e-07, -4.796311259269714e-07, -9.12696123123169e-08, 2.9709190130233765e-07, 6.854534149169922e-07, 1.0738149285316467e-06, 1.4621764421463013e-06, 1.8505379557609558e-06, 2.2388994693756104e-06, 2.627260982990265e-06, 3.0156224966049194e-06, 3.403984010219574e-06, 3.7923455238342285e-06, 4.180707037448883e-06, 4.569068551063538e-06, 4.957430064678192e-06, 5.345791578292847e-06, 5.734153091907501e-06, 6.122514605522156e-06, 6.51087611913681e-06, 6.899237632751465e-06, 7.287599146366119e-06, 7.675960659980774e-06, 8.064322173595428e-06, 8.452683687210083e-06, 8.841045200824738e-06, 9.229406714439392e-06, 9.617768228054047e-06, 1.0006129741668701e-05, 1.0394491255283356e-05, 1.078285276889801e-05, 1.1171214282512665e-05, 1.155957579612732e-05, 1.1947937309741974e-05, 1.2336298823356628e-05, 1.2724660336971283e-05, 1.3113021850585938e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 15.0, 16.0, 23.0, 31.0, 34.0, 41.0, 47.0, 62.0, 64.0, 88.0, 121.0, 151.0, 247.0, 567.0, 67680.0, 977154.0, 1167.0, 284.0, 181.0, 112.0, 99.0, 72.0, 62.0, 40.0, 40.0, 23.0, 20.0, 18.0, 16.0, 14.0, 12.0, 13.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024962425231933594, -0.000242527574300766, -0.00023543089628219604, -0.0002283342182636261, -0.00022123754024505615, -0.0002141408622264862, -0.00020704418420791626, -0.0001999475061893463, -0.00019285082817077637, -0.00018575415015220642, -0.00017865747213363647, -0.00017156079411506653, -0.00016446411609649658, -0.00015736743807792664, -0.0001502707600593567, -0.00014317408204078674, -0.0001360774040222168, -0.00012898072600364685, -0.0001218840479850769, -0.00011478736996650696, -0.00010769069194793701, -0.00010059401392936707, -9.349733591079712e-05, -8.640065789222717e-05, -7.930397987365723e-05, -7.220730185508728e-05, -6.511062383651733e-05, -5.801394581794739e-05, -5.091726779937744e-05, -4.3820589780807495e-05, -3.672391176223755e-05, -2.9627233743667603e-05, -2.2530555725097656e-05, -1.543387770652771e-05, -8.337199687957764e-06, -1.2405216693878174e-06, 5.856156349182129e-06, 1.2952834367752075e-05, 2.004951238632202e-05, 2.7146190404891968e-05, 3.4242868423461914e-05, 4.133954644203186e-05, 4.843622446060181e-05, 5.553290247917175e-05, 6.26295804977417e-05, 6.972625851631165e-05, 7.682293653488159e-05, 8.391961455345154e-05, 9.101629257202148e-05, 9.811297059059143e-05, 0.00010520964860916138, 0.00011230632662773132, 0.00011940300464630127, 0.00012649968266487122, 0.00013359636068344116, 0.0001406930387020111, 0.00014778971672058105, 0.000154886394739151, 0.00016198307275772095, 0.0001690797507762909, 0.00017617642879486084, 0.00018327310681343079, 0.00019036978483200073, 0.00019746646285057068, 0.00020456314086914062]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 64.0, 953.0, 3.0], "bins": [-0.0002125888131558895, -0.00020917571964673698, -0.00020576264068949968, -0.00020234954718034714, -0.0001989364536711946, -0.0001955233747139573, -0.00019211028120480478, -0.00018869718769565225, -0.00018528409418649971, -0.00018187100067734718, -0.00017845792172010988, -0.00017504482821095735, -0.00017163173470180482, -0.0001682186557445675, -0.00016480556223541498, -0.00016139246872626245, -0.00015797938976902515, -0.00015456629625987262, -0.0001511532173026353, -0.00014774012379348278, -0.00014432703028433025, -0.00014091393677517772, -0.00013750085781794041, -0.00013408776430878788, -0.00013067468535155058, -0.00012726159184239805, -0.00012384851288516074, -0.00012043541937600821, -0.00011702232586685568, -0.00011360923963366076, -0.00011019615340046585, -0.00010678305989131331, -0.00010336996638216078, -9.995688014896587e-05, -9.654378663981333e-05, -9.313070040661842e-05, -8.971760689746588e-05, -8.630452066427097e-05, -8.289143443107605e-05, -7.947834092192352e-05, -7.60652546887286e-05, -7.265216845553368e-05, -6.923907494638115e-05, -6.582598871318623e-05, -6.241290247999132e-05, -5.8999808970838785e-05, -5.558672273764387e-05, -5.217363286647014e-05, -4.876054299529642e-05, -4.5347453124122694e-05, -4.193436325294897e-05, -3.852127701975405e-05, -3.510818714858033e-05, -3.16950972774066e-05, -2.8282009225222282e-05, -2.486892117303796e-05, -2.1455831301864237e-05, -1.8042741430690512e-05, -1.4629653378506191e-05, -1.1216564416827168e-05, -7.803475455148146e-06, -4.390385583974421e-06, -9.772975317901e-07, 2.435790520394221e-06, 5.848879482073244e-06]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 6.0, 7.0, 8.0, 7.0, 13.0, 15.0, 18.0, 23.0, 13.0, 30.0, 19.0, 44.0, 38.0, 45.0, 71.0, 56.0, 49.0, 52.0, 62.0, 61.0, 46.0, 52.0, 60.0, 41.0, 31.0, 26.0, 19.0, 21.0, 9.0, 17.0, 14.0, 7.0, 5.0, 6.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.778165698051453e-06, -6.5229833126068115e-06, -6.26780092716217e-06, -6.012618541717529e-06, -5.757436156272888e-06, -5.502253770828247e-06, -5.247071385383606e-06, -4.991888999938965e-06, -4.736706614494324e-06, -4.481524229049683e-06, -4.2263418436050415e-06, -3.9711594581604e-06, -3.7159770727157593e-06, -3.460794687271118e-06, -3.205612301826477e-06, -2.950429916381836e-06, -2.695247530937195e-06, -2.4400651454925537e-06, -2.1848827600479126e-06, -1.9297003746032715e-06, -1.6745179891586304e-06, -1.4193356037139893e-06, -1.1641532182693481e-06, -9.08970832824707e-07, -6.537884473800659e-07, -3.986060619354248e-07, -1.434236764907837e-07, 1.1175870895385742e-07, 3.6694109439849854e-07, 6.221234798431396e-07, 8.773058652877808e-07, 1.1324882507324219e-06, 1.387670636177063e-06, 1.642853021621704e-06, 1.8980354070663452e-06, 2.1532177925109863e-06, 2.4084001779556274e-06, 2.6635825634002686e-06, 2.9187649488449097e-06, 3.1739473342895508e-06, 3.429129719734192e-06, 3.684312105178833e-06, 3.939494490623474e-06, 4.194676876068115e-06, 4.449859261512756e-06, 4.7050416469573975e-06, 4.9602240324020386e-06, 5.21540641784668e-06, 5.470588803291321e-06, 5.725771188735962e-06, 5.980953574180603e-06, 6.236135959625244e-06, 6.491318345069885e-06, 6.746500730514526e-06, 7.0016831159591675e-06, 7.256865501403809e-06, 7.51204788684845e-06, 7.76723027229309e-06, 8.022412657737732e-06, 8.277595043182373e-06, 8.532777428627014e-06, 8.787959814071655e-06, 9.043142199516296e-06, 9.298324584960938e-06]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 8.0, 6.0, 7.0, 13.0, 13.0, 16.0, 25.0, 22.0, 26.0, 27.0, 28.0, 27.0, 31.0, 42.0, 31.0, 40.0, 36.0, 44.0, 38.0, 39.0, 34.0, 31.0, 34.0, 45.0, 45.0, 46.0, 37.0, 26.0, 30.0, 28.0, 24.0, 18.0, 21.0, 13.0, 9.0, 12.0, 9.0, 7.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6736907958984375, -1.621795654296875, -1.5699005126953125, -1.51800537109375, -1.4661102294921875, -1.414215087890625, -1.3623199462890625, -1.3104248046875, -1.2585296630859375, -1.206634521484375, -1.1547393798828125, -1.10284423828125, -1.0509490966796875, -0.999053955078125, -0.9471588134765625, -0.895263671875, -0.8433685302734375, -0.791473388671875, -0.7395782470703125, -0.68768310546875, -0.6357879638671875, -0.583892822265625, -0.5319976806640625, -0.4801025390625, -0.4282073974609375, -0.376312255859375, -0.3244171142578125, -0.27252197265625, -0.2206268310546875, -0.168731689453125, -0.1168365478515625, -0.06494140625, -0.0130462646484375, 0.038848876953125, 0.0907440185546875, 0.14263916015625, 0.1945343017578125, 0.246429443359375, 0.2983245849609375, 0.3502197265625, 0.4021148681640625, 0.454010009765625, 0.5059051513671875, 0.55780029296875, 0.6096954345703125, 0.661590576171875, 0.7134857177734375, 0.765380859375, 0.8172760009765625, 0.869171142578125, 0.9210662841796875, 0.97296142578125, 1.0248565673828125, 1.076751708984375, 1.1286468505859375, 1.1805419921875, 1.2324371337890625, 1.284332275390625, 1.3362274169921875, 1.38812255859375, 1.4400177001953125, 1.491912841796875, 1.5438079833984375, 1.595703125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 12.0, 16.0, 22.0, 27.0, 31.0, 53.0, 82.0, 115.0, 154.0, 193.0, 399.0, 569.0, 1023.0, 1686.0, 2958.0, 5602.0, 10748.0, 21927.0, 49020.0, 119435.0, 301609.0, 310889.0, 124478.0, 50160.0, 23050.0, 11173.0, 5616.0, 3124.0, 1663.0, 994.0, 579.0, 383.0, 248.0, 170.0, 100.0, 68.0, 54.0, 40.0, 30.0, 19.0, 13.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5458984375, -1.496063232421875, -1.44622802734375, -1.396392822265625, -1.3465576171875, -1.296722412109375, -1.24688720703125, -1.197052001953125, -1.147216796875, -1.097381591796875, -1.04754638671875, -0.997711181640625, -0.9478759765625, -0.898040771484375, -0.84820556640625, -0.798370361328125, -0.74853515625, -0.698699951171875, -0.64886474609375, -0.599029541015625, -0.5491943359375, -0.499359130859375, -0.44952392578125, -0.399688720703125, -0.349853515625, -0.300018310546875, -0.25018310546875, -0.200347900390625, -0.1505126953125, -0.100677490234375, -0.05084228515625, -0.001007080078125, 0.048828125, 0.098663330078125, 0.14849853515625, 0.198333740234375, 0.2481689453125, 0.298004150390625, 0.34783935546875, 0.397674560546875, 0.447509765625, 0.497344970703125, 0.54718017578125, 0.597015380859375, 0.6468505859375, 0.696685791015625, 0.74652099609375, 0.796356201171875, 0.84619140625, 0.896026611328125, 0.94586181640625, 0.995697021484375, 1.0455322265625, 1.095367431640625, 1.14520263671875, 1.195037841796875, 1.244873046875, 1.294708251953125, 1.34454345703125, 1.394378662109375, 1.4442138671875, 1.494049072265625, 1.54388427734375, 1.593719482421875, 1.6435546875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 7.0, 14.0, 13.0, 16.0, 20.0, 21.0, 39.0, 29.0, 45.0, 35.0, 60.0, 76.0, 113.0, 371.0, 1556.0, 173.0, 85.0, 56.0, 45.0, 47.0, 30.0, 39.0, 32.0, 24.0, 17.0, 21.0, 14.0, 7.0, 8.0, 7.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.5390625, -8.3031005859375, -8.067138671875, -7.8311767578125, -7.59521484375, -7.3592529296875, -7.123291015625, -6.8873291015625, -6.6513671875, -6.4154052734375, -6.179443359375, -5.9434814453125, -5.70751953125, -5.4715576171875, -5.235595703125, -4.9996337890625, -4.763671875, -4.5277099609375, -4.291748046875, -4.0557861328125, -3.81982421875, -3.5838623046875, -3.347900390625, -3.1119384765625, -2.8759765625, -2.6400146484375, -2.404052734375, -2.1680908203125, -1.93212890625, -1.6961669921875, -1.460205078125, -1.2242431640625, -0.98828125, -0.7523193359375, -0.516357421875, -0.2803955078125, -0.04443359375, 0.1915283203125, 0.427490234375, 0.6634521484375, 0.8994140625, 1.1353759765625, 1.371337890625, 1.6072998046875, 1.84326171875, 2.0792236328125, 2.315185546875, 2.5511474609375, 2.787109375, 3.0230712890625, 3.259033203125, 3.4949951171875, 3.73095703125, 3.9669189453125, 4.202880859375, 4.4388427734375, 4.6748046875, 4.9107666015625, 5.146728515625, 5.3826904296875, 5.61865234375, 5.8546142578125, 6.090576171875, 6.3265380859375, 6.5625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 3.0, 7.0, 6.0, 15.0, 13.0, 17.0, 23.0, 27.0, 29.0, 41.0, 51.0, 73.0, 113.0, 183.0, 483.0, 2211.0, 43724.0, 3073048.0, 22975.0, 1692.0, 410.0, 182.0, 83.0, 75.0, 42.0, 39.0, 33.0, 13.0, 20.0, 17.0, 13.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.9765625, -12.5201416015625, -12.063720703125, -11.6072998046875, -11.15087890625, -10.6944580078125, -10.238037109375, -9.7816162109375, -9.3251953125, -8.8687744140625, -8.412353515625, -7.9559326171875, -7.49951171875, -7.0430908203125, -6.586669921875, -6.1302490234375, -5.673828125, -5.2174072265625, -4.760986328125, -4.3045654296875, -3.84814453125, -3.3917236328125, -2.935302734375, -2.4788818359375, -2.0224609375, -1.5660400390625, -1.109619140625, -0.6531982421875, -0.19677734375, 0.2596435546875, 0.716064453125, 1.1724853515625, 1.62890625, 2.0853271484375, 2.541748046875, 2.9981689453125, 3.45458984375, 3.9110107421875, 4.367431640625, 4.8238525390625, 5.2802734375, 5.7366943359375, 6.193115234375, 6.6495361328125, 7.10595703125, 7.5623779296875, 8.018798828125, 8.4752197265625, 8.931640625, 9.3880615234375, 9.844482421875, 10.3009033203125, 10.75732421875, 11.2137451171875, 11.670166015625, 12.1265869140625, 12.5830078125, 13.0394287109375, 13.495849609375, 13.9522705078125, 14.40869140625, 14.8651123046875, 15.321533203125, 15.7779541015625, 16.234375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 160.0, 632.0, 196.0, 16.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.008544921875, -19.73766326904297, -18.466781616210938, -17.195899963378906, -15.925019264221191, -14.65413761138916, -13.383256912231445, -12.112375259399414, -10.841493606567383, -9.570611953735352, -8.29973030090332, -7.0288496017456055, -5.757967948913574, -4.487086296081543, -3.21620512008667, -1.9453239440917969, -0.6744422912597656, 0.5964391231536865, 1.8673205375671387, 3.138201951980591, 4.409083366394043, 5.679965019226074, 6.950846195220947, 8.22172737121582, 9.492609024047852, 10.763490676879883, 12.034372329711914, 13.305253028869629, 14.57613468170166, 15.847016334533691, 17.117897033691406, 18.388778686523438, 19.659656524658203, 20.930538177490234, 22.201419830322266, 23.472301483154297, 24.743183135986328, 26.01406478881836, 27.284944534301758, 28.55582618713379, 29.82670783996582, 31.09758949279785, 32.36846923828125, 33.63935089111328, 34.91023254394531, 36.181114196777344, 37.451995849609375, 38.722877502441406, 39.99375915527344, 41.26464080810547, 42.5355224609375, 43.80640411376953, 45.07728576660156, 46.348167419433594, 47.619049072265625, 48.889930725097656, 50.16081237792969, 51.43169403076172, 52.70257568359375, 53.97345733642578, 55.24433898925781, 56.515220642089844, 57.786102294921875, 59.056983947753906, 60.32786178588867]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 10.0, 10.0, 7.0, 17.0, 19.0, 22.0, 27.0, 17.0, 38.0, 38.0, 27.0, 37.0, 52.0, 54.0, 50.0, 45.0, 38.0, 41.0, 46.0, 32.0, 45.0, 37.0, 33.0, 27.0, 30.0, 30.0, 30.0, 17.0, 17.0, 21.0, 15.0, 17.0, 9.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-20.333335876464844, -19.726058959960938, -19.1187801361084, -18.511503219604492, -17.904224395751953, -17.296947479248047, -16.689668655395508, -16.0823917388916, -15.475113868713379, -14.867835998535156, -14.260558128356934, -13.653280258178711, -13.046003341674805, -12.438724517822266, -11.83144760131836, -11.224169731140137, -10.616891860961914, -10.009613990783691, -9.402336120605469, -8.795058250427246, -8.187780380249023, -7.580502986907959, -6.9732255935668945, -6.365947723388672, -5.758669853210449, -5.151391983032227, -4.544114112854004, -3.9368367195129395, -3.329558849334717, -2.722280979156494, -2.1150033473968506, -1.507725715637207, -0.9004478454589844, -0.29317009449005127, 0.31410765647888184, 0.9213854074478149, 1.528663158416748, 2.1359410285949707, 2.7432186603546143, 3.350496292114258, 3.9577741622924805, 4.565052032470703, 5.172329902648926, 5.77960729598999, 6.386885166168213, 6.9941630363464355, 7.6014404296875, 8.208718299865723, 8.815996170043945, 9.423274040222168, 10.03055191040039, 10.637829780578613, 11.245107650756836, 11.852384567260742, 12.459662437438965, 13.066940307617188, 13.67421817779541, 14.281496047973633, 14.888773918151855, 15.496051788330078, 16.103328704833984, 16.710607528686523, 17.31788444519043, 17.92516326904297, 18.532440185546875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 8.0, 6.0, 15.0, 17.0, 12.0, 22.0, 23.0, 26.0, 34.0, 29.0, 28.0, 33.0, 36.0, 46.0, 30.0, 41.0, 34.0, 46.0, 38.0, 36.0, 23.0, 43.0, 43.0, 52.0, 34.0, 30.0, 35.0, 28.0, 27.0, 21.0, 21.0, 16.0, 10.0, 16.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6712188720703125, -1.618804931640625, -1.5663909912109375, -1.51397705078125, -1.4615631103515625, -1.409149169921875, -1.3567352294921875, -1.3043212890625, -1.2519073486328125, -1.199493408203125, -1.1470794677734375, -1.09466552734375, -1.0422515869140625, -0.989837646484375, -0.9374237060546875, -0.885009765625, -0.8325958251953125, -0.780181884765625, -0.7277679443359375, -0.67535400390625, -0.6229400634765625, -0.570526123046875, -0.5181121826171875, -0.4656982421875, -0.4132843017578125, -0.360870361328125, -0.3084564208984375, -0.25604248046875, -0.2036285400390625, -0.151214599609375, -0.0988006591796875, -0.04638671875, 0.0060272216796875, 0.058441162109375, 0.1108551025390625, 0.16326904296875, 0.2156829833984375, 0.268096923828125, 0.3205108642578125, 0.3729248046875, 0.4253387451171875, 0.477752685546875, 0.5301666259765625, 0.58258056640625, 0.6349945068359375, 0.687408447265625, 0.7398223876953125, 0.792236328125, 0.8446502685546875, 0.897064208984375, 0.9494781494140625, 1.00189208984375, 1.0543060302734375, 1.106719970703125, 1.1591339111328125, 1.2115478515625, 1.2639617919921875, 1.316375732421875, 1.3687896728515625, 1.42120361328125, 1.4736175537109375, 1.526031494140625, 1.5784454345703125, 1.630859375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 7.0, 6.0, 19.0, 23.0, 21.0, 32.0, 30.0, 45.0, 56.0, 78.0, 98.0, 140.0, 208.0, 437.0, 1238.0, 3995.0, 16345.0, 91312.0, 1021017.0, 2806143.0, 210158.0, 32025.0, 7095.0, 2049.0, 727.0, 296.0, 187.0, 114.0, 77.0, 71.0, 51.0, 34.0, 27.0, 33.0, 24.0, 11.0, 12.0, 12.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6015625, -9.33636474609375, -9.0711669921875, -8.80596923828125, -8.540771484375, -8.27557373046875, -8.0103759765625, -7.74517822265625, -7.47998046875, -7.21478271484375, -6.9495849609375, -6.68438720703125, -6.419189453125, -6.15399169921875, -5.8887939453125, -5.62359619140625, -5.3583984375, -5.09320068359375, -4.8280029296875, -4.56280517578125, -4.297607421875, -4.03240966796875, -3.7672119140625, -3.50201416015625, -3.23681640625, -2.97161865234375, -2.7064208984375, -2.44122314453125, -2.176025390625, -1.91082763671875, -1.6456298828125, -1.38043212890625, -1.115234375, -0.85003662109375, -0.5848388671875, -0.31964111328125, -0.054443359375, 0.21075439453125, 0.4759521484375, 0.74114990234375, 1.00634765625, 1.27154541015625, 1.5367431640625, 1.80194091796875, 2.067138671875, 2.33233642578125, 2.5975341796875, 2.86273193359375, 3.1279296875, 3.39312744140625, 3.6583251953125, 3.92352294921875, 4.188720703125, 4.45391845703125, 4.7191162109375, 4.98431396484375, 5.24951171875, 5.51470947265625, 5.7799072265625, 6.04510498046875, 6.310302734375, 6.57550048828125, 6.8406982421875, 7.10589599609375, 7.37109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 9.0, 8.0, 13.0, 14.0, 21.0, 44.0, 53.0, 50.0, 65.0, 110.0, 133.0, 177.0, 213.0, 319.0, 363.0, 436.0, 461.0, 372.0, 305.0, 217.0, 160.0, 137.0, 96.0, 76.0, 58.0, 42.0, 32.0, 19.0, 13.0, 14.0, 8.0, 5.0, 7.0, 1.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.76171875, -6.5880126953125, -6.414306640625, -6.2406005859375, -6.06689453125, -5.8931884765625, -5.719482421875, -5.5457763671875, -5.3720703125, -5.1983642578125, -5.024658203125, -4.8509521484375, -4.67724609375, -4.5035400390625, -4.329833984375, -4.1561279296875, -3.982421875, -3.8087158203125, -3.635009765625, -3.4613037109375, -3.28759765625, -3.1138916015625, -2.940185546875, -2.7664794921875, -2.5927734375, -2.4190673828125, -2.245361328125, -2.0716552734375, -1.89794921875, -1.7242431640625, -1.550537109375, -1.3768310546875, -1.203125, -1.0294189453125, -0.855712890625, -0.6820068359375, -0.50830078125, -0.3345947265625, -0.160888671875, 0.0128173828125, 0.1865234375, 0.3602294921875, 0.533935546875, 0.7076416015625, 0.88134765625, 1.0550537109375, 1.228759765625, 1.4024658203125, 1.576171875, 1.7498779296875, 1.923583984375, 2.0972900390625, 2.27099609375, 2.4447021484375, 2.618408203125, 2.7921142578125, 2.9658203125, 3.1395263671875, 3.313232421875, 3.4869384765625, 3.66064453125, 3.8343505859375, 4.008056640625, 4.1817626953125, 4.35546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 14.0, 15.0, 21.0, 31.0, 38.0, 72.0, 128.0, 161.0, 312.0, 560.0, 1173.0, 2717.0, 7395.0, 23271.0, 95663.0, 521568.0, 2586074.0, 776765.0, 132362.0, 30750.0, 9043.0, 3171.0, 1419.0, 625.0, 361.0, 205.0, 127.0, 75.0, 50.0, 29.0, 19.0, 19.0, 17.0, 6.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.875, -11.5592041015625, -11.243408203125, -10.9276123046875, -10.61181640625, -10.2960205078125, -9.980224609375, -9.6644287109375, -9.3486328125, -9.0328369140625, -8.717041015625, -8.4012451171875, -8.08544921875, -7.7696533203125, -7.453857421875, -7.1380615234375, -6.822265625, -6.5064697265625, -6.190673828125, -5.8748779296875, -5.55908203125, -5.2432861328125, -4.927490234375, -4.6116943359375, -4.2958984375, -3.9801025390625, -3.664306640625, -3.3485107421875, -3.03271484375, -2.7169189453125, -2.401123046875, -2.0853271484375, -1.76953125, -1.4537353515625, -1.137939453125, -0.8221435546875, -0.50634765625, -0.1905517578125, 0.125244140625, 0.4410400390625, 0.7568359375, 1.0726318359375, 1.388427734375, 1.7042236328125, 2.02001953125, 2.3358154296875, 2.651611328125, 2.9674072265625, 3.283203125, 3.5989990234375, 3.914794921875, 4.2305908203125, 4.54638671875, 4.8621826171875, 5.177978515625, 5.4937744140625, 5.8095703125, 6.1253662109375, 6.441162109375, 6.7569580078125, 7.07275390625, 7.3885498046875, 7.704345703125, 8.0201416015625, 8.3359375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 14.0, 24.0, 49.0, 66.0, 97.0, 167.0, 125.0, 131.0, 109.0, 88.0, 63.0, 28.0, 19.0, 10.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.50980758666992, -47.31346893310547, -46.117130279541016, -44.92079162597656, -43.72445297241211, -42.528114318847656, -41.33177185058594, -40.135433197021484, -38.93909454345703, -37.74275588989258, -36.546417236328125, -35.35007858276367, -34.15373992919922, -32.9573974609375, -31.76106071472168, -30.564720153808594, -29.368383407592773, -28.17204475402832, -26.975706100463867, -25.77936553955078, -24.583026885986328, -23.386688232421875, -22.190349578857422, -20.99401092529297, -19.797672271728516, -18.601333618164062, -17.40499496459961, -16.208656311035156, -15.01231575012207, -13.815977096557617, -12.619638442993164, -11.423298835754395, -10.226957321166992, -9.030618667602539, -7.8342790603637695, -6.637940406799316, -5.441601276397705, -4.245262145996094, -3.0489234924316406, -1.852583885192871, -0.656245231628418, 0.5400937795639038, 1.7364327907562256, 2.932771682739258, 4.129110813140869, 5.3254499435424805, 6.521788597106934, 7.718128204345703, 8.914466857910156, 10.11080551147461, 11.307145118713379, 12.503483772277832, 13.699823379516602, 14.896162033081055, 16.092500686645508, 17.288841247558594, 18.485179901123047, 19.6815185546875, 20.877857208251953, 22.074195861816406, 23.270536422729492, 24.466875076293945, 25.6632137298584, 26.859554290771484, 28.055891036987305]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 2.0, 9.0, 4.0, 7.0, 8.0, 14.0, 10.0, 12.0, 25.0, 26.0, 28.0, 21.0, 31.0, 32.0, 39.0, 26.0, 35.0, 35.0, 52.0, 34.0, 35.0, 40.0, 49.0, 33.0, 31.0, 34.0, 30.0, 33.0, 43.0, 28.0, 23.0, 15.0, 29.0, 20.0, 19.0, 18.0, 15.0, 6.0, 11.0, 10.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.312026977539062, -18.7178897857666, -18.123754501342773, -17.529617309570312, -16.935482025146484, -16.341344833374023, -15.747208595275879, -15.153072357177734, -14.55893611907959, -13.964799880981445, -13.3706636428833, -12.776527404785156, -12.182390213012695, -11.588254928588867, -10.994117736816406, -10.399981498718262, -9.805845260620117, -9.211709022521973, -8.617572784423828, -8.023436546325684, -7.429299831390381, -6.835163593292236, -6.241026878356934, -5.646890640258789, -5.0527544021606445, -4.4586181640625, -3.8644816875457764, -3.2703452110290527, -2.676208972930908, -2.0820727348327637, -1.48793625831604, -0.8937997817993164, -0.2996635437011719, 0.2944728136062622, 0.8886091709136963, 1.4827455282211304, 2.0768818855285645, 2.671018123626709, 3.2651546001434326, 3.8592910766601562, 4.453427314758301, 5.047563552856445, 5.64169979095459, 6.235836505889893, 6.829972743988037, 7.424108982086182, 8.018245697021484, 8.612381935119629, 9.206518173217773, 9.800654411315918, 10.394790649414062, 10.988926887512207, 11.583063125610352, 12.177200317382812, 12.771336555480957, 13.365472793579102, 13.959609031677246, 14.55374526977539, 15.147881507873535, 15.74201774597168, 16.33615493774414, 16.93029022216797, 17.52442741394043, 18.11856460571289, 18.71269989013672]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 3.0, 11.0, 12.0, 11.0, 9.0, 18.0, 24.0, 26.0, 26.0, 27.0, 27.0, 37.0, 37.0, 26.0, 42.0, 36.0, 28.0, 48.0, 42.0, 39.0, 33.0, 41.0, 29.0, 36.0, 38.0, 44.0, 35.0, 34.0, 24.0, 28.0, 16.0, 26.0, 13.0, 9.0, 12.0, 15.0, 9.0, 4.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.9755859375, -1.92218017578125, -1.8687744140625, -1.81536865234375, -1.761962890625, -1.70855712890625, -1.6551513671875, -1.60174560546875, -1.54833984375, -1.49493408203125, -1.4415283203125, -1.38812255859375, -1.334716796875, -1.28131103515625, -1.2279052734375, -1.17449951171875, -1.12109375, -1.06768798828125, -1.0142822265625, -0.96087646484375, -0.907470703125, -0.85406494140625, -0.8006591796875, -0.74725341796875, -0.69384765625, -0.64044189453125, -0.5870361328125, -0.53363037109375, -0.480224609375, -0.42681884765625, -0.3734130859375, -0.32000732421875, -0.2666015625, -0.21319580078125, -0.1597900390625, -0.10638427734375, -0.052978515625, 0.00042724609375, 0.0538330078125, 0.10723876953125, 0.16064453125, 0.21405029296875, 0.2674560546875, 0.32086181640625, 0.374267578125, 0.42767333984375, 0.4810791015625, 0.53448486328125, 0.587890625, 0.64129638671875, 0.6947021484375, 0.74810791015625, 0.801513671875, 0.85491943359375, 0.9083251953125, 0.96173095703125, 1.01513671875, 1.06854248046875, 1.1219482421875, 1.17535400390625, 1.228759765625, 1.28216552734375, 1.3355712890625, 1.38897705078125, 1.4423828125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 5.0, 6.0, 6.0, 19.0, 9.0, 18.0, 16.0, 36.0, 53.0, 87.0, 129.0, 193.0, 247.0, 376.0, 483.0, 685.0, 1015.0, 1620.0, 2403.0, 3529.0, 4998.0, 7245.0, 11105.0, 16561.0, 24400.0, 37227.0, 57326.0, 93901.0, 173155.0, 258080.0, 133259.0, 76493.0, 48170.0, 31327.0, 21269.0, 13784.0, 9442.0, 6406.0, 4278.0, 2926.0, 2005.0, 1364.0, 913.0, 603.0, 404.0, 280.0, 215.0, 159.0, 109.0, 75.0, 46.0, 29.0, 23.0, 15.0, 6.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0], "bins": [-0.054595947265625, -0.05285167694091797, -0.05110740661621094, -0.049363136291503906, -0.047618865966796875, -0.045874595642089844, -0.04413032531738281, -0.04238605499267578, -0.04064178466796875, -0.03889751434326172, -0.03715324401855469, -0.035408973693847656, -0.033664703369140625, -0.031920433044433594, -0.030176162719726562, -0.02843189239501953, -0.0266876220703125, -0.02494335174560547, -0.023199081420898438, -0.021454811096191406, -0.019710540771484375, -0.017966270446777344, -0.016222000122070312, -0.014477729797363281, -0.01273345947265625, -0.010989189147949219, -0.009244918823242188, -0.007500648498535156, -0.005756378173828125, -0.004012107849121094, -0.0022678375244140625, -0.0005235671997070312, 0.001220703125, 0.0029649734497070312, 0.0047092437744140625, 0.006453514099121094, 0.008197784423828125, 0.009942054748535156, 0.011686325073242188, 0.013430595397949219, 0.01517486572265625, 0.01691913604736328, 0.018663406372070312, 0.020407676696777344, 0.022151947021484375, 0.023896217346191406, 0.025640487670898438, 0.02738475799560547, 0.0291290283203125, 0.03087329864501953, 0.03261756896972656, 0.034361839294433594, 0.036106109619140625, 0.037850379943847656, 0.03959465026855469, 0.04133892059326172, 0.04308319091796875, 0.04482746124267578, 0.04657173156738281, 0.048316001892089844, 0.050060272216796875, 0.051804542541503906, 0.05354881286621094, 0.05529308319091797, 0.057037353515625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 12.0, 7.0, 12.0, 17.0, 13.0, 16.0, 19.0, 20.0, 24.0, 14.0, 23.0, 13.0, 27.0, 25.0, 29.0, 39.0, 33.0, 40.0, 25.0, 41.0, 1066.0, 29.0, 37.0, 50.0, 35.0, 40.0, 28.0, 39.0, 30.0, 34.0, 29.0, 14.0, 25.0, 17.0, 19.0, 5.0, 11.0, 8.0, 9.0, 8.0, 12.0, 9.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0224609375, -0.9888153076171875, -0.955169677734375, -0.9215240478515625, -0.88787841796875, -0.8542327880859375, -0.820587158203125, -0.7869415283203125, -0.7532958984375, -0.7196502685546875, -0.686004638671875, -0.6523590087890625, -0.61871337890625, -0.5850677490234375, -0.551422119140625, -0.5177764892578125, -0.484130859375, -0.4504852294921875, -0.416839599609375, -0.3831939697265625, -0.34954833984375, -0.3159027099609375, -0.282257080078125, -0.2486114501953125, -0.2149658203125, -0.1813201904296875, -0.147674560546875, -0.1140289306640625, -0.08038330078125, -0.0467376708984375, -0.013092041015625, 0.0205535888671875, 0.05419921875, 0.0878448486328125, 0.121490478515625, 0.1551361083984375, 0.18878173828125, 0.2224273681640625, 0.256072998046875, 0.2897186279296875, 0.3233642578125, 0.3570098876953125, 0.390655517578125, 0.4243011474609375, 0.45794677734375, 0.4915924072265625, 0.525238037109375, 0.5588836669921875, 0.592529296875, 0.6261749267578125, 0.659820556640625, 0.6934661865234375, 0.72711181640625, 0.7607574462890625, 0.794403076171875, 0.8280487060546875, 0.8616943359375, 0.8953399658203125, 0.928985595703125, 0.9626312255859375, 0.99627685546875, 1.0299224853515625, 1.063568115234375, 1.0972137451171875, 1.130859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 6.0, 14.0, 25.0, 18.0, 35.0, 57.0, 93.0, 137.0, 260.0, 385.0, 555.0, 963.0, 1570.0, 2271.0, 3774.0, 5937.0, 9796.0, 16113.0, 27353.0, 47919.0, 89808.0, 192341.0, 1366513.0, 153945.0, 75431.0, 41154.0, 23563.0, 14192.0, 8764.0, 5206.0, 3303.0, 2107.0, 1283.0, 793.0, 527.0, 335.0, 218.0, 117.0, 79.0, 62.0, 44.0, 20.0, 20.0, 10.0, 10.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03558349609375, -0.034449100494384766, -0.03331470489501953, -0.0321803092956543, -0.031045913696289062, -0.029911518096923828, -0.028777122497558594, -0.02764272689819336, -0.026508331298828125, -0.02537393569946289, -0.024239540100097656, -0.023105144500732422, -0.021970748901367188, -0.020836353302001953, -0.01970195770263672, -0.018567562103271484, -0.01743316650390625, -0.016298770904541016, -0.015164375305175781, -0.014029979705810547, -0.012895584106445312, -0.011761188507080078, -0.010626792907714844, -0.00949239730834961, -0.008358001708984375, -0.007223606109619141, -0.006089210510253906, -0.004954814910888672, -0.0038204193115234375, -0.002686023712158203, -0.0015516281127929688, -0.0004172325134277344, 0.0007171630859375, 0.0018515586853027344, 0.0029859542846679688, 0.004120349884033203, 0.0052547454833984375, 0.006389141082763672, 0.007523536682128906, 0.00865793228149414, 0.009792327880859375, 0.01092672348022461, 0.012061119079589844, 0.013195514678955078, 0.014329910278320312, 0.015464305877685547, 0.01659870147705078, 0.017733097076416016, 0.01886749267578125, 0.020001888275146484, 0.02113628387451172, 0.022270679473876953, 0.023405075073242188, 0.024539470672607422, 0.025673866271972656, 0.02680826187133789, 0.027942657470703125, 0.02907705307006836, 0.030211448669433594, 0.03134584426879883, 0.03248023986816406, 0.0336146354675293, 0.03474903106689453, 0.035883426666259766, 0.037017822265625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 4.0, 5.0, 10.0, 7.0, 8.0, 13.0, 16.0, 20.0, 33.0, 36.0, 39.0, 41.0, 44.0, 55.0, 49.0, 72.0, 103.0, 51.0, 55.0, 53.0, 50.0, 28.0, 30.0, 34.0, 18.0, 17.0, 16.0, 12.0, 12.0, 11.0, 10.0, 7.0, 4.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6748905181884766e-05, -1.6194768249988556e-05, -1.5640631318092346e-05, -1.5086494386196136e-05, -1.4532357454299927e-05, -1.3978220522403717e-05, -1.3424083590507507e-05, -1.2869946658611298e-05, -1.2315809726715088e-05, -1.1761672794818878e-05, -1.1207535862922668e-05, -1.0653398931026459e-05, -1.0099261999130249e-05, -9.54512506723404e-06, -8.99098813533783e-06, -8.43685120344162e-06, -7.88271427154541e-06, -7.3285773396492004e-06, -6.774440407752991e-06, -6.220303475856781e-06, -5.666166543960571e-06, -5.1120296120643616e-06, -4.557892680168152e-06, -4.003755748271942e-06, -3.4496188163757324e-06, -2.8954818844795227e-06, -2.341344952583313e-06, -1.7872080206871033e-06, -1.2330710887908936e-06, -6.789341568946838e-07, -1.2479722499847412e-07, 4.293397068977356e-07, 9.834766387939453e-07, 1.537613570690155e-06, 2.0917505025863647e-06, 2.6458874344825745e-06, 3.200024366378784e-06, 3.754161298274994e-06, 4.308298230171204e-06, 4.862435162067413e-06, 5.416572093963623e-06, 5.970709025859833e-06, 6.5248459577560425e-06, 7.078982889652252e-06, 7.633119821548462e-06, 8.187256753444672e-06, 8.741393685340881e-06, 9.295530617237091e-06, 9.8496675491333e-06, 1.040380448102951e-05, 1.095794141292572e-05, 1.151207834482193e-05, 1.206621527671814e-05, 1.262035220861435e-05, 1.3174489140510559e-05, 1.3728626072406769e-05, 1.4282763004302979e-05, 1.4836899936199188e-05, 1.5391036868095398e-05, 1.5945173799991608e-05, 1.6499310731887817e-05, 1.7053447663784027e-05, 1.7607584595680237e-05, 1.8161721527576447e-05, 1.8715858459472656e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 13.0, 11.0, 11.0, 19.0, 25.0, 25.0, 36.0, 46.0, 61.0, 69.0, 105.0, 171.0, 222.0, 424.0, 1989.0, 1018203.0, 25497.0, 600.0, 274.0, 179.0, 117.0, 109.0, 71.0, 64.0, 54.0, 22.0, 32.0, 12.0, 15.0, 10.0, 7.0, 3.0, 7.0, 5.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0003554821014404297, -0.00034493952989578247, -0.00033439695835113525, -0.00032385438680648804, -0.0003133118152618408, -0.0003027692437171936, -0.0002922266721725464, -0.00028168410062789917, -0.00027114152908325195, -0.00026059895753860474, -0.0002500563859939575, -0.0002395138144493103, -0.00022897124290466309, -0.00021842867136001587, -0.00020788609981536865, -0.00019734352827072144, -0.00018680095672607422, -0.000176258385181427, -0.00016571581363677979, -0.00015517324209213257, -0.00014463067054748535, -0.00013408809900283813, -0.00012354552745819092, -0.0001130029559135437, -0.00010246038436889648, -9.191781282424927e-05, -8.137524127960205e-05, -7.083266973495483e-05, -6.029009819030762e-05, -4.97475266456604e-05, -3.9204955101013184e-05, -2.8662383556365967e-05, -1.811981201171875e-05, -7.577240467071533e-06, 2.9653310775756836e-06, 1.35079026222229e-05, 2.4050474166870117e-05, 3.4593045711517334e-05, 4.513561725616455e-05, 5.567818880081177e-05, 6.622076034545898e-05, 7.67633318901062e-05, 8.730590343475342e-05, 9.784847497940063e-05, 0.00010839104652404785, 0.00011893361806869507, 0.00012947618961334229, 0.0001400187611579895, 0.00015056133270263672, 0.00016110390424728394, 0.00017164647579193115, 0.00018218904733657837, 0.00019273161888122559, 0.0002032741904258728, 0.00021381676197052002, 0.00022435933351516724, 0.00023490190505981445, 0.00024544447660446167, 0.0002559870481491089, 0.0002665296196937561, 0.0002770721912384033, 0.00028761476278305054, 0.00029815733432769775, 0.00030869990587234497, 0.0003192424774169922]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 20.0, 57.0, 182.0, 360.0, 251.0, 94.0, 26.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.2677176932338625e-05, -3.205612301826477e-05, -3.1435069104190916e-05, -3.0814011552138254e-05, -3.01929576380644e-05, -2.9571903723990545e-05, -2.895084980991669e-05, -2.8329795895842835e-05, -2.7708740162779577e-05, -2.7087686248705722e-05, -2.6466630515642464e-05, -2.584557660156861e-05, -2.5224522687494755e-05, -2.4603466954431497e-05, -2.3982413040357642e-05, -2.3361357307294384e-05, -2.274030339322053e-05, -2.2119249479146674e-05, -2.1498193746083416e-05, -2.087713983200956e-05, -2.0256084098946303e-05, -1.963503018487245e-05, -1.9013976270798594e-05, -1.839292235672474e-05, -1.777186662366148e-05, -1.7150812709587626e-05, -1.6529756976524368e-05, -1.5908703062450513e-05, -1.528764914837666e-05, -1.46665934153134e-05, -1.4045539501239546e-05, -1.342448467767099e-05, -1.2803429854102433e-05, -1.2182375030533876e-05, -1.156132020696532e-05, -1.0940266292891465e-05, -1.0319211469322909e-05, -9.698156645754352e-06, -9.077102731680498e-06, -8.456047908111941e-06, -7.834993084543385e-06, -7.213938260974828e-06, -6.592883892153623e-06, -5.971829523332417e-06, -5.3507746997638606e-06, -4.729719876195304e-06, -4.1086655073740985e-06, -3.487611138552893e-06, -2.8665558602369856e-06, -2.2455012640421046e-06, -1.6244466678472236e-06, -1.0033920716523426e-06, -3.8233747545746155e-07, 2.3871712073741946e-07, 8.597717169323005e-07, 1.480826085753506e-06, 2.1018809093220625e-06, 2.7229355055169435e-06, 3.3439901017118245e-06, 3.965044925280381e-06, 4.5860992941015866e-06, 5.207153662922792e-06, 5.828208486491349e-06, 6.449262855312554e-06, 7.070317678881111e-06]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 4.0, 7.0, 10.0, 7.0, 9.0, 16.0, 11.0, 25.0, 13.0, 26.0, 20.0, 33.0, 33.0, 26.0, 29.0, 37.0, 38.0, 50.0, 47.0, 48.0, 38.0, 48.0, 37.0, 37.0, 43.0, 43.0, 27.0, 27.0, 29.0, 31.0, 22.0, 22.0, 23.0, 9.0, 16.0, 10.0, 13.0, 4.0, 5.0, 5.0, 10.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.138448715209961e-05, -1.1062249541282654e-05, -1.0740011930465698e-05, -1.0417774319648743e-05, -1.0095536708831787e-05, -9.773299098014832e-06, -9.451061487197876e-06, -9.12882387638092e-06, -8.806586265563965e-06, -8.48434865474701e-06, -8.162111043930054e-06, -7.839873433113098e-06, -7.517635822296143e-06, -7.195398211479187e-06, -6.8731606006622314e-06, -6.550922989845276e-06, -6.22868537902832e-06, -5.906447768211365e-06, -5.584210157394409e-06, -5.261972546577454e-06, -4.939734935760498e-06, -4.6174973249435425e-06, -4.295259714126587e-06, -3.973022103309631e-06, -3.6507844924926758e-06, -3.3285468816757202e-06, -3.0063092708587646e-06, -2.684071660041809e-06, -2.3618340492248535e-06, -2.039596438407898e-06, -1.7173588275909424e-06, -1.3951212167739868e-06, -1.0728836059570312e-06, -7.506459951400757e-07, -4.284083843231201e-07, -1.0617077350616455e-07, 2.1606683731079102e-07, 5.383044481277466e-07, 8.605420589447021e-07, 1.1827796697616577e-06, 1.5050172805786133e-06, 1.8272548913955688e-06, 2.1494925022125244e-06, 2.47173011302948e-06, 2.7939677238464355e-06, 3.116205334663391e-06, 3.4384429454803467e-06, 3.7606805562973022e-06, 4.082918167114258e-06, 4.405155777931213e-06, 4.727393388748169e-06, 5.0496309995651245e-06, 5.37186861038208e-06, 5.694106221199036e-06, 6.016343832015991e-06, 6.338581442832947e-06, 6.660819053649902e-06, 6.983056664466858e-06, 7.3052942752838135e-06, 7.627531886100769e-06, 7.949769496917725e-06, 8.27200710773468e-06, 8.594244718551636e-06, 8.916482329368591e-06, 9.238719940185547e-06]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 3.0, 11.0, 12.0, 11.0, 9.0, 18.0, 24.0, 26.0, 26.0, 27.0, 27.0, 37.0, 37.0, 26.0, 42.0, 36.0, 28.0, 48.0, 42.0, 39.0, 33.0, 41.0, 29.0, 36.0, 38.0, 44.0, 35.0, 34.0, 24.0, 28.0, 16.0, 26.0, 13.0, 9.0, 12.0, 15.0, 9.0, 4.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.9755859375, -1.92218017578125, -1.8687744140625, -1.81536865234375, -1.761962890625, -1.70855712890625, -1.6551513671875, -1.60174560546875, -1.54833984375, -1.49493408203125, -1.4415283203125, -1.38812255859375, -1.334716796875, -1.28131103515625, -1.2279052734375, -1.17449951171875, -1.12109375, -1.06768798828125, -1.0142822265625, -0.96087646484375, -0.907470703125, -0.85406494140625, -0.8006591796875, -0.74725341796875, -0.69384765625, -0.64044189453125, -0.5870361328125, -0.53363037109375, -0.480224609375, -0.42681884765625, -0.3734130859375, -0.32000732421875, -0.2666015625, -0.21319580078125, -0.1597900390625, -0.10638427734375, -0.052978515625, 0.00042724609375, 0.0538330078125, 0.10723876953125, 0.16064453125, 0.21405029296875, 0.2674560546875, 0.32086181640625, 0.374267578125, 0.42767333984375, 0.4810791015625, 0.53448486328125, 0.587890625, 0.64129638671875, 0.6947021484375, 0.74810791015625, 0.801513671875, 0.85491943359375, 0.9083251953125, 0.96173095703125, 1.01513671875, 1.06854248046875, 1.1219482421875, 1.17535400390625, 1.228759765625, 1.28216552734375, 1.3355712890625, 1.38897705078125, 1.4423828125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 11.0, 10.0, 31.0, 42.0, 58.0, 88.0, 131.0, 253.0, 400.0, 698.0, 1184.0, 2088.0, 3657.0, 6834.0, 12919.0, 28778.0, 102181.0, 702409.0, 124572.0, 31822.0, 13885.0, 7313.0, 3999.0, 2160.0, 1210.0, 741.0, 431.0, 236.0, 159.0, 89.0, 47.0, 41.0, 33.0, 12.0, 5.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.87042236328125, -2.7662353515625, -2.66204833984375, -2.557861328125, -2.45367431640625, -2.3494873046875, -2.24530029296875, -2.14111328125, -2.03692626953125, -1.9327392578125, -1.82855224609375, -1.724365234375, -1.62017822265625, -1.5159912109375, -1.41180419921875, -1.3076171875, -1.20343017578125, -1.0992431640625, -0.99505615234375, -0.890869140625, -0.78668212890625, -0.6824951171875, -0.57830810546875, -0.47412109375, -0.36993408203125, -0.2657470703125, -0.16156005859375, -0.057373046875, 0.04681396484375, 0.1510009765625, 0.25518798828125, 0.359375, 0.46356201171875, 0.5677490234375, 0.67193603515625, 0.776123046875, 0.88031005859375, 0.9844970703125, 1.08868408203125, 1.19287109375, 1.29705810546875, 1.4012451171875, 1.50543212890625, 1.609619140625, 1.71380615234375, 1.8179931640625, 1.92218017578125, 2.0263671875, 2.13055419921875, 2.2347412109375, 2.33892822265625, 2.443115234375, 2.54730224609375, 2.6514892578125, 2.75567626953125, 2.85986328125, 2.96405029296875, 3.0682373046875, 3.17242431640625, 3.276611328125, 3.38079833984375, 3.4849853515625, 3.58917236328125, 3.693359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 4.0, 13.0, 13.0, 17.0, 18.0, 18.0, 19.0, 25.0, 22.0, 27.0, 42.0, 36.0, 41.0, 37.0, 68.0, 96.0, 194.0, 1739.0, 143.0, 71.0, 53.0, 38.0, 44.0, 28.0, 33.0, 38.0, 24.0, 25.0, 17.0, 19.0, 10.0, 18.0, 7.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.79296875, -6.58929443359375, -6.3856201171875, -6.18194580078125, -5.978271484375, -5.77459716796875, -5.5709228515625, -5.36724853515625, -5.16357421875, -4.95989990234375, -4.7562255859375, -4.55255126953125, -4.348876953125, -4.14520263671875, -3.9415283203125, -3.73785400390625, -3.5341796875, -3.33050537109375, -3.1268310546875, -2.92315673828125, -2.719482421875, -2.51580810546875, -2.3121337890625, -2.10845947265625, -1.90478515625, -1.70111083984375, -1.4974365234375, -1.29376220703125, -1.090087890625, -0.88641357421875, -0.6827392578125, -0.47906494140625, -0.275390625, -0.07171630859375, 0.1319580078125, 0.33563232421875, 0.539306640625, 0.74298095703125, 0.9466552734375, 1.15032958984375, 1.35400390625, 1.55767822265625, 1.7613525390625, 1.96502685546875, 2.168701171875, 2.37237548828125, 2.5760498046875, 2.77972412109375, 2.9833984375, 3.18707275390625, 3.3907470703125, 3.59442138671875, 3.798095703125, 4.00177001953125, 4.2054443359375, 4.40911865234375, 4.61279296875, 4.81646728515625, 5.0201416015625, 5.22381591796875, 5.427490234375, 5.63116455078125, 5.8348388671875, 6.03851318359375, 6.2421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 8.0, 14.0, 9.0, 21.0, 28.0, 26.0, 28.0, 54.0, 73.0, 112.0, 166.0, 320.0, 1001.0, 4792.0, 40687.0, 2868887.0, 213070.0, 13045.0, 2107.0, 519.0, 242.0, 134.0, 77.0, 60.0, 36.0, 37.0, 22.0, 24.0, 20.0, 16.0, 11.0, 11.0, 3.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.6328125, -10.2869873046875, -9.941162109375, -9.5953369140625, -9.24951171875, -8.9036865234375, -8.557861328125, -8.2120361328125, -7.8662109375, -7.5203857421875, -7.174560546875, -6.8287353515625, -6.48291015625, -6.1370849609375, -5.791259765625, -5.4454345703125, -5.099609375, -4.7537841796875, -4.407958984375, -4.0621337890625, -3.71630859375, -3.3704833984375, -3.024658203125, -2.6788330078125, -2.3330078125, -1.9871826171875, -1.641357421875, -1.2955322265625, -0.94970703125, -0.6038818359375, -0.258056640625, 0.0877685546875, 0.43359375, 0.7794189453125, 1.125244140625, 1.4710693359375, 1.81689453125, 2.1627197265625, 2.508544921875, 2.8543701171875, 3.2001953125, 3.5460205078125, 3.891845703125, 4.2376708984375, 4.58349609375, 4.9293212890625, 5.275146484375, 5.6209716796875, 5.966796875, 6.3126220703125, 6.658447265625, 7.0042724609375, 7.35009765625, 7.6959228515625, 8.041748046875, 8.3875732421875, 8.7333984375, 9.0792236328125, 9.425048828125, 9.7708740234375, 10.11669921875, 10.4625244140625, 10.808349609375, 11.1541748046875, 11.5]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 19.0, 64.0, 156.0, 215.0, 243.0, 197.0, 82.0, 23.0, 9.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.509864807128906, -20.821853637695312, -20.133840560913086, -19.445829391479492, -18.757816314697266, -18.069805145263672, -17.381793975830078, -16.693782806396484, -16.005769729614258, -15.317757606506348, -14.629745483398438, -13.941734313964844, -13.253722190856934, -12.565710067749023, -11.87769889831543, -11.18968677520752, -10.50167465209961, -9.8136625289917, -9.125650405883789, -8.437639236450195, -7.749627113342285, -7.061614990234375, -6.373603343963623, -5.685591697692871, -4.997579574584961, -4.309567451477051, -3.621555805206299, -2.9335439205169678, -2.2455320358276367, -1.5575201511383057, -0.8695082664489746, -0.18149662017822266, 0.5065135955810547, 1.1945254802703857, 1.8825373649597168, 2.570549249649048, 3.258561134338379, 3.94657301902771, 4.634584903717041, 5.322596549987793, 6.010608673095703, 6.698620796203613, 7.386632442474365, 8.074644088745117, 8.762656211853027, 9.450668334960938, 10.138679504394531, 10.826691627502441, 11.514703750610352, 12.202715873718262, 12.890727996826172, 13.578739166259766, 14.266751289367676, 14.954763412475586, 15.64277458190918, 16.330787658691406, 17.018798828125, 17.706809997558594, 18.39482307434082, 19.082834243774414, 19.77084732055664, 20.458858489990234, 21.146869659423828, 21.834880828857422, 22.52289390563965]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 7.0, 6.0, 15.0, 11.0, 14.0, 14.0, 18.0, 24.0, 14.0, 35.0, 18.0, 39.0, 42.0, 43.0, 39.0, 51.0, 40.0, 37.0, 52.0, 53.0, 35.0, 41.0, 33.0, 26.0, 40.0, 32.0, 37.0, 15.0, 24.0, 19.0, 17.0, 17.0, 17.0, 14.0, 15.0, 8.0, 9.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.87796974182129, -23.20223617553711, -22.52650260925293, -21.85076904296875, -21.17503547668457, -20.49930191040039, -19.82356834411621, -19.14783477783203, -18.47210121154785, -17.796367645263672, -17.120634078979492, -16.444900512695312, -15.769166946411133, -15.093433380126953, -14.417699813842773, -13.741966247558594, -13.066232681274414, -12.390499114990234, -11.714765548706055, -11.039031982421875, -10.363298416137695, -9.687564849853516, -9.011831283569336, -8.336097717285156, -7.660364151000977, -6.984630584716797, -6.308897018432617, -5.6331634521484375, -4.957429885864258, -4.281696319580078, -3.6059627532958984, -2.9302291870117188, -2.254497528076172, -1.5787639617919922, -0.9030303955078125, -0.2272968292236328, 0.4484367370605469, 1.1241703033447266, 1.7999038696289062, 2.475637435913086, 3.1513710021972656, 3.8271045684814453, 4.502838134765625, 5.178571701049805, 5.854305267333984, 6.530038833618164, 7.205772399902344, 7.881505966186523, 8.557239532470703, 9.232973098754883, 9.908706665039062, 10.584440231323242, 11.260173797607422, 11.935907363891602, 12.611640930175781, 13.287374496459961, 13.96310806274414, 14.63884162902832, 15.3145751953125, 15.99030876159668, 16.66604232788086, 17.34177589416504, 18.01750946044922, 18.6932430267334, 19.368976593017578]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 2.0, 3.0, 12.0, 12.0, 10.0, 17.0, 18.0, 14.0, 24.0, 24.0, 35.0, 30.0, 31.0, 34.0, 29.0, 35.0, 35.0, 39.0, 37.0, 39.0, 34.0, 47.0, 31.0, 30.0, 37.0, 43.0, 31.0, 41.0, 36.0, 39.0, 16.0, 22.0, 18.0, 16.0, 14.0, 13.0, 11.0, 10.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9580078125, -1.9039306640625, -1.849853515625, -1.7957763671875, -1.74169921875, -1.6876220703125, -1.633544921875, -1.5794677734375, -1.525390625, -1.4713134765625, -1.417236328125, -1.3631591796875, -1.30908203125, -1.2550048828125, -1.200927734375, -1.1468505859375, -1.0927734375, -1.0386962890625, -0.984619140625, -0.9305419921875, -0.87646484375, -0.8223876953125, -0.768310546875, -0.7142333984375, -0.66015625, -0.6060791015625, -0.552001953125, -0.4979248046875, -0.44384765625, -0.3897705078125, -0.335693359375, -0.2816162109375, -0.2275390625, -0.1734619140625, -0.119384765625, -0.0653076171875, -0.01123046875, 0.0428466796875, 0.096923828125, 0.1510009765625, 0.205078125, 0.2591552734375, 0.313232421875, 0.3673095703125, 0.42138671875, 0.4754638671875, 0.529541015625, 0.5836181640625, 0.6376953125, 0.6917724609375, 0.745849609375, 0.7999267578125, 0.85400390625, 0.9080810546875, 0.962158203125, 1.0162353515625, 1.0703125, 1.1243896484375, 1.178466796875, 1.2325439453125, 1.28662109375, 1.3406982421875, 1.394775390625, 1.4488525390625, 1.5029296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 3.0, 9.0, 12.0, 10.0, 16.0, 11.0, 15.0, 23.0, 24.0, 39.0, 39.0, 65.0, 74.0, 93.0, 129.0, 270.0, 520.0, 1059.0, 2821.0, 7870.0, 26752.0, 120849.0, 1022026.0, 2647717.0, 289820.0, 52666.0, 13343.0, 4552.0, 1697.0, 754.0, 348.0, 170.0, 112.0, 71.0, 66.0, 54.0, 44.0, 24.0, 22.0, 25.0, 10.0, 8.0, 14.0, 8.0, 5.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-7.19140625, -6.96832275390625, -6.7452392578125, -6.52215576171875, -6.299072265625, -6.07598876953125, -5.8529052734375, -5.62982177734375, -5.40673828125, -5.18365478515625, -4.9605712890625, -4.73748779296875, -4.514404296875, -4.29132080078125, -4.0682373046875, -3.84515380859375, -3.6220703125, -3.39898681640625, -3.1759033203125, -2.95281982421875, -2.729736328125, -2.50665283203125, -2.2835693359375, -2.06048583984375, -1.83740234375, -1.61431884765625, -1.3912353515625, -1.16815185546875, -0.945068359375, -0.72198486328125, -0.4989013671875, -0.27581787109375, -0.052734375, 0.17034912109375, 0.3934326171875, 0.61651611328125, 0.839599609375, 1.06268310546875, 1.2857666015625, 1.50885009765625, 1.73193359375, 1.95501708984375, 2.1781005859375, 2.40118408203125, 2.624267578125, 2.84735107421875, 3.0704345703125, 3.29351806640625, 3.5166015625, 3.73968505859375, 3.9627685546875, 4.18585205078125, 4.408935546875, 4.63201904296875, 4.8551025390625, 5.07818603515625, 5.30126953125, 5.52435302734375, 5.7474365234375, 5.97052001953125, 6.193603515625, 6.41668701171875, 6.6397705078125, 6.86285400390625, 7.0859375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 3.0, 6.0, 19.0, 23.0, 32.0, 41.0, 61.0, 86.0, 138.0, 196.0, 255.0, 368.0, 512.0, 592.0, 467.0, 362.0, 281.0, 196.0, 139.0, 83.0, 55.0, 53.0, 40.0, 24.0, 10.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.375, -7.1549072265625, -6.934814453125, -6.7147216796875, -6.49462890625, -6.2745361328125, -6.054443359375, -5.8343505859375, -5.6142578125, -5.3941650390625, -5.174072265625, -4.9539794921875, -4.73388671875, -4.5137939453125, -4.293701171875, -4.0736083984375, -3.853515625, -3.6334228515625, -3.413330078125, -3.1932373046875, -2.97314453125, -2.7530517578125, -2.532958984375, -2.3128662109375, -2.0927734375, -1.8726806640625, -1.652587890625, -1.4324951171875, -1.21240234375, -0.9923095703125, -0.772216796875, -0.5521240234375, -0.33203125, -0.1119384765625, 0.108154296875, 0.3282470703125, 0.54833984375, 0.7684326171875, 0.988525390625, 1.2086181640625, 1.4287109375, 1.6488037109375, 1.868896484375, 2.0889892578125, 2.30908203125, 2.5291748046875, 2.749267578125, 2.9693603515625, 3.189453125, 3.4095458984375, 3.629638671875, 3.8497314453125, 4.06982421875, 4.2899169921875, 4.510009765625, 4.7301025390625, 4.9501953125, 5.1702880859375, 5.390380859375, 5.6104736328125, 5.83056640625, 6.0506591796875, 6.270751953125, 6.4908447265625, 6.7109375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 9.0, 9.0, 29.0, 39.0, 64.0, 81.0, 203.0, 299.0, 495.0, 1126.0, 3427.0, 16272.0, 134097.0, 2080670.0, 1817190.0, 119760.0, 15004.0, 3204.0, 1104.0, 496.0, 262.0, 163.0, 98.0, 57.0, 41.0, 29.0, 14.0, 10.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.5234375, -15.0379638671875, -14.552490234375, -14.0670166015625, -13.58154296875, -13.0960693359375, -12.610595703125, -12.1251220703125, -11.6396484375, -11.1541748046875, -10.668701171875, -10.1832275390625, -9.69775390625, -9.2122802734375, -8.726806640625, -8.2413330078125, -7.755859375, -7.2703857421875, -6.784912109375, -6.2994384765625, -5.81396484375, -5.3284912109375, -4.843017578125, -4.3575439453125, -3.8720703125, -3.3865966796875, -2.901123046875, -2.4156494140625, -1.93017578125, -1.4447021484375, -0.959228515625, -0.4737548828125, 0.01171875, 0.4971923828125, 0.982666015625, 1.4681396484375, 1.95361328125, 2.4390869140625, 2.924560546875, 3.4100341796875, 3.8955078125, 4.3809814453125, 4.866455078125, 5.3519287109375, 5.83740234375, 6.3228759765625, 6.808349609375, 7.2938232421875, 7.779296875, 8.2647705078125, 8.750244140625, 9.2357177734375, 9.72119140625, 10.2066650390625, 10.692138671875, 11.1776123046875, 11.6630859375, 12.1485595703125, 12.634033203125, 13.1195068359375, 13.60498046875, 14.0904541015625, 14.575927734375, 15.0614013671875, 15.546875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 18.0, 22.0, 25.0, 30.0, 51.0, 66.0, 94.0, 113.0, 114.0, 92.0, 99.0, 94.0, 71.0, 46.0, 26.0, 22.0, 10.0, 10.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.51186752319336, -47.4510498046875, -46.390228271484375, -45.329410552978516, -44.268592834472656, -43.20777130126953, -42.14695358276367, -41.08613586425781, -40.02531433105469, -38.96449661254883, -37.9036750793457, -36.842857360839844, -35.782039642333984, -34.721221923828125, -33.660400390625, -32.59958267211914, -31.53876495361328, -30.47794532775879, -29.41712760925293, -28.356307983398438, -27.295490264892578, -26.234670639038086, -25.173851013183594, -24.113033294677734, -23.052213668823242, -21.99139404296875, -20.93057632446289, -19.8697566986084, -18.808937072753906, -17.748119354248047, -16.687299728393555, -15.626481056213379, -14.565666198730469, -13.504847526550293, -12.444028854370117, -11.383209228515625, -10.32239055633545, -9.261571884155273, -8.200752258300781, -7.1399335861206055, -6.07911491394043, -5.018296241760254, -3.95747709274292, -2.896658182144165, -1.8358392715454102, -0.7750205993652344, 0.2857985496520996, 1.3466176986694336, 2.4074363708496094, 3.4682552814483643, 4.529074192047119, 5.589893341064453, 6.650712013244629, 7.711530685424805, 8.772350311279297, 9.833168983459473, 10.893987655639648, 11.954806327819824, 13.015625, 14.076444625854492, 15.137263298034668, 16.198081970214844, 17.258901596069336, 18.319721221923828, 19.380538940429688]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 2.0, 5.0, 8.0, 14.0, 15.0, 14.0, 13.0, 22.0, 21.0, 24.0, 20.0, 32.0, 25.0, 27.0, 32.0, 31.0, 47.0, 37.0, 43.0, 38.0, 42.0, 46.0, 28.0, 34.0, 32.0, 39.0, 36.0, 23.0, 31.0, 25.0, 29.0, 24.0, 19.0, 16.0, 15.0, 18.0, 15.0, 12.0, 6.0, 6.0, 5.0, 2.0, 4.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.701385498046875, -16.091327667236328, -15.481270790100098, -14.87121295928955, -14.26115608215332, -13.651098251342773, -13.041040420532227, -12.43098258972168, -11.82092571258545, -11.210867881774902, -10.600811004638672, -9.990753173828125, -9.380695343017578, -8.770638465881348, -8.1605806350708, -7.550523281097412, -6.940465927124023, -6.330408573150635, -5.720351219177246, -5.110293388366699, -4.5002360343933105, -3.890178680419922, -3.280121088027954, -2.6700634956359863, -2.0600061416625977, -1.4499486684799194, -0.8398911952972412, -0.229833722114563, 0.38022375106811523, 0.9902811050415039, 1.6003386974334717, 2.2103962898254395, 2.820453643798828, 3.430510997772217, 4.0405683517456055, 4.650626182556152, 5.260683536529541, 5.87074089050293, 6.480798721313477, 7.090856075286865, 7.700913429260254, 8.3109712600708, 8.921028137207031, 9.531085968017578, 10.141143798828125, 10.751200675964355, 11.361258506774902, 11.971315383911133, 12.58137321472168, 13.191431045532227, 13.801487922668457, 14.411545753479004, 15.021602630615234, 15.631660461425781, 16.241718292236328, 16.851776123046875, 17.461833953857422, 18.07189178466797, 18.681949615478516, 19.29200553894043, 19.902063369750977, 20.512121200561523, 21.12217903137207, 21.732236862182617, 22.34229278564453]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 6.0, 10.0, 15.0, 15.0, 18.0, 11.0, 19.0, 21.0, 31.0, 24.0, 40.0, 39.0, 32.0, 39.0, 33.0, 35.0, 42.0, 34.0, 45.0, 44.0, 40.0, 39.0, 46.0, 44.0, 30.0, 39.0, 32.0, 27.0, 29.0, 19.0, 18.0, 18.0, 10.0, 14.0, 8.0, 8.0, 9.0, 1.0, 8.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.97076416015625, -1.9102783203125, -1.84979248046875, -1.789306640625, -1.72882080078125, -1.6683349609375, -1.60784912109375, -1.54736328125, -1.48687744140625, -1.4263916015625, -1.36590576171875, -1.305419921875, -1.24493408203125, -1.1844482421875, -1.12396240234375, -1.0634765625, -1.00299072265625, -0.9425048828125, -0.88201904296875, -0.821533203125, -0.76104736328125, -0.7005615234375, -0.64007568359375, -0.57958984375, -0.51910400390625, -0.4586181640625, -0.39813232421875, -0.337646484375, -0.27716064453125, -0.2166748046875, -0.15618896484375, -0.095703125, -0.03521728515625, 0.0252685546875, 0.08575439453125, 0.146240234375, 0.20672607421875, 0.2672119140625, 0.32769775390625, 0.38818359375, 0.44866943359375, 0.5091552734375, 0.56964111328125, 0.630126953125, 0.69061279296875, 0.7510986328125, 0.81158447265625, 0.8720703125, 0.93255615234375, 0.9930419921875, 1.05352783203125, 1.114013671875, 1.17449951171875, 1.2349853515625, 1.29547119140625, 1.35595703125, 1.41644287109375, 1.4769287109375, 1.53741455078125, 1.597900390625, 1.65838623046875, 1.7188720703125, 1.77935791015625, 1.83984375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 8.0, 13.0, 14.0, 23.0, 39.0, 47.0, 61.0, 96.0, 193.0, 358.0, 488.0, 892.0, 1451.0, 2597.0, 4310.0, 7205.0, 12053.0, 21104.0, 36622.0, 68368.0, 135384.0, 327007.0, 213732.0, 96885.0, 51169.0, 28434.0, 16431.0, 9551.0, 5661.0, 3422.0, 1956.0, 1213.0, 693.0, 428.0, 235.0, 145.0, 96.0, 54.0, 38.0, 32.0, 16.0, 8.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.084228515625, -0.08165836334228516, -0.07908821105957031, -0.07651805877685547, -0.07394790649414062, -0.07137775421142578, -0.06880760192871094, -0.0662374496459961, -0.06366729736328125, -0.061097145080566406, -0.05852699279785156, -0.05595684051513672, -0.053386688232421875, -0.05081653594970703, -0.04824638366699219, -0.045676231384277344, -0.0431060791015625, -0.040535926818847656, -0.03796577453613281, -0.03539562225341797, -0.032825469970703125, -0.03025531768798828, -0.027685165405273438, -0.025115013122558594, -0.02254486083984375, -0.019974708557128906, -0.017404556274414062, -0.014834403991699219, -0.012264251708984375, -0.009694099426269531, -0.0071239471435546875, -0.004553794860839844, -0.001983642578125, 0.0005865097045898438, 0.0031566619873046875, 0.005726814270019531, 0.008296966552734375, 0.010867118835449219, 0.013437271118164062, 0.016007423400878906, 0.01857757568359375, 0.021147727966308594, 0.023717880249023438, 0.02628803253173828, 0.028858184814453125, 0.03142833709716797, 0.03399848937988281, 0.036568641662597656, 0.0391387939453125, 0.041708946228027344, 0.04427909851074219, 0.04684925079345703, 0.049419403076171875, 0.05198955535888672, 0.05455970764160156, 0.057129859924316406, 0.05970001220703125, 0.062270164489746094, 0.06484031677246094, 0.06741046905517578, 0.06998062133789062, 0.07255077362060547, 0.07512092590332031, 0.07769107818603516, 0.08026123046875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 3.0, 3.0, 8.0, 6.0, 17.0, 12.0, 13.0, 12.0, 15.0, 26.0, 20.0, 21.0, 21.0, 30.0, 22.0, 34.0, 37.0, 31.0, 39.0, 31.0, 41.0, 50.0, 1064.0, 33.0, 24.0, 41.0, 38.0, 27.0, 32.0, 31.0, 31.0, 30.0, 22.0, 26.0, 24.0, 22.0, 10.0, 11.0, 13.0, 3.0, 12.0, 12.0, 5.0, 1.0, 1.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1281890869140625, -1.091339111328125, -1.0544891357421875, -1.01763916015625, -0.9807891845703125, -0.943939208984375, -0.9070892333984375, -0.8702392578125, -0.8333892822265625, -0.796539306640625, -0.7596893310546875, -0.72283935546875, -0.6859893798828125, -0.649139404296875, -0.6122894287109375, -0.575439453125, -0.5385894775390625, -0.501739501953125, -0.4648895263671875, -0.42803955078125, -0.3911895751953125, -0.354339599609375, -0.3174896240234375, -0.2806396484375, -0.2437896728515625, -0.206939697265625, -0.1700897216796875, -0.13323974609375, -0.0963897705078125, -0.059539794921875, -0.0226898193359375, 0.01416015625, 0.0510101318359375, 0.087860107421875, 0.1247100830078125, 0.16156005859375, 0.1984100341796875, 0.235260009765625, 0.2721099853515625, 0.3089599609375, 0.3458099365234375, 0.382659912109375, 0.4195098876953125, 0.45635986328125, 0.4932098388671875, 0.530059814453125, 0.5669097900390625, 0.603759765625, 0.6406097412109375, 0.677459716796875, 0.7143096923828125, 0.75115966796875, 0.7880096435546875, 0.824859619140625, 0.8617095947265625, 0.8985595703125, 0.9354095458984375, 0.972259521484375, 1.0091094970703125, 1.04595947265625, 1.0828094482421875, 1.119659423828125, 1.1565093994140625, 1.193359375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 10.0, 12.0, 25.0, 31.0, 48.0, 97.0, 107.0, 186.0, 280.0, 389.0, 602.0, 874.0, 1314.0, 1919.0, 2879.0, 4314.0, 6579.0, 9845.0, 15090.0, 23143.0, 37383.0, 61071.0, 107397.0, 206014.0, 1298553.0, 127329.0, 71597.0, 42915.0, 26808.0, 17075.0, 11152.0, 7388.0, 4743.0, 3268.0, 2180.0, 1447.0, 962.0, 678.0, 466.0, 304.0, 215.0, 150.0, 104.0, 55.0, 41.0, 28.0, 20.0, 12.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0], "bins": [-0.03277587890625, -0.03181600570678711, -0.03085613250732422, -0.029896259307861328, -0.028936386108398438, -0.027976512908935547, -0.027016639709472656, -0.026056766510009766, -0.025096893310546875, -0.024137020111083984, -0.023177146911621094, -0.022217273712158203, -0.021257400512695312, -0.020297527313232422, -0.01933765411376953, -0.01837778091430664, -0.01741790771484375, -0.01645803451538086, -0.015498161315917969, -0.014538288116455078, -0.013578414916992188, -0.012618541717529297, -0.011658668518066406, -0.010698795318603516, -0.009738922119140625, -0.008779048919677734, -0.007819175720214844, -0.006859302520751953, -0.0058994293212890625, -0.004939556121826172, -0.003979682922363281, -0.0030198097229003906, -0.0020599365234375, -0.0011000633239746094, -0.00014019012451171875, 0.0008196830749511719, 0.0017795562744140625, 0.002739429473876953, 0.0036993026733398438, 0.004659175872802734, 0.005619049072265625, 0.006578922271728516, 0.007538795471191406, 0.008498668670654297, 0.009458541870117188, 0.010418415069580078, 0.011378288269042969, 0.01233816146850586, 0.01329803466796875, 0.01425790786743164, 0.015217781066894531, 0.016177654266357422, 0.017137527465820312, 0.018097400665283203, 0.019057273864746094, 0.020017147064208984, 0.020977020263671875, 0.021936893463134766, 0.022896766662597656, 0.023856639862060547, 0.024816513061523438, 0.025776386260986328, 0.02673625946044922, 0.02769613265991211, 0.028656005859375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 14.0, 7.0, 11.0, 14.0, 22.0, 24.0, 32.0, 35.0, 35.0, 48.0, 56.0, 66.0, 56.0, 50.0, 70.0, 62.0, 67.0, 67.0, 46.0, 45.0, 27.0, 25.0, 30.0, 18.0, 14.0, 11.0, 14.0, 11.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.637544482946396e-05, -1.57039612531662e-05, -1.5032477676868439e-05, -1.4360994100570679e-05, -1.3689510524272919e-05, -1.3018026947975159e-05, -1.2346543371677399e-05, -1.1675059795379639e-05, -1.1003576219081879e-05, -1.0332092642784119e-05, -9.660609066486359e-06, -8.989125490188599e-06, -8.317641913890839e-06, -7.646158337593079e-06, -6.974674761295319e-06, -6.303191184997559e-06, -5.631707608699799e-06, -4.9602240324020386e-06, -4.2887404561042786e-06, -3.6172568798065186e-06, -2.9457733035087585e-06, -2.2742897272109985e-06, -1.6028061509132385e-06, -9.313225746154785e-07, -2.598389983177185e-07, 4.116445779800415e-07, 1.0831281542778015e-06, 1.7546117305755615e-06, 2.4260953068733215e-06, 3.0975788831710815e-06, 3.7690624594688416e-06, 4.4405460357666016e-06, 5.1120296120643616e-06, 5.783513188362122e-06, 6.454996764659882e-06, 7.126480340957642e-06, 7.797963917255402e-06, 8.469447493553162e-06, 9.140931069850922e-06, 9.812414646148682e-06, 1.0483898222446442e-05, 1.1155381798744202e-05, 1.1826865375041962e-05, 1.2498348951339722e-05, 1.3169832527637482e-05, 1.3841316103935242e-05, 1.4512799680233002e-05, 1.5184283256530762e-05, 1.5855766832828522e-05, 1.6527250409126282e-05, 1.7198733985424042e-05, 1.7870217561721802e-05, 1.8541701138019562e-05, 1.9213184714317322e-05, 1.9884668290615082e-05, 2.0556151866912842e-05, 2.1227635443210602e-05, 2.1899119019508362e-05, 2.2570602595806122e-05, 2.3242086172103882e-05, 2.3913569748401642e-05, 2.4585053324699402e-05, 2.5256536900997162e-05, 2.5928020477294922e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 8.0, 11.0, 13.0, 15.0, 16.0, 22.0, 36.0, 45.0, 55.0, 103.0, 153.0, 234.0, 413.0, 1218.0, 968257.0, 76272.0, 742.0, 286.0, 196.0, 129.0, 88.0, 69.0, 41.0, 39.0, 23.0, 18.0, 14.0, 10.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005278587341308594, -0.0005142726004123688, -0.0005006864666938782, -0.0004871003329753876, -0.00047351419925689697, -0.00045992806553840637, -0.00044634193181991577, -0.00043275579810142517, -0.00041916966438293457, -0.00040558353066444397, -0.00039199739694595337, -0.00037841126322746277, -0.00036482512950897217, -0.00035123899579048157, -0.00033765286207199097, -0.00032406672835350037, -0.00031048059463500977, -0.00029689446091651917, -0.00028330832719802856, -0.00026972219347953796, -0.00025613605976104736, -0.00024254992604255676, -0.00022896379232406616, -0.00021537765860557556, -0.00020179152488708496, -0.00018820539116859436, -0.00017461925745010376, -0.00016103312373161316, -0.00014744699001312256, -0.00013386085629463196, -0.00012027472257614136, -0.00010668858885765076, -9.310245513916016e-05, -7.951632142066956e-05, -6.593018770217896e-05, -5.2344053983688354e-05, -3.8757920265197754e-05, -2.5171786546707153e-05, -1.1585652828216553e-05, 2.000480890274048e-06, 1.558661460876465e-05, 2.917274832725525e-05, 4.275888204574585e-05, 5.634501576423645e-05, 6.993114948272705e-05, 8.351728320121765e-05, 9.710341691970825e-05, 0.00011068955063819885, 0.00012427568435668945, 0.00013786181807518005, 0.00015144795179367065, 0.00016503408551216125, 0.00017862021923065186, 0.00019220635294914246, 0.00020579248666763306, 0.00021937862038612366, 0.00023296475410461426, 0.00024655088782310486, 0.00026013702154159546, 0.00027372315526008606, 0.00028730928897857666, 0.00030089542269706726, 0.00031448155641555786, 0.00032806769013404846, 0.00034165382385253906]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 19.0, 422.0, 553.0, 22.0, 0.0, 1.0, 1.0], "bins": [-0.00015350784815382212, -0.0001509089197497815, -0.00014830997679382563, -0.000145711048389785, -0.00014311211998574436, -0.0001405131770297885, -0.00013791424862574786, -0.00013531532022170722, -0.00013271637726575136, -0.00013011744886171073, -0.00012751850590575486, -0.00012491957750171423, -0.0001223206490976736, -0.00011972171341767535, -0.0001171227777376771, -0.00011452384933363646, -0.00011192492092959583, -0.00010932598524959758, -0.00010672705684555694, -0.0001041281211655587, -0.00010152919276151806, -9.893025708151981e-05, -9.633132140152156e-05, -9.373239299748093e-05, -9.113345731748268e-05, -8.853452163748443e-05, -8.59355932334438e-05, -8.333665755344555e-05, -8.07377218734473e-05, -7.813879346940666e-05, -7.553985778940842e-05, -7.294092210941017e-05, -7.034199370536953e-05, -6.774305802537128e-05, -6.514412962133065e-05, -6.25451939413324e-05, -5.994626189931296e-05, -5.7347329857293516e-05, -5.474839417729527e-05, -5.2149462135275826e-05, -4.9550530093256384e-05, -4.695159805123694e-05, -4.43526660092175e-05, -4.175373032921925e-05, -3.915479828719981e-05, -3.655586624518037e-05, -3.395693056518212e-05, -3.135799852316268e-05, -2.8759064662153833e-05, -2.6160130801144987e-05, -2.3561198759125546e-05, -2.0962266717106104e-05, -1.836333285609726e-05, -1.5764398995088413e-05, -1.3165466953068972e-05, -1.0566533092060126e-05, -7.967601050040685e-06, -5.368668098526541e-06, -2.7697351470123976e-06, -1.7080219549825415e-07, 2.4281307560158893e-06, 5.027063707530033e-06, 7.625996659044176e-06, 1.0224930520053022e-05, 1.2823862562072463e-05]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 8.0, 11.0, 7.0, 11.0, 17.0, 17.0, 15.0, 22.0, 26.0, 21.0, 30.0, 35.0, 30.0, 39.0, 35.0, 42.0, 41.0, 48.0, 48.0, 53.0, 38.0, 38.0, 36.0, 34.0, 42.0, 30.0, 35.0, 26.0, 21.0, 28.0, 20.0, 10.0, 15.0, 18.0, 8.0, 8.0, 11.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1444091796875e-05, -1.107342541217804e-05, -1.0702759027481079e-05, -1.0332092642784119e-05, -9.961426258087158e-06, -9.590759873390198e-06, -9.220093488693237e-06, -8.849427103996277e-06, -8.478760719299316e-06, -8.108094334602356e-06, -7.737427949905396e-06, -7.366761565208435e-06, -6.996095180511475e-06, -6.625428795814514e-06, -6.254762411117554e-06, -5.884096026420593e-06, -5.513429641723633e-06, -5.142763257026672e-06, -4.772096872329712e-06, -4.4014304876327515e-06, -4.030764102935791e-06, -3.6600977182388306e-06, -3.28943133354187e-06, -2.9187649488449097e-06, -2.5480985641479492e-06, -2.1774321794509888e-06, -1.8067657947540283e-06, -1.4360994100570679e-06, -1.0654330253601074e-06, -6.94766640663147e-07, -3.241002559661865e-07, 4.6566128730773926e-08, 4.172325134277344e-07, 7.878988981246948e-07, 1.1585652828216553e-06, 1.5292316675186157e-06, 1.8998980522155762e-06, 2.2705644369125366e-06, 2.641230821609497e-06, 3.0118972063064575e-06, 3.382563591003418e-06, 3.7532299757003784e-06, 4.123896360397339e-06, 4.494562745094299e-06, 4.86522912979126e-06, 5.23589551448822e-06, 5.606561899185181e-06, 5.977228283882141e-06, 6.3478946685791016e-06, 6.718561053276062e-06, 7.0892274379730225e-06, 7.459893822669983e-06, 7.830560207366943e-06, 8.201226592063904e-06, 8.571892976760864e-06, 8.942559361457825e-06, 9.313225746154785e-06, 9.683892130851746e-06, 1.0054558515548706e-05, 1.0425224900245667e-05, 1.0795891284942627e-05, 1.1166557669639587e-05, 1.1537224054336548e-05, 1.1907890439033508e-05, 1.2278556823730469e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 6.0, 10.0, 15.0, 15.0, 18.0, 11.0, 19.0, 21.0, 31.0, 24.0, 40.0, 39.0, 32.0, 39.0, 33.0, 35.0, 42.0, 34.0, 45.0, 44.0, 40.0, 39.0, 46.0, 44.0, 30.0, 39.0, 32.0, 27.0, 29.0, 19.0, 18.0, 18.0, 10.0, 14.0, 8.0, 8.0, 9.0, 1.0, 8.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.97076416015625, -1.9102783203125, -1.84979248046875, -1.789306640625, -1.72882080078125, -1.6683349609375, -1.60784912109375, -1.54736328125, -1.48687744140625, -1.4263916015625, -1.36590576171875, -1.305419921875, -1.24493408203125, -1.1844482421875, -1.12396240234375, -1.0634765625, -1.00299072265625, -0.9425048828125, -0.88201904296875, -0.821533203125, -0.76104736328125, -0.7005615234375, -0.64007568359375, -0.57958984375, -0.51910400390625, -0.4586181640625, -0.39813232421875, -0.337646484375, -0.27716064453125, -0.2166748046875, -0.15618896484375, -0.095703125, -0.03521728515625, 0.0252685546875, 0.08575439453125, 0.146240234375, 0.20672607421875, 0.2672119140625, 0.32769775390625, 0.38818359375, 0.44866943359375, 0.5091552734375, 0.56964111328125, 0.630126953125, 0.69061279296875, 0.7510986328125, 0.81158447265625, 0.8720703125, 0.93255615234375, 0.9930419921875, 1.05352783203125, 1.114013671875, 1.17449951171875, 1.2349853515625, 1.29547119140625, 1.35595703125, 1.41644287109375, 1.4769287109375, 1.53741455078125, 1.597900390625, 1.65838623046875, 1.7188720703125, 1.77935791015625, 1.83984375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 14.0, 11.0, 23.0, 61.0, 93.0, 164.0, 303.0, 635.0, 1241.0, 2509.0, 5321.0, 11791.0, 28547.0, 82139.0, 335307.0, 419955.0, 101722.0, 33355.0, 13569.0, 6085.0, 2913.0, 1307.0, 666.0, 360.0, 214.0, 92.0, 60.0, 33.0, 26.0, 9.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.8671875, -1.808990478515625, -1.75079345703125, -1.692596435546875, -1.6343994140625, -1.576202392578125, -1.51800537109375, -1.459808349609375, -1.401611328125, -1.343414306640625, -1.28521728515625, -1.227020263671875, -1.1688232421875, -1.110626220703125, -1.05242919921875, -0.994232177734375, -0.93603515625, -0.877838134765625, -0.81964111328125, -0.761444091796875, -0.7032470703125, -0.645050048828125, -0.58685302734375, -0.528656005859375, -0.470458984375, -0.412261962890625, -0.35406494140625, -0.295867919921875, -0.2376708984375, -0.179473876953125, -0.12127685546875, -0.063079833984375, -0.0048828125, 0.053314208984375, 0.11151123046875, 0.169708251953125, 0.2279052734375, 0.286102294921875, 0.34429931640625, 0.402496337890625, 0.460693359375, 0.518890380859375, 0.57708740234375, 0.635284423828125, 0.6934814453125, 0.751678466796875, 0.80987548828125, 0.868072509765625, 0.92626953125, 0.984466552734375, 1.04266357421875, 1.100860595703125, 1.1590576171875, 1.217254638671875, 1.27545166015625, 1.333648681640625, 1.391845703125, 1.450042724609375, 1.50823974609375, 1.566436767578125, 1.6246337890625, 1.682830810546875, 1.74102783203125, 1.799224853515625, 1.857421875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 7.0, 6.0, 6.0, 6.0, 13.0, 13.0, 11.0, 14.0, 18.0, 20.0, 23.0, 40.0, 30.0, 42.0, 53.0, 32.0, 51.0, 73.0, 155.0, 1577.0, 329.0, 121.0, 56.0, 36.0, 38.0, 36.0, 32.0, 26.0, 25.0, 22.0, 28.0, 16.0, 6.0, 16.0, 12.0, 7.0, 11.0, 7.0, 5.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.765625, -5.57220458984375, -5.3787841796875, -5.18536376953125, -4.991943359375, -4.79852294921875, -4.6051025390625, -4.41168212890625, -4.21826171875, -4.02484130859375, -3.8314208984375, -3.63800048828125, -3.444580078125, -3.25115966796875, -3.0577392578125, -2.86431884765625, -2.6708984375, -2.47747802734375, -2.2840576171875, -2.09063720703125, -1.897216796875, -1.70379638671875, -1.5103759765625, -1.31695556640625, -1.12353515625, -0.93011474609375, -0.7366943359375, -0.54327392578125, -0.349853515625, -0.15643310546875, 0.0369873046875, 0.23040771484375, 0.423828125, 0.61724853515625, 0.8106689453125, 1.00408935546875, 1.197509765625, 1.39093017578125, 1.5843505859375, 1.77777099609375, 1.97119140625, 2.16461181640625, 2.3580322265625, 2.55145263671875, 2.744873046875, 2.93829345703125, 3.1317138671875, 3.32513427734375, 3.5185546875, 3.71197509765625, 3.9053955078125, 4.09881591796875, 4.292236328125, 4.48565673828125, 4.6790771484375, 4.87249755859375, 5.06591796875, 5.25933837890625, 5.4527587890625, 5.64617919921875, 5.839599609375, 6.03302001953125, 6.2264404296875, 6.41986083984375, 6.61328125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 9.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 9.0, 13.0, 14.0, 18.0, 29.0, 25.0, 50.0, 51.0, 71.0, 117.0, 171.0, 337.0, 748.0, 3450.0, 48565.0, 2935064.0, 148601.0, 6051.0, 1153.0, 401.0, 190.0, 147.0, 100.0, 64.0, 49.0, 35.0, 27.0, 20.0, 19.0, 13.0, 12.0, 10.0, 5.0, 7.0, 6.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.21875, -8.9447021484375, -8.670654296875, -8.3966064453125, -8.12255859375, -7.8485107421875, -7.574462890625, -7.3004150390625, -7.0263671875, -6.7523193359375, -6.478271484375, -6.2042236328125, -5.93017578125, -5.6561279296875, -5.382080078125, -5.1080322265625, -4.833984375, -4.5599365234375, -4.285888671875, -4.0118408203125, -3.73779296875, -3.4637451171875, -3.189697265625, -2.9156494140625, -2.6416015625, -2.3675537109375, -2.093505859375, -1.8194580078125, -1.54541015625, -1.2713623046875, -0.997314453125, -0.7232666015625, -0.44921875, -0.1751708984375, 0.098876953125, 0.3729248046875, 0.64697265625, 0.9210205078125, 1.195068359375, 1.4691162109375, 1.7431640625, 2.0172119140625, 2.291259765625, 2.5653076171875, 2.83935546875, 3.1134033203125, 3.387451171875, 3.6614990234375, 3.935546875, 4.2095947265625, 4.483642578125, 4.7576904296875, 5.03173828125, 5.3057861328125, 5.579833984375, 5.8538818359375, 6.1279296875, 6.4019775390625, 6.676025390625, 6.9500732421875, 7.22412109375, 7.4981689453125, 7.772216796875, 8.0462646484375, 8.3203125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0, 766.0, 211.0, 4.0, 0.0, 2.0], "bins": [-128.45249938964844, -126.30015563964844, -124.1478042602539, -121.9954605102539, -119.84310913085938, -117.69076538085938, -115.53842163085938, -113.38607025146484, -111.23372650146484, -109.08138275146484, -106.92903137207031, -104.77668762207031, -102.62434387207031, -100.47199249267578, -98.31964874267578, -96.16729736328125, -94.01495361328125, -91.86260986328125, -89.71025848388672, -87.55791473388672, -85.40556335449219, -83.25321960449219, -81.10087585449219, -78.94852447509766, -76.79618072509766, -74.64383697509766, -72.49148559570312, -70.33914184570312, -68.18679809570312, -66.0344467163086, -63.882102966308594, -61.72975540161133, -59.57741165161133, -57.42506408691406, -55.27272033691406, -53.1203727722168, -50.96802520751953, -48.815677642822266, -46.663330078125, -44.510986328125, -42.358638763427734, -40.20629119873047, -38.05394744873047, -35.9015998840332, -33.74925231933594, -31.596904754638672, -29.44455909729004, -27.292213439941406, -25.13986587524414, -22.987518310546875, -20.835172653198242, -18.68282699584961, -16.530479431152344, -14.378132820129395, -12.225786209106445, -10.073439598083496, -7.9210920333862305, -5.768745422363281, -3.616398811340332, -1.4640522003173828, 0.6882944107055664, 2.8406410217285156, 4.992987632751465, 7.145334243774414, 9.297680854797363]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 3.0, 6.0, 7.0, 7.0, 5.0, 7.0, 7.0, 17.0, 14.0, 16.0, 26.0, 31.0, 15.0, 26.0, 35.0, 25.0, 34.0, 18.0, 33.0, 42.0, 39.0, 36.0, 35.0, 27.0, 35.0, 35.0, 33.0, 44.0, 36.0, 38.0, 23.0, 30.0, 33.0, 18.0, 18.0, 25.0, 14.0, 17.0, 22.0, 12.0, 13.0, 6.0, 10.0, 11.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-17.849258422851562, -17.30141258239746, -16.75356674194336, -16.205720901489258, -15.657876014709473, -15.110030174255371, -14.562185287475586, -14.014339447021484, -13.466493606567383, -12.918647766113281, -12.37080192565918, -11.822957038879395, -11.275111198425293, -10.727265357971191, -10.179420471191406, -9.631574630737305, -9.083728790283203, -8.535882949829102, -7.988037586212158, -7.440192222595215, -6.892346382141113, -6.344500541687012, -5.796655178070068, -5.248809814453125, -4.700963973999023, -4.153118133544922, -3.6052727699279785, -3.057427167892456, -2.5095815658569336, -1.9617359638214111, -1.4138903617858887, -0.8660447597503662, -0.31819915771484375, 0.2296464443206787, 0.7774920463562012, 1.3253376483917236, 1.873183250427246, 2.4210288524627686, 2.968874454498291, 3.5167200565338135, 4.064565658569336, 4.6124114990234375, 5.160256862640381, 5.708102226257324, 6.255948066711426, 6.803793907165527, 7.351639270782471, 7.899484634399414, 8.447330474853516, 8.995176315307617, 9.543022155761719, 10.090867042541504, 10.638712882995605, 11.186558723449707, 11.734403610229492, 12.282249450683594, 12.830095291137695, 13.377941131591797, 13.925786972045898, 14.473631858825684, 15.021477699279785, 15.569323539733887, 16.117168426513672, 16.665014266967773, 17.212860107421875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 6.0, 6.0, 11.0, 11.0, 17.0, 11.0, 21.0, 24.0, 14.0, 33.0, 32.0, 35.0, 42.0, 38.0, 34.0, 30.0, 39.0, 47.0, 40.0, 40.0, 45.0, 39.0, 44.0, 48.0, 39.0, 38.0, 30.0, 24.0, 35.0, 21.0, 18.0, 21.0, 17.0, 7.0, 11.0, 6.0, 5.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.05499267578125, -1.9927978515625, -1.93060302734375, -1.868408203125, -1.80621337890625, -1.7440185546875, -1.68182373046875, -1.61962890625, -1.55743408203125, -1.4952392578125, -1.43304443359375, -1.370849609375, -1.30865478515625, -1.2464599609375, -1.18426513671875, -1.1220703125, -1.05987548828125, -0.9976806640625, -0.93548583984375, -0.873291015625, -0.81109619140625, -0.7489013671875, -0.68670654296875, -0.62451171875, -0.56231689453125, -0.5001220703125, -0.43792724609375, -0.375732421875, -0.31353759765625, -0.2513427734375, -0.18914794921875, -0.126953125, -0.06475830078125, -0.0025634765625, 0.05963134765625, 0.121826171875, 0.18402099609375, 0.2462158203125, 0.30841064453125, 0.37060546875, 0.43280029296875, 0.4949951171875, 0.55718994140625, 0.619384765625, 0.68157958984375, 0.7437744140625, 0.80596923828125, 0.8681640625, 0.93035888671875, 0.9925537109375, 1.05474853515625, 1.116943359375, 1.17913818359375, 1.2413330078125, 1.30352783203125, 1.36572265625, 1.42791748046875, 1.4901123046875, 1.55230712890625, 1.614501953125, 1.67669677734375, 1.7388916015625, 1.80108642578125, 1.86328125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 5.0, 8.0, 14.0, 21.0, 21.0, 41.0, 51.0, 76.0, 139.0, 232.0, 503.0, 893.0, 2001.0, 4399.0, 10939.0, 29577.0, 91622.0, 361316.0, 2058514.0, 1305285.0, 228853.0, 63461.0, 21578.0, 8104.0, 3438.0, 1533.0, 729.0, 384.0, 209.0, 122.0, 73.0, 45.0, 28.0, 17.0, 14.0, 10.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.12677001953125, -4.9605712890625, -4.79437255859375, -4.628173828125, -4.46197509765625, -4.2957763671875, -4.12957763671875, -3.96337890625, -3.79718017578125, -3.6309814453125, -3.46478271484375, -3.298583984375, -3.13238525390625, -2.9661865234375, -2.79998779296875, -2.6337890625, -2.46759033203125, -2.3013916015625, -2.13519287109375, -1.968994140625, -1.80279541015625, -1.6365966796875, -1.47039794921875, -1.30419921875, -1.13800048828125, -0.9718017578125, -0.80560302734375, -0.639404296875, -0.47320556640625, -0.3070068359375, -0.14080810546875, 0.025390625, 0.19158935546875, 0.3577880859375, 0.52398681640625, 0.690185546875, 0.85638427734375, 1.0225830078125, 1.18878173828125, 1.35498046875, 1.52117919921875, 1.6873779296875, 1.85357666015625, 2.019775390625, 2.18597412109375, 2.3521728515625, 2.51837158203125, 2.6845703125, 2.85076904296875, 3.0169677734375, 3.18316650390625, 3.349365234375, 3.51556396484375, 3.6817626953125, 3.84796142578125, 4.01416015625, 4.18035888671875, 4.3465576171875, 4.51275634765625, 4.678955078125, 4.84515380859375, 5.0113525390625, 5.17755126953125, 5.34375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 5.0, 20.0, 26.0, 44.0, 63.0, 116.0, 198.0, 314.0, 533.0, 739.0, 743.0, 469.0, 326.0, 209.0, 95.0, 79.0, 38.0, 24.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.1640625, -10.8536376953125, -10.543212890625, -10.2327880859375, -9.92236328125, -9.6119384765625, -9.301513671875, -8.9910888671875, -8.6806640625, -8.3702392578125, -8.059814453125, -7.7493896484375, -7.43896484375, -7.1285400390625, -6.818115234375, -6.5076904296875, -6.197265625, -5.8868408203125, -5.576416015625, -5.2659912109375, -4.95556640625, -4.6451416015625, -4.334716796875, -4.0242919921875, -3.7138671875, -3.4034423828125, -3.093017578125, -2.7825927734375, -2.47216796875, -2.1617431640625, -1.851318359375, -1.5408935546875, -1.23046875, -0.9200439453125, -0.609619140625, -0.2991943359375, 0.01123046875, 0.3216552734375, 0.632080078125, 0.9425048828125, 1.2529296875, 1.5633544921875, 1.873779296875, 2.1842041015625, 2.49462890625, 2.8050537109375, 3.115478515625, 3.4259033203125, 3.736328125, 4.0467529296875, 4.357177734375, 4.6676025390625, 4.97802734375, 5.2884521484375, 5.598876953125, 5.9093017578125, 6.2197265625, 6.5301513671875, 6.840576171875, 7.1510009765625, 7.46142578125, 7.7718505859375, 8.082275390625, 8.3927001953125, 8.703125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 7.0, 10.0, 16.0, 30.0, 37.0, 42.0, 59.0, 76.0, 169.0, 256.0, 514.0, 1328.0, 4526.0, 28537.0, 395629.0, 3358909.0, 369741.0, 27391.0, 4392.0, 1349.0, 544.0, 267.0, 145.0, 83.0, 71.0, 31.0, 27.0, 29.0, 11.0, 12.0, 11.0, 2.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.59375, -21.03271484375, -20.4716796875, -19.91064453125, -19.349609375, -18.78857421875, -18.2275390625, -17.66650390625, -17.10546875, -16.54443359375, -15.9833984375, -15.42236328125, -14.861328125, -14.30029296875, -13.7392578125, -13.17822265625, -12.6171875, -12.05615234375, -11.4951171875, -10.93408203125, -10.373046875, -9.81201171875, -9.2509765625, -8.68994140625, -8.12890625, -7.56787109375, -7.0068359375, -6.44580078125, -5.884765625, -5.32373046875, -4.7626953125, -4.20166015625, -3.640625, -3.07958984375, -2.5185546875, -1.95751953125, -1.396484375, -0.83544921875, -0.2744140625, 0.28662109375, 0.84765625, 1.40869140625, 1.9697265625, 2.53076171875, 3.091796875, 3.65283203125, 4.2138671875, 4.77490234375, 5.3359375, 5.89697265625, 6.4580078125, 7.01904296875, 7.580078125, 8.14111328125, 8.7021484375, 9.26318359375, 9.82421875, 10.38525390625, 10.9462890625, 11.50732421875, 12.068359375, 12.62939453125, 13.1904296875, 13.75146484375, 14.3125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 9.0, 9.0, 8.0, 19.0, 25.0, 34.0, 51.0, 51.0, 74.0, 92.0, 97.0, 89.0, 82.0, 74.0, 70.0, 69.0, 48.0, 27.0, 22.0, 25.0, 9.0, 4.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.53931427001953, -33.57227325439453, -32.605228424072266, -31.638187408447266, -30.671144485473633, -29.7041015625, -28.737060546875, -27.770017623901367, -26.802974700927734, -25.8359317779541, -24.86888885498047, -23.90184783935547, -22.934804916381836, -21.967761993408203, -21.000720977783203, -20.03367805480957, -19.066635131835938, -18.099592208862305, -17.132549285888672, -16.165508270263672, -15.198465347290039, -14.231422424316406, -13.26438045501709, -12.297338485717773, -11.33029556274414, -10.363252639770508, -9.396210670471191, -8.429168701171875, -7.462125778198242, -6.495083332061768, -5.528040885925293, -4.560998439788818, -3.593954086303711, -2.6269116401672363, -1.6598691940307617, -0.6928267478942871, 0.2742156982421875, 1.241258144378662, 2.2083005905151367, 3.1753430366516113, 4.142385482788086, 5.1094279289245605, 6.076470375061035, 7.04351282119751, 8.010555267333984, 8.977598190307617, 9.944640159606934, 10.91168212890625, 11.878725051879883, 12.845767974853516, 13.812809944152832, 14.779851913452148, 15.746894836425781, 16.713937759399414, 17.680980682373047, 18.648021697998047, 19.61506462097168, 20.582107543945312, 21.549148559570312, 22.516191482543945, 23.483234405517578, 24.45027732849121, 25.417320251464844, 26.384361267089844, 27.351404190063477]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 8.0, 10.0, 11.0, 13.0, 23.0, 24.0, 24.0, 24.0, 48.0, 26.0, 32.0, 34.0, 41.0, 46.0, 39.0, 44.0, 53.0, 49.0, 44.0, 45.0, 45.0, 36.0, 25.0, 29.0, 35.0, 29.0, 28.0, 28.0, 15.0, 14.0, 12.0, 11.0, 9.0, 9.0, 4.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.921066284179688, -25.16924476623535, -24.41742515563965, -23.665603637695312, -22.91378402709961, -22.161962509155273, -21.410140991210938, -20.658321380615234, -19.9064998626709, -19.154678344726562, -18.40285873413086, -17.651037216186523, -16.899215698242188, -16.147396087646484, -15.395574569702148, -14.643754005432129, -13.89193344116211, -13.14011287689209, -12.38829231262207, -11.636470794677734, -10.884650230407715, -10.132829666137695, -9.38100814819336, -8.62918758392334, -7.87736701965332, -7.125546455383301, -6.373725414276123, -5.621904373168945, -4.870083808898926, -4.118263244628906, -3.3664422035217285, -2.614621162414551, -1.8628005981445312, -1.1109797954559326, -0.359158992767334, 0.39266180992126465, 1.1444826126098633, 1.896303415298462, 2.6481242179870605, 3.3999452590942383, 4.151765823364258, 4.903586387634277, 5.655407428741455, 6.407228469848633, 7.159049034118652, 7.910869598388672, 8.662691116333008, 9.414511680603027, 10.166332244873047, 10.918152809143066, 11.669973373413086, 12.421794891357422, 13.173615455627441, 13.925436019897461, 14.677257537841797, 15.429078102111816, 16.180898666381836, 16.932720184326172, 17.684539794921875, 18.43636131286621, 19.188182830810547, 19.94000244140625, 20.691823959350586, 21.443645477294922, 22.195465087890625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 4.0, 5.0, 12.0, 11.0, 10.0, 22.0, 18.0, 26.0, 19.0, 29.0, 30.0, 32.0, 35.0, 46.0, 41.0, 43.0, 39.0, 43.0, 41.0, 55.0, 36.0, 49.0, 26.0, 39.0, 29.0, 39.0, 26.0, 32.0, 29.0, 30.0, 13.0, 16.0, 18.0, 11.0, 12.0, 11.0, 3.0, 1.0, 3.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.42578125, -2.35986328125, -2.2939453125, -2.22802734375, -2.162109375, -2.09619140625, -2.0302734375, -1.96435546875, -1.8984375, -1.83251953125, -1.7666015625, -1.70068359375, -1.634765625, -1.56884765625, -1.5029296875, -1.43701171875, -1.37109375, -1.30517578125, -1.2392578125, -1.17333984375, -1.107421875, -1.04150390625, -0.9755859375, -0.90966796875, -0.84375, -0.77783203125, -0.7119140625, -0.64599609375, -0.580078125, -0.51416015625, -0.4482421875, -0.38232421875, -0.31640625, -0.25048828125, -0.1845703125, -0.11865234375, -0.052734375, 0.01318359375, 0.0791015625, 0.14501953125, 0.2109375, 0.27685546875, 0.3427734375, 0.40869140625, 0.474609375, 0.54052734375, 0.6064453125, 0.67236328125, 0.73828125, 0.80419921875, 0.8701171875, 0.93603515625, 1.001953125, 1.06787109375, 1.1337890625, 1.19970703125, 1.265625, 1.33154296875, 1.3974609375, 1.46337890625, 1.529296875, 1.59521484375, 1.6611328125, 1.72705078125, 1.79296875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 14.0, 6.0, 17.0, 23.0, 44.0, 54.0, 74.0, 114.0, 157.0, 243.0, 341.0, 507.0, 748.0, 1122.0, 1557.0, 2408.0, 3538.0, 5284.0, 8103.0, 12422.0, 18485.0, 28293.0, 44460.0, 74701.0, 143072.0, 286950.0, 179985.0, 89369.0, 51271.0, 32118.0, 21409.0, 13944.0, 9181.0, 6164.0, 4060.0, 2686.0, 1721.0, 1280.0, 806.0, 574.0, 418.0, 242.0, 180.0, 124.0, 97.0, 61.0, 30.0, 29.0, 24.0, 13.0, 14.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06448554992675781, -0.062381744384765625, -0.06027793884277344, -0.05817413330078125, -0.05607032775878906, -0.053966522216796875, -0.05186271667480469, -0.0497589111328125, -0.04765510559082031, -0.045551300048828125, -0.04344749450683594, -0.04134368896484375, -0.03923988342285156, -0.037136077880859375, -0.03503227233886719, -0.032928466796875, -0.030824661254882812, -0.028720855712890625, -0.026617050170898438, -0.02451324462890625, -0.022409439086914062, -0.020305633544921875, -0.018201828002929688, -0.0160980224609375, -0.013994216918945312, -0.011890411376953125, -0.009786605834960938, -0.00768280029296875, -0.0055789947509765625, -0.003475189208984375, -0.0013713836669921875, 0.000732421875, 0.0028362274169921875, 0.004940032958984375, 0.0070438385009765625, 0.00914764404296875, 0.011251449584960938, 0.013355255126953125, 0.015459060668945312, 0.0175628662109375, 0.019666671752929688, 0.021770477294921875, 0.023874282836914062, 0.02597808837890625, 0.028081893920898438, 0.030185699462890625, 0.03228950500488281, 0.034393310546875, 0.03649711608886719, 0.038600921630859375, 0.04070472717285156, 0.04280853271484375, 0.04491233825683594, 0.047016143798828125, 0.04911994934082031, 0.0512237548828125, 0.05332756042480469, 0.055431365966796875, 0.05753517150878906, 0.05963897705078125, 0.06174278259277344, 0.06384658813476562, 0.06595039367675781, 0.06805419921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 7.0, 12.0, 10.0, 14.0, 10.0, 15.0, 22.0, 23.0, 32.0, 34.0, 39.0, 41.0, 38.0, 35.0, 42.0, 45.0, 52.0, 1068.0, 45.0, 46.0, 42.0, 46.0, 37.0, 18.0, 38.0, 28.0, 26.0, 32.0, 17.0, 17.0, 17.0, 11.0, 12.0, 6.0, 10.0, 7.0, 2.0, 5.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.556640625, -1.51202392578125, -1.4674072265625, -1.42279052734375, -1.378173828125, -1.33355712890625, -1.2889404296875, -1.24432373046875, -1.19970703125, -1.15509033203125, -1.1104736328125, -1.06585693359375, -1.021240234375, -0.97662353515625, -0.9320068359375, -0.88739013671875, -0.8427734375, -0.79815673828125, -0.7535400390625, -0.70892333984375, -0.664306640625, -0.61968994140625, -0.5750732421875, -0.53045654296875, -0.48583984375, -0.44122314453125, -0.3966064453125, -0.35198974609375, -0.307373046875, -0.26275634765625, -0.2181396484375, -0.17352294921875, -0.12890625, -0.08428955078125, -0.0396728515625, 0.00494384765625, 0.049560546875, 0.09417724609375, 0.1387939453125, 0.18341064453125, 0.22802734375, 0.27264404296875, 0.3172607421875, 0.36187744140625, 0.406494140625, 0.45111083984375, 0.4957275390625, 0.54034423828125, 0.5849609375, 0.62957763671875, 0.6741943359375, 0.71881103515625, 0.763427734375, 0.80804443359375, 0.8526611328125, 0.89727783203125, 0.94189453125, 0.98651123046875, 1.0311279296875, 1.07574462890625, 1.120361328125, 1.16497802734375, 1.2095947265625, 1.25421142578125, 1.298828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 15.0, 27.0, 28.0, 50.0, 76.0, 110.0, 181.0, 239.0, 411.0, 538.0, 903.0, 1344.0, 2057.0, 3171.0, 4945.0, 7974.0, 12787.0, 20975.0, 34707.0, 61826.0, 116139.0, 308039.0, 1250540.0, 116812.0, 61946.0, 35408.0, 20969.0, 12773.0, 7864.0, 4990.0, 3214.0, 2086.0, 1383.0, 888.0, 584.0, 378.0, 254.0, 164.0, 113.0, 60.0, 55.0, 36.0, 15.0, 20.0, 11.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.04193115234375, -0.04069805145263672, -0.03946495056152344, -0.038231849670410156, -0.036998748779296875, -0.035765647888183594, -0.03453254699707031, -0.03329944610595703, -0.03206634521484375, -0.03083324432373047, -0.029600143432617188, -0.028367042541503906, -0.027133941650390625, -0.025900840759277344, -0.024667739868164062, -0.02343463897705078, -0.0222015380859375, -0.02096843719482422, -0.019735336303710938, -0.018502235412597656, -0.017269134521484375, -0.016036033630371094, -0.014802932739257812, -0.013569831848144531, -0.01233673095703125, -0.011103630065917969, -0.009870529174804688, -0.008637428283691406, -0.007404327392578125, -0.006171226501464844, -0.0049381256103515625, -0.0037050247192382812, -0.002471923828125, -0.0012388229370117188, -5.7220458984375e-06, 0.0012273788452148438, 0.002460479736328125, 0.0036935806274414062, 0.0049266815185546875, 0.006159782409667969, 0.00739288330078125, 0.008625984191894531, 0.009859085083007812, 0.011092185974121094, 0.012325286865234375, 0.013558387756347656, 0.014791488647460938, 0.01602458953857422, 0.0172576904296875, 0.01849079132080078, 0.019723892211914062, 0.020956993103027344, 0.022190093994140625, 0.023423194885253906, 0.024656295776367188, 0.02588939666748047, 0.02712249755859375, 0.02835559844970703, 0.029588699340820312, 0.030821800231933594, 0.032054901123046875, 0.033288002014160156, 0.03452110290527344, 0.03575420379638672, 0.0369873046875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 11.0, 8.0, 13.0, 15.0, 18.0, 17.0, 26.0, 24.0, 32.0, 36.0, 43.0, 34.0, 48.0, 41.0, 63.0, 60.0, 52.0, 47.0, 41.0, 35.0, 41.0, 43.0, 38.0, 32.0, 25.0, 28.0, 15.0, 13.0, 18.0, 10.0, 9.0, 9.0, 4.0, 10.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6689300537109375e-05, -1.618172973394394e-05, -1.5674158930778503e-05, -1.5166588127613068e-05, -1.4659017324447632e-05, -1.4151446521282196e-05, -1.364387571811676e-05, -1.3136304914951324e-05, -1.2628734111785889e-05, -1.2121163308620453e-05, -1.1613592505455017e-05, -1.1106021702289581e-05, -1.0598450899124146e-05, -1.009088009595871e-05, -9.583309292793274e-06, -9.075738489627838e-06, -8.568167686462402e-06, -8.060596883296967e-06, -7.553026080131531e-06, -7.045455276966095e-06, -6.537884473800659e-06, -6.030313670635223e-06, -5.522742867469788e-06, -5.015172064304352e-06, -4.507601261138916e-06, -4.00003045797348e-06, -3.4924596548080444e-06, -2.9848888516426086e-06, -2.477318048477173e-06, -1.969747245311737e-06, -1.4621764421463013e-06, -9.546056389808655e-07, -4.470348358154297e-07, 6.05359673500061e-08, 5.681067705154419e-07, 1.0756775736808777e-06, 1.5832483768463135e-06, 2.0908191800117493e-06, 2.598389983177185e-06, 3.105960786342621e-06, 3.6135315895080566e-06, 4.1211023926734924e-06, 4.628673195838928e-06, 5.136243999004364e-06, 5.6438148021698e-06, 6.151385605335236e-06, 6.658956408500671e-06, 7.166527211666107e-06, 7.674098014831543e-06, 8.181668817996979e-06, 8.689239621162415e-06, 9.19681042432785e-06, 9.704381227493286e-06, 1.0211952030658722e-05, 1.0719522833824158e-05, 1.1227093636989594e-05, 1.173466444015503e-05, 1.2242235243320465e-05, 1.2749806046485901e-05, 1.3257376849651337e-05, 1.3764947652816772e-05, 1.4272518455982208e-05, 1.4780089259147644e-05, 1.528766006231308e-05, 1.5795230865478516e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 8.0, 6.0, 11.0, 5.0, 8.0, 15.0, 15.0, 27.0, 35.0, 27.0, 35.0, 54.0, 64.0, 95.0, 109.0, 184.0, 280.0, 636.0, 5528.0, 1012764.0, 26702.0, 795.0, 407.0, 187.0, 120.0, 93.0, 73.0, 50.0, 36.0, 38.0, 24.0, 26.0, 14.0, 13.0, 16.0, 6.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0003123283386230469, -0.0003021322190761566, -0.00029193609952926636, -0.0002817399799823761, -0.00027154386043548584, -0.0002613477408885956, -0.0002511516213417053, -0.00024095550179481506, -0.0002307593822479248, -0.00022056326270103455, -0.0002103671431541443, -0.00020017102360725403, -0.00018997490406036377, -0.0001797787845134735, -0.00016958266496658325, -0.000159386545419693, -0.00014919042587280273, -0.00013899430632591248, -0.00012879818677902222, -0.00011860206723213196, -0.0001084059476852417, -9.820982813835144e-05, -8.801370859146118e-05, -7.781758904457092e-05, -6.762146949768066e-05, -5.7425349950790405e-05, -4.7229230403900146e-05, -3.703311085700989e-05, -2.683699131011963e-05, -1.664087176322937e-05, -6.444752216339111e-06, 3.7513673305511475e-06, 1.3947486877441406e-05, 2.4143606424331665e-05, 3.4339725971221924e-05, 4.453584551811218e-05, 5.473196506500244e-05, 6.49280846118927e-05, 7.512420415878296e-05, 8.532032370567322e-05, 9.551644325256348e-05, 0.00010571256279945374, 0.000115908682346344, 0.00012610480189323425, 0.0001363009214401245, 0.00014649704098701477, 0.00015669316053390503, 0.0001668892800807953, 0.00017708539962768555, 0.0001872815191745758, 0.00019747763872146606, 0.00020767375826835632, 0.00021786987781524658, 0.00022806599736213684, 0.0002382621169090271, 0.00024845823645591736, 0.0002586543560028076, 0.0002688504755496979, 0.00027904659509658813, 0.0002892427146434784, 0.00029943883419036865, 0.0003096349537372589, 0.00031983107328414917, 0.00033002719283103943, 0.0003402233123779297]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 11.0, 36.0, 316.0, 511.0, 114.0, 22.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.436301919165999e-05, -6.290770397754386e-05, -6.145239603938535e-05, -5.999708082526922e-05, -5.85417692491319e-05, -5.7086457672994584e-05, -5.563114245887846e-05, -5.417583088274114e-05, -5.272051930660382e-05, -5.12652077304665e-05, -4.980989615432918e-05, -4.8354580940213054e-05, -4.6899269364075735e-05, -4.5443957787938416e-05, -4.398864257382229e-05, -4.253333099768497e-05, -4.107801942154765e-05, -3.962270784541033e-05, -3.816739626927301e-05, -3.6712081055156887e-05, -3.525676947901957e-05, -3.380145790288225e-05, -3.234614268876612e-05, -3.08908311126288e-05, -2.9435519536491483e-05, -2.7980207960354164e-05, -2.652489456522744e-05, -2.506958117010072e-05, -2.36142695939634e-05, -2.215895801782608e-05, -2.0703644622699358e-05, -1.9248331227572635e-05, -1.779302147042472e-05, -1.6337708075297996e-05, -1.4882396499160677e-05, -1.3427084013528656e-05, -1.1971771527896635e-05, -1.0516459042264614e-05, -9.061146556632593e-06, -7.605834071000572e-06, -6.150521585368551e-06, -4.69520909973653e-06, -3.2398966141045094e-06, -1.7845841284724884e-06, -3.292716428404674e-07, 1.1260408427915536e-06, 2.5813533284235746e-06, 4.0366658140555955e-06, 5.4919782996876165e-06, 6.9472907853196375e-06, 8.402603270951658e-06, 9.85791575658368e-06, 1.13132282422157e-05, 1.2768540727847721e-05, 1.4223853213479742e-05, 1.567916478961706e-05, 1.7134478184743784e-05, 1.8589791579870507e-05, 2.0045103156007826e-05, 2.1500414732145146e-05, 2.2955728127271868e-05, 2.441104152239859e-05, 2.586635309853591e-05, 2.732166467467323e-05, 2.8776978069799952e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 3.0, 3.0, 9.0, 10.0, 7.0, 16.0, 7.0, 7.0, 18.0, 14.0, 17.0, 23.0, 25.0, 25.0, 31.0, 37.0, 31.0, 39.0, 27.0, 33.0, 45.0, 38.0, 45.0, 40.0, 44.0, 37.0, 29.0, 27.0, 30.0, 41.0, 33.0, 27.0, 18.0, 19.0, 18.0, 11.0, 24.0, 16.0, 10.0, 5.0, 15.0, 8.0, 9.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0], "bins": [-1.049041748046875e-05, -1.0186806321144104e-05, -9.883195161819458e-06, -9.579584002494812e-06, -9.275972843170166e-06, -8.97236168384552e-06, -8.668750524520874e-06, -8.365139365196228e-06, -8.061528205871582e-06, -7.757917046546936e-06, -7.45430588722229e-06, -7.150694727897644e-06, -6.847083568572998e-06, -6.543472409248352e-06, -6.239861249923706e-06, -5.93625009059906e-06, -5.632638931274414e-06, -5.329027771949768e-06, -5.025416612625122e-06, -4.721805453300476e-06, -4.41819429397583e-06, -4.114583134651184e-06, -3.810971975326538e-06, -3.507360816001892e-06, -3.203749656677246e-06, -2.9001384973526e-06, -2.596527338027954e-06, -2.292916178703308e-06, -1.989305019378662e-06, -1.6856938600540161e-06, -1.3820827007293701e-06, -1.0784715414047241e-06, -7.748603820800781e-07, -4.7124922275543213e-07, -1.6763806343078613e-07, 1.3597309589385986e-07, 4.3958425521850586e-07, 7.431954145431519e-07, 1.0468065738677979e-06, 1.3504177331924438e-06, 1.6540288925170898e-06, 1.957640051841736e-06, 2.261251211166382e-06, 2.564862370491028e-06, 2.868473529815674e-06, 3.17208468914032e-06, 3.475695848464966e-06, 3.779307007789612e-06, 4.082918167114258e-06, 4.386529326438904e-06, 4.69014048576355e-06, 4.993751645088196e-06, 5.297362804412842e-06, 5.600973963737488e-06, 5.904585123062134e-06, 6.20819628238678e-06, 6.511807441711426e-06, 6.815418601036072e-06, 7.119029760360718e-06, 7.422640919685364e-06, 7.72625207901001e-06, 8.029863238334656e-06, 8.333474397659302e-06, 8.637085556983948e-06, 8.940696716308594e-06]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 4.0, 5.0, 12.0, 11.0, 10.0, 22.0, 18.0, 26.0, 19.0, 29.0, 30.0, 32.0, 35.0, 46.0, 41.0, 43.0, 39.0, 43.0, 41.0, 55.0, 36.0, 49.0, 26.0, 39.0, 29.0, 39.0, 26.0, 32.0, 29.0, 30.0, 13.0, 16.0, 18.0, 11.0, 12.0, 11.0, 3.0, 1.0, 3.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.42578125, -2.35986328125, -2.2939453125, -2.22802734375, -2.162109375, -2.09619140625, -2.0302734375, -1.96435546875, -1.8984375, -1.83251953125, -1.7666015625, -1.70068359375, -1.634765625, -1.56884765625, -1.5029296875, -1.43701171875, -1.37109375, -1.30517578125, -1.2392578125, -1.17333984375, -1.107421875, -1.04150390625, -0.9755859375, -0.90966796875, -0.84375, -0.77783203125, -0.7119140625, -0.64599609375, -0.580078125, -0.51416015625, -0.4482421875, -0.38232421875, -0.31640625, -0.25048828125, -0.1845703125, -0.11865234375, -0.052734375, 0.01318359375, 0.0791015625, 0.14501953125, 0.2109375, 0.27685546875, 0.3427734375, 0.40869140625, 0.474609375, 0.54052734375, 0.6064453125, 0.67236328125, 0.73828125, 0.80419921875, 0.8701171875, 0.93603515625, 1.001953125, 1.06787109375, 1.1337890625, 1.19970703125, 1.265625, 1.33154296875, 1.3974609375, 1.46337890625, 1.529296875, 1.59521484375, 1.6611328125, 1.72705078125, 1.79296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 11.0, 15.0, 25.0, 34.0, 46.0, 79.0, 96.0, 151.0, 211.0, 348.0, 633.0, 973.0, 1455.0, 2398.0, 4141.0, 6984.0, 12905.0, 25919.0, 62218.0, 191701.0, 437917.0, 184713.0, 60121.0, 25459.0, 12657.0, 6856.0, 4042.0, 2382.0, 1417.0, 916.0, 601.0, 379.0, 237.0, 155.0, 96.0, 56.0, 73.0, 37.0, 22.0, 15.0, 15.0, 3.0, 6.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-2.421875, -2.34954833984375, -2.2772216796875, -2.20489501953125, -2.132568359375, -2.06024169921875, -1.9879150390625, -1.91558837890625, -1.84326171875, -1.77093505859375, -1.6986083984375, -1.62628173828125, -1.553955078125, -1.48162841796875, -1.4093017578125, -1.33697509765625, -1.2646484375, -1.19232177734375, -1.1199951171875, -1.04766845703125, -0.975341796875, -0.90301513671875, -0.8306884765625, -0.75836181640625, -0.68603515625, -0.61370849609375, -0.5413818359375, -0.46905517578125, -0.396728515625, -0.32440185546875, -0.2520751953125, -0.17974853515625, -0.107421875, -0.03509521484375, 0.0372314453125, 0.10955810546875, 0.181884765625, 0.25421142578125, 0.3265380859375, 0.39886474609375, 0.47119140625, 0.54351806640625, 0.6158447265625, 0.68817138671875, 0.760498046875, 0.83282470703125, 0.9051513671875, 0.97747802734375, 1.0498046875, 1.12213134765625, 1.1944580078125, 1.26678466796875, 1.339111328125, 1.41143798828125, 1.4837646484375, 1.55609130859375, 1.62841796875, 1.70074462890625, 1.7730712890625, 1.84539794921875, 1.917724609375, 1.99005126953125, 2.0623779296875, 2.13470458984375, 2.20703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 13.0, 7.0, 8.0, 11.0, 14.0, 13.0, 24.0, 25.0, 30.0, 34.0, 43.0, 47.0, 40.0, 59.0, 79.0, 121.0, 1494.0, 402.0, 124.0, 72.0, 60.0, 47.0, 50.0, 33.0, 34.0, 34.0, 26.0, 20.0, 20.0, 14.0, 12.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.81365966796875, -6.5609130859375, -6.30816650390625, -6.055419921875, -5.80267333984375, -5.5499267578125, -5.29718017578125, -5.04443359375, -4.79168701171875, -4.5389404296875, -4.28619384765625, -4.033447265625, -3.78070068359375, -3.5279541015625, -3.27520751953125, -3.0224609375, -2.76971435546875, -2.5169677734375, -2.26422119140625, -2.011474609375, -1.75872802734375, -1.5059814453125, -1.25323486328125, -1.00048828125, -0.74774169921875, -0.4949951171875, -0.24224853515625, 0.010498046875, 0.26324462890625, 0.5159912109375, 0.76873779296875, 1.021484375, 1.27423095703125, 1.5269775390625, 1.77972412109375, 2.032470703125, 2.28521728515625, 2.5379638671875, 2.79071044921875, 3.04345703125, 3.29620361328125, 3.5489501953125, 3.80169677734375, 4.054443359375, 4.30718994140625, 4.5599365234375, 4.81268310546875, 5.0654296875, 5.31817626953125, 5.5709228515625, 5.82366943359375, 6.076416015625, 6.32916259765625, 6.5819091796875, 6.83465576171875, 7.08740234375, 7.34014892578125, 7.5928955078125, 7.84564208984375, 8.098388671875, 8.35113525390625, 8.6038818359375, 8.85662841796875, 9.109375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 10.0, 9.0, 11.0, 14.0, 26.0, 22.0, 31.0, 45.0, 58.0, 84.0, 151.0, 324.0, 872.0, 2954.0, 18045.0, 701281.0, 2387826.0, 28150.0, 3835.0, 1075.0, 367.0, 166.0, 96.0, 57.0, 40.0, 31.0, 34.0, 20.0, 14.0, 10.0, 10.0, 6.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.2265625, -13.8323974609375, -13.438232421875, -13.0440673828125, -12.64990234375, -12.2557373046875, -11.861572265625, -11.4674072265625, -11.0732421875, -10.6790771484375, -10.284912109375, -9.8907470703125, -9.49658203125, -9.1024169921875, -8.708251953125, -8.3140869140625, -7.919921875, -7.5257568359375, -7.131591796875, -6.7374267578125, -6.34326171875, -5.9490966796875, -5.554931640625, -5.1607666015625, -4.7666015625, -4.3724365234375, -3.978271484375, -3.5841064453125, -3.18994140625, -2.7957763671875, -2.401611328125, -2.0074462890625, -1.61328125, -1.2191162109375, -0.824951171875, -0.4307861328125, -0.03662109375, 0.3575439453125, 0.751708984375, 1.1458740234375, 1.5400390625, 1.9342041015625, 2.328369140625, 2.7225341796875, 3.11669921875, 3.5108642578125, 3.905029296875, 4.2991943359375, 4.693359375, 5.0875244140625, 5.481689453125, 5.8758544921875, 6.27001953125, 6.6641845703125, 7.058349609375, 7.4525146484375, 7.8466796875, 8.2408447265625, 8.635009765625, 9.0291748046875, 9.42333984375, 9.8175048828125, 10.211669921875, 10.6058349609375, 11.0]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 23.0, 598.0, 391.0, 8.0], "bins": [-220.234619140625, -216.67408752441406, -213.11355590820312, -209.5530242919922, -205.99249267578125, -202.43194580078125, -198.8714141845703, -195.31088256835938, -191.75035095214844, -188.1898193359375, -184.62928771972656, -181.06875610351562, -177.5082244873047, -173.94769287109375, -170.38714599609375, -166.8266143798828, -163.26608276367188, -159.70555114746094, -156.14501953125, -152.58448791503906, -149.02395629882812, -145.46340942382812, -141.9028778076172, -138.34234619140625, -134.7818145751953, -131.22128295898438, -127.66075134277344, -124.10021209716797, -120.53968048095703, -116.9791488647461, -113.41861724853516, -109.85807800292969, -106.29755401611328, -102.73702239990234, -99.1764907836914, -95.61595153808594, -92.055419921875, -88.49488830566406, -84.93435668945312, -81.37382507324219, -77.81328582763672, -74.25275421142578, -70.69222259521484, -67.13168334960938, -63.57115173339844, -60.0106201171875, -56.45008850097656, -52.88955307006836, -49.32902145385742, -45.768489837646484, -42.20795440673828, -38.647422790527344, -35.08688735961914, -31.526355743408203, -27.965822219848633, -24.405288696289062, -20.844757080078125, -17.284223556518555, -13.723690032958984, -10.16315746307373, -6.60262393951416, -3.0420913696289062, 0.5184421539306641, 4.078975677490234, 7.639510154724121]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 6.0, 6.0, 7.0, 8.0, 13.0, 12.0, 8.0, 20.0, 20.0, 25.0, 28.0, 36.0, 29.0, 36.0, 36.0, 42.0, 26.0, 50.0, 45.0, 44.0, 41.0, 45.0, 47.0, 44.0, 42.0, 36.0, 44.0, 24.0, 25.0, 27.0, 29.0, 16.0, 14.0, 12.0, 11.0, 12.0, 7.0, 5.0, 8.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-28.225393295288086, -27.43456268310547, -26.64373016357422, -25.8528995513916, -25.06206703186035, -24.271236419677734, -23.480403900146484, -22.689573287963867, -21.898740768432617, -21.10791015625, -20.31707763671875, -19.526247024536133, -18.735414505004883, -17.944583892822266, -17.153751373291016, -16.3629207611084, -15.572089195251465, -14.781257629394531, -13.990426063537598, -13.199594497680664, -12.40876293182373, -11.617931365966797, -10.82710075378418, -10.03626823425293, -9.245437622070312, -8.454606056213379, -7.663774490356445, -6.872942924499512, -6.082111358642578, -5.2912797927856445, -4.500448703765869, -3.7096171379089355, -2.9187850952148438, -2.12795352935791, -1.3371220827102661, -0.5462906360626221, 0.24454092979431152, 1.0353724956512451, 1.8262038230895996, 2.617035388946533, 3.407866954803467, 4.1986985206604, 4.989530086517334, 5.780361175537109, 6.571192741394043, 7.362024307250977, 8.15285587310791, 8.943687438964844, 9.734519004821777, 10.525350570678711, 11.316182136535645, 12.107013702392578, 12.897845268249512, 13.688676834106445, 14.479507446289062, 15.270339965820312, 16.06117057800293, 16.852001190185547, 17.642833709716797, 18.433664321899414, 19.224496841430664, 20.01532745361328, 20.80615997314453, 21.59699058532715, 22.3878231048584]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 10.0, 10.0, 9.0, 15.0, 19.0, 13.0, 27.0, 21.0, 28.0, 31.0, 30.0, 44.0, 39.0, 41.0, 51.0, 24.0, 45.0, 51.0, 39.0, 40.0, 43.0, 45.0, 25.0, 40.0, 39.0, 27.0, 31.0, 27.0, 27.0, 22.0, 16.0, 10.0, 16.0, 8.0, 6.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.400390625, -2.3333587646484375, -2.266326904296875, -2.1992950439453125, -2.13226318359375, -2.0652313232421875, -1.998199462890625, -1.9311676025390625, -1.8641357421875, -1.7971038818359375, -1.730072021484375, -1.6630401611328125, -1.59600830078125, -1.5289764404296875, -1.461944580078125, -1.3949127197265625, -1.327880859375, -1.2608489990234375, -1.193817138671875, -1.1267852783203125, -1.05975341796875, -0.9927215576171875, -0.925689697265625, -0.8586578369140625, -0.7916259765625, -0.7245941162109375, -0.657562255859375, -0.5905303955078125, -0.52349853515625, -0.4564666748046875, -0.389434814453125, -0.3224029541015625, -0.25537109375, -0.1883392333984375, -0.121307373046875, -0.0542755126953125, 0.01275634765625, 0.0797882080078125, 0.146820068359375, 0.2138519287109375, 0.2808837890625, 0.3479156494140625, 0.414947509765625, 0.4819793701171875, 0.54901123046875, 0.6160430908203125, 0.683074951171875, 0.7501068115234375, 0.817138671875, 0.8841705322265625, 0.951202392578125, 1.0182342529296875, 1.08526611328125, 1.1522979736328125, 1.219329833984375, 1.2863616943359375, 1.3533935546875, 1.4204254150390625, 1.487457275390625, 1.5544891357421875, 1.62152099609375, 1.6885528564453125, 1.755584716796875, 1.8226165771484375, 1.8896484375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 8.0, 5.0, 8.0, 7.0, 10.0, 8.0, 17.0, 24.0, 20.0, 25.0, 50.0, 62.0, 86.0, 155.0, 277.0, 506.0, 977.0, 2201.0, 5092.0, 14246.0, 43134.0, 148737.0, 710831.0, 2378439.0, 680980.0, 143741.0, 41581.0, 13812.0, 5081.0, 2035.0, 946.0, 468.0, 250.0, 157.0, 98.0, 69.0, 36.0, 31.0, 18.0, 16.0, 11.0, 6.0, 14.0, 5.0, 5.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58984375, -4.41656494140625, -4.2432861328125, -4.07000732421875, -3.896728515625, -3.72344970703125, -3.5501708984375, -3.37689208984375, -3.20361328125, -3.03033447265625, -2.8570556640625, -2.68377685546875, -2.510498046875, -2.33721923828125, -2.1639404296875, -1.99066162109375, -1.8173828125, -1.64410400390625, -1.4708251953125, -1.29754638671875, -1.124267578125, -0.95098876953125, -0.7777099609375, -0.60443115234375, -0.43115234375, -0.25787353515625, -0.0845947265625, 0.08868408203125, 0.261962890625, 0.43524169921875, 0.6085205078125, 0.78179931640625, 0.955078125, 1.12835693359375, 1.3016357421875, 1.47491455078125, 1.648193359375, 1.82147216796875, 1.9947509765625, 2.16802978515625, 2.34130859375, 2.51458740234375, 2.6878662109375, 2.86114501953125, 3.034423828125, 3.20770263671875, 3.3809814453125, 3.55426025390625, 3.7275390625, 3.90081787109375, 4.0740966796875, 4.24737548828125, 4.420654296875, 4.59393310546875, 4.7672119140625, 4.94049072265625, 5.11376953125, 5.28704833984375, 5.4603271484375, 5.63360595703125, 5.806884765625, 5.98016357421875, 6.1534423828125, 6.32672119140625, 6.5]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 12.0, 9.0, 16.0, 21.0, 32.0, 53.0, 70.0, 57.0, 107.0, 148.0, 208.0, 287.0, 409.0, 490.0, 503.0, 430.0, 316.0, 256.0, 188.0, 110.0, 93.0, 66.0, 55.0, 44.0, 23.0, 17.0, 13.0, 12.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03515625, -5.82208251953125, -5.6090087890625, -5.39593505859375, -5.182861328125, -4.96978759765625, -4.7567138671875, -4.54364013671875, -4.33056640625, -4.11749267578125, -3.9044189453125, -3.69134521484375, -3.478271484375, -3.26519775390625, -3.0521240234375, -2.83905029296875, -2.6259765625, -2.41290283203125, -2.1998291015625, -1.98675537109375, -1.773681640625, -1.56060791015625, -1.3475341796875, -1.13446044921875, -0.92138671875, -0.70831298828125, -0.4952392578125, -0.28216552734375, -0.069091796875, 0.14398193359375, 0.3570556640625, 0.57012939453125, 0.783203125, 0.99627685546875, 1.2093505859375, 1.42242431640625, 1.635498046875, 1.84857177734375, 2.0616455078125, 2.27471923828125, 2.48779296875, 2.70086669921875, 2.9139404296875, 3.12701416015625, 3.340087890625, 3.55316162109375, 3.7662353515625, 3.97930908203125, 4.1923828125, 4.40545654296875, 4.6185302734375, 4.83160400390625, 5.044677734375, 5.25775146484375, 5.4708251953125, 5.68389892578125, 5.89697265625, 6.11004638671875, 6.3231201171875, 6.53619384765625, 6.749267578125, 6.96234130859375, 7.1754150390625, 7.38848876953125, 7.6015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 12.0, 14.0, 14.0, 20.0, 28.0, 46.0, 73.0, 127.0, 204.0, 367.0, 806.0, 1847.0, 4982.0, 18464.0, 94688.0, 716209.0, 2777276.0, 488239.0, 69156.0, 14455.0, 4094.0, 1609.0, 667.0, 366.0, 197.0, 106.0, 67.0, 42.0, 45.0, 24.0, 15.0, 9.0, 12.0, 3.0, 4.0, 0.0, 3.0], "bins": [-16.953125, -16.5626220703125, -16.172119140625, -15.7816162109375, -15.39111328125, -15.0006103515625, -14.610107421875, -14.2196044921875, -13.8291015625, -13.4385986328125, -13.048095703125, -12.6575927734375, -12.26708984375, -11.8765869140625, -11.486083984375, -11.0955810546875, -10.705078125, -10.3145751953125, -9.924072265625, -9.5335693359375, -9.14306640625, -8.7525634765625, -8.362060546875, -7.9715576171875, -7.5810546875, -7.1905517578125, -6.800048828125, -6.4095458984375, -6.01904296875, -5.6285400390625, -5.238037109375, -4.8475341796875, -4.45703125, -4.0665283203125, -3.676025390625, -3.2855224609375, -2.89501953125, -2.5045166015625, -2.114013671875, -1.7235107421875, -1.3330078125, -0.9425048828125, -0.552001953125, -0.1614990234375, 0.22900390625, 0.6195068359375, 1.010009765625, 1.4005126953125, 1.791015625, 2.1815185546875, 2.572021484375, 2.9625244140625, 3.35302734375, 3.7435302734375, 4.134033203125, 4.5245361328125, 4.9150390625, 5.3055419921875, 5.696044921875, 6.0865478515625, 6.47705078125, 6.8675537109375, 7.258056640625, 7.6485595703125, 8.0390625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 4.0, 15.0, 14.0, 28.0, 39.0, 46.0, 60.0, 84.0, 71.0, 96.0, 95.0, 83.0, 83.0, 74.0, 60.0, 26.0, 45.0, 26.0, 18.0, 8.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.34174728393555, -41.32365417480469, -40.30556106567383, -39.28746795654297, -38.26937484741211, -37.25128173828125, -36.23318862915039, -35.21509552001953, -34.19700622558594, -33.17891311645508, -32.16082000732422, -31.14272689819336, -30.1246337890625, -29.10654067993164, -28.088449478149414, -27.070356369018555, -26.052261352539062, -25.034168243408203, -24.016075134277344, -22.997982025146484, -21.979888916015625, -20.961795806884766, -19.94370460510254, -18.92561149597168, -17.90751838684082, -16.88942527770996, -15.871332168579102, -14.853240013122559, -13.8351469039917, -12.81705379486084, -11.798961639404297, -10.780868530273438, -9.762775421142578, -8.744682312011719, -7.726589679718018, -6.708497047424316, -5.690403938293457, -4.672310829162598, -3.6542181968688965, -2.6361255645751953, -1.618032455444336, -0.5999395847320557, 0.4181532859802246, 1.4362461566925049, 2.454339027404785, 3.4724321365356445, 4.490524768829346, 5.508617401123047, 6.526710510253906, 7.544803619384766, 8.562896728515625, 9.580988883972168, 10.599081993103027, 11.617175102233887, 12.63526725769043, 13.653360366821289, 14.671453475952148, 15.689546585083008, 16.707639694213867, 17.725732803344727, 18.743824005126953, 19.761917114257812, 20.780010223388672, 21.79810333251953, 22.81619644165039]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 11.0, 12.0, 8.0, 8.0, 9.0, 24.0, 14.0, 17.0, 22.0, 15.0, 35.0, 29.0, 30.0, 28.0, 33.0, 33.0, 36.0, 20.0, 32.0, 35.0, 35.0, 34.0, 40.0, 30.0, 31.0, 34.0, 34.0, 34.0, 28.0, 37.0, 33.0, 27.0, 27.0, 15.0, 20.0, 12.0, 13.0, 9.0, 14.0, 12.0, 7.0, 4.0, 0.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.326324462890625, -16.727331161499023, -16.128337860107422, -15.529343605041504, -14.930349349975586, -14.331356048583984, -13.732362747192383, -13.133369445800781, -12.534375190734863, -11.935381889343262, -11.336387634277344, -10.737394332885742, -10.13840103149414, -9.539406776428223, -8.940413475036621, -8.341419219970703, -7.742425918579102, -7.143432140350342, -6.544438362121582, -5.9454450607299805, -5.346451282501221, -4.747457504272461, -4.148464202880859, -3.5494704246520996, -2.95047664642334, -2.35148286819458, -1.7524893283843994, -1.1534956693649292, -0.554502010345459, 0.04449176788330078, 0.6434853076934814, 1.242478847503662, 1.8414726257324219, 2.4404664039611816, 3.0394599437713623, 3.638453483581543, 4.237447261810303, 4.8364410400390625, 5.435434341430664, 6.034428119659424, 6.633421897888184, 7.232415676116943, 7.831409454345703, 8.430402755737305, 9.029396057128906, 9.628390312194824, 10.227383613586426, 10.826377868652344, 11.425371170043945, 12.024364471435547, 12.623358726501465, 13.222352027893066, 13.821346282958984, 14.420339584350586, 15.019332885742188, 15.618326187133789, 16.21731948852539, 16.816312789916992, 17.415306091308594, 18.014301300048828, 18.61329460144043, 19.21228790283203, 19.811281204223633, 20.410274505615234, 21.00926971435547]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 11.0, 19.0, 17.0, 22.0, 19.0, 25.0, 29.0, 34.0, 27.0, 34.0, 34.0, 38.0, 48.0, 47.0, 42.0, 36.0, 41.0, 38.0, 41.0, 37.0, 32.0, 43.0, 40.0, 35.0, 28.0, 33.0, 34.0, 20.0, 23.0, 12.0, 13.0, 6.0, 6.0, 8.0, 3.0, 4.0, 10.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.176483154296875, -2.10687255859375, -2.037261962890625, -1.9676513671875, -1.898040771484375, -1.82843017578125, -1.758819580078125, -1.689208984375, -1.619598388671875, -1.54998779296875, -1.480377197265625, -1.4107666015625, -1.341156005859375, -1.27154541015625, -1.201934814453125, -1.13232421875, -1.062713623046875, -0.99310302734375, -0.923492431640625, -0.8538818359375, -0.784271240234375, -0.71466064453125, -0.645050048828125, -0.575439453125, -0.505828857421875, -0.43621826171875, -0.366607666015625, -0.2969970703125, -0.227386474609375, -0.15777587890625, -0.088165283203125, -0.0185546875, 0.051055908203125, 0.12066650390625, 0.190277099609375, 0.2598876953125, 0.329498291015625, 0.39910888671875, 0.468719482421875, 0.538330078125, 0.607940673828125, 0.67755126953125, 0.747161865234375, 0.8167724609375, 0.886383056640625, 0.95599365234375, 1.025604248046875, 1.09521484375, 1.164825439453125, 1.23443603515625, 1.304046630859375, 1.3736572265625, 1.443267822265625, 1.51287841796875, 1.582489013671875, 1.652099609375, 1.721710205078125, 1.79132080078125, 1.860931396484375, 1.9305419921875, 2.000152587890625, 2.06976318359375, 2.139373779296875, 2.208984375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 7.0, 17.0, 17.0, 27.0, 41.0, 54.0, 97.0, 156.0, 235.0, 354.0, 621.0, 939.0, 1479.0, 2474.0, 3970.0, 6236.0, 9990.0, 16260.0, 27092.0, 46444.0, 84250.0, 179994.0, 335404.0, 151940.0, 74712.0, 42107.0, 24464.0, 14698.0, 9106.0, 5706.0, 3617.0, 2237.0, 1461.0, 829.0, 549.0, 354.0, 205.0, 136.0, 94.0, 65.0, 46.0, 20.0, 23.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09027099609375, -0.08748531341552734, -0.08469963073730469, -0.08191394805908203, -0.07912826538085938, -0.07634258270263672, -0.07355690002441406, -0.0707712173461914, -0.06798553466796875, -0.0651998519897461, -0.06241416931152344, -0.05962848663330078, -0.056842803955078125, -0.05405712127685547, -0.05127143859863281, -0.048485755920410156, -0.0457000732421875, -0.042914390563964844, -0.04012870788574219, -0.03734302520751953, -0.034557342529296875, -0.03177165985107422, -0.028985977172851562, -0.026200294494628906, -0.02341461181640625, -0.020628929138183594, -0.017843246459960938, -0.015057563781738281, -0.012271881103515625, -0.009486198425292969, -0.0067005157470703125, -0.003914833068847656, -0.001129150390625, 0.0016565322875976562, 0.0044422149658203125, 0.007227897644042969, 0.010013580322265625, 0.012799263000488281, 0.015584945678710938, 0.018370628356933594, 0.02115631103515625, 0.023941993713378906, 0.026727676391601562, 0.02951335906982422, 0.032299041748046875, 0.03508472442626953, 0.03787040710449219, 0.040656089782714844, 0.0434417724609375, 0.046227455139160156, 0.04901313781738281, 0.05179882049560547, 0.054584503173828125, 0.05737018585205078, 0.06015586853027344, 0.0629415512084961, 0.06572723388671875, 0.0685129165649414, 0.07129859924316406, 0.07408428192138672, 0.07686996459960938, 0.07965564727783203, 0.08244132995605469, 0.08522701263427734, 0.0880126953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 9.0, 5.0, 9.0, 8.0, 9.0, 13.0, 20.0, 33.0, 19.0, 35.0, 31.0, 27.0, 36.0, 46.0, 42.0, 58.0, 36.0, 40.0, 1064.0, 41.0, 49.0, 45.0, 36.0, 39.0, 29.0, 28.0, 32.0, 22.0, 29.0, 23.0, 23.0, 23.0, 17.0, 14.0, 5.0, 8.0, 6.0, 2.0, 5.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3125, -1.2652130126953125, -1.217926025390625, -1.1706390380859375, -1.12335205078125, -1.0760650634765625, -1.028778076171875, -0.9814910888671875, -0.9342041015625, -0.8869171142578125, -0.839630126953125, -0.7923431396484375, -0.74505615234375, -0.6977691650390625, -0.650482177734375, -0.6031951904296875, -0.555908203125, -0.5086212158203125, -0.461334228515625, -0.4140472412109375, -0.36676025390625, -0.3194732666015625, -0.272186279296875, -0.2248992919921875, -0.1776123046875, -0.1303253173828125, -0.083038330078125, -0.0357513427734375, 0.01153564453125, 0.0588226318359375, 0.106109619140625, 0.1533966064453125, 0.20068359375, 0.2479705810546875, 0.295257568359375, 0.3425445556640625, 0.38983154296875, 0.4371185302734375, 0.484405517578125, 0.5316925048828125, 0.5789794921875, 0.6262664794921875, 0.673553466796875, 0.7208404541015625, 0.76812744140625, 0.8154144287109375, 0.862701416015625, 0.9099884033203125, 0.957275390625, 1.0045623779296875, 1.051849365234375, 1.0991363525390625, 1.14642333984375, 1.1937103271484375, 1.240997314453125, 1.2882843017578125, 1.3355712890625, 1.3828582763671875, 1.430145263671875, 1.4774322509765625, 1.52471923828125, 1.5720062255859375, 1.619293212890625, 1.6665802001953125, 1.7138671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 7.0, 13.0, 21.0, 27.0, 45.0, 57.0, 90.0, 169.0, 242.0, 339.0, 488.0, 787.0, 1173.0, 1805.0, 2594.0, 4094.0, 6230.0, 9495.0, 15030.0, 23318.0, 37211.0, 61250.0, 108226.0, 225563.0, 1300188.0, 120470.0, 66970.0, 40150.0, 25434.0, 16007.0, 10105.0, 6661.0, 4321.0, 2909.0, 1908.0, 1296.0, 783.0, 573.0, 356.0, 242.0, 172.0, 97.0, 72.0, 47.0, 38.0, 17.0, 17.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03619384765625, -0.035065650939941406, -0.03393745422363281, -0.03280925750732422, -0.031681060791015625, -0.03055286407470703, -0.029424667358398438, -0.028296470642089844, -0.02716827392578125, -0.026040077209472656, -0.024911880493164062, -0.02378368377685547, -0.022655487060546875, -0.02152729034423828, -0.020399093627929688, -0.019270896911621094, -0.0181427001953125, -0.017014503479003906, -0.015886306762695312, -0.014758110046386719, -0.013629913330078125, -0.012501716613769531, -0.011373519897460938, -0.010245323181152344, -0.00911712646484375, -0.007988929748535156, -0.0068607330322265625, -0.005732536315917969, -0.004604339599609375, -0.0034761428833007812, -0.0023479461669921875, -0.0012197494506835938, -9.1552734375e-05, 0.0010366439819335938, 0.0021648406982421875, 0.0032930374145507812, 0.004421234130859375, 0.005549430847167969, 0.0066776275634765625, 0.007805824279785156, 0.00893402099609375, 0.010062217712402344, 0.011190414428710938, 0.012318611145019531, 0.013446807861328125, 0.014575004577636719, 0.015703201293945312, 0.016831398010253906, 0.0179595947265625, 0.019087791442871094, 0.020215988159179688, 0.02134418487548828, 0.022472381591796875, 0.02360057830810547, 0.024728775024414062, 0.025856971740722656, 0.02698516845703125, 0.028113365173339844, 0.029241561889648438, 0.03036975860595703, 0.031497955322265625, 0.03262615203857422, 0.03375434875488281, 0.034882545471191406, 0.0360107421875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 9.0, 3.0, 8.0, 9.0, 17.0, 21.0, 23.0, 27.0, 42.0, 45.0, 40.0, 49.0, 87.0, 86.0, 82.0, 60.0, 49.0, 66.0, 58.0, 48.0, 29.0, 19.0, 26.0, 20.0, 26.0, 8.0, 10.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.8789043426513672e-05, -2.7943402528762817e-05, -2.7097761631011963e-05, -2.625212073326111e-05, -2.5406479835510254e-05, -2.45608389377594e-05, -2.3715198040008545e-05, -2.286955714225769e-05, -2.2023916244506836e-05, -2.117827534675598e-05, -2.0332634449005127e-05, -1.9486993551254272e-05, -1.8641352653503418e-05, -1.7795711755752563e-05, -1.695007085800171e-05, -1.6104429960250854e-05, -1.52587890625e-05, -1.4413148164749146e-05, -1.3567507266998291e-05, -1.2721866369247437e-05, -1.1876225471496582e-05, -1.1030584573745728e-05, -1.0184943675994873e-05, -9.339302778244019e-06, -8.493661880493164e-06, -7.64802098274231e-06, -6.802380084991455e-06, -5.956739187240601e-06, -5.111098289489746e-06, -4.265457391738892e-06, -3.419816493988037e-06, -2.5741755962371826e-06, -1.7285346984863281e-06, -8.828938007354736e-07, -3.725290298461914e-08, 8.083879947662354e-07, 1.6540288925170898e-06, 2.4996697902679443e-06, 3.345310688018799e-06, 4.190951585769653e-06, 5.036592483520508e-06, 5.882233381271362e-06, 6.727874279022217e-06, 7.573515176773071e-06, 8.419156074523926e-06, 9.26479697227478e-06, 1.0110437870025635e-05, 1.095607876777649e-05, 1.1801719665527344e-05, 1.2647360563278198e-05, 1.3493001461029053e-05, 1.4338642358779907e-05, 1.5184283256530762e-05, 1.6029924154281616e-05, 1.687556505203247e-05, 1.7721205949783325e-05, 1.856684684753418e-05, 1.9412487745285034e-05, 2.025812864303589e-05, 2.1103769540786743e-05, 2.1949410438537598e-05, 2.2795051336288452e-05, 2.3640692234039307e-05, 2.448633313179016e-05, 2.5331974029541016e-05]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 7.0, 8.0, 9.0, 10.0, 10.0, 15.0, 19.0, 32.0, 35.0, 31.0, 51.0, 93.0, 129.0, 214.0, 436.0, 1710.0, 937648.0, 106240.0, 922.0, 303.0, 185.0, 117.0, 69.0, 58.0, 39.0, 35.0, 32.0, 19.0, 23.0, 6.0, 13.0, 6.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00047087669372558594, -0.00045510753989219666, -0.0004393383860588074, -0.0004235692322254181, -0.0004078000783920288, -0.0003920309245586395, -0.00037626177072525024, -0.00036049261689186096, -0.0003447234630584717, -0.0003289543092250824, -0.0003131851553916931, -0.00029741600155830383, -0.00028164684772491455, -0.00026587769389152527, -0.000250108540058136, -0.0002343393862247467, -0.00021857023239135742, -0.00020280107855796814, -0.00018703192472457886, -0.00017126277089118958, -0.0001554936170578003, -0.000139724463224411, -0.00012395530939102173, -0.00010818615555763245, -9.241700172424316e-05, -7.664784789085388e-05, -6.08786940574646e-05, -4.510954022407532e-05, -2.9340386390686035e-05, -1.3571232557296753e-05, 2.1979212760925293e-06, 1.796707510948181e-05, 3.3736228942871094e-05, 4.9505382776260376e-05, 6.527453660964966e-05, 8.104369044303894e-05, 9.681284427642822e-05, 0.0001125819981098175, 0.0001283511519432068, 0.00014412030577659607, 0.00015988945960998535, 0.00017565861344337463, 0.00019142776727676392, 0.0002071969211101532, 0.00022296607494354248, 0.00023873522877693176, 0.00025450438261032104, 0.00027027353644371033, 0.0002860426902770996, 0.0003018118441104889, 0.0003175809979438782, 0.00033335015177726746, 0.00034911930561065674, 0.000364888459444046, 0.0003806576132774353, 0.0003964267671108246, 0.00041219592094421387, 0.00042796507477760315, 0.00044373422861099243, 0.0004595033824443817, 0.000475272536277771, 0.0004910416901111603, 0.0005068108439445496, 0.0005225799977779388, 0.0005383491516113281]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 42.0, 212.0, 477.0, 197.0, 61.0, 13.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5357243682956323e-05, -1.3890138689021114e-05, -1.2423033695085905e-05, -1.0955927791655995e-05, -9.488822797720786e-06, -8.021717803785577e-06, -6.554611900355667e-06, -5.087506906420458e-06, -3.6204019124852493e-06, -2.153296691176365e-06, -6.861914698674809e-07, 7.809139788150787e-07, 2.2480189727502875e-06, 3.7151239666854963e-06, 5.182229870115407e-06, 6.649334864050616e-06, 8.116439857985824e-06, 9.583544851921033e-06, 1.1050649845856242e-05, 1.2517755749286152e-05, 1.3984860743221361e-05, 1.545196573715657e-05, 1.691907164058648e-05, 1.838617754401639e-05, 1.9853281628456898e-05, 2.132038753188681e-05, 2.2787491616327316e-05, 2.4254597519757226e-05, 2.5721703423187137e-05, 2.7188807507627644e-05, 2.8655913411057554e-05, 3.012301749549806e-05, 3.1590119760949165e-05, 3.3057225664379075e-05, 3.4524331567808986e-05, 3.599143383326009e-05, 3.745853973669e-05, 3.892564564011991e-05, 4.039275154354982e-05, 4.185985744697973e-05, 4.3326959712430835e-05, 4.4794065615860745e-05, 4.6261171519290656e-05, 4.772827378474176e-05, 4.919537968817167e-05, 5.066248559160158e-05, 5.212959149503149e-05, 5.35966973984614e-05, 5.506380330189131e-05, 5.653090920532122e-05, 5.799801510875113e-05, 5.9465121012181044e-05, 6.093222327763215e-05, 6.239932554308325e-05, 6.386643508449197e-05, 6.533353734994307e-05, 6.680064689135179e-05, 6.826774915680289e-05, 6.973485869821161e-05, 7.120196096366271e-05, 7.266907050507143e-05, 7.413617277052253e-05, 7.560328231193125e-05, 7.707038457738236e-05, 7.853748684283346e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 5.0, 4.0, 10.0, 6.0, 10.0, 8.0, 13.0, 16.0, 24.0, 18.0, 16.0, 23.0, 27.0, 41.0, 28.0, 44.0, 50.0, 33.0, 44.0, 38.0, 33.0, 40.0, 49.0, 40.0, 45.0, 34.0, 38.0, 38.0, 29.0, 35.0, 25.0, 17.0, 23.0, 17.0, 14.0, 20.0, 10.0, 10.0, 11.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2755393981933594e-05, -1.2295320630073547e-05, -1.1835247278213501e-05, -1.1375173926353455e-05, -1.0915100574493408e-05, -1.0455027222633362e-05, -9.994953870773315e-06, -9.534880518913269e-06, -9.074807167053223e-06, -8.614733815193176e-06, -8.15466046333313e-06, -7.694587111473083e-06, -7.234513759613037e-06, -6.774440407752991e-06, -6.314367055892944e-06, -5.854293704032898e-06, -5.3942203521728516e-06, -4.934147000312805e-06, -4.474073648452759e-06, -4.014000296592712e-06, -3.553926944732666e-06, -3.0938535928726196e-06, -2.6337802410125732e-06, -2.173706889152527e-06, -1.7136335372924805e-06, -1.253560185432434e-06, -7.934868335723877e-07, -3.334134817123413e-07, 1.2665987014770508e-07, 5.867332220077515e-07, 1.0468065738677979e-06, 1.5068799257278442e-06, 1.9669532775878906e-06, 2.427026629447937e-06, 2.8870999813079834e-06, 3.3471733331680298e-06, 3.807246685028076e-06, 4.2673200368881226e-06, 4.727393388748169e-06, 5.187466740608215e-06, 5.647540092468262e-06, 6.107613444328308e-06, 6.5676867961883545e-06, 7.027760148048401e-06, 7.487833499908447e-06, 7.947906851768494e-06, 8.40798020362854e-06, 8.868053555488586e-06, 9.328126907348633e-06, 9.78820025920868e-06, 1.0248273611068726e-05, 1.0708346962928772e-05, 1.1168420314788818e-05, 1.1628493666648865e-05, 1.2088567018508911e-05, 1.2548640370368958e-05, 1.3008713722229004e-05, 1.346878707408905e-05, 1.3928860425949097e-05, 1.4388933777809143e-05, 1.484900712966919e-05, 1.5309080481529236e-05, 1.5769153833389282e-05, 1.622922718524933e-05, 1.6689300537109375e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 11.0, 19.0, 17.0, 22.0, 19.0, 25.0, 29.0, 34.0, 27.0, 34.0, 34.0, 38.0, 48.0, 47.0, 42.0, 36.0, 41.0, 38.0, 41.0, 37.0, 32.0, 43.0, 40.0, 35.0, 28.0, 33.0, 34.0, 20.0, 23.0, 12.0, 13.0, 6.0, 6.0, 8.0, 3.0, 4.0, 10.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.176483154296875, -2.10687255859375, -2.037261962890625, -1.9676513671875, -1.898040771484375, -1.82843017578125, -1.758819580078125, -1.689208984375, -1.619598388671875, -1.54998779296875, -1.480377197265625, -1.4107666015625, -1.341156005859375, -1.27154541015625, -1.201934814453125, -1.13232421875, -1.062713623046875, -0.99310302734375, -0.923492431640625, -0.8538818359375, -0.784271240234375, -0.71466064453125, -0.645050048828125, -0.575439453125, -0.505828857421875, -0.43621826171875, -0.366607666015625, -0.2969970703125, -0.227386474609375, -0.15777587890625, -0.088165283203125, -0.0185546875, 0.051055908203125, 0.12066650390625, 0.190277099609375, 0.2598876953125, 0.329498291015625, 0.39910888671875, 0.468719482421875, 0.538330078125, 0.607940673828125, 0.67755126953125, 0.747161865234375, 0.8167724609375, 0.886383056640625, 0.95599365234375, 1.025604248046875, 1.09521484375, 1.164825439453125, 1.23443603515625, 1.304046630859375, 1.3736572265625, 1.443267822265625, 1.51287841796875, 1.582489013671875, 1.652099609375, 1.721710205078125, 1.79132080078125, 1.860931396484375, 1.9305419921875, 2.000152587890625, 2.06976318359375, 2.139373779296875, 2.208984375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 12.0, 11.0, 10.0, 15.0, 38.0, 68.0, 47.0, 83.0, 138.0, 217.0, 287.0, 446.0, 662.0, 1107.0, 1735.0, 2820.0, 4858.0, 9347.0, 20790.0, 60237.0, 281753.0, 511617.0, 96291.0, 28876.0, 11954.0, 6092.0, 3398.0, 2029.0, 1245.0, 786.0, 505.0, 299.0, 237.0, 166.0, 118.0, 75.0, 56.0, 32.0, 31.0, 21.0, 12.0, 17.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.404296875, -3.291473388671875, -3.17864990234375, -3.065826416015625, -2.9530029296875, -2.840179443359375, -2.72735595703125, -2.614532470703125, -2.501708984375, -2.388885498046875, -2.27606201171875, -2.163238525390625, -2.0504150390625, -1.937591552734375, -1.82476806640625, -1.711944580078125, -1.59912109375, -1.486297607421875, -1.37347412109375, -1.260650634765625, -1.1478271484375, -1.035003662109375, -0.92218017578125, -0.809356689453125, -0.696533203125, -0.583709716796875, -0.47088623046875, -0.358062744140625, -0.2452392578125, -0.132415771484375, -0.01959228515625, 0.093231201171875, 0.2060546875, 0.318878173828125, 0.43170166015625, 0.544525146484375, 0.6573486328125, 0.770172119140625, 0.88299560546875, 0.995819091796875, 1.108642578125, 1.221466064453125, 1.33428955078125, 1.447113037109375, 1.5599365234375, 1.672760009765625, 1.78558349609375, 1.898406982421875, 2.01123046875, 2.124053955078125, 2.23687744140625, 2.349700927734375, 2.4625244140625, 2.575347900390625, 2.68817138671875, 2.800994873046875, 2.913818359375, 3.026641845703125, 3.13946533203125, 3.252288818359375, 3.3651123046875, 3.477935791015625, 3.59075927734375, 3.703582763671875, 3.81640625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 5.0, 6.0, 9.0, 10.0, 18.0, 11.0, 9.0, 17.0, 21.0, 19.0, 31.0, 22.0, 46.0, 29.0, 44.0, 44.0, 54.0, 62.0, 133.0, 302.0, 1450.0, 181.0, 85.0, 67.0, 41.0, 37.0, 40.0, 39.0, 18.0, 24.0, 18.0, 29.0, 21.0, 19.0, 8.0, 11.0, 14.0, 15.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.1328125, -6.92431640625, -6.7158203125, -6.50732421875, -6.298828125, -6.09033203125, -5.8818359375, -5.67333984375, -5.46484375, -5.25634765625, -5.0478515625, -4.83935546875, -4.630859375, -4.42236328125, -4.2138671875, -4.00537109375, -3.796875, -3.58837890625, -3.3798828125, -3.17138671875, -2.962890625, -2.75439453125, -2.5458984375, -2.33740234375, -2.12890625, -1.92041015625, -1.7119140625, -1.50341796875, -1.294921875, -1.08642578125, -0.8779296875, -0.66943359375, -0.4609375, -0.25244140625, -0.0439453125, 0.16455078125, 0.373046875, 0.58154296875, 0.7900390625, 0.99853515625, 1.20703125, 1.41552734375, 1.6240234375, 1.83251953125, 2.041015625, 2.24951171875, 2.4580078125, 2.66650390625, 2.875, 3.08349609375, 3.2919921875, 3.50048828125, 3.708984375, 3.91748046875, 4.1259765625, 4.33447265625, 4.54296875, 4.75146484375, 4.9599609375, 5.16845703125, 5.376953125, 5.58544921875, 5.7939453125, 6.00244140625, 6.2109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 8.0, 13.0, 12.0, 12.0, 20.0, 23.0, 37.0, 33.0, 48.0, 63.0, 87.0, 126.0, 240.0, 466.0, 1472.0, 5267.0, 24012.0, 424810.0, 2615266.0, 59915.0, 9678.0, 2437.0, 733.0, 293.0, 167.0, 101.0, 79.0, 70.0, 41.0, 33.0, 22.0, 26.0, 16.0, 10.0, 13.0, 9.0, 6.0, 4.0, 5.0, 5.0, 5.0, 3.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.2578125, -9.9183349609375, -9.578857421875, -9.2393798828125, -8.89990234375, -8.5604248046875, -8.220947265625, -7.8814697265625, -7.5419921875, -7.2025146484375, -6.863037109375, -6.5235595703125, -6.18408203125, -5.8446044921875, -5.505126953125, -5.1656494140625, -4.826171875, -4.4866943359375, -4.147216796875, -3.8077392578125, -3.46826171875, -3.1287841796875, -2.789306640625, -2.4498291015625, -2.1103515625, -1.7708740234375, -1.431396484375, -1.0919189453125, -0.75244140625, -0.4129638671875, -0.073486328125, 0.2659912109375, 0.60546875, 0.9449462890625, 1.284423828125, 1.6239013671875, 1.96337890625, 2.3028564453125, 2.642333984375, 2.9818115234375, 3.3212890625, 3.6607666015625, 4.000244140625, 4.3397216796875, 4.67919921875, 5.0186767578125, 5.358154296875, 5.6976318359375, 6.037109375, 6.3765869140625, 6.716064453125, 7.0555419921875, 7.39501953125, 7.7344970703125, 8.073974609375, 8.4134521484375, 8.7529296875, 9.0924072265625, 9.431884765625, 9.7713623046875, 10.11083984375, 10.4503173828125, 10.789794921875, 11.1292724609375, 11.46875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 15.0, 227.0, 500.0, 250.0, 23.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-120.93769836425781, -118.58816528320312, -116.23863983154297, -113.88910675048828, -111.5395736694336, -109.1900405883789, -106.84051513671875, -104.49098205566406, -102.14144897460938, -99.79191589355469, -97.44239044189453, -95.09285736083984, -92.74332427978516, -90.39379119873047, -88.04426574707031, -85.69473266601562, -83.34519958496094, -80.99566650390625, -78.6461410522461, -76.2966079711914, -73.94707489013672, -71.59754180908203, -69.24801635742188, -66.89848327636719, -64.54895782470703, -62.19942855834961, -59.84989547729492, -57.5003662109375, -55.15083312988281, -52.80130386352539, -50.45177459716797, -48.10224151611328, -45.75271224975586, -43.40318298339844, -41.05364990234375, -38.70412063598633, -36.35458755493164, -34.00505828857422, -31.655527114868164, -29.30599594116211, -26.956464767456055, -24.60693359375, -22.257402420043945, -19.90787124633789, -17.55834197998047, -15.208809852600098, -12.85927963256836, -10.509748458862305, -8.16021728515625, -5.810686111450195, -3.461155414581299, -1.1116247177124023, 1.2379064559936523, 3.587437629699707, 5.936967849731445, 8.2864990234375, 10.636030197143555, 12.98556137084961, 15.335092544555664, 17.68462371826172, 20.03415298461914, 22.383686065673828, 24.73321533203125, 27.082746505737305, 29.43227767944336]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 3.0, 6.0, 7.0, 10.0, 9.0, 11.0, 12.0, 16.0, 21.0, 27.0, 24.0, 18.0, 23.0, 29.0, 40.0, 32.0, 34.0, 35.0, 29.0, 40.0, 33.0, 38.0, 51.0, 32.0, 36.0, 35.0, 32.0, 41.0, 33.0, 32.0, 34.0, 25.0, 20.0, 27.0, 16.0, 13.0, 14.0, 5.0, 11.0, 6.0, 5.0, 7.0, 5.0, 1.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.849008560180664, -17.233322143554688, -16.61763572692871, -16.001949310302734, -15.386261940002441, -14.770575523376465, -14.154888153076172, -13.539201736450195, -12.923515319824219, -12.307828903198242, -11.692142486572266, -11.076455116271973, -10.460768699645996, -9.84508228302002, -9.229394912719727, -8.61370849609375, -7.998022079467773, -7.382335662841797, -6.766648769378662, -6.150961875915527, -5.535275459289551, -4.919589042663574, -4.3039021492004395, -3.6882152557373047, -3.072528839111328, -2.4568421840667725, -1.8411555290222168, -1.2254688739776611, -0.6097822189331055, 0.005904436111450195, 0.6215910911560059, 1.2372779846191406, 1.85296630859375, 2.4686529636383057, 3.0843396186828613, 3.700026273727417, 4.315712928771973, 4.931399345397949, 5.547086238861084, 6.162773132324219, 6.778459548950195, 7.394145965576172, 8.009832382202148, 8.625519752502441, 9.241206169128418, 9.856892585754395, 10.472579956054688, 11.088266372680664, 11.70395278930664, 12.319639205932617, 12.935325622558594, 13.551012992858887, 14.166699409484863, 14.78238582611084, 15.398073196411133, 16.01375961303711, 16.629446029663086, 17.245132446289062, 17.86081886291504, 18.476505279541016, 19.092193603515625, 19.7078800201416, 20.323566436767578, 20.939252853393555, 21.55493927001953]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 16.0, 18.0, 24.0, 20.0, 22.0, 28.0, 25.0, 38.0, 33.0, 40.0, 41.0, 49.0, 39.0, 55.0, 43.0, 38.0, 50.0, 42.0, 33.0, 32.0, 47.0, 33.0, 38.0, 41.0, 23.0, 29.0, 20.0, 14.0, 11.0, 7.0, 14.0, 3.0, 4.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.33294677734375, -2.2576904296875, -2.18243408203125, -2.107177734375, -2.03192138671875, -1.9566650390625, -1.88140869140625, -1.80615234375, -1.73089599609375, -1.6556396484375, -1.58038330078125, -1.505126953125, -1.42987060546875, -1.3546142578125, -1.27935791015625, -1.2041015625, -1.12884521484375, -1.0535888671875, -0.97833251953125, -0.903076171875, -0.82781982421875, -0.7525634765625, -0.67730712890625, -0.60205078125, -0.52679443359375, -0.4515380859375, -0.37628173828125, -0.301025390625, -0.22576904296875, -0.1505126953125, -0.07525634765625, 0.0, 0.07525634765625, 0.1505126953125, 0.22576904296875, 0.301025390625, 0.37628173828125, 0.4515380859375, 0.52679443359375, 0.60205078125, 0.67730712890625, 0.7525634765625, 0.82781982421875, 0.903076171875, 0.97833251953125, 1.0535888671875, 1.12884521484375, 1.2041015625, 1.27935791015625, 1.3546142578125, 1.42987060546875, 1.505126953125, 1.58038330078125, 1.6556396484375, 1.73089599609375, 1.80615234375, 1.88140869140625, 1.9566650390625, 2.03192138671875, 2.107177734375, 2.18243408203125, 2.2576904296875, 2.33294677734375, 2.408203125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 15.0, 19.0, 19.0, 44.0, 56.0, 90.0, 124.0, 233.0, 380.0, 623.0, 1212.0, 2227.0, 4472.0, 9150.0, 20007.0, 47700.0, 122038.0, 365466.0, 1263476.0, 1585274.0, 505585.0, 159044.0, 59699.0, 24811.0, 11165.0, 5399.0, 2693.0, 1421.0, 758.0, 419.0, 240.0, 147.0, 95.0, 59.0, 40.0, 33.0, 7.0, 7.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.498046875, -3.377960205078125, -3.25787353515625, -3.137786865234375, -3.0177001953125, -2.897613525390625, -2.77752685546875, -2.657440185546875, -2.537353515625, -2.417266845703125, -2.29718017578125, -2.177093505859375, -2.0570068359375, -1.936920166015625, -1.81683349609375, -1.696746826171875, -1.57666015625, -1.456573486328125, -1.33648681640625, -1.216400146484375, -1.0963134765625, -0.976226806640625, -0.85614013671875, -0.736053466796875, -0.615966796875, -0.495880126953125, -0.37579345703125, -0.255706787109375, -0.1356201171875, -0.015533447265625, 0.10455322265625, 0.224639892578125, 0.3447265625, 0.464813232421875, 0.58489990234375, 0.704986572265625, 0.8250732421875, 0.945159912109375, 1.06524658203125, 1.185333251953125, 1.305419921875, 1.425506591796875, 1.54559326171875, 1.665679931640625, 1.7857666015625, 1.905853271484375, 2.02593994140625, 2.146026611328125, 2.26611328125, 2.386199951171875, 2.50628662109375, 2.626373291015625, 2.7464599609375, 2.866546630859375, 2.98663330078125, 3.106719970703125, 3.226806640625, 3.346893310546875, 3.46697998046875, 3.587066650390625, 3.7071533203125, 3.827239990234375, 3.94732666015625, 4.067413330078125, 4.1875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 6.0, 5.0, 7.0, 13.0, 16.0, 40.0, 39.0, 50.0, 68.0, 94.0, 149.0, 211.0, 257.0, 367.0, 411.0, 504.0, 437.0, 370.0, 298.0, 190.0, 154.0, 112.0, 79.0, 53.0, 41.0, 25.0, 24.0, 16.0, 11.0, 7.0, 6.0, 3.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.4630126953125, -6.258056640625, -6.0531005859375, -5.84814453125, -5.6431884765625, -5.438232421875, -5.2332763671875, -5.0283203125, -4.8233642578125, -4.618408203125, -4.4134521484375, -4.20849609375, -4.0035400390625, -3.798583984375, -3.5936279296875, -3.388671875, -3.1837158203125, -2.978759765625, -2.7738037109375, -2.56884765625, -2.3638916015625, -2.158935546875, -1.9539794921875, -1.7490234375, -1.5440673828125, -1.339111328125, -1.1341552734375, -0.92919921875, -0.7242431640625, -0.519287109375, -0.3143310546875, -0.109375, 0.0955810546875, 0.300537109375, 0.5054931640625, 0.71044921875, 0.9154052734375, 1.120361328125, 1.3253173828125, 1.5302734375, 1.7352294921875, 1.940185546875, 2.1451416015625, 2.35009765625, 2.5550537109375, 2.760009765625, 2.9649658203125, 3.169921875, 3.3748779296875, 3.579833984375, 3.7847900390625, 3.98974609375, 4.1947021484375, 4.399658203125, 4.6046142578125, 4.8095703125, 5.0145263671875, 5.219482421875, 5.4244384765625, 5.62939453125, 5.8343505859375, 6.039306640625, 6.2442626953125, 6.44921875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 13.0, 13.0, 15.0, 27.0, 31.0, 61.0, 106.0, 208.0, 461.0, 1055.0, 2663.0, 8353.0, 33597.0, 182698.0, 1314402.0, 2244530.0, 331306.0, 55776.0, 12783.0, 3572.0, 1351.0, 591.0, 287.0, 163.0, 83.0, 53.0, 20.0, 27.0, 14.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.4296875, -12.0859375, -11.7421875, -11.3984375, -11.0546875, -10.7109375, -10.3671875, -10.0234375, -9.6796875, -9.3359375, -8.9921875, -8.6484375, -8.3046875, -7.9609375, -7.6171875, -7.2734375, -6.9296875, -6.5859375, -6.2421875, -5.8984375, -5.5546875, -5.2109375, -4.8671875, -4.5234375, -4.1796875, -3.8359375, -3.4921875, -3.1484375, -2.8046875, -2.4609375, -2.1171875, -1.7734375, -1.4296875, -1.0859375, -0.7421875, -0.3984375, -0.0546875, 0.2890625, 0.6328125, 0.9765625, 1.3203125, 1.6640625, 2.0078125, 2.3515625, 2.6953125, 3.0390625, 3.3828125, 3.7265625, 4.0703125, 4.4140625, 4.7578125, 5.1015625, 5.4453125, 5.7890625, 6.1328125, 6.4765625, 6.8203125, 7.1640625, 7.5078125, 7.8515625, 8.1953125, 8.5390625, 8.8828125, 9.2265625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 8.0, 8.0, 13.0, 21.0, 24.0, 24.0, 42.0, 54.0, 60.0, 49.0, 60.0, 89.0, 66.0, 64.0, 77.0, 56.0, 59.0, 48.0, 37.0, 31.0, 27.0, 19.0, 17.0, 14.0, 10.0, 4.0, 7.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.341407775878906, -26.509775161743164, -25.678144454956055, -24.846511840820312, -24.01487922668457, -23.18324851989746, -22.35161590576172, -21.51998519897461, -20.688352584838867, -19.856719970703125, -19.025089263916016, -18.193456649780273, -17.36182403564453, -16.530193328857422, -15.69856071472168, -14.866929054260254, -14.035296440124512, -13.203664779663086, -12.372032165527344, -11.540400505065918, -10.708768844604492, -9.87713623046875, -9.045504570007324, -8.213872909545898, -7.3822407722473145, -6.5506086349487305, -5.718976974487305, -4.887344837188721, -4.055712699890137, -3.224081039428711, -2.392448902130127, -1.5608172416687012, -0.7291851043701172, 0.10244685411453247, 0.9340788125991821, 1.7657108306884766, 2.5973427295684814, 3.4289746284484863, 4.26060676574707, 5.092238426208496, 5.92387056350708, 6.755502700805664, 7.58713436126709, 8.418766021728516, 9.250398635864258, 10.082030296325684, 10.91366195678711, 11.745294570922852, 12.576926231384277, 13.408557891845703, 14.240190505981445, 15.071822166442871, 15.903453826904297, 16.73508644104004, 17.56671905517578, 18.39834976196289, 19.229982376098633, 20.061614990234375, 20.893245697021484, 21.724878311157227, 22.55651092529297, 23.388141632080078, 24.21977424621582, 25.051406860351562, 25.883037567138672]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 7.0, 9.0, 9.0, 7.0, 11.0, 11.0, 11.0, 14.0, 17.0, 14.0, 20.0, 20.0, 21.0, 24.0, 34.0, 40.0, 33.0, 39.0, 41.0, 30.0, 45.0, 36.0, 40.0, 49.0, 36.0, 32.0, 45.0, 39.0, 32.0, 31.0, 26.0, 19.0, 31.0, 29.0, 13.0, 10.0, 14.0, 8.0, 14.0, 4.0, 8.0, 3.0, 4.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-21.400039672851562, -20.789541244506836, -20.179040908813477, -19.56854248046875, -18.958044052124023, -18.347545623779297, -17.737045288085938, -17.12654685974121, -16.516048431396484, -15.905549049377441, -15.295050621032715, -14.684551239013672, -14.074052810668945, -13.463553428649902, -12.85305404663086, -12.242555618286133, -11.632055282592773, -11.02155590057373, -10.411057472229004, -9.800558090209961, -9.190059661865234, -8.579560279846191, -7.969060897827148, -7.358561992645264, -6.748063087463379, -6.137564182281494, -5.527065277099609, -4.916565895080566, -4.306066989898682, -3.695568084716797, -3.085068941116333, -2.474569797515869, -1.8640708923339844, -1.25357186794281, -0.6430728435516357, -0.032573819160461426, 0.5779252052307129, 1.1884241104125977, 1.7989232540130615, 2.4094223976135254, 3.01992130279541, 3.630420207977295, 4.24091911315918, 4.851418495178223, 5.461917400360107, 6.072416305541992, 6.682915687561035, 7.29341459274292, 7.903913497924805, 8.514412879943848, 9.124911308288574, 9.735410690307617, 10.345909118652344, 10.956408500671387, 11.56690788269043, 12.177406311035156, 12.7879056930542, 13.398405075073242, 14.008903503417969, 14.619402885437012, 15.229902267456055, 15.840400695800781, 16.450899124145508, 17.061399459838867, 17.671897888183594]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 2.0, 12.0, 12.0, 16.0, 15.0, 21.0, 26.0, 20.0, 20.0, 27.0, 34.0, 36.0, 32.0, 33.0, 38.0, 43.0, 45.0, 55.0, 46.0, 35.0, 46.0, 35.0, 35.0, 41.0, 35.0, 29.0, 29.0, 25.0, 27.0, 21.0, 25.0, 18.0, 10.0, 9.0, 10.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.267578125, -2.19512939453125, -2.1226806640625, -2.05023193359375, -1.977783203125, -1.90533447265625, -1.8328857421875, -1.76043701171875, -1.68798828125, -1.61553955078125, -1.5430908203125, -1.47064208984375, -1.398193359375, -1.32574462890625, -1.2532958984375, -1.18084716796875, -1.1083984375, -1.03594970703125, -0.9635009765625, -0.89105224609375, -0.818603515625, -0.74615478515625, -0.6737060546875, -0.60125732421875, -0.52880859375, -0.45635986328125, -0.3839111328125, -0.31146240234375, -0.239013671875, -0.16656494140625, -0.0941162109375, -0.02166748046875, 0.05078125, 0.12322998046875, 0.1956787109375, 0.26812744140625, 0.340576171875, 0.41302490234375, 0.4854736328125, 0.55792236328125, 0.63037109375, 0.70281982421875, 0.7752685546875, 0.84771728515625, 0.920166015625, 0.99261474609375, 1.0650634765625, 1.13751220703125, 1.2099609375, 1.28240966796875, 1.3548583984375, 1.42730712890625, 1.499755859375, 1.57220458984375, 1.6446533203125, 1.71710205078125, 1.78955078125, 1.86199951171875, 1.9344482421875, 2.00689697265625, 2.079345703125, 2.15179443359375, 2.2242431640625, 2.29669189453125, 2.369140625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 22.0, 23.0, 38.0, 56.0, 95.0, 132.0, 199.0, 277.0, 483.0, 636.0, 956.0, 1478.0, 2168.0, 3211.0, 4951.0, 7612.0, 11968.0, 19147.0, 31132.0, 53828.0, 97711.0, 211319.0, 303350.0, 127681.0, 67365.0, 38632.0, 23085.0, 14464.0, 9053.0, 6021.0, 3885.0, 2480.0, 1707.0, 1128.0, 755.0, 496.0, 326.0, 231.0, 158.0, 99.0, 64.0, 45.0, 37.0, 12.0, 12.0, 8.0, 2.0, 6.0, 5.0, 2.0, 3.0], "bins": [-0.1104736328125, -0.10733509063720703, -0.10419654846191406, -0.1010580062866211, -0.09791946411132812, -0.09478092193603516, -0.09164237976074219, -0.08850383758544922, -0.08536529541015625, -0.08222675323486328, -0.07908821105957031, -0.07594966888427734, -0.07281112670898438, -0.0696725845336914, -0.06653404235839844, -0.06339550018310547, -0.0602569580078125, -0.05711841583251953, -0.05397987365722656, -0.050841331481933594, -0.047702789306640625, -0.044564247131347656, -0.04142570495605469, -0.03828716278076172, -0.03514862060546875, -0.03201007843017578, -0.028871536254882812, -0.025732994079589844, -0.022594451904296875, -0.019455909729003906, -0.016317367553710938, -0.013178825378417969, -0.010040283203125, -0.006901741027832031, -0.0037631988525390625, -0.0006246566772460938, 0.002513885498046875, 0.005652427673339844, 0.008790969848632812, 0.011929512023925781, 0.01506805419921875, 0.01820659637451172, 0.021345138549804688, 0.024483680725097656, 0.027622222900390625, 0.030760765075683594, 0.03389930725097656, 0.03703784942626953, 0.0401763916015625, 0.04331493377685547, 0.04645347595214844, 0.049592018127441406, 0.052730560302734375, 0.055869102478027344, 0.05900764465332031, 0.06214618682861328, 0.06528472900390625, 0.06842327117919922, 0.07156181335449219, 0.07470035552978516, 0.07783889770507812, 0.0809774398803711, 0.08411598205566406, 0.08725452423095703, 0.09039306640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 5.0, 5.0, 6.0, 9.0, 9.0, 6.0, 15.0, 13.0, 10.0, 16.0, 20.0, 23.0, 22.0, 25.0, 32.0, 27.0, 28.0, 29.0, 21.0, 38.0, 39.0, 39.0, 1063.0, 29.0, 39.0, 48.0, 37.0, 31.0, 32.0, 24.0, 22.0, 36.0, 26.0, 24.0, 17.0, 24.0, 13.0, 13.0, 12.0, 14.0, 11.0, 12.0, 16.0, 6.0, 7.0, 5.0, 3.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2287139892578125, -1.188873291015625, -1.1490325927734375, -1.10919189453125, -1.0693511962890625, -1.029510498046875, -0.9896697998046875, -0.9498291015625, -0.9099884033203125, -0.870147705078125, -0.8303070068359375, -0.79046630859375, -0.7506256103515625, -0.710784912109375, -0.6709442138671875, -0.631103515625, -0.5912628173828125, -0.551422119140625, -0.5115814208984375, -0.47174072265625, -0.4319000244140625, -0.392059326171875, -0.3522186279296875, -0.3123779296875, -0.2725372314453125, -0.232696533203125, -0.1928558349609375, -0.15301513671875, -0.1131744384765625, -0.073333740234375, -0.0334930419921875, 0.00634765625, 0.0461883544921875, 0.086029052734375, 0.1258697509765625, 0.16571044921875, 0.2055511474609375, 0.245391845703125, 0.2852325439453125, 0.3250732421875, 0.3649139404296875, 0.404754638671875, 0.4445953369140625, 0.48443603515625, 0.5242767333984375, 0.564117431640625, 0.6039581298828125, 0.643798828125, 0.6836395263671875, 0.723480224609375, 0.7633209228515625, 0.80316162109375, 0.8430023193359375, 0.882843017578125, 0.9226837158203125, 0.9625244140625, 1.0023651123046875, 1.042205810546875, 1.0820465087890625, 1.12188720703125, 1.1617279052734375, 1.201568603515625, 1.2414093017578125, 1.28125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 11.0, 5.0, 28.0, 30.0, 63.0, 73.0, 113.0, 156.0, 246.0, 411.0, 541.0, 810.0, 1278.0, 1937.0, 2778.0, 4376.0, 6648.0, 10009.0, 16148.0, 25670.0, 41348.0, 70279.0, 127381.0, 1312341.0, 212728.0, 104914.0, 59422.0, 35353.0, 22073.0, 13913.0, 8887.0, 6000.0, 3745.0, 2460.0, 1689.0, 1092.0, 699.0, 484.0, 307.0, 232.0, 134.0, 104.0, 72.0, 44.0, 36.0, 12.0, 19.0, 5.0, 10.0, 6.0, 1.0, 5.0, 0.0, 3.0, 1.0], "bins": [-0.040374755859375, -0.039145469665527344, -0.03791618347167969, -0.03668689727783203, -0.035457611083984375, -0.03422832489013672, -0.03299903869628906, -0.031769752502441406, -0.03054046630859375, -0.029311180114746094, -0.028081893920898438, -0.02685260772705078, -0.025623321533203125, -0.02439403533935547, -0.023164749145507812, -0.021935462951660156, -0.0207061767578125, -0.019476890563964844, -0.018247604370117188, -0.01701831817626953, -0.015789031982421875, -0.014559745788574219, -0.013330459594726562, -0.012101173400878906, -0.01087188720703125, -0.009642601013183594, -0.008413314819335938, -0.007184028625488281, -0.005954742431640625, -0.004725456237792969, -0.0034961700439453125, -0.0022668838500976562, -0.00103759765625, 0.00019168853759765625, 0.0014209747314453125, 0.0026502609252929688, 0.003879547119140625, 0.005108833312988281, 0.0063381195068359375, 0.007567405700683594, 0.00879669189453125, 0.010025978088378906, 0.011255264282226562, 0.012484550476074219, 0.013713836669921875, 0.014943122863769531, 0.016172409057617188, 0.017401695251464844, 0.0186309814453125, 0.019860267639160156, 0.021089553833007812, 0.02231884002685547, 0.023548126220703125, 0.02477741241455078, 0.026006698608398438, 0.027235984802246094, 0.02846527099609375, 0.029694557189941406, 0.030923843383789062, 0.03215312957763672, 0.033382415771484375, 0.03461170196533203, 0.03584098815917969, 0.037070274353027344, 0.038299560546875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 15.0, 13.0, 15.0, 28.0, 24.0, 54.0, 59.0, 95.0, 90.0, 87.0, 100.0, 95.0, 71.0, 43.0, 52.0, 36.0, 22.0, 13.0, 10.0, 8.0, 9.0, 10.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74913215637207e-05, -3.63178551197052e-05, -3.51443886756897e-05, -3.3970922231674194e-05, -3.279745578765869e-05, -3.162398934364319e-05, -3.0450522899627686e-05, -2.9277056455612183e-05, -2.810359001159668e-05, -2.6930123567581177e-05, -2.5756657123565674e-05, -2.458319067955017e-05, -2.3409724235534668e-05, -2.2236257791519165e-05, -2.1062791347503662e-05, -1.988932490348816e-05, -1.8715858459472656e-05, -1.7542392015457153e-05, -1.636892557144165e-05, -1.5195459127426147e-05, -1.4021992683410645e-05, -1.2848526239395142e-05, -1.1675059795379639e-05, -1.0501593351364136e-05, -9.328126907348633e-06, -8.15466046333313e-06, -6.981194019317627e-06, -5.807727575302124e-06, -4.634261131286621e-06, -3.460794687271118e-06, -2.2873282432556152e-06, -1.1138617992401123e-06, 5.960464477539063e-08, 1.2330710887908936e-06, 2.4065375328063965e-06, 3.5800039768218994e-06, 4.753470420837402e-06, 5.926936864852905e-06, 7.100403308868408e-06, 8.273869752883911e-06, 9.447336196899414e-06, 1.0620802640914917e-05, 1.179426908493042e-05, 1.2967735528945923e-05, 1.4141201972961426e-05, 1.531466841697693e-05, 1.648813486099243e-05, 1.7661601305007935e-05, 1.8835067749023438e-05, 2.000853419303894e-05, 2.1182000637054443e-05, 2.2355467081069946e-05, 2.352893352508545e-05, 2.4702399969100952e-05, 2.5875866413116455e-05, 2.7049332857131958e-05, 2.822279930114746e-05, 2.9396265745162964e-05, 3.056973218917847e-05, 3.174319863319397e-05, 3.291666507720947e-05, 3.4090131521224976e-05, 3.526359796524048e-05, 3.643706440925598e-05, 3.7610530853271484e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 9.0, 10.0, 14.0, 9.0, 21.0, 24.0, 48.0, 64.0, 99.0, 152.0, 370.0, 4186.0, 1038539.0, 4133.0, 375.0, 167.0, 116.0, 55.0, 36.0, 27.0, 18.0, 16.0, 16.0, 9.0, 9.0, 7.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008282661437988281, -0.0008019730448722839, -0.0007756799459457397, -0.0007493868470191956, -0.0007230937480926514, -0.0006968006491661072, -0.000670507550239563, -0.0006442144513130188, -0.0006179213523864746, -0.0005916282534599304, -0.0005653351545333862, -0.000539042055606842, -0.0005127489566802979, -0.00048645585775375366, -0.00046016275882720947, -0.0004338696599006653, -0.0004075765609741211, -0.0003812834620475769, -0.0003549903631210327, -0.0003286972641944885, -0.00030240416526794434, -0.00027611106634140015, -0.00024981796741485596, -0.00022352486848831177, -0.00019723176956176758, -0.0001709386706352234, -0.0001446455717086792, -0.00011835247278213501, -9.205937385559082e-05, -6.576627492904663e-05, -3.947317600250244e-05, -1.3180077075958252e-05, 1.3113021850585938e-05, 3.940612077713013e-05, 6.569921970367432e-05, 9.19923186302185e-05, 0.0001182854175567627, 0.00014457851648330688, 0.00017087161540985107, 0.00019716471433639526, 0.00022345781326293945, 0.00024975091218948364, 0.00027604401111602783, 0.000302337110042572, 0.0003286302089691162, 0.0003549233078956604, 0.0003812164068222046, 0.0004075095057487488, 0.00043380260467529297, 0.00046009570360183716, 0.00048638880252838135, 0.0005126819014549255, 0.0005389750003814697, 0.0005652680993080139, 0.0005915611982345581, 0.0006178542971611023, 0.0006441473960876465, 0.0006704404950141907, 0.0006967335939407349, 0.000723026692867279, 0.0007493197917938232, 0.0007756128907203674, 0.0008019059896469116, 0.0008281990885734558, 0.0008544921875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [955.0, 62.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0713695701269899e-05, 3.63301660399884e-06, 1.7979727999772877e-05, 3.232644303352572e-05, 4.667315442929976e-05, 6.10198694630526e-05, 7.536658085882664e-05, 8.971329225460067e-05, 0.00010406000365037471, 0.00011840671504614875, 0.00013275342644192278, 0.00014710014511365443, 0.00016144684923347086, 0.0001757935679052025, 0.00019014027202501893, 0.00020448699069675058, 0.000218833694816567, 0.00023318041348829865, 0.0002475271176081151, 0.0002618738217279315, 0.0002762205549515784, 0.0002905672590713948, 0.0003049139631912112, 0.0003192606964148581, 0.0003336074005346745, 0.00034795410465449095, 0.0003623008378781378, 0.00037664754199795425, 0.00039099424611777067, 0.00040534097934141755, 0.000419687683461234, 0.0004340343875810504, 0.0004483810917008668, 0.00046272779582068324, 0.0004770745290443301, 0.0004914212040603161, 0.000505767937283963, 0.0005201146705076098, 0.0005344613455235958, 0.0005488080787472427, 0.0005631548119708896, 0.0005775015451945364, 0.0005918482202105224, 0.0006061949534341693, 0.0006205416866578162, 0.0006348883616738021, 0.000649235094897449, 0.000663581769913435, 0.0006779285031370819, 0.0006922752363607287, 0.0007066219113767147, 0.0007209686446003616, 0.0007353153778240085, 0.0007496620528399944, 0.0007640087860636413, 0.0007783555192872882, 0.0007927021943032742, 0.000807048927526921, 0.000821395602542907, 0.0008357423357665539, 0.0008500890689902008, 0.0008644357440061867, 0.0008787824772298336, 0.0008931291522458196, 0.0009074758854694664]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 12.0, 9.0, 23.0, 29.0, 39.0, 49.0, 56.0, 43.0, 62.0, 68.0, 65.0, 77.0, 73.0, 75.0, 55.0, 55.0, 48.0, 37.0, 37.0, 20.0, 20.0, 17.0, 13.0, 10.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.892183303833008e-05, -3.7964433431625366e-05, -3.7007033824920654e-05, -3.604963421821594e-05, -3.509223461151123e-05, -3.413483500480652e-05, -3.317743539810181e-05, -3.2220035791397095e-05, -3.126263618469238e-05, -3.030523657798767e-05, -2.934783697128296e-05, -2.8390437364578247e-05, -2.7433037757873535e-05, -2.6475638151168823e-05, -2.551823854446411e-05, -2.45608389377594e-05, -2.3603439331054688e-05, -2.2646039724349976e-05, -2.1688640117645264e-05, -2.0731240510940552e-05, -1.977384090423584e-05, -1.8816441297531128e-05, -1.7859041690826416e-05, -1.6901642084121704e-05, -1.5944242477416992e-05, -1.498684287071228e-05, -1.4029443264007568e-05, -1.3072043657302856e-05, -1.2114644050598145e-05, -1.1157244443893433e-05, -1.019984483718872e-05, -9.242445230484009e-06, -8.285045623779297e-06, -7.327646017074585e-06, -6.370246410369873e-06, -5.412846803665161e-06, -4.455447196960449e-06, -3.4980475902557373e-06, -2.5406479835510254e-06, -1.5832483768463135e-06, -6.258487701416016e-07, 3.3155083656311035e-07, 1.2889504432678223e-06, 2.246350049972534e-06, 3.203749656677246e-06, 4.161149263381958e-06, 5.11854887008667e-06, 6.075948476791382e-06, 7.033348083496094e-06, 7.990747690200806e-06, 8.948147296905518e-06, 9.90554690361023e-06, 1.0862946510314941e-05, 1.1820346117019653e-05, 1.2777745723724365e-05, 1.3735145330429077e-05, 1.4692544937133789e-05, 1.56499445438385e-05, 1.6607344150543213e-05, 1.7564743757247925e-05, 1.8522143363952637e-05, 1.947954297065735e-05, 2.043694257736206e-05, 2.1394342184066772e-05, 2.2351741790771484e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 2.0, 12.0, 12.0, 16.0, 15.0, 21.0, 26.0, 20.0, 20.0, 27.0, 34.0, 36.0, 32.0, 33.0, 38.0, 43.0, 45.0, 55.0, 46.0, 35.0, 46.0, 35.0, 35.0, 41.0, 35.0, 29.0, 29.0, 25.0, 27.0, 21.0, 25.0, 18.0, 10.0, 9.0, 10.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.267578125, -2.19512939453125, -2.1226806640625, -2.05023193359375, -1.977783203125, -1.90533447265625, -1.8328857421875, -1.76043701171875, -1.68798828125, -1.61553955078125, -1.5430908203125, -1.47064208984375, -1.398193359375, -1.32574462890625, -1.2532958984375, -1.18084716796875, -1.1083984375, -1.03594970703125, -0.9635009765625, -0.89105224609375, -0.818603515625, -0.74615478515625, -0.6737060546875, -0.60125732421875, -0.52880859375, -0.45635986328125, -0.3839111328125, -0.31146240234375, -0.239013671875, -0.16656494140625, -0.0941162109375, -0.02166748046875, 0.05078125, 0.12322998046875, 0.1956787109375, 0.26812744140625, 0.340576171875, 0.41302490234375, 0.4854736328125, 0.55792236328125, 0.63037109375, 0.70281982421875, 0.7752685546875, 0.84771728515625, 0.920166015625, 0.99261474609375, 1.0650634765625, 1.13751220703125, 1.2099609375, 1.28240966796875, 1.3548583984375, 1.42730712890625, 1.499755859375, 1.57220458984375, 1.6446533203125, 1.71710205078125, 1.78955078125, 1.86199951171875, 1.9344482421875, 2.00689697265625, 2.079345703125, 2.15179443359375, 2.2242431640625, 2.29669189453125, 2.369140625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 21.0, 22.0, 35.0, 54.0, 94.0, 131.0, 219.0, 395.0, 691.0, 1210.0, 2051.0, 3558.0, 6312.0, 11930.0, 25728.0, 73615.0, 339205.0, 437799.0, 87243.0, 29311.0, 13032.0, 6804.0, 3755.0, 2190.0, 1288.0, 744.0, 448.0, 252.0, 143.0, 87.0, 63.0, 36.0, 28.0, 15.0, 12.0, 9.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.759765625, -2.653900146484375, -2.54803466796875, -2.442169189453125, -2.3363037109375, -2.230438232421875, -2.12457275390625, -2.018707275390625, -1.912841796875, -1.806976318359375, -1.70111083984375, -1.595245361328125, -1.4893798828125, -1.383514404296875, -1.27764892578125, -1.171783447265625, -1.06591796875, -0.960052490234375, -0.85418701171875, -0.748321533203125, -0.6424560546875, -0.536590576171875, -0.43072509765625, -0.324859619140625, -0.218994140625, -0.113128662109375, -0.00726318359375, 0.098602294921875, 0.2044677734375, 0.310333251953125, 0.41619873046875, 0.522064208984375, 0.6279296875, 0.733795166015625, 0.83966064453125, 0.945526123046875, 1.0513916015625, 1.157257080078125, 1.26312255859375, 1.368988037109375, 1.474853515625, 1.580718994140625, 1.68658447265625, 1.792449951171875, 1.8983154296875, 2.004180908203125, 2.11004638671875, 2.215911865234375, 2.32177734375, 2.427642822265625, 2.53350830078125, 2.639373779296875, 2.7452392578125, 2.851104736328125, 2.95697021484375, 3.062835693359375, 3.168701171875, 3.274566650390625, 3.38043212890625, 3.486297607421875, 3.5921630859375, 3.698028564453125, 3.80389404296875, 3.909759521484375, 4.015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 7.0, 7.0, 7.0, 6.0, 4.0, 5.0, 11.0, 7.0, 8.0, 6.0, 13.0, 23.0, 19.0, 18.0, 31.0, 27.0, 35.0, 41.0, 46.0, 44.0, 60.0, 72.0, 132.0, 1496.0, 363.0, 124.0, 67.0, 51.0, 35.0, 37.0, 39.0, 33.0, 33.0, 26.0, 11.0, 16.0, 12.0, 22.0, 12.0, 11.0, 14.0, 10.0, 4.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.62890625, -6.39129638671875, -6.1536865234375, -5.91607666015625, -5.678466796875, -5.44085693359375, -5.2032470703125, -4.96563720703125, -4.72802734375, -4.49041748046875, -4.2528076171875, -4.01519775390625, -3.777587890625, -3.53997802734375, -3.3023681640625, -3.06475830078125, -2.8271484375, -2.58953857421875, -2.3519287109375, -2.11431884765625, -1.876708984375, -1.63909912109375, -1.4014892578125, -1.16387939453125, -0.92626953125, -0.68865966796875, -0.4510498046875, -0.21343994140625, 0.024169921875, 0.26177978515625, 0.4993896484375, 0.73699951171875, 0.974609375, 1.21221923828125, 1.4498291015625, 1.68743896484375, 1.925048828125, 2.16265869140625, 2.4002685546875, 2.63787841796875, 2.87548828125, 3.11309814453125, 3.3507080078125, 3.58831787109375, 3.825927734375, 4.06353759765625, 4.3011474609375, 4.53875732421875, 4.7763671875, 5.01397705078125, 5.2515869140625, 5.48919677734375, 5.726806640625, 5.96441650390625, 6.2020263671875, 6.43963623046875, 6.67724609375, 6.91485595703125, 7.1524658203125, 7.39007568359375, 7.627685546875, 7.86529541015625, 8.1029052734375, 8.34051513671875, 8.578125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 4.0, 3.0, 11.0, 14.0, 17.0, 7.0, 21.0, 14.0, 26.0, 22.0, 50.0, 60.0, 92.0, 107.0, 156.0, 239.0, 592.0, 2684.0, 23163.0, 2679207.0, 425053.0, 11272.0, 1640.0, 454.0, 223.0, 147.0, 101.0, 67.0, 50.0, 43.0, 35.0, 38.0, 20.0, 9.0, 12.0, 3.0, 11.0, 6.0, 5.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.015625, -16.541015625, -16.06640625, -15.591796875, -15.1171875, -14.642578125, -14.16796875, -13.693359375, -13.21875, -12.744140625, -12.26953125, -11.794921875, -11.3203125, -10.845703125, -10.37109375, -9.896484375, -9.421875, -8.947265625, -8.47265625, -7.998046875, -7.5234375, -7.048828125, -6.57421875, -6.099609375, -5.625, -5.150390625, -4.67578125, -4.201171875, -3.7265625, -3.251953125, -2.77734375, -2.302734375, -1.828125, -1.353515625, -0.87890625, -0.404296875, 0.0703125, 0.544921875, 1.01953125, 1.494140625, 1.96875, 2.443359375, 2.91796875, 3.392578125, 3.8671875, 4.341796875, 4.81640625, 5.291015625, 5.765625, 6.240234375, 6.71484375, 7.189453125, 7.6640625, 8.138671875, 8.61328125, 9.087890625, 9.5625, 10.037109375, 10.51171875, 10.986328125, 11.4609375, 11.935546875, 12.41015625, 12.884765625, 13.359375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 34.0, 146.0, 295.0, 282.0, 164.0, 72.0, 11.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.8038444519043, -58.6097412109375, -57.4156379699707, -56.221534729003906, -55.02743148803711, -53.83332824707031, -52.63922119140625, -51.44511795043945, -50.251014709472656, -49.05691146850586, -47.86280822753906, -46.668704986572266, -45.47460174560547, -44.280494689941406, -43.086395263671875, -41.89228820800781, -40.69818878173828, -39.504085540771484, -38.30998229980469, -37.11587905883789, -35.921775817871094, -34.72766876220703, -33.5335693359375, -32.33946228027344, -31.14535903930664, -29.951255798339844, -28.757152557373047, -27.56304931640625, -26.36894416809082, -25.174840927124023, -23.980737686157227, -22.786632537841797, -21.592531204223633, -20.398427963256836, -19.20432472229004, -18.01021957397461, -16.816116333007812, -15.622013092041016, -14.427909851074219, -13.233805656433105, -12.039702415466309, -10.845599174499512, -9.651494979858398, -8.457391738891602, -7.2632880210876465, -6.069184303283691, -4.8750810623168945, -3.6809768676757812, -2.4868736267089844, -1.2927700281143188, -0.09866642951965332, 1.0954370498657227, 2.2895407676696777, 3.483644485473633, 4.67774772644043, 5.871851921081543, 7.06595516204834, 8.260058403015137, 9.45416259765625, 10.648265838623047, 11.842369079589844, 13.036473274230957, 14.230576515197754, 15.424680709838867, 16.618783950805664]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 3.0, 9.0, 9.0, 12.0, 13.0, 7.0, 18.0, 11.0, 10.0, 23.0, 29.0, 34.0, 32.0, 36.0, 35.0, 35.0, 47.0, 49.0, 42.0, 48.0, 43.0, 49.0, 38.0, 31.0, 49.0, 29.0, 43.0, 23.0, 31.0, 25.0, 20.0, 19.0, 20.0, 20.0, 17.0, 5.0, 16.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.18801498413086, -17.513378143310547, -16.838741302490234, -16.164104461669922, -15.48946762084961, -14.814830780029297, -14.140193939208984, -13.465557098388672, -12.79092025756836, -12.116283416748047, -11.441646575927734, -10.767009735107422, -10.09237289428711, -9.417736053466797, -8.743099212646484, -8.068462371826172, -7.393826484680176, -6.719189643859863, -6.044552803039551, -5.369915962219238, -4.695279121398926, -4.020642280578613, -3.346005916595459, -2.6713690757751465, -1.996732234954834, -1.3220953941345215, -0.6474586725234985, 0.027178049087524414, 0.7018148899078369, 1.3764517307281494, 2.051088333129883, 2.7257251739501953, 3.400362014770508, 4.07499885559082, 4.749635696411133, 5.424272537231445, 6.098909378051758, 6.77354621887207, 7.448182582855225, 8.122819900512695, 8.797456741333008, 9.47209358215332, 10.146730422973633, 10.821367263793945, 11.496004104614258, 12.17064094543457, 12.845277786254883, 13.519914627075195, 14.194550514221191, 14.869187355041504, 15.543824195861816, 16.218460083007812, 16.893096923828125, 17.567733764648438, 18.24237060546875, 18.917007446289062, 19.591644287109375, 20.266281127929688, 20.94091796875, 21.615554809570312, 22.290191650390625, 22.964828491210938, 23.63946533203125, 24.314102172851562, 24.988739013671875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 13.0, 15.0, 19.0, 16.0, 17.0, 27.0, 26.0, 23.0, 30.0, 39.0, 34.0, 38.0, 34.0, 52.0, 54.0, 43.0, 48.0, 41.0, 42.0, 35.0, 50.0, 34.0, 34.0, 27.0, 31.0, 23.0, 27.0, 28.0, 18.0, 17.0, 14.0, 7.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.424407958984375, -2.34686279296875, -2.269317626953125, -2.1917724609375, -2.114227294921875, -2.03668212890625, -1.959136962890625, -1.881591796875, -1.804046630859375, -1.72650146484375, -1.648956298828125, -1.5714111328125, -1.493865966796875, -1.41632080078125, -1.338775634765625, -1.26123046875, -1.183685302734375, -1.10614013671875, -1.028594970703125, -0.9510498046875, -0.873504638671875, -0.79595947265625, -0.718414306640625, -0.640869140625, -0.563323974609375, -0.48577880859375, -0.408233642578125, -0.3306884765625, -0.253143310546875, -0.17559814453125, -0.098052978515625, -0.0205078125, 0.057037353515625, 0.13458251953125, 0.212127685546875, 0.2896728515625, 0.367218017578125, 0.44476318359375, 0.522308349609375, 0.599853515625, 0.677398681640625, 0.75494384765625, 0.832489013671875, 0.9100341796875, 0.987579345703125, 1.06512451171875, 1.142669677734375, 1.22021484375, 1.297760009765625, 1.37530517578125, 1.452850341796875, 1.5303955078125, 1.607940673828125, 1.68548583984375, 1.763031005859375, 1.840576171875, 1.918121337890625, 1.99566650390625, 2.073211669921875, 2.1507568359375, 2.228302001953125, 2.30584716796875, 2.383392333984375, 2.4609375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 12.0, 9.0, 10.0, 18.0, 14.0, 25.0, 26.0, 31.0, 47.0, 79.0, 133.0, 294.0, 743.0, 1813.0, 5446.0, 20777.0, 103732.0, 781039.0, 2722584.0, 465591.0, 69581.0, 15149.0, 4376.0, 1517.0, 586.0, 249.0, 137.0, 63.0, 44.0, 33.0, 25.0, 32.0, 17.0, 3.0, 11.0, 6.0, 11.0, 4.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.5035400390625, -6.257080078125, -6.0106201171875, -5.76416015625, -5.5177001953125, -5.271240234375, -5.0247802734375, -4.7783203125, -4.5318603515625, -4.285400390625, -4.0389404296875, -3.79248046875, -3.5460205078125, -3.299560546875, -3.0531005859375, -2.806640625, -2.5601806640625, -2.313720703125, -2.0672607421875, -1.82080078125, -1.5743408203125, -1.327880859375, -1.0814208984375, -0.8349609375, -0.5885009765625, -0.342041015625, -0.0955810546875, 0.15087890625, 0.3973388671875, 0.643798828125, 0.8902587890625, 1.13671875, 1.3831787109375, 1.629638671875, 1.8760986328125, 2.12255859375, 2.3690185546875, 2.615478515625, 2.8619384765625, 3.1083984375, 3.3548583984375, 3.601318359375, 3.8477783203125, 4.09423828125, 4.3406982421875, 4.587158203125, 4.8336181640625, 5.080078125, 5.3265380859375, 5.572998046875, 5.8194580078125, 6.06591796875, 6.3123779296875, 6.558837890625, 6.8052978515625, 7.0517578125, 7.2982177734375, 7.544677734375, 7.7911376953125, 8.03759765625, 8.2840576171875, 8.530517578125, 8.7769775390625, 9.0234375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 5.0, 19.0, 20.0, 36.0, 63.0, 88.0, 129.0, 182.0, 323.0, 465.0, 669.0, 647.0, 501.0, 331.0, 222.0, 149.0, 83.0, 53.0, 33.0, 19.0, 19.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.329345703125, -10.02587890625, -9.722412109375, -9.4189453125, -9.115478515625, -8.81201171875, -8.508544921875, -8.205078125, -7.901611328125, -7.59814453125, -7.294677734375, -6.9912109375, -6.687744140625, -6.38427734375, -6.080810546875, -5.77734375, -5.473876953125, -5.17041015625, -4.866943359375, -4.5634765625, -4.260009765625, -3.95654296875, -3.653076171875, -3.349609375, -3.046142578125, -2.74267578125, -2.439208984375, -2.1357421875, -1.832275390625, -1.52880859375, -1.225341796875, -0.921875, -0.618408203125, -0.31494140625, -0.011474609375, 0.2919921875, 0.595458984375, 0.89892578125, 1.202392578125, 1.505859375, 1.809326171875, 2.11279296875, 2.416259765625, 2.7197265625, 3.023193359375, 3.32666015625, 3.630126953125, 3.93359375, 4.237060546875, 4.54052734375, 4.843994140625, 5.1474609375, 5.450927734375, 5.75439453125, 6.057861328125, 6.361328125, 6.664794921875, 6.96826171875, 7.271728515625, 7.5751953125, 7.878662109375, 8.18212890625, 8.485595703125, 8.7890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 16.0, 30.0, 53.0, 72.0, 151.0, 282.0, 711.0, 2693.0, 28642.0, 1244544.0, 2848604.0, 62517.0, 4323.0, 925.0, 341.0, 161.0, 103.0, 40.0, 36.0, 15.0, 9.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671875, -21.919189453125, -21.16650390625, -20.413818359375, -19.6611328125, -18.908447265625, -18.15576171875, -17.403076171875, -16.650390625, -15.897705078125, -15.14501953125, -14.392333984375, -13.6396484375, -12.886962890625, -12.13427734375, -11.381591796875, -10.62890625, -9.876220703125, -9.12353515625, -8.370849609375, -7.6181640625, -6.865478515625, -6.11279296875, -5.360107421875, -4.607421875, -3.854736328125, -3.10205078125, -2.349365234375, -1.5966796875, -0.843994140625, -0.09130859375, 0.661376953125, 1.4140625, 2.166748046875, 2.91943359375, 3.672119140625, 4.4248046875, 5.177490234375, 5.93017578125, 6.682861328125, 7.435546875, 8.188232421875, 8.94091796875, 9.693603515625, 10.4462890625, 11.198974609375, 11.95166015625, 12.704345703125, 13.45703125, 14.209716796875, 14.96240234375, 15.715087890625, 16.4677734375, 17.220458984375, 17.97314453125, 18.725830078125, 19.478515625, 20.231201171875, 20.98388671875, 21.736572265625, 22.4892578125, 23.241943359375, 23.99462890625, 24.747314453125, 25.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 8.0, 12.0, 26.0, 25.0, 31.0, 52.0, 74.0, 88.0, 87.0, 93.0, 92.0, 79.0, 78.0, 64.0, 47.0, 46.0, 36.0, 15.0, 22.0, 9.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.207744598388672, -19.151086807250977, -18.094430923461914, -17.03777313232422, -15.981117248535156, -14.924459457397461, -13.867802619934082, -12.811145782470703, -11.754488945007324, -10.697832107543945, -9.641175270080566, -8.584518432617188, -7.52786111831665, -6.4712042808532715, -5.414546966552734, -4.3578901290893555, -3.3012332916259766, -2.2445764541625977, -1.1879193782806396, -0.13126230239868164, 0.9253945350646973, 1.9820513725280762, 3.0387086868286133, 4.095365524291992, 5.152022361755371, 6.20867919921875, 7.265336036682129, 8.321992874145508, 9.378650665283203, 10.435306549072266, 11.491964340209961, 12.54862117767334, 13.605278015136719, 14.661934852600098, 15.718591690063477, 16.775249481201172, 17.831905364990234, 18.88856315612793, 19.945220947265625, 21.001876831054688, 22.05853271484375, 23.115190505981445, 24.171846389770508, 25.228504180908203, 26.285160064697266, 27.34181785583496, 28.398475646972656, 29.45513153076172, 30.511789321899414, 31.56844711303711, 32.62510299682617, 33.681758880615234, 34.73841857910156, 35.795074462890625, 36.85173034667969, 37.90838623046875, 38.96504592895508, 40.02170181274414, 41.07836151123047, 42.13501739501953, 43.191673278808594, 44.248329162597656, 45.304988861083984, 46.36164474487305, 47.41830062866211]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 16.0, 5.0, 11.0, 10.0, 17.0, 20.0, 17.0, 23.0, 27.0, 29.0, 34.0, 26.0, 43.0, 36.0, 32.0, 29.0, 46.0, 31.0, 35.0, 31.0, 36.0, 50.0, 43.0, 39.0, 41.0, 35.0, 23.0, 25.0, 20.0, 20.0, 24.0, 18.0, 12.0, 12.0, 12.0, 14.0, 14.0, 5.0, 4.0, 4.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.431793212890625, -19.750713348388672, -19.06963348388672, -18.3885555267334, -17.707475662231445, -17.026395797729492, -16.34531593322754, -15.664237022399902, -14.983158111572266, -14.302078247070312, -13.620999336242676, -12.939919471740723, -12.258840560913086, -11.577760696411133, -10.89668083190918, -10.215601921081543, -9.53452205657959, -8.853442192077637, -8.17236328125, -7.491283416748047, -6.81020450592041, -6.129124641418457, -5.448045253753662, -4.766965866088867, -4.085886478424072, -3.4048070907592773, -2.7237277030944824, -2.0426480770111084, -1.3615686893463135, -0.6804893016815186, 0.0005903244018554688, 0.6816697120666504, 1.3627490997314453, 2.0438284873962402, 2.724907875061035, 3.405987501144409, 4.087066650390625, 4.768146514892578, 5.449225902557373, 6.130305290222168, 6.811384677886963, 7.492464065551758, 8.173543930053711, 8.854622840881348, 9.5357027053833, 10.216781616210938, 10.89786148071289, 11.578941345214844, 12.26002025604248, 12.941100120544434, 13.62217903137207, 14.303258895874023, 14.98433780670166, 15.665417671203613, 16.34649658203125, 17.027576446533203, 17.708656311035156, 18.38973617553711, 19.070816040039062, 19.751893997192383, 20.432973861694336, 21.11405372619629, 21.795133590698242, 22.476211547851562, 23.157291412353516]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 7.0, 9.0, 15.0, 16.0, 23.0, 20.0, 17.0, 25.0, 27.0, 41.0, 32.0, 38.0, 29.0, 39.0, 39.0, 43.0, 52.0, 49.0, 37.0, 41.0, 47.0, 38.0, 22.0, 33.0, 26.0, 25.0, 24.0, 26.0, 20.0, 18.0, 23.0, 19.0, 13.0, 8.0, 4.0, 7.0, 10.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-2.48828125, -2.413909912109375, -2.33953857421875, -2.265167236328125, -2.1907958984375, -2.116424560546875, -2.04205322265625, -1.967681884765625, -1.893310546875, -1.818939208984375, -1.74456787109375, -1.670196533203125, -1.5958251953125, -1.521453857421875, -1.44708251953125, -1.372711181640625, -1.29833984375, -1.223968505859375, -1.14959716796875, -1.075225830078125, -1.0008544921875, -0.926483154296875, -0.85211181640625, -0.777740478515625, -0.703369140625, -0.628997802734375, -0.55462646484375, -0.480255126953125, -0.4058837890625, -0.331512451171875, -0.25714111328125, -0.182769775390625, -0.1083984375, -0.034027099609375, 0.04034423828125, 0.114715576171875, 0.1890869140625, 0.263458251953125, 0.33782958984375, 0.412200927734375, 0.486572265625, 0.560943603515625, 0.63531494140625, 0.709686279296875, 0.7840576171875, 0.858428955078125, 0.93280029296875, 1.007171630859375, 1.08154296875, 1.155914306640625, 1.23028564453125, 1.304656982421875, 1.3790283203125, 1.453399658203125, 1.52777099609375, 1.602142333984375, 1.676513671875, 1.750885009765625, 1.82525634765625, 1.899627685546875, 1.9739990234375, 2.048370361328125, 2.12274169921875, 2.197113037109375, 2.271484375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 14.0, 14.0, 33.0, 54.0, 60.0, 105.0, 144.0, 262.0, 420.0, 670.0, 1170.0, 1827.0, 2982.0, 5145.0, 8605.0, 14532.0, 25764.0, 46869.0, 88616.0, 195408.0, 356782.0, 141814.0, 69047.0, 37174.0, 21357.0, 12155.0, 7009.0, 4060.0, 2497.0, 1461.0, 927.0, 604.0, 355.0, 212.0, 142.0, 93.0, 50.0, 45.0, 15.0, 16.0, 10.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.131103515625, -0.1270465850830078, -0.12298965454101562, -0.11893272399902344, -0.11487579345703125, -0.11081886291503906, -0.10676193237304688, -0.10270500183105469, -0.0986480712890625, -0.09459114074707031, -0.09053421020507812, -0.08647727966308594, -0.08242034912109375, -0.07836341857910156, -0.07430648803710938, -0.07024955749511719, -0.066192626953125, -0.06213569641113281, -0.058078765869140625, -0.05402183532714844, -0.04996490478515625, -0.04590797424316406, -0.041851043701171875, -0.03779411315917969, -0.0337371826171875, -0.029680252075195312, -0.025623321533203125, -0.021566390991210938, -0.01750946044921875, -0.013452529907226562, -0.009395599365234375, -0.0053386688232421875, -0.00128173828125, 0.0027751922607421875, 0.006832122802734375, 0.010889053344726562, 0.01494598388671875, 0.019002914428710938, 0.023059844970703125, 0.027116775512695312, 0.0311737060546875, 0.03523063659667969, 0.039287567138671875, 0.04334449768066406, 0.04740142822265625, 0.05145835876464844, 0.055515289306640625, 0.05957221984863281, 0.063629150390625, 0.06768608093261719, 0.07174301147460938, 0.07579994201660156, 0.07985687255859375, 0.08391380310058594, 0.08797073364257812, 0.09202766418457031, 0.0960845947265625, 0.10014152526855469, 0.10419845581054688, 0.10825538635253906, 0.11231231689453125, 0.11636924743652344, 0.12042617797851562, 0.12448310852050781, 0.1285400390625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 3.0, 8.0, 8.0, 15.0, 10.0, 11.0, 9.0, 18.0, 14.0, 20.0, 21.0, 19.0, 33.0, 27.0, 34.0, 27.0, 29.0, 52.0, 40.0, 40.0, 43.0, 1063.0, 35.0, 44.0, 28.0, 32.0, 43.0, 41.0, 37.0, 25.0, 20.0, 25.0, 27.0, 14.0, 14.0, 20.0, 13.0, 16.0, 9.0, 4.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4920501708984375, -1.444061279296875, -1.3960723876953125, -1.34808349609375, -1.3000946044921875, -1.252105712890625, -1.2041168212890625, -1.1561279296875, -1.1081390380859375, -1.060150146484375, -1.0121612548828125, -0.96417236328125, -0.9161834716796875, -0.868194580078125, -0.8202056884765625, -0.772216796875, -0.7242279052734375, -0.676239013671875, -0.6282501220703125, -0.58026123046875, -0.5322723388671875, -0.484283447265625, -0.4362945556640625, -0.3883056640625, -0.3403167724609375, -0.292327880859375, -0.2443389892578125, -0.19635009765625, -0.1483612060546875, -0.100372314453125, -0.0523834228515625, -0.00439453125, 0.0435943603515625, 0.091583251953125, 0.1395721435546875, 0.18756103515625, 0.2355499267578125, 0.283538818359375, 0.3315277099609375, 0.3795166015625, 0.4275054931640625, 0.475494384765625, 0.5234832763671875, 0.57147216796875, 0.6194610595703125, 0.667449951171875, 0.7154388427734375, 0.763427734375, 0.8114166259765625, 0.859405517578125, 0.9073944091796875, 0.95538330078125, 1.0033721923828125, 1.051361083984375, 1.0993499755859375, 1.1473388671875, 1.1953277587890625, 1.243316650390625, 1.2913055419921875, 1.33929443359375, 1.3872833251953125, 1.435272216796875, 1.4832611083984375, 1.53125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 14.0, 9.0, 24.0, 36.0, 40.0, 72.0, 104.0, 169.0, 232.0, 368.0, 531.0, 914.0, 1375.0, 2094.0, 3313.0, 5377.0, 8292.0, 13588.0, 22161.0, 36948.0, 62961.0, 114923.0, 239377.0, 1300048.0, 119854.0, 65508.0, 38056.0, 22918.0, 14222.0, 8409.0, 5529.0, 3494.0, 2208.0, 1367.0, 921.0, 601.0, 366.0, 222.0, 183.0, 102.0, 78.0, 41.0, 30.0, 22.0, 12.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.044952392578125, -0.0435490608215332, -0.042145729064941406, -0.04074239730834961, -0.03933906555175781, -0.037935733795166016, -0.03653240203857422, -0.03512907028198242, -0.033725738525390625, -0.03232240676879883, -0.03091907501220703, -0.029515743255615234, -0.028112411499023438, -0.02670907974243164, -0.025305747985839844, -0.023902416229248047, -0.02249908447265625, -0.021095752716064453, -0.019692420959472656, -0.01828908920288086, -0.016885757446289062, -0.015482425689697266, -0.014079093933105469, -0.012675762176513672, -0.011272430419921875, -0.009869098663330078, -0.008465766906738281, -0.007062435150146484, -0.0056591033935546875, -0.004255771636962891, -0.0028524398803710938, -0.0014491081237792969, -4.57763671875e-05, 0.0013575553894042969, 0.0027608871459960938, 0.004164218902587891, 0.0055675506591796875, 0.006970882415771484, 0.008374214172363281, 0.009777545928955078, 0.011180877685546875, 0.012584209442138672, 0.013987541198730469, 0.015390872955322266, 0.016794204711914062, 0.01819753646850586, 0.019600868225097656, 0.021004199981689453, 0.02240753173828125, 0.023810863494873047, 0.025214195251464844, 0.02661752700805664, 0.028020858764648438, 0.029424190521240234, 0.03082752227783203, 0.03223085403442383, 0.033634185791015625, 0.03503751754760742, 0.03644084930419922, 0.037844181060791016, 0.03924751281738281, 0.04065084457397461, 0.042054176330566406, 0.0434575080871582, 0.04486083984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 10.0, 8.0, 10.0, 12.0, 12.0, 16.0, 22.0, 24.0, 23.0, 21.0, 39.0, 37.0, 49.0, 69.0, 76.0, 97.0, 73.0, 69.0, 50.0, 58.0, 33.0, 35.0, 33.0, 19.0, 10.0, 17.0, 12.0, 11.0, 8.0, 6.0, 3.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0, 1.0], "bins": [-3.039836883544922e-05, -2.954527735710144e-05, -2.8692185878753662e-05, -2.7839094400405884e-05, -2.6986002922058105e-05, -2.6132911443710327e-05, -2.527981996536255e-05, -2.442672848701477e-05, -2.3573637008666992e-05, -2.2720545530319214e-05, -2.1867454051971436e-05, -2.1014362573623657e-05, -2.016127109527588e-05, -1.93081796169281e-05, -1.8455088138580322e-05, -1.7601996660232544e-05, -1.6748905181884766e-05, -1.5895813703536987e-05, -1.5042722225189209e-05, -1.418963074684143e-05, -1.3336539268493652e-05, -1.2483447790145874e-05, -1.1630356311798096e-05, -1.0777264833450317e-05, -9.924173355102539e-06, -9.07108187675476e-06, -8.217990398406982e-06, -7.364898920059204e-06, -6.511807441711426e-06, -5.6587159633636475e-06, -4.805624485015869e-06, -3.952533006668091e-06, -3.0994415283203125e-06, -2.246350049972534e-06, -1.3932585716247559e-06, -5.401670932769775e-07, 3.129243850708008e-07, 1.166015863418579e-06, 2.0191073417663574e-06, 2.8721988201141357e-06, 3.725290298461914e-06, 4.578381776809692e-06, 5.431473255157471e-06, 6.284564733505249e-06, 7.137656211853027e-06, 7.990747690200806e-06, 8.843839168548584e-06, 9.696930646896362e-06, 1.055002212524414e-05, 1.1403113603591919e-05, 1.2256205081939697e-05, 1.3109296560287476e-05, 1.3962388038635254e-05, 1.4815479516983032e-05, 1.566857099533081e-05, 1.652166247367859e-05, 1.7374753952026367e-05, 1.8227845430374146e-05, 1.9080936908721924e-05, 1.9934028387069702e-05, 2.078711986541748e-05, 2.164021134376526e-05, 2.2493302822113037e-05, 2.3346394300460815e-05, 2.4199485778808594e-05]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 3.0, 6.0, 7.0, 12.0, 13.0, 14.0, 20.0, 16.0, 33.0, 41.0, 40.0, 82.0, 122.0, 355.0, 2336.0, 980555.0, 63506.0, 800.0, 211.0, 80.0, 65.0, 36.0, 30.0, 26.0, 20.0, 22.0, 12.0, 14.0, 15.0, 10.0, 4.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000629425048828125, -0.000608980655670166, -0.000588536262512207, -0.000568091869354248, -0.0005476474761962891, -0.0005272030830383301, -0.0005067586898803711, -0.0004863142967224121, -0.0004658699035644531, -0.00044542551040649414, -0.00042498111724853516, -0.00040453672409057617, -0.0003840923309326172, -0.0003636479377746582, -0.0003432035446166992, -0.00032275915145874023, -0.00030231475830078125, -0.00028187036514282227, -0.0002614259719848633, -0.0002409815788269043, -0.0002205371856689453, -0.00020009279251098633, -0.00017964839935302734, -0.00015920400619506836, -0.00013875961303710938, -0.00011831521987915039, -9.78708267211914e-05, -7.742643356323242e-05, -5.698204040527344e-05, -3.653764724731445e-05, -1.609325408935547e-05, 4.351139068603516e-06, 2.47955322265625e-05, 4.5239925384521484e-05, 6.568431854248047e-05, 8.612871170043945e-05, 0.00010657310485839844, 0.00012701749801635742, 0.0001474618911743164, 0.0001679062843322754, 0.00018835067749023438, 0.00020879507064819336, 0.00022923946380615234, 0.00024968385696411133, 0.0002701282501220703, 0.0002905726432800293, 0.0003110170364379883, 0.00033146142959594727, 0.00035190582275390625, 0.00037235021591186523, 0.0003927946090698242, 0.0004132390022277832, 0.0004336833953857422, 0.00045412778854370117, 0.00047457218170166016, 0.0004950165748596191, 0.0005154609680175781, 0.0005359053611755371, 0.0005563497543334961, 0.0005767941474914551, 0.0005972385406494141, 0.000617682933807373, 0.000638127326965332, 0.000658571720123291, 0.00067901611328125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 709.0, 301.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.764181797625497e-05, -8.37785773910582e-06, 8.861024980433285e-07, 1.0150062735192478e-05, 1.9414022972341627e-05, 2.8677983209490776e-05, 3.7941943446639925e-05, 4.7205903683789074e-05, 5.6469863920938224e-05, 6.573382415808737e-05, 7.499778439523652e-05, 8.426174463238567e-05, 9.352570486953482e-05, 0.00010278966510668397, 0.00011205362534383312, 0.00012131758558098227, 0.00013058155309408903, 0.00013984550605528057, 0.00014910947356838733, 0.0001583734410814941, 0.00016763739404268563, 0.00017690134700387716, 0.00018616531451698393, 0.0001954292820300907, 0.00020469323499128222, 0.00021395718795247376, 0.00022322115546558052, 0.00023248512297868729, 0.00024174907593987882, 0.00025101302890107036, 0.00026027701096609235, 0.0002695409639272839, 0.0002788049168884754, 0.00028806886984966695, 0.0002973328228108585, 0.0003065968048758805, 0.000315860757837072, 0.00032512471079826355, 0.00033438869286328554, 0.0003436526458244771, 0.0003529165987856686, 0.00036218055174686015, 0.0003714445047080517, 0.0003807084867730737, 0.0003899724397342652, 0.00039923639269545674, 0.00040850037476047873, 0.00041776432772167027, 0.0004270282806828618, 0.00043629223364405334, 0.0004455561866052449, 0.00045482016867026687, 0.0004640841216314584, 0.00047334807459264994, 0.00048261205665767193, 0.000491875980515033, 0.000501139962580055, 0.000510403944645077, 0.0005196678685024381, 0.0005289318505674601, 0.000538195832632482, 0.0005474597564898431, 0.0005567237385548651, 0.0005659876624122262, 0.0005752516444772482]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 11.0, 15.0, 19.0, 22.0, 24.0, 34.0, 31.0, 48.0, 42.0, 45.0, 57.0, 50.0, 54.0, 59.0, 49.0, 54.0, 58.0, 45.0, 34.0, 42.0, 36.0, 35.0, 25.0, 27.0, 14.0, 11.0, 10.0, 11.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1778978407382965e-05, -2.1087005734443665e-05, -2.0395033061504364e-05, -1.9703060388565063e-05, -1.9011087715625763e-05, -1.8319115042686462e-05, -1.7627142369747162e-05, -1.693516969680786e-05, -1.624319702386856e-05, -1.555122435092926e-05, -1.485925167798996e-05, -1.416727900505066e-05, -1.3475306332111359e-05, -1.2783333659172058e-05, -1.2091360986232758e-05, -1.1399388313293457e-05, -1.0707415640354156e-05, -1.0015442967414856e-05, -9.323470294475555e-06, -8.631497621536255e-06, -7.939524948596954e-06, -7.247552275657654e-06, -6.555579602718353e-06, -5.863606929779053e-06, -5.171634256839752e-06, -4.479661583900452e-06, -3.787688910961151e-06, -3.0957162380218506e-06, -2.40374356508255e-06, -1.7117708921432495e-06, -1.019798219203949e-06, -3.2782554626464844e-07, 3.641471266746521e-07, 1.0561197996139526e-06, 1.7480924725532532e-06, 2.4400651454925537e-06, 3.1320378184318542e-06, 3.824010491371155e-06, 4.515983164310455e-06, 5.207955837249756e-06, 5.899928510189056e-06, 6.591901183128357e-06, 7.2838738560676575e-06, 7.975846529006958e-06, 8.667819201946259e-06, 9.359791874885559e-06, 1.005176454782486e-05, 1.074373722076416e-05, 1.143570989370346e-05, 1.2127682566642761e-05, 1.2819655239582062e-05, 1.3511627912521362e-05, 1.4203600585460663e-05, 1.4895573258399963e-05, 1.5587545931339264e-05, 1.6279518604278564e-05, 1.6971491277217865e-05, 1.7663463950157166e-05, 1.8355436623096466e-05, 1.9047409296035767e-05, 1.9739381968975067e-05, 2.0431354641914368e-05, 2.1123327314853668e-05, 2.181529998779297e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 7.0, 9.0, 15.0, 16.0, 23.0, 20.0, 17.0, 25.0, 27.0, 41.0, 32.0, 38.0, 29.0, 39.0, 39.0, 43.0, 52.0, 49.0, 37.0, 41.0, 47.0, 38.0, 22.0, 33.0, 26.0, 25.0, 24.0, 26.0, 20.0, 18.0, 23.0, 19.0, 13.0, 8.0, 4.0, 7.0, 10.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-2.48828125, -2.413909912109375, -2.33953857421875, -2.265167236328125, -2.1907958984375, -2.116424560546875, -2.04205322265625, -1.967681884765625, -1.893310546875, -1.818939208984375, -1.74456787109375, -1.670196533203125, -1.5958251953125, -1.521453857421875, -1.44708251953125, -1.372711181640625, -1.29833984375, -1.223968505859375, -1.14959716796875, -1.075225830078125, -1.0008544921875, -0.926483154296875, -0.85211181640625, -0.777740478515625, -0.703369140625, -0.628997802734375, -0.55462646484375, -0.480255126953125, -0.4058837890625, -0.331512451171875, -0.25714111328125, -0.182769775390625, -0.1083984375, -0.034027099609375, 0.04034423828125, 0.114715576171875, 0.1890869140625, 0.263458251953125, 0.33782958984375, 0.412200927734375, 0.486572265625, 0.560943603515625, 0.63531494140625, 0.709686279296875, 0.7840576171875, 0.858428955078125, 0.93280029296875, 1.007171630859375, 1.08154296875, 1.155914306640625, 1.23028564453125, 1.304656982421875, 1.3790283203125, 1.453399658203125, 1.52777099609375, 1.602142333984375, 1.676513671875, 1.750885009765625, 1.82525634765625, 1.899627685546875, 1.9739990234375, 2.048370361328125, 2.12274169921875, 2.197113037109375, 2.271484375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 10.0, 6.0, 11.0, 13.0, 23.0, 33.0, 55.0, 73.0, 130.0, 184.0, 311.0, 463.0, 749.0, 1186.0, 2055.0, 3516.0, 6418.0, 11873.0, 23216.0, 48241.0, 113769.0, 376519.0, 283912.0, 91983.0, 40485.0, 19716.0, 10216.0, 5604.0, 3162.0, 1693.0, 1049.0, 711.0, 431.0, 251.0, 182.0, 102.0, 76.0, 62.0, 26.0, 16.0, 15.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.568359375, -3.47161865234375, -3.3748779296875, -3.27813720703125, -3.181396484375, -3.08465576171875, -2.9879150390625, -2.89117431640625, -2.79443359375, -2.69769287109375, -2.6009521484375, -2.50421142578125, -2.407470703125, -2.31072998046875, -2.2139892578125, -2.11724853515625, -2.0205078125, -1.92376708984375, -1.8270263671875, -1.73028564453125, -1.633544921875, -1.53680419921875, -1.4400634765625, -1.34332275390625, -1.24658203125, -1.14984130859375, -1.0531005859375, -0.95635986328125, -0.859619140625, -0.76287841796875, -0.6661376953125, -0.56939697265625, -0.47265625, -0.37591552734375, -0.2791748046875, -0.18243408203125, -0.085693359375, 0.01104736328125, 0.1077880859375, 0.20452880859375, 0.30126953125, 0.39801025390625, 0.4947509765625, 0.59149169921875, 0.688232421875, 0.78497314453125, 0.8817138671875, 0.97845458984375, 1.0751953125, 1.17193603515625, 1.2686767578125, 1.36541748046875, 1.462158203125, 1.55889892578125, 1.6556396484375, 1.75238037109375, 1.84912109375, 1.94586181640625, 2.0426025390625, 2.13934326171875, 2.236083984375, 2.33282470703125, 2.4295654296875, 2.52630615234375, 2.623046875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 8.0, 14.0, 17.0, 15.0, 22.0, 24.0, 19.0, 32.0, 33.0, 38.0, 39.0, 55.0, 68.0, 103.0, 207.0, 1622.0, 216.0, 97.0, 53.0, 46.0, 42.0, 52.0, 41.0, 24.0, 33.0, 26.0, 20.0, 9.0, 10.0, 8.0, 12.0, 3.0, 5.0, 7.0, 4.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.015625, -10.7144775390625, -10.413330078125, -10.1121826171875, -9.81103515625, -9.5098876953125, -9.208740234375, -8.9075927734375, -8.6064453125, -8.3052978515625, -8.004150390625, -7.7030029296875, -7.40185546875, -7.1007080078125, -6.799560546875, -6.4984130859375, -6.197265625, -5.8961181640625, -5.594970703125, -5.2938232421875, -4.99267578125, -4.6915283203125, -4.390380859375, -4.0892333984375, -3.7880859375, -3.4869384765625, -3.185791015625, -2.8846435546875, -2.58349609375, -2.2823486328125, -1.981201171875, -1.6800537109375, -1.37890625, -1.0777587890625, -0.776611328125, -0.4754638671875, -0.17431640625, 0.1268310546875, 0.427978515625, 0.7291259765625, 1.0302734375, 1.3314208984375, 1.632568359375, 1.9337158203125, 2.23486328125, 2.5360107421875, 2.837158203125, 3.1383056640625, 3.439453125, 3.7406005859375, 4.041748046875, 4.3428955078125, 4.64404296875, 4.9451904296875, 5.246337890625, 5.5474853515625, 5.8486328125, 6.1497802734375, 6.450927734375, 6.7520751953125, 7.05322265625, 7.3543701171875, 7.655517578125, 7.9566650390625, 8.2578125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 7.0, 4.0, 4.0, 7.0, 8.0, 7.0, 15.0, 12.0, 35.0, 27.0, 63.0, 67.0, 88.0, 107.0, 164.0, 263.0, 536.0, 2105.0, 16781.0, 458569.0, 2614086.0, 46518.0, 4327.0, 855.0, 309.0, 214.0, 125.0, 91.0, 63.0, 60.0, 34.0, 41.0, 20.0, 26.0, 15.0, 13.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.0628662109375, -11.602294921875, -11.1417236328125, -10.68115234375, -10.2205810546875, -9.760009765625, -9.2994384765625, -8.8388671875, -8.3782958984375, -7.917724609375, -7.4571533203125, -6.99658203125, -6.5360107421875, -6.075439453125, -5.6148681640625, -5.154296875, -4.6937255859375, -4.233154296875, -3.7725830078125, -3.31201171875, -2.8514404296875, -2.390869140625, -1.9302978515625, -1.4697265625, -1.0091552734375, -0.548583984375, -0.0880126953125, 0.37255859375, 0.8331298828125, 1.293701171875, 1.7542724609375, 2.21484375, 2.6754150390625, 3.135986328125, 3.5965576171875, 4.05712890625, 4.5177001953125, 4.978271484375, 5.4388427734375, 5.8994140625, 6.3599853515625, 6.820556640625, 7.2811279296875, 7.74169921875, 8.2022705078125, 8.662841796875, 9.1234130859375, 9.583984375, 10.0445556640625, 10.505126953125, 10.9656982421875, 11.42626953125, 11.8868408203125, 12.347412109375, 12.8079833984375, 13.2685546875, 13.7291259765625, 14.189697265625, 14.6502685546875, 15.11083984375, 15.5714111328125, 16.031982421875, 16.4925537109375, 16.953125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 68.0, 284.0, 455.0, 176.0, 24.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.61382293701172, -100.4881820678711, -98.36254119873047, -96.23690032958984, -94.11125183105469, -91.98561096191406, -89.85997009277344, -87.73432922363281, -85.60868835449219, -83.48304748535156, -81.35740661621094, -79.23176574707031, -77.10612487792969, -74.98047637939453, -72.8548355102539, -70.72919464111328, -68.60355377197266, -66.47791290283203, -64.3522720336914, -62.226627349853516, -60.10098648071289, -57.975345611572266, -55.849700927734375, -53.72406005859375, -51.598419189453125, -49.4727783203125, -47.347137451171875, -45.221492767333984, -43.09585189819336, -40.970211029052734, -38.844566345214844, -36.71892547607422, -34.59328842163086, -32.467647552490234, -30.342004776000977, -28.21636199951172, -26.090721130371094, -23.96508026123047, -21.83943748474121, -19.713794708251953, -17.588153839111328, -15.462512016296387, -13.336870193481445, -11.211228370666504, -9.085586547851562, -6.959944725036621, -4.83430290222168, -2.7086610794067383, -0.5830192565917969, 1.5426225662231445, 3.668264389038086, 5.793906211853027, 7.919548034667969, 10.04518985748291, 12.170831680297852, 14.296473503112793, 16.422115325927734, 18.54775619506836, 20.673398971557617, 22.799041748046875, 24.9246826171875, 27.050323486328125, 29.175966262817383, 31.30160903930664, 33.427249908447266]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 2.0, 8.0, 9.0, 9.0, 12.0, 17.0, 15.0, 24.0, 21.0, 25.0, 29.0, 28.0, 32.0, 35.0, 41.0, 35.0, 31.0, 40.0, 43.0, 34.0, 37.0, 33.0, 46.0, 47.0, 45.0, 29.0, 31.0, 30.0, 34.0, 25.0, 20.0, 22.0, 15.0, 13.0, 13.0, 15.0, 11.0, 7.0, 6.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.032007217407227, -24.260358810424805, -23.488710403442383, -22.717063903808594, -21.945415496826172, -21.17376708984375, -20.402118682861328, -19.630470275878906, -18.858821868896484, -18.087173461914062, -17.31552505493164, -16.54387664794922, -15.77223014831543, -15.000581741333008, -14.228933334350586, -13.457284927368164, -12.685638427734375, -11.913990020751953, -11.142342567443848, -10.370694160461426, -9.59904670715332, -8.827398300170898, -8.055749893188477, -7.284101963043213, -6.512454032897949, -5.7408061027526855, -4.969158172607422, -4.197509765625, -3.4258618354797363, -2.6542139053344727, -1.8825654983520508, -1.110917568206787, -0.33927154541015625, 0.432376503944397, 1.2040245532989502, 1.975672721862793, 2.7473206520080566, 3.5189685821533203, 4.290616989135742, 5.062264919281006, 5.8339128494262695, 6.605560779571533, 7.377208709716797, 8.148857116699219, 8.92050552368164, 9.692152976989746, 10.463801383972168, 11.235448837280273, 12.007097244262695, 12.778745651245117, 13.550393104553223, 14.322041511535645, 15.09368896484375, 15.865337371826172, 16.636985778808594, 17.408634185791016, 18.180282592773438, 18.95193099975586, 19.72357940673828, 20.495227813720703, 21.266874313354492, 22.038522720336914, 22.810171127319336, 23.581819534301758, 24.353466033935547]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 5.0, 9.0, 17.0, 19.0, 19.0, 21.0, 19.0, 31.0, 44.0, 44.0, 26.0, 31.0, 29.0, 37.0, 39.0, 57.0, 48.0, 52.0, 42.0, 30.0, 42.0, 32.0, 30.0, 33.0, 27.0, 25.0, 24.0, 26.0, 20.0, 22.0, 22.0, 10.0, 12.0, 8.0, 6.0, 8.0, 6.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.63671875, -2.556732177734375, -2.47674560546875, -2.396759033203125, -2.3167724609375, -2.236785888671875, -2.15679931640625, -2.076812744140625, -1.996826171875, -1.916839599609375, -1.83685302734375, -1.756866455078125, -1.6768798828125, -1.596893310546875, -1.51690673828125, -1.436920166015625, -1.35693359375, -1.276947021484375, -1.19696044921875, -1.116973876953125, -1.0369873046875, -0.957000732421875, -0.87701416015625, -0.797027587890625, -0.717041015625, -0.637054443359375, -0.55706787109375, -0.477081298828125, -0.3970947265625, -0.317108154296875, -0.23712158203125, -0.157135009765625, -0.0771484375, 0.002838134765625, 0.08282470703125, 0.162811279296875, 0.2427978515625, 0.322784423828125, 0.40277099609375, 0.482757568359375, 0.562744140625, 0.642730712890625, 0.72271728515625, 0.802703857421875, 0.8826904296875, 0.962677001953125, 1.04266357421875, 1.122650146484375, 1.20263671875, 1.282623291015625, 1.36260986328125, 1.442596435546875, 1.5225830078125, 1.602569580078125, 1.68255615234375, 1.762542724609375, 1.842529296875, 1.922515869140625, 2.00250244140625, 2.082489013671875, 2.1624755859375, 2.242462158203125, 2.32244873046875, 2.402435302734375, 2.482421875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 5.0, 8.0, 7.0, 8.0, 14.0, 30.0, 41.0, 49.0, 76.0, 115.0, 181.0, 255.0, 430.0, 649.0, 1090.0, 1729.0, 3255.0, 6001.0, 11987.0, 26769.0, 60552.0, 151239.0, 440919.0, 1255865.0, 1413774.0, 518900.0, 173594.0, 68200.0, 29595.0, 13718.0, 6633.0, 3544.0, 1902.0, 1149.0, 695.0, 419.0, 257.0, 189.0, 135.0, 92.0, 60.0, 42.0, 46.0, 21.0, 16.0, 16.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.865234375, -3.744720458984375, -3.62420654296875, -3.503692626953125, -3.3831787109375, -3.262664794921875, -3.14215087890625, -3.021636962890625, -2.901123046875, -2.780609130859375, -2.66009521484375, -2.539581298828125, -2.4190673828125, -2.298553466796875, -2.17803955078125, -2.057525634765625, -1.93701171875, -1.816497802734375, -1.69598388671875, -1.575469970703125, -1.4549560546875, -1.334442138671875, -1.21392822265625, -1.093414306640625, -0.972900390625, -0.852386474609375, -0.73187255859375, -0.611358642578125, -0.4908447265625, -0.370330810546875, -0.24981689453125, -0.129302978515625, -0.0087890625, 0.111724853515625, 0.23223876953125, 0.352752685546875, 0.4732666015625, 0.593780517578125, 0.71429443359375, 0.834808349609375, 0.955322265625, 1.075836181640625, 1.19635009765625, 1.316864013671875, 1.4373779296875, 1.557891845703125, 1.67840576171875, 1.798919677734375, 1.91943359375, 2.039947509765625, 2.16046142578125, 2.280975341796875, 2.4014892578125, 2.522003173828125, 2.64251708984375, 2.763031005859375, 2.883544921875, 3.004058837890625, 3.12457275390625, 3.245086669921875, 3.3656005859375, 3.486114501953125, 3.60662841796875, 3.727142333984375, 3.84765625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 7.0, 10.0, 23.0, 24.0, 38.0, 51.0, 66.0, 103.0, 118.0, 131.0, 246.0, 301.0, 418.0, 460.0, 450.0, 415.0, 323.0, 222.0, 189.0, 133.0, 108.0, 69.0, 48.0, 37.0, 26.0, 12.0, 7.0, 9.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94921875, -6.7325439453125, -6.515869140625, -6.2991943359375, -6.08251953125, -5.8658447265625, -5.649169921875, -5.4324951171875, -5.2158203125, -4.9991455078125, -4.782470703125, -4.5657958984375, -4.34912109375, -4.1324462890625, -3.915771484375, -3.6990966796875, -3.482421875, -3.2657470703125, -3.049072265625, -2.8323974609375, -2.61572265625, -2.3990478515625, -2.182373046875, -1.9656982421875, -1.7490234375, -1.5323486328125, -1.315673828125, -1.0989990234375, -0.88232421875, -0.6656494140625, -0.448974609375, -0.2322998046875, -0.015625, 0.2010498046875, 0.417724609375, 0.6343994140625, 0.85107421875, 1.0677490234375, 1.284423828125, 1.5010986328125, 1.7177734375, 1.9344482421875, 2.151123046875, 2.3677978515625, 2.58447265625, 2.8011474609375, 3.017822265625, 3.2344970703125, 3.451171875, 3.6678466796875, 3.884521484375, 4.1011962890625, 4.31787109375, 4.5345458984375, 4.751220703125, 4.9678955078125, 5.1845703125, 5.4012451171875, 5.617919921875, 5.8345947265625, 6.05126953125, 6.2679443359375, 6.484619140625, 6.7012939453125, 6.91796875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 4.0, 13.0, 13.0, 24.0, 26.0, 49.0, 61.0, 87.0, 157.0, 294.0, 611.0, 1341.0, 4383.0, 19602.0, 123650.0, 1042918.0, 2562754.0, 374132.0, 50361.0, 9410.0, 2452.0, 862.0, 412.0, 192.0, 153.0, 89.0, 66.0, 44.0, 27.0, 17.0, 16.0, 9.0, 13.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.2862548828125, -10.900634765625, -10.5150146484375, -10.12939453125, -9.7437744140625, -9.358154296875, -8.9725341796875, -8.5869140625, -8.2012939453125, -7.815673828125, -7.4300537109375, -7.04443359375, -6.6588134765625, -6.273193359375, -5.8875732421875, -5.501953125, -5.1163330078125, -4.730712890625, -4.3450927734375, -3.95947265625, -3.5738525390625, -3.188232421875, -2.8026123046875, -2.4169921875, -2.0313720703125, -1.645751953125, -1.2601318359375, -0.87451171875, -0.4888916015625, -0.103271484375, 0.2823486328125, 0.66796875, 1.0535888671875, 1.439208984375, 1.8248291015625, 2.21044921875, 2.5960693359375, 2.981689453125, 3.3673095703125, 3.7529296875, 4.1385498046875, 4.524169921875, 4.9097900390625, 5.29541015625, 5.6810302734375, 6.066650390625, 6.4522705078125, 6.837890625, 7.2235107421875, 7.609130859375, 7.9947509765625, 8.38037109375, 8.7659912109375, 9.151611328125, 9.5372314453125, 9.9228515625, 10.3084716796875, 10.694091796875, 11.0797119140625, 11.46533203125, 11.8509521484375, 12.236572265625, 12.6221923828125, 13.0078125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 11.0, 32.0, 28.0, 55.0, 55.0, 91.0, 97.0, 103.0, 101.0, 107.0, 86.0, 69.0, 54.0, 38.0, 27.0, 20.0, 13.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-55.894630432128906, -54.689579010009766, -53.48453140258789, -52.27947998046875, -51.074432373046875, -49.869380950927734, -48.66433334350586, -47.45928192138672, -46.254234313964844, -45.0491828918457, -43.84413528442383, -42.63908386230469, -41.43403625488281, -40.22898483276367, -39.0239372253418, -37.818885803222656, -36.613834381103516, -35.408782958984375, -34.2037353515625, -32.99868392944336, -31.793636322021484, -30.588584899902344, -29.383535385131836, -28.178485870361328, -26.97343635559082, -25.768386840820312, -24.563337326049805, -23.358287811279297, -22.153236389160156, -20.94818878173828, -19.74313735961914, -18.538087844848633, -17.33303451538086, -16.12798500061035, -14.922935485839844, -13.71788501739502, -12.512835502624512, -11.307785987854004, -10.10273551940918, -8.897686004638672, -7.692636489868164, -6.487586975097656, -5.28253698348999, -4.077486991882324, -2.8724374771118164, -1.6673879623413086, -0.4623379707336426, 0.7427120208740234, 1.9477615356445312, 3.152811288833618, 4.357861042022705, 5.562911033630371, 6.767960548400879, 7.973010063171387, 9.178060531616211, 10.383110046386719, 11.588159561157227, 12.793209075927734, 13.998258590698242, 15.203309059143066, 16.40835952758789, 17.613407135009766, 18.818458557128906, 20.023508071899414, 21.228557586669922]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 15.0, 12.0, 16.0, 10.0, 18.0, 14.0, 26.0, 22.0, 27.0, 28.0, 32.0, 52.0, 34.0, 43.0, 40.0, 56.0, 52.0, 47.0, 46.0, 41.0, 50.0, 33.0, 34.0, 43.0, 33.0, 30.0, 32.0, 20.0, 12.0, 18.0, 19.0, 9.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.433258056640625, -22.67607307434082, -21.91888999938965, -21.161705017089844, -20.40452003479004, -19.647335052490234, -18.890151977539062, -18.132966995239258, -17.375782012939453, -16.61859703063965, -15.86141300201416, -15.104228973388672, -14.347043991088867, -13.589859962463379, -12.83267593383789, -12.075490951538086, -11.318307876586914, -10.561123847961426, -9.803938865661621, -9.046754837036133, -8.289569854736328, -7.53238582611084, -6.775201797485352, -6.018017292022705, -5.260832786560059, -4.503648281097412, -3.7464640140533447, -2.9892797470092773, -2.232095241546631, -1.4749107360839844, -0.7177267074584961, 0.03945779800415039, 0.7966423034667969, 1.5538266897201538, 2.3110110759735107, 3.068195343017578, 3.8253798484802246, 4.582564353942871, 5.339748382568359, 6.096932888031006, 6.854117393493652, 7.611301898956299, 8.368486404418945, 9.125670433044434, 9.882854461669922, 10.640039443969727, 11.397223472595215, 12.154407501220703, 12.911592483520508, 13.668776512145996, 14.4259614944458, 15.183145523071289, 15.940330505371094, 16.697513580322266, 17.45469856262207, 18.211883544921875, 18.969066619873047, 19.72625160217285, 20.483434677124023, 21.240619659423828, 21.997804641723633, 22.754989624023438, 23.51217269897461, 24.269357681274414, 25.02654266357422]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 12.0, 10.0, 20.0, 22.0, 19.0, 24.0, 27.0, 25.0, 29.0, 39.0, 35.0, 32.0, 51.0, 43.0, 49.0, 51.0, 41.0, 38.0, 37.0, 34.0, 45.0, 38.0, 26.0, 27.0, 24.0, 26.0, 29.0, 21.0, 14.0, 15.0, 14.0, 14.0, 16.0, 6.0, 10.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.517578125, -2.43463134765625, -2.3516845703125, -2.26873779296875, -2.185791015625, -2.10284423828125, -2.0198974609375, -1.93695068359375, -1.85400390625, -1.77105712890625, -1.6881103515625, -1.60516357421875, -1.522216796875, -1.43927001953125, -1.3563232421875, -1.27337646484375, -1.1904296875, -1.10748291015625, -1.0245361328125, -0.94158935546875, -0.858642578125, -0.77569580078125, -0.6927490234375, -0.60980224609375, -0.52685546875, -0.44390869140625, -0.3609619140625, -0.27801513671875, -0.195068359375, -0.11212158203125, -0.0291748046875, 0.05377197265625, 0.13671875, 0.21966552734375, 0.3026123046875, 0.38555908203125, 0.468505859375, 0.55145263671875, 0.6343994140625, 0.71734619140625, 0.80029296875, 0.88323974609375, 0.9661865234375, 1.04913330078125, 1.132080078125, 1.21502685546875, 1.2979736328125, 1.38092041015625, 1.4638671875, 1.54681396484375, 1.6297607421875, 1.71270751953125, 1.795654296875, 1.87860107421875, 1.9615478515625, 2.04449462890625, 2.12744140625, 2.21038818359375, 2.2933349609375, 2.37628173828125, 2.459228515625, 2.54217529296875, 2.6251220703125, 2.70806884765625, 2.791015625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 8.0, 11.0, 17.0, 23.0, 36.0, 50.0, 60.0, 113.0, 172.0, 244.0, 432.0, 661.0, 1085.0, 1667.0, 2722.0, 4388.0, 7014.0, 11617.0, 19501.0, 32889.0, 58034.0, 109740.0, 265367.0, 276260.0, 112881.0, 59479.0, 33526.0, 19654.0, 11701.0, 7294.0, 4410.0, 2776.0, 1720.0, 1117.0, 693.0, 419.0, 285.0, 184.0, 103.0, 77.0, 39.0, 34.0, 22.0, 16.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.1268768310546875, -0.122650146484375, -0.1184234619140625, -0.11419677734375, -0.1099700927734375, -0.105743408203125, -0.1015167236328125, -0.0972900390625, -0.0930633544921875, -0.088836669921875, -0.0846099853515625, -0.08038330078125, -0.0761566162109375, -0.071929931640625, -0.0677032470703125, -0.0634765625, -0.0592498779296875, -0.055023193359375, -0.0507965087890625, -0.04656982421875, -0.0423431396484375, -0.038116455078125, -0.0338897705078125, -0.0296630859375, -0.0254364013671875, -0.021209716796875, -0.0169830322265625, -0.01275634765625, -0.0085296630859375, -0.004302978515625, -7.62939453125e-05, 0.004150390625, 0.0083770751953125, 0.012603759765625, 0.0168304443359375, 0.02105712890625, 0.0252838134765625, 0.029510498046875, 0.0337371826171875, 0.0379638671875, 0.0421905517578125, 0.046417236328125, 0.0506439208984375, 0.05487060546875, 0.0590972900390625, 0.063323974609375, 0.0675506591796875, 0.07177734375, 0.0760040283203125, 0.080230712890625, 0.0844573974609375, 0.08868408203125, 0.0929107666015625, 0.097137451171875, 0.1013641357421875, 0.1055908203125, 0.1098175048828125, 0.114044189453125, 0.1182708740234375, 0.12249755859375, 0.1267242431640625, 0.130950927734375, 0.1351776123046875, 0.139404296875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 9.0, 7.0, 7.0, 8.0, 9.0, 10.0, 17.0, 21.0, 24.0, 20.0, 15.0, 34.0, 31.0, 32.0, 50.0, 29.0, 38.0, 35.0, 48.0, 56.0, 1076.0, 50.0, 36.0, 41.0, 41.0, 29.0, 36.0, 27.0, 34.0, 21.0, 30.0, 17.0, 22.0, 17.0, 9.0, 7.0, 4.0, 8.0, 6.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7802734375, -1.7191925048828125, -1.658111572265625, -1.5970306396484375, -1.53594970703125, -1.4748687744140625, -1.413787841796875, -1.3527069091796875, -1.2916259765625, -1.2305450439453125, -1.169464111328125, -1.1083831787109375, -1.04730224609375, -0.9862213134765625, -0.925140380859375, -0.8640594482421875, -0.802978515625, -0.7418975830078125, -0.680816650390625, -0.6197357177734375, -0.55865478515625, -0.4975738525390625, -0.436492919921875, -0.3754119873046875, -0.3143310546875, -0.2532501220703125, -0.192169189453125, -0.1310882568359375, -0.07000732421875, -0.0089263916015625, 0.052154541015625, 0.1132354736328125, 0.17431640625, 0.2353973388671875, 0.296478271484375, 0.3575592041015625, 0.41864013671875, 0.4797210693359375, 0.540802001953125, 0.6018829345703125, 0.6629638671875, 0.7240447998046875, 0.785125732421875, 0.8462066650390625, 0.90728759765625, 0.9683685302734375, 1.029449462890625, 1.0905303955078125, 1.151611328125, 1.2126922607421875, 1.273773193359375, 1.3348541259765625, 1.39593505859375, 1.4570159912109375, 1.518096923828125, 1.5791778564453125, 1.6402587890625, 1.7013397216796875, 1.762420654296875, 1.8235015869140625, 1.88458251953125, 1.9456634521484375, 2.006744384765625, 2.0678253173828125, 2.12890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 7.0, 10.0, 7.0, 11.0, 23.0, 31.0, 60.0, 80.0, 121.0, 145.0, 225.0, 348.0, 530.0, 690.0, 1030.0, 1506.0, 2156.0, 3144.0, 4727.0, 6935.0, 10367.0, 15402.0, 24168.0, 37588.0, 62197.0, 108078.0, 207715.0, 1291576.0, 125376.0, 70828.0, 42802.0, 26699.0, 17319.0, 11104.0, 7625.0, 5221.0, 3593.0, 2354.0, 1689.0, 1155.0, 778.0, 532.0, 390.0, 254.0, 178.0, 105.0, 100.0, 56.0, 34.0, 15.0, 22.0, 8.0, 10.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0], "bins": [-0.0433349609375, -0.04198598861694336, -0.04063701629638672, -0.03928804397583008, -0.03793907165527344, -0.0365900993347168, -0.035241127014160156, -0.033892154693603516, -0.032543182373046875, -0.031194210052490234, -0.029845237731933594, -0.028496265411376953, -0.027147293090820312, -0.025798320770263672, -0.02444934844970703, -0.02310037612915039, -0.02175140380859375, -0.02040243148803711, -0.01905345916748047, -0.017704486846923828, -0.016355514526367188, -0.015006542205810547, -0.013657569885253906, -0.012308597564697266, -0.010959625244140625, -0.009610652923583984, -0.008261680603027344, -0.006912708282470703, -0.0055637359619140625, -0.004214763641357422, -0.0028657913208007812, -0.0015168190002441406, -0.0001678466796875, 0.0011811256408691406, 0.0025300979614257812, 0.003879070281982422, 0.0052280426025390625, 0.006577014923095703, 0.007925987243652344, 0.009274959564208984, 0.010623931884765625, 0.011972904205322266, 0.013321876525878906, 0.014670848846435547, 0.016019821166992188, 0.017368793487548828, 0.01871776580810547, 0.02006673812866211, 0.02141571044921875, 0.02276468276977539, 0.02411365509033203, 0.025462627410888672, 0.026811599731445312, 0.028160572052001953, 0.029509544372558594, 0.030858516693115234, 0.032207489013671875, 0.033556461334228516, 0.034905433654785156, 0.0362544059753418, 0.03760337829589844, 0.03895235061645508, 0.04030132293701172, 0.04165029525756836, 0.042999267578125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 1.0, 7.0, 8.0, 14.0, 16.0, 21.0, 16.0, 20.0, 18.0, 46.0, 64.0, 76.0, 132.0, 140.0, 97.0, 81.0, 53.0, 42.0, 22.0, 29.0, 16.0, 6.0, 12.0, 12.0, 10.0, 5.0, 11.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8014183044433594e-05, -2.7145259082317352e-05, -2.627633512020111e-05, -2.540741115808487e-05, -2.4538487195968628e-05, -2.3669563233852386e-05, -2.2800639271736145e-05, -2.1931715309619904e-05, -2.1062791347503662e-05, -2.019386738538742e-05, -1.932494342327118e-05, -1.8456019461154938e-05, -1.7587095499038696e-05, -1.6718171536922455e-05, -1.5849247574806213e-05, -1.4980323612689972e-05, -1.411139965057373e-05, -1.3242475688457489e-05, -1.2373551726341248e-05, -1.1504627764225006e-05, -1.0635703802108765e-05, -9.766779839992523e-06, -8.897855877876282e-06, -8.02893191576004e-06, -7.160007953643799e-06, -6.291083991527557e-06, -5.422160029411316e-06, -4.5532360672950745e-06, -3.684312105178833e-06, -2.8153881430625916e-06, -1.94646418094635e-06, -1.0775402188301086e-06, -2.086162567138672e-07, 6.603077054023743e-07, 1.5292316675186157e-06, 2.398155629634857e-06, 3.2670795917510986e-06, 4.13600355386734e-06, 5.0049275159835815e-06, 5.873851478099823e-06, 6.7427754402160645e-06, 7.611699402332306e-06, 8.480623364448547e-06, 9.349547326564789e-06, 1.021847128868103e-05, 1.1087395250797272e-05, 1.1956319212913513e-05, 1.2825243175029755e-05, 1.3694167137145996e-05, 1.4563091099262238e-05, 1.543201506137848e-05, 1.630093902349472e-05, 1.7169862985610962e-05, 1.8038786947727203e-05, 1.8907710909843445e-05, 1.9776634871959686e-05, 2.0645558834075928e-05, 2.151448279619217e-05, 2.238340675830841e-05, 2.3252330720424652e-05, 2.4121254682540894e-05, 2.4990178644657135e-05, 2.5859102606773376e-05, 2.6728026568889618e-05, 2.759695053100586e-05]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 2.0, 3.0, 10.0, 7.0, 11.0, 11.0, 10.0, 19.0, 24.0, 32.0, 41.0, 49.0, 113.0, 242.0, 3269.0, 1016475.0, 27421.0, 422.0, 149.0, 71.0, 28.0, 26.0, 22.0, 21.0, 16.0, 18.0, 11.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006861686706542969, -0.0006645023822784424, -0.0006428360939025879, -0.0006211698055267334, -0.0005995035171508789, -0.0005778372287750244, -0.0005561709403991699, -0.0005345046520233154, -0.0005128383636474609, -0.0004911720752716064, -0.00046950578689575195, -0.00044783949851989746, -0.00042617321014404297, -0.0004045069217681885, -0.000382840633392334, -0.0003611743450164795, -0.000339508056640625, -0.0003178417682647705, -0.000296175479888916, -0.0002745091915130615, -0.00025284290313720703, -0.00023117661476135254, -0.00020951032638549805, -0.00018784403800964355, -0.00016617774963378906, -0.00014451146125793457, -0.00012284517288208008, -0.00010117888450622559, -7.95125961303711e-05, -5.78463077545166e-05, -3.618001937866211e-05, -1.4513731002807617e-05, 7.152557373046875e-06, 2.8818845748901367e-05, 5.048513412475586e-05, 7.215142250061035e-05, 9.381771087646484e-05, 0.00011548399925231934, 0.00013715028762817383, 0.00015881657600402832, 0.0001804828643798828, 0.0002021491527557373, 0.0002238154411315918, 0.0002454817295074463, 0.0002671480178833008, 0.0002888143062591553, 0.00031048059463500977, 0.00033214688301086426, 0.00035381317138671875, 0.00037547945976257324, 0.00039714574813842773, 0.0004188120365142822, 0.0004404783248901367, 0.0004621446132659912, 0.0004838109016418457, 0.0005054771900177002, 0.0005271434783935547, 0.0005488097667694092, 0.0005704760551452637, 0.0005921423435211182, 0.0006138086318969727, 0.0006354749202728271, 0.0006571412086486816, 0.0006788074970245361, 0.0007004737854003906]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [30.0, 955.0, 33.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4839413779554889e-05, -4.97347537020687e-06, 4.892463039141148e-06, 1.4758401448489167e-05, 2.4624339857837185e-05, 3.44902764481958e-05, 4.435621667653322e-05, 5.4222156904870644e-05, 6.408808985725045e-05, 7.395402644760907e-05, 8.381996303796768e-05, 9.368590690428391e-05, 0.00010355184349464253, 0.00011341778008500114, 0.00012328372395131737, 0.00013314966054167598, 0.0001430155971320346, 0.00015288153372239321, 0.00016274747031275183, 0.00017261340690311044, 0.0001824793580453843, 0.0001923452946357429, 0.00020221123122610152, 0.00021207716781646013, 0.00022194310440681875, 0.00023180904099717736, 0.00024167497758753598, 0.0002515409141778946, 0.0002614068507682532, 0.0002712727873586118, 0.00028113872394897044, 0.00029100466053932905, 0.0003008706262335181, 0.00031073656282387674, 0.00032060249941423535, 0.00033046843600459397, 0.0003403343725949526, 0.0003502003091853112, 0.0003600662457756698, 0.0003699322114698589, 0.00037979811895638704, 0.00038966405554674566, 0.00039952999213710427, 0.0004093959287274629, 0.0004192618653178215, 0.0004291278019081801, 0.00043899373849853873, 0.0004488597041927278, 0.0004587256407830864, 0.00046859157737344503, 0.00047845751396380365, 0.0004883234505541623, 0.0004981894162483513, 0.0005080553237348795, 0.0005179212894290686, 0.0005277871969155967, 0.0005376531626097858, 0.0005475191283039749, 0.000557385035790503, 0.0005672510014846921, 0.0005771169089712203, 0.0005869828746654093, 0.0005968487821519375, 0.0006067147478461266, 0.0006165806553326547]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 11.0, 2.0, 10.0, 15.0, 8.0, 15.0, 28.0, 22.0, 27.0, 28.0, 41.0, 36.0, 42.0, 45.0, 47.0, 43.0, 59.0, 47.0, 49.0, 56.0, 54.0, 57.0, 51.0, 45.0, 23.0, 36.0, 31.0, 21.0, 12.0, 14.0, 7.0, 10.0, 4.0, 7.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09808349609375e-05, -2.04332172870636e-05, -1.9885599613189697e-05, -1.9337981939315796e-05, -1.8790364265441895e-05, -1.8242746591567993e-05, -1.7695128917694092e-05, -1.714751124382019e-05, -1.659989356994629e-05, -1.6052275896072388e-05, -1.5504658222198486e-05, -1.4957040548324585e-05, -1.4409422874450684e-05, -1.3861805200576782e-05, -1.3314187526702881e-05, -1.276656985282898e-05, -1.2218952178955078e-05, -1.1671334505081177e-05, -1.1123716831207275e-05, -1.0576099157333374e-05, -1.0028481483459473e-05, -9.480863809585571e-06, -8.93324613571167e-06, -8.385628461837769e-06, -7.838010787963867e-06, -7.290393114089966e-06, -6.7427754402160645e-06, -6.195157766342163e-06, -5.647540092468262e-06, -5.09992241859436e-06, -4.552304744720459e-06, -4.004687070846558e-06, -3.4570693969726562e-06, -2.909451723098755e-06, -2.3618340492248535e-06, -1.8142163753509521e-06, -1.2665987014770508e-06, -7.189810276031494e-07, -1.7136335372924805e-07, 3.762543201446533e-07, 9.238719940185547e-07, 1.471489667892456e-06, 2.0191073417663574e-06, 2.566725015640259e-06, 3.11434268951416e-06, 3.6619603633880615e-06, 4.209578037261963e-06, 4.757195711135864e-06, 5.304813385009766e-06, 5.852431058883667e-06, 6.400048732757568e-06, 6.94766640663147e-06, 7.495284080505371e-06, 8.042901754379272e-06, 8.590519428253174e-06, 9.138137102127075e-06, 9.685754776000977e-06, 1.0233372449874878e-05, 1.078099012374878e-05, 1.132860779762268e-05, 1.1876225471496582e-05, 1.2423843145370483e-05, 1.2971460819244385e-05, 1.3519078493118286e-05, 1.4066696166992188e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 12.0, 10.0, 20.0, 22.0, 19.0, 24.0, 27.0, 25.0, 29.0, 39.0, 35.0, 32.0, 51.0, 43.0, 49.0, 51.0, 41.0, 38.0, 37.0, 34.0, 45.0, 38.0, 26.0, 27.0, 24.0, 26.0, 29.0, 21.0, 14.0, 15.0, 14.0, 14.0, 16.0, 6.0, 10.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.517578125, -2.43463134765625, -2.3516845703125, -2.26873779296875, -2.185791015625, -2.10284423828125, -2.0198974609375, -1.93695068359375, -1.85400390625, -1.77105712890625, -1.6881103515625, -1.60516357421875, -1.522216796875, -1.43927001953125, -1.3563232421875, -1.27337646484375, -1.1904296875, -1.10748291015625, -1.0245361328125, -0.94158935546875, -0.858642578125, -0.77569580078125, -0.6927490234375, -0.60980224609375, -0.52685546875, -0.44390869140625, -0.3609619140625, -0.27801513671875, -0.195068359375, -0.11212158203125, -0.0291748046875, 0.05377197265625, 0.13671875, 0.21966552734375, 0.3026123046875, 0.38555908203125, 0.468505859375, 0.55145263671875, 0.6343994140625, 0.71734619140625, 0.80029296875, 0.88323974609375, 0.9661865234375, 1.04913330078125, 1.132080078125, 1.21502685546875, 1.2979736328125, 1.38092041015625, 1.4638671875, 1.54681396484375, 1.6297607421875, 1.71270751953125, 1.795654296875, 1.87860107421875, 1.9615478515625, 2.04449462890625, 2.12744140625, 2.21038818359375, 2.2933349609375, 2.37628173828125, 2.459228515625, 2.54217529296875, 2.6251220703125, 2.70806884765625, 2.791015625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 18.0, 35.0, 64.0, 126.0, 197.0, 332.0, 562.0, 1018.0, 1805.0, 3472.0, 6530.0, 13559.0, 29686.0, 72676.0, 199038.0, 413218.0, 184579.0, 67809.0, 27433.0, 12648.0, 6370.0, 3206.0, 1848.0, 963.0, 591.0, 318.0, 205.0, 99.0, 63.0, 26.0, 13.0, 17.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1953125, -4.073577880859375, -3.95184326171875, -3.830108642578125, -3.7083740234375, -3.586639404296875, -3.46490478515625, -3.343170166015625, -3.221435546875, -3.099700927734375, -2.97796630859375, -2.856231689453125, -2.7344970703125, -2.612762451171875, -2.49102783203125, -2.369293212890625, -2.24755859375, -2.125823974609375, -2.00408935546875, -1.882354736328125, -1.7606201171875, -1.638885498046875, -1.51715087890625, -1.395416259765625, -1.273681640625, -1.151947021484375, -1.03021240234375, -0.908477783203125, -0.7867431640625, -0.665008544921875, -0.54327392578125, -0.421539306640625, -0.2998046875, -0.178070068359375, -0.05633544921875, 0.065399169921875, 0.1871337890625, 0.308868408203125, 0.43060302734375, 0.552337646484375, 0.674072265625, 0.795806884765625, 0.91754150390625, 1.039276123046875, 1.1610107421875, 1.282745361328125, 1.40447998046875, 1.526214599609375, 1.64794921875, 1.769683837890625, 1.89141845703125, 2.013153076171875, 2.1348876953125, 2.256622314453125, 2.37835693359375, 2.500091552734375, 2.621826171875, 2.743560791015625, 2.86529541015625, 2.987030029296875, 3.1087646484375, 3.230499267578125, 3.35223388671875, 3.473968505859375, 3.595703125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 7.0, 4.0, 8.0, 5.0, 12.0, 8.0, 9.0, 16.0, 18.0, 13.0, 18.0, 29.0, 32.0, 33.0, 49.0, 32.0, 57.0, 73.0, 104.0, 221.0, 1469.0, 272.0, 129.0, 83.0, 55.0, 41.0, 36.0, 36.0, 35.0, 26.0, 23.0, 16.0, 18.0, 16.0, 12.0, 7.0, 6.0, 7.0, 6.0, 7.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -10.0421142578125, -9.724853515625, -9.4075927734375, -9.09033203125, -8.7730712890625, -8.455810546875, -8.1385498046875, -7.8212890625, -7.5040283203125, -7.186767578125, -6.8695068359375, -6.55224609375, -6.2349853515625, -5.917724609375, -5.6004638671875, -5.283203125, -4.9659423828125, -4.648681640625, -4.3314208984375, -4.01416015625, -3.6968994140625, -3.379638671875, -3.0623779296875, -2.7451171875, -2.4278564453125, -2.110595703125, -1.7933349609375, -1.47607421875, -1.1588134765625, -0.841552734375, -0.5242919921875, -0.20703125, 0.1102294921875, 0.427490234375, 0.7447509765625, 1.06201171875, 1.3792724609375, 1.696533203125, 2.0137939453125, 2.3310546875, 2.6483154296875, 2.965576171875, 3.2828369140625, 3.60009765625, 3.9173583984375, 4.234619140625, 4.5518798828125, 4.869140625, 5.1864013671875, 5.503662109375, 5.8209228515625, 6.13818359375, 6.4554443359375, 6.772705078125, 7.0899658203125, 7.4072265625, 7.7244873046875, 8.041748046875, 8.3590087890625, 8.67626953125, 8.9935302734375, 9.310791015625, 9.6280517578125, 9.9453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 12.0, 11.0, 22.0, 16.0, 26.0, 40.0, 63.0, 82.0, 95.0, 143.0, 203.0, 320.0, 872.0, 6196.0, 205135.0, 2861400.0, 66174.0, 3266.0, 650.0, 257.0, 172.0, 127.0, 108.0, 71.0, 47.0, 45.0, 26.0, 27.0, 15.0, 14.0, 14.0, 11.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.546875, -17.95556640625, -17.3642578125, -16.77294921875, -16.181640625, -15.59033203125, -14.9990234375, -14.40771484375, -13.81640625, -13.22509765625, -12.6337890625, -12.04248046875, -11.451171875, -10.85986328125, -10.2685546875, -9.67724609375, -9.0859375, -8.49462890625, -7.9033203125, -7.31201171875, -6.720703125, -6.12939453125, -5.5380859375, -4.94677734375, -4.35546875, -3.76416015625, -3.1728515625, -2.58154296875, -1.990234375, -1.39892578125, -0.8076171875, -0.21630859375, 0.375, 0.96630859375, 1.5576171875, 2.14892578125, 2.740234375, 3.33154296875, 3.9228515625, 4.51416015625, 5.10546875, 5.69677734375, 6.2880859375, 6.87939453125, 7.470703125, 8.06201171875, 8.6533203125, 9.24462890625, 9.8359375, 10.42724609375, 11.0185546875, 11.60986328125, 12.201171875, 12.79248046875, 13.3837890625, 13.97509765625, 14.56640625, 15.15771484375, 15.7490234375, 16.34033203125, 16.931640625, 17.52294921875, 18.1142578125, 18.70556640625, 19.296875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 43.0, 131.0, 270.0, 307.0, 184.0, 61.0, 10.0, 6.0], "bins": [-102.04620361328125, -100.3194808959961, -98.5927505493164, -96.86602783203125, -95.1393051147461, -93.41258239746094, -91.68585205078125, -89.9591293334961, -88.23240661621094, -86.50568389892578, -84.7789535522461, -83.05223083496094, -81.32550811767578, -79.59878540039062, -77.87205505371094, -76.14533233642578, -74.4186019897461, -72.69187927246094, -70.96514892578125, -69.2384262084961, -67.51170349121094, -65.78497314453125, -64.0582504272461, -62.33152770996094, -60.60480499267578, -58.87807846069336, -57.1513557434082, -55.42462921142578, -53.697906494140625, -51.9711799621582, -50.24445343017578, -48.517730712890625, -46.7910041809082, -45.06427764892578, -43.337554931640625, -41.6108283996582, -39.88410568237305, -38.157379150390625, -36.43065643310547, -34.70392990112305, -32.977203369140625, -31.250478744506836, -29.523754119873047, -27.797027587890625, -26.070302963256836, -24.343578338623047, -22.616853713989258, -20.89012908935547, -19.163402557373047, -17.436677932739258, -15.709952354431152, -13.983227729797363, -12.256502151489258, -10.529777526855469, -8.80305290222168, -7.076327323913574, -5.349603652954102, -3.6228785514831543, -1.8961536884307861, -0.16942882537841797, 1.5572962760925293, 3.2840213775634766, 5.010746002197266, 6.737471580505371, 8.46419620513916]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 2.0, 9.0, 8.0, 8.0, 9.0, 17.0, 15.0, 17.0, 19.0, 18.0, 24.0, 22.0, 30.0, 31.0, 22.0, 29.0, 31.0, 39.0, 36.0, 35.0, 34.0, 37.0, 40.0, 41.0, 29.0, 41.0, 46.0, 40.0, 36.0, 21.0, 21.0, 15.0, 11.0, 21.0, 21.0, 17.0, 15.0, 15.0, 16.0, 14.0, 5.0, 8.0, 7.0, 10.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-20.136947631835938, -19.537351608276367, -18.937753677368164, -18.338157653808594, -17.73855972290039, -17.13896369934082, -16.53936767578125, -15.939769744873047, -15.340173721313477, -14.74057674407959, -14.140979766845703, -13.541383743286133, -12.941786766052246, -12.34218978881836, -11.742592811584473, -11.142995834350586, -10.5433988571167, -9.943801879882812, -9.344204902648926, -8.744607925415039, -8.145011901855469, -7.545414924621582, -6.945817947387695, -6.346221446990967, -5.74662446975708, -5.147027492523193, -4.547430992126465, -3.947834014892578, -3.3482372760772705, -2.748640537261963, -2.149043560028076, -1.5494470596313477, -0.9498500823974609, -0.35025328397750854, 0.24934351444244385, 0.848940372467041, 1.4485371112823486, 2.0481338500976562, 2.647730827331543, 3.2473273277282715, 3.846924304962158, 4.446521282196045, 5.046117782592773, 5.64571475982666, 6.245311737060547, 6.844908237457275, 7.444505214691162, 8.04410171508789, 8.643698692321777, 9.243295669555664, 9.84289264678955, 10.442489624023438, 11.042085647583008, 11.641682624816895, 12.241279602050781, 12.840875625610352, 13.440473556518555, 14.040070533752441, 14.639667510986328, 15.239263534545898, 15.838860511779785, 16.438457489013672, 17.038055419921875, 17.637651443481445, 18.237247467041016]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 11.0, 8.0, 13.0, 15.0, 15.0, 20.0, 30.0, 21.0, 27.0, 21.0, 33.0, 41.0, 40.0, 39.0, 43.0, 49.0, 48.0, 48.0, 42.0, 45.0, 26.0, 36.0, 39.0, 27.0, 29.0, 26.0, 25.0, 20.0, 31.0, 14.0, 20.0, 17.0, 14.0, 14.0, 8.0, 5.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.66796875, -2.583740234375, -2.49951171875, -2.415283203125, -2.3310546875, -2.246826171875, -2.16259765625, -2.078369140625, -1.994140625, -1.909912109375, -1.82568359375, -1.741455078125, -1.6572265625, -1.572998046875, -1.48876953125, -1.404541015625, -1.3203125, -1.236083984375, -1.15185546875, -1.067626953125, -0.9833984375, -0.899169921875, -0.81494140625, -0.730712890625, -0.646484375, -0.562255859375, -0.47802734375, -0.393798828125, -0.3095703125, -0.225341796875, -0.14111328125, -0.056884765625, 0.02734375, 0.111572265625, 0.19580078125, 0.280029296875, 0.3642578125, 0.448486328125, 0.53271484375, 0.616943359375, 0.701171875, 0.785400390625, 0.86962890625, 0.953857421875, 1.0380859375, 1.122314453125, 1.20654296875, 1.290771484375, 1.375, 1.459228515625, 1.54345703125, 1.627685546875, 1.7119140625, 1.796142578125, 1.88037109375, 1.964599609375, 2.048828125, 2.133056640625, 2.21728515625, 2.301513671875, 2.3857421875, 2.469970703125, 2.55419921875, 2.638427734375, 2.72265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 8.0, 11.0, 12.0, 9.0, 16.0, 14.0, 23.0, 28.0, 26.0, 50.0, 103.0, 174.0, 435.0, 1093.0, 3644.0, 16394.0, 104634.0, 1045592.0, 2634402.0, 334408.0, 41946.0, 7901.0, 2026.0, 663.0, 276.0, 117.0, 73.0, 37.0, 42.0, 19.0, 19.0, 17.0, 7.0, 14.0, 11.0, 14.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.3197021484375, -7.030029296875, -6.7403564453125, -6.45068359375, -6.1610107421875, -5.871337890625, -5.5816650390625, -5.2919921875, -5.0023193359375, -4.712646484375, -4.4229736328125, -4.13330078125, -3.8436279296875, -3.553955078125, -3.2642822265625, -2.974609375, -2.6849365234375, -2.395263671875, -2.1055908203125, -1.81591796875, -1.5262451171875, -1.236572265625, -0.9468994140625, -0.6572265625, -0.3675537109375, -0.077880859375, 0.2117919921875, 0.50146484375, 0.7911376953125, 1.080810546875, 1.3704833984375, 1.66015625, 1.9498291015625, 2.239501953125, 2.5291748046875, 2.81884765625, 3.1085205078125, 3.398193359375, 3.6878662109375, 3.9775390625, 4.2672119140625, 4.556884765625, 4.8465576171875, 5.13623046875, 5.4259033203125, 5.715576171875, 6.0052490234375, 6.294921875, 6.5845947265625, 6.874267578125, 7.1639404296875, 7.45361328125, 7.7432861328125, 8.032958984375, 8.3226318359375, 8.6123046875, 8.9019775390625, 9.191650390625, 9.4813232421875, 9.77099609375, 10.0606689453125, 10.350341796875, 10.6400146484375, 10.9296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 8.0, 9.0, 14.0, 27.0, 26.0, 38.0, 77.0, 78.0, 96.0, 121.0, 176.0, 253.0, 320.0, 369.0, 389.0, 407.0, 387.0, 289.0, 252.0, 200.0, 157.0, 104.0, 69.0, 67.0, 42.0, 26.0, 21.0, 15.0, 8.0, 9.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.333251953125, -6.13525390625, -5.937255859375, -5.7392578125, -5.541259765625, -5.34326171875, -5.145263671875, -4.947265625, -4.749267578125, -4.55126953125, -4.353271484375, -4.1552734375, -3.957275390625, -3.75927734375, -3.561279296875, -3.36328125, -3.165283203125, -2.96728515625, -2.769287109375, -2.5712890625, -2.373291015625, -2.17529296875, -1.977294921875, -1.779296875, -1.581298828125, -1.38330078125, -1.185302734375, -0.9873046875, -0.789306640625, -0.59130859375, -0.393310546875, -0.1953125, 0.002685546875, 0.20068359375, 0.398681640625, 0.5966796875, 0.794677734375, 0.99267578125, 1.190673828125, 1.388671875, 1.586669921875, 1.78466796875, 1.982666015625, 2.1806640625, 2.378662109375, 2.57666015625, 2.774658203125, 2.97265625, 3.170654296875, 3.36865234375, 3.566650390625, 3.7646484375, 3.962646484375, 4.16064453125, 4.358642578125, 4.556640625, 4.754638671875, 4.95263671875, 5.150634765625, 5.3486328125, 5.546630859375, 5.74462890625, 5.942626953125, 6.140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 15.0, 20.0, 26.0, 54.0, 82.0, 140.0, 237.0, 511.0, 1497.0, 8097.0, 100168.0, 2038850.0, 1939721.0, 94514.0, 7800.0, 1412.0, 502.0, 234.0, 141.0, 89.0, 57.0, 27.0, 30.0, 19.0, 8.0, 7.0, 12.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.484375, -18.9429931640625, -18.401611328125, -17.8602294921875, -17.31884765625, -16.7774658203125, -16.236083984375, -15.6947021484375, -15.1533203125, -14.6119384765625, -14.070556640625, -13.5291748046875, -12.98779296875, -12.4464111328125, -11.905029296875, -11.3636474609375, -10.822265625, -10.2808837890625, -9.739501953125, -9.1981201171875, -8.65673828125, -8.1153564453125, -7.573974609375, -7.0325927734375, -6.4912109375, -5.9498291015625, -5.408447265625, -4.8670654296875, -4.32568359375, -3.7843017578125, -3.242919921875, -2.7015380859375, -2.16015625, -1.6187744140625, -1.077392578125, -0.5360107421875, 0.00537109375, 0.5467529296875, 1.088134765625, 1.6295166015625, 2.1708984375, 2.7122802734375, 3.253662109375, 3.7950439453125, 4.33642578125, 4.8778076171875, 5.419189453125, 5.9605712890625, 6.501953125, 7.0433349609375, 7.584716796875, 8.1260986328125, 8.66748046875, 9.2088623046875, 9.750244140625, 10.2916259765625, 10.8330078125, 11.3743896484375, 11.915771484375, 12.4571533203125, 12.99853515625, 13.5399169921875, 14.081298828125, 14.6226806640625, 15.1640625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 3.0, 8.0, 22.0, 28.0, 72.0, 106.0, 173.0, 189.0, 177.0, 124.0, 68.0, 25.0, 16.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0894775390625, -16.858539581298828, -14.627601623535156, -12.396663665771484, -10.165725708007812, -7.934787750244141, -5.703849792480469, -3.472911834716797, -1.241973876953125, 0.9889640808105469, 3.2199020385742188, 5.450839996337891, 7.6817779541015625, 9.912715911865234, 12.143653869628906, 14.374591827392578, 16.60552978515625, 18.836467742919922, 21.067405700683594, 23.298343658447266, 25.529281616210938, 27.76021957397461, 29.99115753173828, 32.22209548950195, 34.453033447265625, 36.6839714050293, 38.91490936279297, 41.14584732055664, 43.37678527832031, 45.607723236083984, 47.838661193847656, 50.06959915161133, 52.30054473876953, 54.5314826965332, 56.762420654296875, 58.99335861206055, 61.22429656982422, 63.45523452758789, 65.68617248535156, 67.9171142578125, 70.1480484008789, 72.37898254394531, 74.60992431640625, 76.84086608886719, 79.0718002319336, 81.302734375, 83.53367614746094, 85.76461791992188, 87.99555206298828, 90.22648620605469, 92.45742797851562, 94.68836975097656, 96.91930389404297, 99.15023803710938, 101.38117980957031, 103.61212158203125, 105.84305572509766, 108.07398986816406, 110.304931640625, 112.53587341308594, 114.76680755615234, 116.99774169921875, 119.22868347167969, 121.45962524414062, 123.69055938720703]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 10.0, 17.0, 17.0, 13.0, 19.0, 33.0, 27.0, 39.0, 30.0, 44.0, 32.0, 48.0, 47.0, 51.0, 68.0, 53.0, 49.0, 40.0, 39.0, 45.0, 34.0, 28.0, 29.0, 35.0, 17.0, 19.0, 17.0, 13.0, 9.0, 3.0, 15.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.97484588623047, -24.227624893188477, -23.48040199279785, -22.73318099975586, -21.985960006713867, -21.238739013671875, -20.49151611328125, -19.744295120239258, -18.997074127197266, -18.249853134155273, -17.50263023376465, -16.755409240722656, -16.008188247680664, -15.260966300964355, -14.513744354248047, -13.766523361206055, -13.01930046081543, -12.272078514099121, -11.524857521057129, -10.77763557434082, -10.030414581298828, -9.28319263458252, -8.535970687866211, -7.7887492179870605, -7.04152774810791, -6.29430627822876, -5.547084808349609, -4.799862861633301, -4.05264139175415, -3.305419921875, -2.5581979751586914, -1.810976505279541, -1.0637550354003906, -0.3165334463119507, 0.43068814277648926, 1.1779098510742188, 1.9251313209533691, 2.6723527908325195, 3.419574737548828, 4.1667962074279785, 4.914017677307129, 5.661239147186279, 6.40846061706543, 7.155682563781738, 7.902904033660889, 8.650125503540039, 9.397347450256348, 10.144569396972656, 10.891790390014648, 11.639012336730957, 12.38623332977295, 13.133455276489258, 13.88067626953125, 14.627898216247559, 15.375120162963867, 16.12234115600586, 16.869564056396484, 17.616785049438477, 18.3640079498291, 19.111228942871094, 19.858449935913086, 20.605670928955078, 21.352893829345703, 22.100114822387695, 22.847335815429688]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 6.0, 4.0, 6.0, 15.0, 17.0, 13.0, 27.0, 20.0, 25.0, 33.0, 31.0, 32.0, 29.0, 35.0, 38.0, 33.0, 35.0, 52.0, 45.0, 52.0, 33.0, 46.0, 29.0, 27.0, 35.0, 31.0, 31.0, 26.0, 25.0, 17.0, 22.0, 15.0, 17.0, 17.0, 11.0, 15.0, 12.0, 3.0, 7.0, 1.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.296844482421875, -2.21478271484375, -2.132720947265625, -2.0506591796875, -1.968597412109375, -1.88653564453125, -1.804473876953125, -1.722412109375, -1.640350341796875, -1.55828857421875, -1.476226806640625, -1.3941650390625, -1.312103271484375, -1.23004150390625, -1.147979736328125, -1.06591796875, -0.983856201171875, -0.90179443359375, -0.819732666015625, -0.7376708984375, -0.655609130859375, -0.57354736328125, -0.491485595703125, -0.409423828125, -0.327362060546875, -0.24530029296875, -0.163238525390625, -0.0811767578125, 0.000885009765625, 0.08294677734375, 0.165008544921875, 0.2470703125, 0.329132080078125, 0.41119384765625, 0.493255615234375, 0.5753173828125, 0.657379150390625, 0.73944091796875, 0.821502685546875, 0.903564453125, 0.985626220703125, 1.06768798828125, 1.149749755859375, 1.2318115234375, 1.313873291015625, 1.39593505859375, 1.477996826171875, 1.56005859375, 1.642120361328125, 1.72418212890625, 1.806243896484375, 1.8883056640625, 1.970367431640625, 2.05242919921875, 2.134490966796875, 2.216552734375, 2.298614501953125, 2.38067626953125, 2.462738037109375, 2.5447998046875, 2.626861572265625, 2.70892333984375, 2.790985107421875, 2.873046875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 19.0, 33.0, 43.0, 66.0, 73.0, 128.0, 167.0, 326.0, 484.0, 739.0, 1142.0, 1665.0, 2529.0, 3890.0, 5951.0, 9042.0, 14509.0, 23912.0, 39976.0, 71395.0, 141204.0, 338729.0, 184302.0, 86256.0, 47479.0, 27617.0, 16854.0, 10500.0, 6713.0, 4397.0, 2821.0, 1862.0, 1336.0, 844.0, 534.0, 335.0, 220.0, 148.0, 96.0, 69.0, 42.0, 25.0, 13.0, 17.0, 9.0, 11.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.13143157958984375, -0.1269989013671875, -0.12256622314453125, -0.118133544921875, -0.11370086669921875, -0.1092681884765625, -0.10483551025390625, -0.10040283203125, -0.09597015380859375, -0.0915374755859375, -0.08710479736328125, -0.082672119140625, -0.07823944091796875, -0.0738067626953125, -0.06937408447265625, -0.06494140625, -0.06050872802734375, -0.0560760498046875, -0.05164337158203125, -0.047210693359375, -0.04277801513671875, -0.0383453369140625, -0.03391265869140625, -0.02947998046875, -0.02504730224609375, -0.0206146240234375, -0.01618194580078125, -0.011749267578125, -0.00731658935546875, -0.0028839111328125, 0.00154876708984375, 0.0059814453125, 0.01041412353515625, 0.0148468017578125, 0.01927947998046875, 0.023712158203125, 0.02814483642578125, 0.0325775146484375, 0.03701019287109375, 0.04144287109375, 0.04587554931640625, 0.0503082275390625, 0.05474090576171875, 0.059173583984375, 0.06360626220703125, 0.0680389404296875, 0.07247161865234375, 0.076904296875, 0.08133697509765625, 0.0857696533203125, 0.09020233154296875, 0.094635009765625, 0.09906768798828125, 0.1035003662109375, 0.10793304443359375, 0.11236572265625, 0.11679840087890625, 0.1212310791015625, 0.12566375732421875, 0.130096435546875, 0.13452911376953125, 0.1389617919921875, 0.14339447021484375, 0.1478271484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 9.0, 7.0, 8.0, 14.0, 22.0, 16.0, 28.0, 22.0, 31.0, 28.0, 36.0, 30.0, 51.0, 48.0, 55.0, 37.0, 55.0, 1077.0, 38.0, 44.0, 49.0, 39.0, 41.0, 37.0, 35.0, 22.0, 24.0, 17.0, 25.0, 15.0, 17.0, 15.0, 8.0, 13.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.36328125, -2.296234130859375, -2.22918701171875, -2.162139892578125, -2.0950927734375, -2.028045654296875, -1.96099853515625, -1.893951416015625, -1.826904296875, -1.759857177734375, -1.69281005859375, -1.625762939453125, -1.5587158203125, -1.491668701171875, -1.42462158203125, -1.357574462890625, -1.29052734375, -1.223480224609375, -1.15643310546875, -1.089385986328125, -1.0223388671875, -0.955291748046875, -0.88824462890625, -0.821197509765625, -0.754150390625, -0.687103271484375, -0.62005615234375, -0.553009033203125, -0.4859619140625, -0.418914794921875, -0.35186767578125, -0.284820556640625, -0.2177734375, -0.150726318359375, -0.08367919921875, -0.016632080078125, 0.0504150390625, 0.117462158203125, 0.18450927734375, 0.251556396484375, 0.318603515625, 0.385650634765625, 0.45269775390625, 0.519744873046875, 0.5867919921875, 0.653839111328125, 0.72088623046875, 0.787933349609375, 0.85498046875, 0.922027587890625, 0.98907470703125, 1.056121826171875, 1.1231689453125, 1.190216064453125, 1.25726318359375, 1.324310302734375, 1.391357421875, 1.458404541015625, 1.52545166015625, 1.592498779296875, 1.6595458984375, 1.726593017578125, 1.79364013671875, 1.860687255859375, 1.927734375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 9.0, 15.0, 21.0, 26.0, 46.0, 55.0, 103.0, 117.0, 192.0, 322.0, 495.0, 686.0, 1142.0, 1798.0, 2795.0, 4393.0, 7320.0, 11905.0, 19733.0, 34473.0, 63351.0, 125056.0, 1315478.0, 249927.0, 116613.0, 59419.0, 32579.0, 18973.0, 11315.0, 6938.0, 4384.0, 2636.0, 1652.0, 1115.0, 699.0, 450.0, 299.0, 193.0, 142.0, 95.0, 55.0, 37.0, 17.0, 20.0, 14.0, 14.0, 3.0, 4.0, 4.0, 2.0, 3.0], "bins": [-0.06121826171875, -0.05951547622680664, -0.05781269073486328, -0.05610990524291992, -0.05440711975097656, -0.0527043342590332, -0.051001548767089844, -0.049298763275146484, -0.047595977783203125, -0.045893192291259766, -0.044190406799316406, -0.04248762130737305, -0.04078483581542969, -0.03908205032348633, -0.03737926483154297, -0.03567647933959961, -0.03397369384765625, -0.03227090835571289, -0.03056812286376953, -0.028865337371826172, -0.027162551879882812, -0.025459766387939453, -0.023756980895996094, -0.022054195404052734, -0.020351409912109375, -0.018648624420166016, -0.016945838928222656, -0.015243053436279297, -0.013540267944335938, -0.011837482452392578, -0.010134696960449219, -0.00843191146850586, -0.0067291259765625, -0.005026340484619141, -0.0033235549926757812, -0.0016207695007324219, 8.20159912109375e-05, 0.0017848014831542969, 0.0034875869750976562, 0.005190372467041016, 0.006893157958984375, 0.008595943450927734, 0.010298728942871094, 0.012001514434814453, 0.013704299926757812, 0.015407085418701172, 0.01710987091064453, 0.01881265640258789, 0.02051544189453125, 0.02221822738647461, 0.02392101287841797, 0.025623798370361328, 0.027326583862304688, 0.029029369354248047, 0.030732154846191406, 0.032434940338134766, 0.034137725830078125, 0.035840511322021484, 0.037543296813964844, 0.0392460823059082, 0.04094886779785156, 0.04265165328979492, 0.04435443878173828, 0.04605722427368164, 0.047760009765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 12.0, 6.0, 6.0, 7.0, 8.0, 16.0, 21.0, 22.0, 27.0, 26.0, 34.0, 40.0, 51.0, 60.0, 75.0, 67.0, 54.0, 66.0, 54.0, 58.0, 39.0, 46.0, 27.0, 29.0, 22.0, 14.0, 19.0, 15.0, 11.0, 8.0, 4.0, 10.0, 3.0, 11.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-1.239776611328125e-05, -1.2014992535114288e-05, -1.1632218956947327e-05, -1.1249445378780365e-05, -1.0866671800613403e-05, -1.0483898222446442e-05, -1.010112464427948e-05, -9.718351066112518e-06, -9.335577487945557e-06, -8.952803909778595e-06, -8.570030331611633e-06, -8.187256753444672e-06, -7.80448317527771e-06, -7.421709597110748e-06, -7.038936018943787e-06, -6.656162440776825e-06, -6.273388862609863e-06, -5.890615284442902e-06, -5.50784170627594e-06, -5.125068128108978e-06, -4.742294549942017e-06, -4.359520971775055e-06, -3.976747393608093e-06, -3.5939738154411316e-06, -3.21120023727417e-06, -2.8284266591072083e-06, -2.4456530809402466e-06, -2.062879502773285e-06, -1.6801059246063232e-06, -1.2973323464393616e-06, -9.145587682723999e-07, -5.317851901054382e-07, -1.4901161193847656e-07, 2.337619662284851e-07, 6.165355443954468e-07, 9.993091225624084e-07, 1.3820827007293701e-06, 1.7648562788963318e-06, 2.1476298570632935e-06, 2.530403435230255e-06, 2.913177013397217e-06, 3.2959505915641785e-06, 3.67872416973114e-06, 4.061497747898102e-06, 4.4442713260650635e-06, 4.827044904232025e-06, 5.209818482398987e-06, 5.5925920605659485e-06, 5.97536563873291e-06, 6.358139216899872e-06, 6.7409127950668335e-06, 7.123686373233795e-06, 7.506459951400757e-06, 7.889233529567719e-06, 8.27200710773468e-06, 8.654780685901642e-06, 9.037554264068604e-06, 9.420327842235565e-06, 9.803101420402527e-06, 1.0185874998569489e-05, 1.056864857673645e-05, 1.0951422154903412e-05, 1.1334195733070374e-05, 1.1716969311237335e-05, 1.2099742889404297e-05]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 1.0, 11.0, 5.0, 7.0, 9.0, 11.0, 11.0, 28.0, 25.0, 41.0, 50.0, 91.0, 165.0, 279.0, 766.0, 3846.0, 31356.0, 587518.0, 396234.0, 23853.0, 2956.0, 570.0, 267.0, 127.0, 86.0, 73.0, 39.0, 32.0, 27.0, 8.0, 13.0, 10.0, 5.0, 9.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0002491474151611328, -0.00024134665727615356, -0.00023354589939117432, -0.00022574514150619507, -0.00021794438362121582, -0.00021014362573623657, -0.00020234286785125732, -0.00019454210996627808, -0.00018674135208129883, -0.00017894059419631958, -0.00017113983631134033, -0.00016333907842636108, -0.00015553832054138184, -0.0001477375626564026, -0.00013993680477142334, -0.0001321360468864441, -0.00012433528900146484, -0.0001165345311164856, -0.00010873377323150635, -0.0001009330153465271, -9.313225746154785e-05, -8.53314995765686e-05, -7.753074169158936e-05, -6.972998380661011e-05, -6.192922592163086e-05, -5.412846803665161e-05, -4.632771015167236e-05, -3.8526952266693115e-05, -3.072619438171387e-05, -2.292543649673462e-05, -1.5124678611755371e-05, -7.323920726776123e-06, 4.76837158203125e-07, 8.277595043182373e-06, 1.607835292816162e-05, 2.387911081314087e-05, 3.167986869812012e-05, 3.9480626583099365e-05, 4.728138446807861e-05, 5.508214235305786e-05, 6.288290023803711e-05, 7.068365812301636e-05, 7.84844160079956e-05, 8.628517389297485e-05, 9.40859317779541e-05, 0.00010188668966293335, 0.0001096874475479126, 0.00011748820543289185, 0.0001252889633178711, 0.00013308972120285034, 0.0001408904790878296, 0.00014869123697280884, 0.00015649199485778809, 0.00016429275274276733, 0.00017209351062774658, 0.00017989426851272583, 0.00018769502639770508, 0.00019549578428268433, 0.00020329654216766357, 0.00021109730005264282, 0.00021889805793762207, 0.00022669881582260132, 0.00023449957370758057, 0.00024230033159255981, 0.00025010108947753906]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 37.0, 131.0, 409.0, 305.0, 75.0, 29.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734465958084911e-05, -5.471585609484464e-05, -5.2087056246818975e-05, -4.94582527608145e-05, -4.682945291278884e-05, -4.4200649426784366e-05, -4.1571845940779895e-05, -3.894304245477542e-05, -3.631424260674976e-05, -3.3685439120745286e-05, -3.105663927271962e-05, -2.842783578671515e-05, -2.579903411970008e-05, -2.3170232452685013e-05, -2.054142896668054e-05, -1.7912627299665473e-05, -1.5283825632650405e-05, -1.2655023965635337e-05, -1.0026221389125567e-05, -7.397418812615797e-06, -4.768617145600729e-06, -2.1398154785856605e-06, 4.889880074188113e-07, 3.1177896744338796e-06, 5.746591341448948e-06, 8.375393008464016e-06, 1.1004195584973786e-05, 1.3632998161483556e-05, 1.6261799828498624e-05, 1.8890601495513692e-05, 2.1519404981518164e-05, 2.4148206648533233e-05, 2.67770083155483e-05, 2.940580998256337e-05, 3.203461164957844e-05, 3.466341513558291e-05, 3.7292214983608574e-05, 3.9921018469613045e-05, 4.254982195561752e-05, 4.517862544162199e-05, 4.7807425289647654e-05, 5.0436228775652125e-05, 5.306502862367779e-05, 5.569383210968226e-05, 5.8322635595686734e-05, 6.09514354437124e-05, 6.358024256769568e-05, 6.620903877774253e-05, 6.8837842263747e-05, 7.146664574975148e-05, 7.409544923575595e-05, 7.672424544580281e-05, 7.935304893180728e-05, 8.198185241781175e-05, 8.461065590381622e-05, 8.72394593898207e-05, 8.986826287582517e-05, 9.249706636182964e-05, 9.512586984783411e-05, 9.775467333383858e-05, 0.00010038346954388544, 0.00010301227302988991, 0.00010564107651589438, 0.00010826988000189885, 0.00011089867621194571]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 5.0, 15.0, 18.0, 18.0, 19.0, 25.0, 20.0, 33.0, 35.0, 38.0, 34.0, 27.0, 44.0, 39.0, 36.0, 38.0, 35.0, 49.0, 39.0, 34.0, 44.0, 32.0, 30.0, 35.0, 30.0, 21.0, 23.0, 24.0, 32.0, 16.0, 20.0, 13.0, 13.0, 7.0, 6.0, 10.0, 4.0, 6.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.794929504394531e-06, -6.557442247867584e-06, -6.319954991340637e-06, -6.08246773481369e-06, -5.844980478286743e-06, -5.607493221759796e-06, -5.370005965232849e-06, -5.132518708705902e-06, -4.895031452178955e-06, -4.657544195652008e-06, -4.420056939125061e-06, -4.182569682598114e-06, -3.945082426071167e-06, -3.70759516954422e-06, -3.470107913017273e-06, -3.232620656490326e-06, -2.995133399963379e-06, -2.757646143436432e-06, -2.520158886909485e-06, -2.282671630382538e-06, -2.045184373855591e-06, -1.8076971173286438e-06, -1.5702098608016968e-06, -1.3327226042747498e-06, -1.0952353477478027e-06, -8.577480912208557e-07, -6.202608346939087e-07, -3.8277357816696167e-07, -1.4528632164001465e-07, 9.220093488693237e-08, 3.296881914138794e-07, 5.671754479408264e-07, 8.046627044677734e-07, 1.0421499609947205e-06, 1.2796372175216675e-06, 1.5171244740486145e-06, 1.7546117305755615e-06, 1.9920989871025085e-06, 2.2295862436294556e-06, 2.4670735001564026e-06, 2.7045607566833496e-06, 2.9420480132102966e-06, 3.1795352697372437e-06, 3.4170225262641907e-06, 3.6545097827911377e-06, 3.891997039318085e-06, 4.129484295845032e-06, 4.366971552371979e-06, 4.604458808898926e-06, 4.841946065425873e-06, 5.07943332195282e-06, 5.316920578479767e-06, 5.554407835006714e-06, 5.791895091533661e-06, 6.029382348060608e-06, 6.266869604587555e-06, 6.504356861114502e-06, 6.741844117641449e-06, 6.979331374168396e-06, 7.216818630695343e-06, 7.45430588722229e-06, 7.691793143749237e-06, 7.929280400276184e-06, 8.166767656803131e-06, 8.404254913330078e-06]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 6.0, 4.0, 6.0, 15.0, 17.0, 13.0, 27.0, 20.0, 25.0, 33.0, 31.0, 32.0, 29.0, 35.0, 38.0, 33.0, 35.0, 52.0, 45.0, 52.0, 33.0, 46.0, 29.0, 27.0, 35.0, 31.0, 31.0, 26.0, 25.0, 17.0, 22.0, 15.0, 17.0, 17.0, 11.0, 15.0, 12.0, 3.0, 7.0, 1.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.296844482421875, -2.21478271484375, -2.132720947265625, -2.0506591796875, -1.968597412109375, -1.88653564453125, -1.804473876953125, -1.722412109375, -1.640350341796875, -1.55828857421875, -1.476226806640625, -1.3941650390625, -1.312103271484375, -1.23004150390625, -1.147979736328125, -1.06591796875, -0.983856201171875, -0.90179443359375, -0.819732666015625, -0.7376708984375, -0.655609130859375, -0.57354736328125, -0.491485595703125, -0.409423828125, -0.327362060546875, -0.24530029296875, -0.163238525390625, -0.0811767578125, 0.000885009765625, 0.08294677734375, 0.165008544921875, 0.2470703125, 0.329132080078125, 0.41119384765625, 0.493255615234375, 0.5753173828125, 0.657379150390625, 0.73944091796875, 0.821502685546875, 0.903564453125, 0.985626220703125, 1.06768798828125, 1.149749755859375, 1.2318115234375, 1.313873291015625, 1.39593505859375, 1.477996826171875, 1.56005859375, 1.642120361328125, 1.72418212890625, 1.806243896484375, 1.8883056640625, 1.970367431640625, 2.05242919921875, 2.134490966796875, 2.216552734375, 2.298614501953125, 2.38067626953125, 2.462738037109375, 2.5447998046875, 2.626861572265625, 2.70892333984375, 2.790985107421875, 2.873046875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 11.0, 15.0, 25.0, 48.0, 75.0, 113.0, 198.0, 291.0, 491.0, 807.0, 1294.0, 2084.0, 3315.0, 5360.0, 8955.0, 16405.0, 33997.0, 88092.0, 311627.0, 388909.0, 104745.0, 38504.0, 18107.0, 10018.0, 5798.0, 3436.0, 2160.0, 1371.0, 821.0, 487.0, 364.0, 227.0, 130.0, 88.0, 54.0, 31.0, 30.0, 19.0, 14.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.02288818359375, -3.8934326171875, -3.76397705078125, -3.634521484375, -3.50506591796875, -3.3756103515625, -3.24615478515625, -3.11669921875, -2.98724365234375, -2.8577880859375, -2.72833251953125, -2.598876953125, -2.46942138671875, -2.3399658203125, -2.21051025390625, -2.0810546875, -1.95159912109375, -1.8221435546875, -1.69268798828125, -1.563232421875, -1.43377685546875, -1.3043212890625, -1.17486572265625, -1.04541015625, -0.91595458984375, -0.7864990234375, -0.65704345703125, -0.527587890625, -0.39813232421875, -0.2686767578125, -0.13922119140625, -0.009765625, 0.11968994140625, 0.2491455078125, 0.37860107421875, 0.508056640625, 0.63751220703125, 0.7669677734375, 0.89642333984375, 1.02587890625, 1.15533447265625, 1.2847900390625, 1.41424560546875, 1.543701171875, 1.67315673828125, 1.8026123046875, 1.93206787109375, 2.0615234375, 2.19097900390625, 2.3204345703125, 2.44989013671875, 2.579345703125, 2.70880126953125, 2.8382568359375, 2.96771240234375, 3.09716796875, 3.22662353515625, 3.3560791015625, 3.48553466796875, 3.614990234375, 3.74444580078125, 3.8739013671875, 4.00335693359375, 4.1328125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 8.0, 1.0, 9.0, 6.0, 7.0, 10.0, 15.0, 14.0, 14.0, 21.0, 17.0, 15.0, 11.0, 26.0, 25.0, 24.0, 39.0, 36.0, 36.0, 57.0, 78.0, 131.0, 256.0, 1439.0, 194.0, 103.0, 73.0, 44.0, 45.0, 33.0, 30.0, 23.0, 34.0, 23.0, 24.0, 23.0, 16.0, 14.0, 18.0, 14.0, 6.0, 10.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5390625, -7.2816162109375, -7.024169921875, -6.7667236328125, -6.50927734375, -6.2518310546875, -5.994384765625, -5.7369384765625, -5.4794921875, -5.2220458984375, -4.964599609375, -4.7071533203125, -4.44970703125, -4.1922607421875, -3.934814453125, -3.6773681640625, -3.419921875, -3.1624755859375, -2.905029296875, -2.6475830078125, -2.39013671875, -2.1326904296875, -1.875244140625, -1.6177978515625, -1.3603515625, -1.1029052734375, -0.845458984375, -0.5880126953125, -0.33056640625, -0.0731201171875, 0.184326171875, 0.4417724609375, 0.69921875, 0.9566650390625, 1.214111328125, 1.4715576171875, 1.72900390625, 1.9864501953125, 2.243896484375, 2.5013427734375, 2.7587890625, 3.0162353515625, 3.273681640625, 3.5311279296875, 3.78857421875, 4.0460205078125, 4.303466796875, 4.5609130859375, 4.818359375, 5.0758056640625, 5.333251953125, 5.5906982421875, 5.84814453125, 6.1055908203125, 6.363037109375, 6.6204833984375, 6.8779296875, 7.1353759765625, 7.392822265625, 7.6502685546875, 7.90771484375, 8.1651611328125, 8.422607421875, 8.6800537109375, 8.9375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 5.0, 6.0, 6.0, 8.0, 11.0, 13.0, 21.0, 18.0, 19.0, 28.0, 33.0, 44.0, 51.0, 70.0, 85.0, 98.0, 157.0, 207.0, 362.0, 1178.0, 5613.0, 56407.0, 2640493.0, 419546.0, 17075.0, 2508.0, 595.0, 282.0, 147.0, 131.0, 79.0, 91.0, 65.0, 47.0, 33.0, 23.0, 25.0, 20.0, 23.0, 16.0, 16.0, 10.0, 6.0, 5.0, 7.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0], "bins": [-16.875, -16.3896484375, -15.904296875, -15.4189453125, -14.93359375, -14.4482421875, -13.962890625, -13.4775390625, -12.9921875, -12.5068359375, -12.021484375, -11.5361328125, -11.05078125, -10.5654296875, -10.080078125, -9.5947265625, -9.109375, -8.6240234375, -8.138671875, -7.6533203125, -7.16796875, -6.6826171875, -6.197265625, -5.7119140625, -5.2265625, -4.7412109375, -4.255859375, -3.7705078125, -3.28515625, -2.7998046875, -2.314453125, -1.8291015625, -1.34375, -0.8583984375, -0.373046875, 0.1123046875, 0.59765625, 1.0830078125, 1.568359375, 2.0537109375, 2.5390625, 3.0244140625, 3.509765625, 3.9951171875, 4.48046875, 4.9658203125, 5.451171875, 5.9365234375, 6.421875, 6.9072265625, 7.392578125, 7.8779296875, 8.36328125, 8.8486328125, 9.333984375, 9.8193359375, 10.3046875, 10.7900390625, 11.275390625, 11.7607421875, 12.24609375, 12.7314453125, 13.216796875, 13.7021484375, 14.1875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 14.0, 17.0, 39.0, 73.0, 130.0, 163.0, 166.0, 160.0, 120.0, 70.0, 32.0, 16.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.771941184997559, -7.921891212463379, -7.071841239929199, -6.2217912673950195, -5.37174129486084, -4.52169132232666, -3.6716413497924805, -2.821591377258301, -1.971541404724121, -1.1214914321899414, -0.2714414596557617, 0.578608512878418, 1.4286584854125977, 2.2787084579467773, 3.128758430480957, 3.9788084030151367, 4.828858375549316, 5.678908348083496, 6.528958320617676, 7.3790082931518555, 8.229058265686035, 9.079108238220215, 9.929158210754395, 10.779208183288574, 11.629258155822754, 12.479308128356934, 13.329358100891113, 14.179408073425293, 15.029458045959473, 15.879508018493652, 16.729557037353516, 17.579608917236328, 18.429656982421875, 19.279706954956055, 20.129756927490234, 20.979806900024414, 21.829856872558594, 22.679906845092773, 23.529956817626953, 24.380006790161133, 25.230056762695312, 26.080106735229492, 26.930156707763672, 27.78020668029785, 28.63025665283203, 29.48030662536621, 30.33035659790039, 31.18040657043457, 32.03045654296875, 32.88050842285156, 33.73055648803711, 34.580604553222656, 35.43065643310547, 36.28070831298828, 37.13075637817383, 37.980804443359375, 38.83085632324219, 39.680908203125, 40.53095626831055, 41.381004333496094, 42.231056213378906, 43.08110809326172, 43.931156158447266, 44.78120422363281, 45.631256103515625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 4.0, 8.0, 8.0, 6.0, 18.0, 13.0, 21.0, 28.0, 31.0, 24.0, 40.0, 40.0, 43.0, 47.0, 43.0, 51.0, 45.0, 51.0, 43.0, 49.0, 54.0, 32.0, 50.0, 38.0, 29.0, 33.0, 29.0, 19.0, 14.0, 22.0, 14.0, 7.0, 9.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.64198303222656, -33.681304931640625, -32.72062683105469, -31.75994873046875, -30.799270629882812, -29.838592529296875, -28.877914428710938, -27.917236328125, -26.956558227539062, -25.995880126953125, -25.035202026367188, -24.07452392578125, -23.113845825195312, -22.153167724609375, -21.192489624023438, -20.2318115234375, -19.27113151550293, -18.310453414916992, -17.349775314331055, -16.389097213745117, -15.42841911315918, -14.467741012573242, -13.507061958312988, -12.54638385772705, -11.585705757141113, -10.625027656555176, -9.664349555969238, -8.703670501708984, -7.742992877960205, -6.782314777374268, -5.821636199951172, -4.860958099365234, -3.900278091430664, -2.9395999908447266, -1.97892165184021, -1.0182433128356934, -0.05756521224975586, 0.9031128883361816, 1.8637914657592773, 2.824469566345215, 3.7851476669311523, 4.74582576751709, 5.706503868103027, 6.667182445526123, 7.6278605461120605, 8.588539123535156, 9.549217224121094, 10.509895324707031, 11.470573425292969, 12.431251525878906, 13.391929626464844, 14.352607727050781, 15.313285827636719, 16.273963928222656, 17.234642028808594, 18.19532012939453, 19.15599822998047, 20.116676330566406, 21.077354431152344, 22.03803253173828, 22.99871063232422, 23.959388732910156, 24.920066833496094, 25.88074493408203, 26.8414249420166]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 3.0, 8.0, 13.0, 14.0, 16.0, 16.0, 23.0, 19.0, 23.0, 25.0, 34.0, 26.0, 27.0, 33.0, 30.0, 34.0, 32.0, 41.0, 50.0, 35.0, 45.0, 47.0, 38.0, 30.0, 32.0, 30.0, 30.0, 33.0, 19.0, 25.0, 13.0, 26.0, 16.0, 19.0, 18.0, 15.0, 12.0, 6.0, 7.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.5625, -2.478668212890625, -2.39483642578125, -2.311004638671875, -2.2271728515625, -2.143341064453125, -2.05950927734375, -1.975677490234375, -1.891845703125, -1.808013916015625, -1.72418212890625, -1.640350341796875, -1.5565185546875, -1.472686767578125, -1.38885498046875, -1.305023193359375, -1.22119140625, -1.137359619140625, -1.05352783203125, -0.969696044921875, -0.8858642578125, -0.802032470703125, -0.71820068359375, -0.634368896484375, -0.550537109375, -0.466705322265625, -0.38287353515625, -0.299041748046875, -0.2152099609375, -0.131378173828125, -0.04754638671875, 0.036285400390625, 0.1201171875, 0.203948974609375, 0.28778076171875, 0.371612548828125, 0.4554443359375, 0.539276123046875, 0.62310791015625, 0.706939697265625, 0.790771484375, 0.874603271484375, 0.95843505859375, 1.042266845703125, 1.1260986328125, 1.209930419921875, 1.29376220703125, 1.377593994140625, 1.46142578125, 1.545257568359375, 1.62908935546875, 1.712921142578125, 1.7967529296875, 1.880584716796875, 1.96441650390625, 2.048248291015625, 2.132080078125, 2.215911865234375, 2.29974365234375, 2.383575439453125, 2.4674072265625, 2.551239013671875, 2.63507080078125, 2.718902587890625, 2.802734375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 5.0, 10.0, 8.0, 18.0, 13.0, 30.0, 31.0, 40.0, 63.0, 87.0, 101.0, 225.0, 377.0, 947.0, 3092.0, 12744.0, 73183.0, 646197.0, 2775582.0, 596025.0, 68374.0, 12291.0, 2955.0, 922.0, 366.0, 183.0, 109.0, 59.0, 61.0, 45.0, 35.0, 28.0, 22.0, 11.0, 8.0, 10.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51171875, -7.22808837890625, -6.9444580078125, -6.66082763671875, -6.377197265625, -6.09356689453125, -5.8099365234375, -5.52630615234375, -5.24267578125, -4.95904541015625, -4.6754150390625, -4.39178466796875, -4.108154296875, -3.82452392578125, -3.5408935546875, -3.25726318359375, -2.9736328125, -2.69000244140625, -2.4063720703125, -2.12274169921875, -1.839111328125, -1.55548095703125, -1.2718505859375, -0.98822021484375, -0.70458984375, -0.42095947265625, -0.1373291015625, 0.14630126953125, 0.429931640625, 0.71356201171875, 0.9971923828125, 1.28082275390625, 1.564453125, 1.84808349609375, 2.1317138671875, 2.41534423828125, 2.698974609375, 2.98260498046875, 3.2662353515625, 3.54986572265625, 3.83349609375, 4.11712646484375, 4.4007568359375, 4.68438720703125, 4.968017578125, 5.25164794921875, 5.5352783203125, 5.81890869140625, 6.1025390625, 6.38616943359375, 6.6697998046875, 6.95343017578125, 7.237060546875, 7.52069091796875, 7.8043212890625, 8.08795166015625, 8.37158203125, 8.65521240234375, 8.9388427734375, 9.22247314453125, 9.506103515625, 9.78973388671875, 10.0733642578125, 10.35699462890625, 10.640625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 12.0, 15.0, 23.0, 31.0, 33.0, 53.0, 65.0, 68.0, 98.0, 142.0, 157.0, 194.0, 272.0, 297.0, 374.0, 339.0, 352.0, 317.0, 274.0, 211.0, 172.0, 119.0, 106.0, 70.0, 69.0, 46.0, 52.0, 22.0, 20.0, 20.0, 14.0, 9.0, 4.0, 1.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-6.6328125, -6.4603271484375, -6.287841796875, -6.1153564453125, -5.94287109375, -5.7703857421875, -5.597900390625, -5.4254150390625, -5.2529296875, -5.0804443359375, -4.907958984375, -4.7354736328125, -4.56298828125, -4.3905029296875, -4.218017578125, -4.0455322265625, -3.873046875, -3.7005615234375, -3.528076171875, -3.3555908203125, -3.18310546875, -3.0106201171875, -2.838134765625, -2.6656494140625, -2.4931640625, -2.3206787109375, -2.148193359375, -1.9757080078125, -1.80322265625, -1.6307373046875, -1.458251953125, -1.2857666015625, -1.11328125, -0.9407958984375, -0.768310546875, -0.5958251953125, -0.42333984375, -0.2508544921875, -0.078369140625, 0.0941162109375, 0.2666015625, 0.4390869140625, 0.611572265625, 0.7840576171875, 0.95654296875, 1.1290283203125, 1.301513671875, 1.4739990234375, 1.646484375, 1.8189697265625, 1.991455078125, 2.1639404296875, 2.33642578125, 2.5089111328125, 2.681396484375, 2.8538818359375, 3.0263671875, 3.1988525390625, 3.371337890625, 3.5438232421875, 3.71630859375, 3.8887939453125, 4.061279296875, 4.2337646484375, 4.40625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 10.0, 3.0, 18.0, 23.0, 27.0, 32.0, 47.0, 65.0, 79.0, 85.0, 140.0, 199.0, 310.0, 633.0, 2220.0, 19057.0, 381558.0, 3349423.0, 416009.0, 20414.0, 2291.0, 585.0, 313.0, 193.0, 145.0, 97.0, 80.0, 65.0, 56.0, 25.0, 19.0, 24.0, 14.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1171875, -14.5469970703125, -13.976806640625, -13.4066162109375, -12.83642578125, -12.2662353515625, -11.696044921875, -11.1258544921875, -10.5556640625, -9.9854736328125, -9.415283203125, -8.8450927734375, -8.27490234375, -7.7047119140625, -7.134521484375, -6.5643310546875, -5.994140625, -5.4239501953125, -4.853759765625, -4.2835693359375, -3.71337890625, -3.1431884765625, -2.572998046875, -2.0028076171875, -1.4326171875, -0.8624267578125, -0.292236328125, 0.2779541015625, 0.84814453125, 1.4183349609375, 1.988525390625, 2.5587158203125, 3.12890625, 3.6990966796875, 4.269287109375, 4.8394775390625, 5.40966796875, 5.9798583984375, 6.550048828125, 7.1202392578125, 7.6904296875, 8.2606201171875, 8.830810546875, 9.4010009765625, 9.97119140625, 10.5413818359375, 11.111572265625, 11.6817626953125, 12.251953125, 12.8221435546875, 13.392333984375, 13.9625244140625, 14.53271484375, 15.1029052734375, 15.673095703125, 16.2432861328125, 16.8134765625, 17.3836669921875, 17.953857421875, 18.5240478515625, 19.09423828125, 19.6644287109375, 20.234619140625, 20.8048095703125, 21.375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 47.0, 81.0, 181.0, 224.0, 188.0, 160.0, 66.0, 32.0, 18.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.864017486572266, -38.301151275634766, -35.73828125, -33.1754150390625, -30.612548828125, -28.0496826171875, -25.486814498901367, -22.923946380615234, -20.361080169677734, -17.798213958740234, -15.235345840454102, -12.672478675842285, -10.109611511230469, -7.546744346618652, -4.983877182006836, -2.421009063720703, 0.14185714721679688, 2.7047243118286133, 5.26759147644043, 7.830458641052246, 10.393325805664062, 12.956192970275879, 15.519060134887695, 18.081928253173828, 20.644794464111328, 23.207660675048828, 25.77052879333496, 28.333396911621094, 30.896263122558594, 33.459129333496094, 36.021995544433594, 38.58486557006836, 41.147735595703125, 43.710601806640625, 46.273468017578125, 48.83633804321289, 51.39920425415039, 53.96207046508789, 56.524940490722656, 59.087806701660156, 61.650672912597656, 64.21353912353516, 66.77640533447266, 69.33927154541016, 71.90214538574219, 74.46501159667969, 77.02787780761719, 79.59074401855469, 82.15361022949219, 84.71647644042969, 87.27934265136719, 89.84220886230469, 92.40507507324219, 94.96794891357422, 97.53081512451172, 100.09368133544922, 102.65654754638672, 105.21941375732422, 107.78227996826172, 110.34514617919922, 112.90802001953125, 115.47088623046875, 118.03375244140625, 120.59661865234375, 123.15948486328125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 7.0, 7.0, 5.0, 5.0, 5.0, 10.0, 6.0, 8.0, 8.0, 14.0, 15.0, 17.0, 20.0, 29.0, 27.0, 28.0, 33.0, 29.0, 26.0, 23.0, 25.0, 32.0, 35.0, 50.0, 31.0, 37.0, 43.0, 46.0, 39.0, 32.0, 33.0, 32.0, 31.0, 30.0, 15.0, 24.0, 16.0, 15.0, 15.0, 20.0, 18.0, 8.0, 18.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.103111267089844, -15.531569480895996, -14.960027694702148, -14.388484954833984, -13.816943168640137, -13.245401382446289, -12.673858642578125, -12.102316856384277, -11.53077507019043, -10.959233283996582, -10.387691497802734, -9.81614875793457, -9.244606971740723, -8.673065185546875, -8.101522445678711, -7.529980659484863, -6.958438873291016, -6.386897087097168, -5.815354824066162, -5.243812561035156, -4.672270774841309, -4.100728988647461, -3.529186725616455, -2.957644462585449, -2.3861026763916016, -1.8145606517791748, -1.243018627166748, -0.6714766025543213, -0.09993457794189453, 0.4716074466705322, 1.043149471282959, 1.6146917343139648, 2.1862335205078125, 2.7577755451202393, 3.329317569732666, 3.9008595943450928, 4.4724016189575195, 5.043943405151367, 5.615485668182373, 6.187027931213379, 6.758569717407227, 7.330111503601074, 7.90165376663208, 8.473196029663086, 9.044737815856934, 9.616279602050781, 10.187822341918945, 10.759364128112793, 11.33090591430664, 11.902447700500488, 12.473989486694336, 13.0455322265625, 13.617074012756348, 14.188615798950195, 14.76015853881836, 15.331700325012207, 15.903242111206055, 16.47478485107422, 17.04632568359375, 17.617868423461914, 18.189411163330078, 18.76095199584961, 19.332494735717773, 19.904037475585938, 20.47557830810547]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 3.0, 7.0, 8.0, 14.0, 13.0, 18.0, 22.0, 16.0, 22.0, 29.0, 24.0, 35.0, 36.0, 32.0, 40.0, 28.0, 33.0, 47.0, 42.0, 31.0, 44.0, 43.0, 36.0, 45.0, 34.0, 36.0, 22.0, 31.0, 20.0, 15.0, 16.0, 21.0, 18.0, 17.0, 18.0, 18.0, 10.0, 13.0, 6.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.625, -2.539154052734375, -2.45330810546875, -2.367462158203125, -2.2816162109375, -2.195770263671875, -2.10992431640625, -2.024078369140625, -1.938232421875, -1.852386474609375, -1.76654052734375, -1.680694580078125, -1.5948486328125, -1.509002685546875, -1.42315673828125, -1.337310791015625, -1.25146484375, -1.165618896484375, -1.07977294921875, -0.993927001953125, -0.9080810546875, -0.822235107421875, -0.73638916015625, -0.650543212890625, -0.564697265625, -0.478851318359375, -0.39300537109375, -0.307159423828125, -0.2213134765625, -0.135467529296875, -0.04962158203125, 0.036224365234375, 0.1220703125, 0.207916259765625, 0.29376220703125, 0.379608154296875, 0.4654541015625, 0.551300048828125, 0.63714599609375, 0.722991943359375, 0.808837890625, 0.894683837890625, 0.98052978515625, 1.066375732421875, 1.1522216796875, 1.238067626953125, 1.32391357421875, 1.409759521484375, 1.49560546875, 1.581451416015625, 1.66729736328125, 1.753143310546875, 1.8389892578125, 1.924835205078125, 2.01068115234375, 2.096527099609375, 2.182373046875, 2.268218994140625, 2.35406494140625, 2.439910888671875, 2.5257568359375, 2.611602783203125, 2.69744873046875, 2.783294677734375, 2.869140625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 8.0, 15.0, 24.0, 30.0, 49.0, 69.0, 99.0, 180.0, 295.0, 480.0, 833.0, 1355.0, 2510.0, 4313.0, 7969.0, 14938.0, 29643.0, 62531.0, 150434.0, 416343.0, 202359.0, 78497.0, 35915.0, 18064.0, 9536.0, 5136.0, 2914.0, 1585.0, 946.0, 573.0, 352.0, 200.0, 106.0, 92.0, 49.0, 34.0, 30.0, 13.0, 11.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20947265625, -0.2028522491455078, -0.19623184204101562, -0.18961143493652344, -0.18299102783203125, -0.17637062072753906, -0.16975021362304688, -0.1631298065185547, -0.1565093994140625, -0.1498889923095703, -0.14326858520507812, -0.13664817810058594, -0.13002777099609375, -0.12340736389160156, -0.11678695678710938, -0.11016654968261719, -0.103546142578125, -0.09692573547363281, -0.09030532836914062, -0.08368492126464844, -0.07706451416015625, -0.07044410705566406, -0.06382369995117188, -0.05720329284667969, -0.0505828857421875, -0.04396247863769531, -0.037342071533203125, -0.030721664428710938, -0.02410125732421875, -0.017480850219726562, -0.010860443115234375, -0.0042400360107421875, 0.00238037109375, 0.009000778198242188, 0.015621185302734375, 0.022241592407226562, 0.02886199951171875, 0.03548240661621094, 0.042102813720703125, 0.04872322082519531, 0.0553436279296875, 0.06196403503417969, 0.06858444213867188, 0.07520484924316406, 0.08182525634765625, 0.08844566345214844, 0.09506607055664062, 0.10168647766113281, 0.108306884765625, 0.11492729187011719, 0.12154769897460938, 0.12816810607910156, 0.13478851318359375, 0.14140892028808594, 0.14802932739257812, 0.1546497344970703, 0.1612701416015625, 0.1678905487060547, 0.17451095581054688, 0.18113136291503906, 0.18775177001953125, 0.19437217712402344, 0.20099258422851562, 0.2076129913330078, 0.2142333984375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 7.0, 3.0, 11.0, 13.0, 10.0, 25.0, 8.0, 19.0, 17.0, 27.0, 20.0, 29.0, 33.0, 29.0, 38.0, 43.0, 50.0, 42.0, 32.0, 1071.0, 57.0, 37.0, 38.0, 36.0, 40.0, 35.0, 29.0, 31.0, 29.0, 21.0, 31.0, 10.0, 19.0, 19.0, 14.0, 12.0, 4.0, 17.0, 3.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.130859375, -2.067626953125, -2.00439453125, -1.941162109375, -1.8779296875, -1.814697265625, -1.75146484375, -1.688232421875, -1.625, -1.561767578125, -1.49853515625, -1.435302734375, -1.3720703125, -1.308837890625, -1.24560546875, -1.182373046875, -1.119140625, -1.055908203125, -0.99267578125, -0.929443359375, -0.8662109375, -0.802978515625, -0.73974609375, -0.676513671875, -0.61328125, -0.550048828125, -0.48681640625, -0.423583984375, -0.3603515625, -0.297119140625, -0.23388671875, -0.170654296875, -0.107421875, -0.044189453125, 0.01904296875, 0.082275390625, 0.1455078125, 0.208740234375, 0.27197265625, 0.335205078125, 0.3984375, 0.461669921875, 0.52490234375, 0.588134765625, 0.6513671875, 0.714599609375, 0.77783203125, 0.841064453125, 0.904296875, 0.967529296875, 1.03076171875, 1.093994140625, 1.1572265625, 1.220458984375, 1.28369140625, 1.346923828125, 1.41015625, 1.473388671875, 1.53662109375, 1.599853515625, 1.6630859375, 1.726318359375, 1.78955078125, 1.852783203125, 1.916015625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 14.0, 15.0, 16.0, 33.0, 47.0, 66.0, 101.0, 165.0, 263.0, 405.0, 718.0, 1082.0, 1880.0, 3030.0, 5262.0, 8851.0, 15469.0, 28340.0, 53155.0, 104887.0, 237256.0, 1358716.0, 133324.0, 65002.0, 34295.0, 18931.0, 10533.0, 6078.0, 3663.0, 2079.0, 1320.0, 798.0, 479.0, 302.0, 161.0, 151.0, 86.0, 54.0, 35.0, 19.0, 17.0, 18.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063232421875, -0.0612030029296875, -0.059173583984375, -0.0571441650390625, -0.05511474609375, -0.0530853271484375, -0.051055908203125, -0.0490264892578125, -0.0469970703125, -0.0449676513671875, -0.042938232421875, -0.0409088134765625, -0.03887939453125, -0.0368499755859375, -0.034820556640625, -0.0327911376953125, -0.03076171875, -0.0287322998046875, -0.026702880859375, -0.0246734619140625, -0.02264404296875, -0.0206146240234375, -0.018585205078125, -0.0165557861328125, -0.0145263671875, -0.0124969482421875, -0.010467529296875, -0.0084381103515625, -0.00640869140625, -0.0043792724609375, -0.002349853515625, -0.0003204345703125, 0.001708984375, 0.0037384033203125, 0.005767822265625, 0.0077972412109375, 0.00982666015625, 0.0118560791015625, 0.013885498046875, 0.0159149169921875, 0.0179443359375, 0.0199737548828125, 0.022003173828125, 0.0240325927734375, 0.02606201171875, 0.0280914306640625, 0.030120849609375, 0.0321502685546875, 0.0341796875, 0.0362091064453125, 0.038238525390625, 0.0402679443359375, 0.04229736328125, 0.0443267822265625, 0.046356201171875, 0.0483856201171875, 0.0504150390625, 0.0524444580078125, 0.054473876953125, 0.0565032958984375, 0.05853271484375, 0.0605621337890625, 0.062591552734375, 0.0646209716796875, 0.066650390625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 8.0, 5.0, 3.0, 6.0, 10.0, 6.0, 14.0, 22.0, 29.0, 44.0, 50.0, 55.0, 99.0, 117.0, 134.0, 91.0, 86.0, 73.0, 43.0, 40.0, 14.0, 16.0, 12.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3066997528076172e-05, -2.242904156446457e-05, -2.1791085600852966e-05, -2.1153129637241364e-05, -2.051517367362976e-05, -1.9877217710018158e-05, -1.9239261746406555e-05, -1.8601305782794952e-05, -1.796334981918335e-05, -1.7325393855571747e-05, -1.6687437891960144e-05, -1.604948192834854e-05, -1.541152596473694e-05, -1.4773570001125336e-05, -1.4135614037513733e-05, -1.349765807390213e-05, -1.2859702110290527e-05, -1.2221746146678925e-05, -1.1583790183067322e-05, -1.0945834219455719e-05, -1.0307878255844116e-05, -9.669922292232513e-06, -9.03196632862091e-06, -8.394010365009308e-06, -7.756054401397705e-06, -7.118098437786102e-06, -6.4801424741744995e-06, -5.842186510562897e-06, -5.204230546951294e-06, -4.566274583339691e-06, -3.928318619728088e-06, -3.2903626561164856e-06, -2.652406692504883e-06, -2.01445072889328e-06, -1.3764947652816772e-06, -7.385388016700745e-07, -1.0058283805847168e-07, 5.373731255531311e-07, 1.1753290891647339e-06, 1.8132850527763367e-06, 2.4512410163879395e-06, 3.0891969799995422e-06, 3.727152943611145e-06, 4.365108907222748e-06, 5.003064870834351e-06, 5.641020834445953e-06, 6.278976798057556e-06, 6.916932761669159e-06, 7.554888725280762e-06, 8.192844688892365e-06, 8.830800652503967e-06, 9.46875661611557e-06, 1.0106712579727173e-05, 1.0744668543338776e-05, 1.1382624506950378e-05, 1.2020580470561981e-05, 1.2658536434173584e-05, 1.3296492397785187e-05, 1.393444836139679e-05, 1.4572404325008392e-05, 1.5210360288619995e-05, 1.5848316252231598e-05, 1.64862722158432e-05, 1.7124228179454803e-05, 1.7762184143066406e-05]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 7.0, 7.0, 14.0, 8.0, 10.0, 29.0, 36.0, 43.0, 80.0, 125.0, 254.0, 678.0, 3376.0, 27527.0, 669193.0, 325245.0, 18331.0, 2487.0, 541.0, 222.0, 117.0, 51.0, 50.0, 24.0, 27.0, 10.0, 16.0, 17.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002856254577636719, -0.000275392085313797, -0.0002651587128639221, -0.00025492534041404724, -0.00024469196796417236, -0.00023445859551429749, -0.0002242252230644226, -0.00021399185061454773, -0.00020375847816467285, -0.00019352510571479797, -0.0001832917332649231, -0.00017305836081504822, -0.00016282498836517334, -0.00015259161591529846, -0.00014235824346542358, -0.0001321248710155487, -0.00012189149856567383, -0.00011165812611579895, -0.00010142475366592407, -9.11913812160492e-05, -8.095800876617432e-05, -7.072463631629944e-05, -6.049126386642456e-05, -5.025789141654968e-05, -4.0024518966674805e-05, -2.9791146516799927e-05, -1.955777406692505e-05, -9.324401617050171e-06, 9.08970832824707e-07, 1.1142343282699585e-05, 2.1375715732574463e-05, 3.160908818244934e-05, 4.184246063232422e-05, 5.20758330821991e-05, 6.230920553207397e-05, 7.254257798194885e-05, 8.277595043182373e-05, 9.300932288169861e-05, 0.00010324269533157349, 0.00011347606778144836, 0.00012370944023132324, 0.00013394281268119812, 0.000144176185131073, 0.00015440955758094788, 0.00016464293003082275, 0.00017487630248069763, 0.0001851096749305725, 0.0001953430473804474, 0.00020557641983032227, 0.00021580979228019714, 0.00022604316473007202, 0.0002362765371799469, 0.0002465099096298218, 0.00025674328207969666, 0.00026697665452957153, 0.0002772100269794464, 0.0002874433994293213, 0.00029767677187919617, 0.00030791014432907104, 0.0003181435167789459, 0.0003283768892288208, 0.0003386102616786957, 0.00034884363412857056, 0.00035907700657844543, 0.0003693103790283203]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 18.0, 130.0, 595.0, 226.0, 34.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.311251778854057e-05, -8.837796485750005e-05, -8.364341192645952e-05, -7.8908858995419e-05, -7.417431334033608e-05, -6.943976040929556e-05, -6.470520747825503e-05, -5.997065454721451e-05, -5.523610161617398e-05, -5.050154868513346e-05, -4.576699575409293e-05, -4.1032446461031213e-05, -3.629789352999069e-05, -3.156334059895016e-05, -2.682878948689904e-05, -2.209423837484792e-05, -1.7359685443807393e-05, -1.262513342226157e-05, -7.890581400715746e-06, -3.1560293791699223e-06, 1.5785226423759013e-06, 6.313075573416427e-06, 1.1047626685467549e-05, 1.578217779751867e-05, 2.0516730728559196e-05, 2.525128365959972e-05, 2.9985834771650843e-05, 3.4720385883701965e-05, 3.945493881474249e-05, 4.4189491745783016e-05, 4.8924041038844734e-05, 5.365859396988526e-05, 5.83931541768834e-05, 6.312770710792392e-05, 6.786226003896445e-05, 7.259681297000498e-05, 7.73313659010455e-05, 8.206591883208603e-05, 8.680046448716894e-05, 9.153501741820946e-05, 9.626957034924999e-05, 0.00010100412328029051, 0.00010573867621133104, 0.00011047322914237157, 0.00011520777479745448, 0.000119942327728495, 0.00012467688065953553, 0.00012941143359057605, 0.00013414598652161658, 0.0001388805394526571, 0.00014361509238369763, 0.00014834964531473815, 0.00015308419824577868, 0.0001578187511768192, 0.00016255330410785973, 0.00016728785703890026, 0.00017202240996994078, 0.0001767569629009813, 0.00018149151583202183, 0.00018622606876306236, 0.00019096062169410288, 0.0001956951746251434, 0.00020042972755618393, 0.00020516428048722446, 0.00020989881886634976]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 10.0, 6.0, 11.0, 20.0, 10.0, 30.0, 16.0, 21.0, 26.0, 43.0, 35.0, 37.0, 33.0, 39.0, 45.0, 38.0, 44.0, 48.0, 69.0, 44.0, 43.0, 40.0, 31.0, 31.0, 32.0, 25.0, 31.0, 30.0, 22.0, 17.0, 18.0, 9.0, 12.0, 8.0, 10.0, 8.0, 6.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.556510925292969e-06, -6.311573088169098e-06, -6.066635251045227e-06, -5.821697413921356e-06, -5.576759576797485e-06, -5.3318217396736145e-06, -5.086883902549744e-06, -4.841946065425873e-06, -4.597008228302002e-06, -4.352070391178131e-06, -4.10713255405426e-06, -3.862194716930389e-06, -3.6172568798065186e-06, -3.3723190426826477e-06, -3.127381205558777e-06, -2.882443368434906e-06, -2.637505531311035e-06, -2.3925676941871643e-06, -2.1476298570632935e-06, -1.9026920199394226e-06, -1.6577541828155518e-06, -1.412816345691681e-06, -1.16787850856781e-06, -9.229406714439392e-07, -6.780028343200684e-07, -4.330649971961975e-07, -1.8812716007232666e-07, 5.681067705154419e-08, 3.0174851417541504e-07, 5.466863512992859e-07, 7.916241884231567e-07, 1.0365620255470276e-06, 1.2814998626708984e-06, 1.5264376997947693e-06, 1.7713755369186401e-06, 2.016313374042511e-06, 2.261251211166382e-06, 2.5061890482902527e-06, 2.7511268854141235e-06, 2.9960647225379944e-06, 3.2410025596618652e-06, 3.485940396785736e-06, 3.730878233909607e-06, 3.975816071033478e-06, 4.220753908157349e-06, 4.4656917452812195e-06, 4.71062958240509e-06, 4.955567419528961e-06, 5.200505256652832e-06, 5.445443093776703e-06, 5.690380930900574e-06, 5.935318768024445e-06, 6.1802566051483154e-06, 6.425194442272186e-06, 6.670132279396057e-06, 6.915070116519928e-06, 7.160007953643799e-06, 7.40494579076767e-06, 7.64988362789154e-06, 7.894821465015411e-06, 8.139759302139282e-06, 8.384697139263153e-06, 8.629634976387024e-06, 8.874572813510895e-06, 9.119510650634766e-06]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 3.0, 7.0, 8.0, 14.0, 13.0, 18.0, 22.0, 16.0, 22.0, 29.0, 24.0, 35.0, 36.0, 32.0, 40.0, 28.0, 33.0, 47.0, 42.0, 31.0, 44.0, 43.0, 36.0, 45.0, 34.0, 36.0, 22.0, 31.0, 20.0, 15.0, 16.0, 21.0, 18.0, 17.0, 18.0, 18.0, 10.0, 13.0, 6.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.625, -2.539154052734375, -2.45330810546875, -2.367462158203125, -2.2816162109375, -2.195770263671875, -2.10992431640625, -2.024078369140625, -1.938232421875, -1.852386474609375, -1.76654052734375, -1.680694580078125, -1.5948486328125, -1.509002685546875, -1.42315673828125, -1.337310791015625, -1.25146484375, -1.165618896484375, -1.07977294921875, -0.993927001953125, -0.9080810546875, -0.822235107421875, -0.73638916015625, -0.650543212890625, -0.564697265625, -0.478851318359375, -0.39300537109375, -0.307159423828125, -0.2213134765625, -0.135467529296875, -0.04962158203125, 0.036224365234375, 0.1220703125, 0.207916259765625, 0.29376220703125, 0.379608154296875, 0.4654541015625, 0.551300048828125, 0.63714599609375, 0.722991943359375, 0.808837890625, 0.894683837890625, 0.98052978515625, 1.066375732421875, 1.1522216796875, 1.238067626953125, 1.32391357421875, 1.409759521484375, 1.49560546875, 1.581451416015625, 1.66729736328125, 1.753143310546875, 1.8389892578125, 1.924835205078125, 2.01068115234375, 2.096527099609375, 2.182373046875, 2.268218994140625, 2.35406494140625, 2.439910888671875, 2.5257568359375, 2.611602783203125, 2.69744873046875, 2.783294677734375, 2.869140625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 10.0, 22.0, 45.0, 81.0, 147.0, 270.0, 507.0, 1025.0, 2178.0, 4584.0, 9499.0, 21067.0, 53720.0, 188220.0, 526028.0, 157992.0, 47163.0, 19174.0, 8722.0, 4152.0, 1993.0, 942.0, 493.0, 251.0, 111.0, 60.0, 34.0, 18.0, 20.0, 8.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.882568359375, -4.72216796875, -4.561767578125, -4.4013671875, -4.240966796875, -4.08056640625, -3.920166015625, -3.759765625, -3.599365234375, -3.43896484375, -3.278564453125, -3.1181640625, -2.957763671875, -2.79736328125, -2.636962890625, -2.4765625, -2.316162109375, -2.15576171875, -1.995361328125, -1.8349609375, -1.674560546875, -1.51416015625, -1.353759765625, -1.193359375, -1.032958984375, -0.87255859375, -0.712158203125, -0.5517578125, -0.391357421875, -0.23095703125, -0.070556640625, 0.08984375, 0.250244140625, 0.41064453125, 0.571044921875, 0.7314453125, 0.891845703125, 1.05224609375, 1.212646484375, 1.373046875, 1.533447265625, 1.69384765625, 1.854248046875, 2.0146484375, 2.175048828125, 2.33544921875, 2.495849609375, 2.65625, 2.816650390625, 2.97705078125, 3.137451171875, 3.2978515625, 3.458251953125, 3.61865234375, 3.779052734375, 3.939453125, 4.099853515625, 4.26025390625, 4.420654296875, 4.5810546875, 4.741455078125, 4.90185546875, 5.062255859375, 5.22265625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 11.0, 6.0, 8.0, 16.0, 20.0, 13.0, 24.0, 23.0, 19.0, 30.0, 26.0, 37.0, 44.0, 46.0, 80.0, 98.0, 150.0, 355.0, 1398.0, 167.0, 87.0, 65.0, 51.0, 41.0, 28.0, 30.0, 28.0, 33.0, 18.0, 12.0, 17.0, 17.0, 6.0, 16.0, 8.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.2265625, -10.906005859375, -10.58544921875, -10.264892578125, -9.9443359375, -9.623779296875, -9.30322265625, -8.982666015625, -8.662109375, -8.341552734375, -8.02099609375, -7.700439453125, -7.3798828125, -7.059326171875, -6.73876953125, -6.418212890625, -6.09765625, -5.777099609375, -5.45654296875, -5.135986328125, -4.8154296875, -4.494873046875, -4.17431640625, -3.853759765625, -3.533203125, -3.212646484375, -2.89208984375, -2.571533203125, -2.2509765625, -1.930419921875, -1.60986328125, -1.289306640625, -0.96875, -0.648193359375, -0.32763671875, -0.007080078125, 0.3134765625, 0.634033203125, 0.95458984375, 1.275146484375, 1.595703125, 1.916259765625, 2.23681640625, 2.557373046875, 2.8779296875, 3.198486328125, 3.51904296875, 3.839599609375, 4.16015625, 4.480712890625, 4.80126953125, 5.121826171875, 5.4423828125, 5.762939453125, 6.08349609375, 6.404052734375, 6.724609375, 7.045166015625, 7.36572265625, 7.686279296875, 8.0068359375, 8.327392578125, 8.64794921875, 8.968505859375, 9.2890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 8.0, 4.0, 15.0, 12.0, 20.0, 20.0, 35.0, 39.0, 37.0, 57.0, 87.0, 112.0, 114.0, 135.0, 219.0, 275.0, 679.0, 3301.0, 35038.0, 2317201.0, 766149.0, 18279.0, 2171.0, 555.0, 287.0, 175.0, 143.0, 117.0, 82.0, 63.0, 55.0, 46.0, 38.0, 37.0, 25.0, 21.0, 17.0, 12.0, 8.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8359375, -15.3060302734375, -14.776123046875, -14.2462158203125, -13.71630859375, -13.1864013671875, -12.656494140625, -12.1265869140625, -11.5966796875, -11.0667724609375, -10.536865234375, -10.0069580078125, -9.47705078125, -8.9471435546875, -8.417236328125, -7.8873291015625, -7.357421875, -6.8275146484375, -6.297607421875, -5.7677001953125, -5.23779296875, -4.7078857421875, -4.177978515625, -3.6480712890625, -3.1181640625, -2.5882568359375, -2.058349609375, -1.5284423828125, -0.99853515625, -0.4686279296875, 0.061279296875, 0.5911865234375, 1.12109375, 1.6510009765625, 2.180908203125, 2.7108154296875, 3.24072265625, 3.7706298828125, 4.300537109375, 4.8304443359375, 5.3603515625, 5.8902587890625, 6.420166015625, 6.9500732421875, 7.47998046875, 8.0098876953125, 8.539794921875, 9.0697021484375, 9.599609375, 10.1295166015625, 10.659423828125, 11.1893310546875, 11.71923828125, 12.2491455078125, 12.779052734375, 13.3089599609375, 13.8388671875, 14.3687744140625, 14.898681640625, 15.4285888671875, 15.95849609375, 16.4884033203125, 17.018310546875, 17.5482177734375, 18.078125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 10.0, 30.0, 41.0, 62.0, 94.0, 104.0, 134.0, 132.0, 120.0, 112.0, 65.0, 40.0, 18.0, 14.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.063336372375488, -9.390031814575195, -8.716727256774902, -8.04342269897461, -7.370118618011475, -6.696814060211182, -6.023509979248047, -5.350205421447754, -4.676900863647461, -4.003596305847168, -3.330291986465454, -2.6569876670837402, -1.9836831092834473, -1.3103785514831543, -0.6370744705200195, 0.03623008728027344, 0.7095346450805664, 1.3828390836715698, 2.0561435222625732, 2.729447841644287, 3.40275239944458, 4.076056957244873, 4.749361038208008, 5.422665596008301, 6.095970153808594, 6.769274711608887, 7.44257926940918, 8.115882873535156, 8.789188385009766, 9.462491989135742, 10.135796546936035, 10.809101104736328, 11.482406616210938, 12.15571117401123, 12.829015731811523, 13.5023193359375, 14.17562484741211, 14.848928451538086, 15.522233009338379, 16.195537567138672, 16.86884307861328, 17.542146682739258, 18.215452194213867, 18.888755798339844, 19.562061309814453, 20.23536491394043, 20.908668518066406, 21.581974029541016, 22.255277633666992, 22.92858123779297, 23.601886749267578, 24.275190353393555, 24.948495864868164, 25.62179946899414, 26.29510498046875, 26.968408584594727, 27.641712188720703, 28.31501579284668, 28.98832130432129, 29.661624908447266, 30.334930419921875, 31.00823402404785, 31.681537628173828, 32.35484313964844, 33.02814865112305]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 6.0, 4.0, 7.0, 12.0, 12.0, 13.0, 17.0, 21.0, 29.0, 18.0, 27.0, 21.0, 30.0, 26.0, 28.0, 26.0, 35.0, 38.0, 42.0, 40.0, 27.0, 28.0, 26.0, 41.0, 38.0, 30.0, 43.0, 27.0, 39.0, 33.0, 34.0, 19.0, 22.0, 28.0, 16.0, 15.0, 12.0, 16.0, 8.0, 7.0, 6.0, 8.0, 8.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.034652709960938, -23.262086868286133, -22.489521026611328, -21.716957092285156, -20.94439125061035, -20.171825408935547, -19.399259567260742, -18.626693725585938, -17.854127883911133, -17.081562042236328, -16.308996200561523, -15.536431312561035, -14.76386547088623, -13.991300582885742, -13.218734741210938, -12.446168899536133, -11.673604011535645, -10.90103816986084, -10.128473281860352, -9.355907440185547, -8.583341598510742, -7.810776233673096, -7.038210868835449, -6.2656450271606445, -5.493079662322998, -4.720514297485352, -3.947948455810547, -3.1753830909729004, -2.402817487716675, -1.6302518844604492, -0.8576865196228027, -0.08512067794799805, 0.6874446868896484, 1.460010290145874, 2.2325758934020996, 3.005141258239746, 3.7777068614959717, 4.550272464752197, 5.322837829589844, 6.095403671264648, 6.867969036102295, 7.640534400939941, 8.413100242614746, 9.185665130615234, 9.958230972290039, 10.730796813964844, 11.503362655639648, 12.275928497314453, 13.048493385314941, 13.821059226989746, 14.593624114990234, 15.366189956665039, 16.138755798339844, 16.91132164001465, 17.683887481689453, 18.456451416015625, 19.22901725769043, 20.001583099365234, 20.77414894104004, 21.546714782714844, 22.319278717041016, 23.09184455871582, 23.864410400390625, 24.63697624206543, 25.409542083740234]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 5.0, 4.0, 7.0, 13.0, 5.0, 12.0, 12.0, 15.0, 16.0, 18.0, 29.0, 29.0, 23.0, 35.0, 29.0, 33.0, 46.0, 31.0, 40.0, 38.0, 34.0, 30.0, 37.0, 56.0, 44.0, 32.0, 38.0, 32.0, 25.0, 25.0, 22.0, 24.0, 17.0, 19.0, 12.0, 18.0, 18.0, 20.0, 8.0, 14.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0], "bins": [-2.80078125, -2.711944580078125, -2.62310791015625, -2.534271240234375, -2.4454345703125, -2.356597900390625, -2.26776123046875, -2.178924560546875, -2.090087890625, -2.001251220703125, -1.91241455078125, -1.823577880859375, -1.7347412109375, -1.645904541015625, -1.55706787109375, -1.468231201171875, -1.37939453125, -1.290557861328125, -1.20172119140625, -1.112884521484375, -1.0240478515625, -0.935211181640625, -0.84637451171875, -0.757537841796875, -0.668701171875, -0.579864501953125, -0.49102783203125, -0.402191162109375, -0.3133544921875, -0.224517822265625, -0.13568115234375, -0.046844482421875, 0.0419921875, 0.130828857421875, 0.21966552734375, 0.308502197265625, 0.3973388671875, 0.486175537109375, 0.57501220703125, 0.663848876953125, 0.752685546875, 0.841522216796875, 0.93035888671875, 1.019195556640625, 1.1080322265625, 1.196868896484375, 1.28570556640625, 1.374542236328125, 1.46337890625, 1.552215576171875, 1.64105224609375, 1.729888916015625, 1.8187255859375, 1.907562255859375, 1.99639892578125, 2.085235595703125, 2.174072265625, 2.262908935546875, 2.35174560546875, 2.440582275390625, 2.5294189453125, 2.618255615234375, 2.70709228515625, 2.795928955078125, 2.884765625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 10.0, 16.0, 15.0, 32.0, 28.0, 54.0, 99.0, 170.0, 272.0, 481.0, 1012.0, 2274.0, 5187.0, 13666.0, 41609.0, 158472.0, 778974.0, 2113867.0, 841980.0, 168126.0, 43532.0, 14268.0, 5377.0, 2379.0, 1118.0, 489.0, 314.0, 151.0, 94.0, 66.0, 37.0, 31.0, 25.0, 9.0, 13.0, 5.0, 3.0, 8.0, 0.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6220703125, -5.431640625, -5.2412109375, -5.05078125, -4.8603515625, -4.669921875, -4.4794921875, -4.2890625, -4.0986328125, -3.908203125, -3.7177734375, -3.52734375, -3.3369140625, -3.146484375, -2.9560546875, -2.765625, -2.5751953125, -2.384765625, -2.1943359375, -2.00390625, -1.8134765625, -1.623046875, -1.4326171875, -1.2421875, -1.0517578125, -0.861328125, -0.6708984375, -0.48046875, -0.2900390625, -0.099609375, 0.0908203125, 0.28125, 0.4716796875, 0.662109375, 0.8525390625, 1.04296875, 1.2333984375, 1.423828125, 1.6142578125, 1.8046875, 1.9951171875, 2.185546875, 2.3759765625, 2.56640625, 2.7568359375, 2.947265625, 3.1376953125, 3.328125, 3.5185546875, 3.708984375, 3.8994140625, 4.08984375, 4.2802734375, 4.470703125, 4.6611328125, 4.8515625, 5.0419921875, 5.232421875, 5.4228515625, 5.61328125, 5.8037109375, 5.994140625, 6.1845703125, 6.375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 14.0, 9.0, 17.0, 31.0, 39.0, 63.0, 91.0, 115.0, 154.0, 208.0, 291.0, 371.0, 483.0, 491.0, 429.0, 320.0, 277.0, 204.0, 152.0, 93.0, 63.0, 60.0, 40.0, 21.0, 12.0, 5.0, 7.0, 2.0, 6.0, 1.0, 2.0, 2.0], "bins": [-10.5078125, -10.2750244140625, -10.042236328125, -9.8094482421875, -9.57666015625, -9.3438720703125, -9.111083984375, -8.8782958984375, -8.6455078125, -8.4127197265625, -8.179931640625, -7.9471435546875, -7.71435546875, -7.4815673828125, -7.248779296875, -7.0159912109375, -6.783203125, -6.5504150390625, -6.317626953125, -6.0848388671875, -5.85205078125, -5.6192626953125, -5.386474609375, -5.1536865234375, -4.9208984375, -4.6881103515625, -4.455322265625, -4.2225341796875, -3.98974609375, -3.7569580078125, -3.524169921875, -3.2913818359375, -3.05859375, -2.8258056640625, -2.593017578125, -2.3602294921875, -2.12744140625, -1.8946533203125, -1.661865234375, -1.4290771484375, -1.1962890625, -0.9635009765625, -0.730712890625, -0.4979248046875, -0.26513671875, -0.0323486328125, 0.200439453125, 0.4332275390625, 0.666015625, 0.8988037109375, 1.131591796875, 1.3643798828125, 1.59716796875, 1.8299560546875, 2.062744140625, 2.2955322265625, 2.5283203125, 2.7611083984375, 2.993896484375, 3.2266845703125, 3.45947265625, 3.6922607421875, 3.925048828125, 4.1578369140625, 4.390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 1.0, 6.0, 11.0, 16.0, 37.0, 54.0, 79.0, 109.0, 216.0, 343.0, 642.0, 2403.0, 39486.0, 2832083.0, 1297379.0, 18593.0, 1526.0, 533.0, 291.0, 170.0, 109.0, 87.0, 42.0, 26.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -13.8004150390625, -12.983642578125, -12.1668701171875, -11.35009765625, -10.5333251953125, -9.716552734375, -8.8997802734375, -8.0830078125, -7.2662353515625, -6.449462890625, -5.6326904296875, -4.81591796875, -3.9991455078125, -3.182373046875, -2.3656005859375, -1.548828125, -0.7320556640625, 0.084716796875, 0.9014892578125, 1.71826171875, 2.5350341796875, 3.351806640625, 4.1685791015625, 4.9853515625, 5.8021240234375, 6.618896484375, 7.4356689453125, 8.25244140625, 9.0692138671875, 9.885986328125, 10.7027587890625, 11.51953125, 12.3363037109375, 13.153076171875, 13.9698486328125, 14.78662109375, 15.6033935546875, 16.420166015625, 17.2369384765625, 18.0537109375, 18.8704833984375, 19.687255859375, 20.5040283203125, 21.32080078125, 22.1375732421875, 22.954345703125, 23.7711181640625, 24.587890625, 25.4046630859375, 26.221435546875, 27.0382080078125, 27.85498046875, 28.6717529296875, 29.488525390625, 30.3052978515625, 31.1220703125, 31.9388427734375, 32.755615234375, 33.5723876953125, 34.38916015625, 35.2059326171875, 36.022705078125, 36.8394775390625, 37.65625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 9.0, 11.0, 24.0, 29.0, 49.0, 45.0, 70.0, 72.0, 101.0, 83.0, 95.0, 103.0, 92.0, 63.0, 51.0, 36.0, 24.0, 14.0, 16.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.161117553710938, -25.144216537475586, -24.127315521240234, -23.110414505004883, -22.09351348876953, -21.076610565185547, -20.059709548950195, -19.042808532714844, -18.025907516479492, -17.00900650024414, -15.992105484008789, -14.975203514099121, -13.95830249786377, -12.941401481628418, -11.92449951171875, -10.907598495483398, -9.890697479248047, -8.873796463012695, -7.8568949699401855, -6.839993476867676, -5.823092460632324, -4.806191444396973, -3.789289951324463, -2.772388458251953, -1.7554874420166016, -0.7385861873626709, 0.27831506729125977, 1.2952163219451904, 2.312117576599121, 3.3290185928344727, 4.345920085906982, 5.362821578979492, 6.379718780517578, 7.39661979675293, 8.413520812988281, 9.43042278289795, 10.4473237991333, 11.464224815368652, 12.48112678527832, 13.498027801513672, 14.514928817749023, 15.531829833984375, 16.548730850219727, 17.565631866455078, 18.582534790039062, 19.59943389892578, 20.616336822509766, 21.633237838745117, 22.65013885498047, 23.66703987121582, 24.683940887451172, 25.700841903686523, 26.717742919921875, 27.73464584350586, 28.75154685974121, 29.768447875976562, 30.785348892211914, 31.802249908447266, 32.81915283203125, 33.83605194091797, 34.85295486450195, 35.86985397338867, 36.886756896972656, 37.903656005859375, 38.92055892944336]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 5.0, 10.0, 4.0, 15.0, 12.0, 21.0, 8.0, 13.0, 20.0, 19.0, 25.0, 35.0, 25.0, 27.0, 22.0, 31.0, 40.0, 45.0, 44.0, 43.0, 38.0, 36.0, 46.0, 37.0, 29.0, 36.0, 27.0, 39.0, 26.0, 19.0, 25.0, 14.0, 24.0, 19.0, 10.0, 11.0, 14.0, 19.0, 8.0, 7.0, 3.0, 13.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0], "bins": [-19.3941650390625, -18.805688858032227, -18.217212677001953, -17.62873649597168, -17.040260314941406, -16.4517822265625, -15.863306045532227, -15.274829864501953, -14.68635368347168, -14.097877502441406, -13.509401321411133, -12.920924186706543, -12.33244800567627, -11.743971824645996, -11.155494689941406, -10.567018508911133, -9.97854232788086, -9.390066146850586, -8.801589965820312, -8.213112831115723, -7.624636650085449, -7.036160469055176, -6.447683811187744, -5.8592071533203125, -5.270730972290039, -4.682254791259766, -4.093778133392334, -3.5053017139434814, -2.916825294494629, -2.3283488750457764, -1.7398724555969238, -1.1513957977294922, -0.5629196166992188, 0.02555680274963379, 0.6140332221984863, 1.2025096416473389, 1.7909860610961914, 2.379462480545044, 2.9679388999938965, 3.556415557861328, 4.144891738891602, 4.733367919921875, 5.321844577789307, 5.910321235656738, 6.498797416687012, 7.087273597717285, 7.675750255584717, 8.264226913452148, 8.852703094482422, 9.441179275512695, 10.029655456542969, 10.618132591247559, 11.206608772277832, 11.795084953308105, 12.383562088012695, 12.972038269042969, 13.560514450073242, 14.148990631103516, 14.737466812133789, 15.325943946838379, 15.914420127868652, 16.502897262573242, 17.091373443603516, 17.67984962463379, 18.268325805664062]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 7.0, 11.0, 6.0, 12.0, 11.0, 10.0, 14.0, 20.0, 22.0, 20.0, 20.0, 29.0, 33.0, 37.0, 43.0, 41.0, 41.0, 34.0, 40.0, 41.0, 46.0, 45.0, 37.0, 39.0, 47.0, 31.0, 29.0, 26.0, 31.0, 17.0, 27.0, 29.0, 16.0, 15.0, 12.0, 14.0, 15.0, 5.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.177734375, -3.08203125, -2.986328125, -2.890625, -2.794921875, -2.69921875, -2.603515625, -2.5078125, -2.412109375, -2.31640625, -2.220703125, -2.125, -2.029296875, -1.93359375, -1.837890625, -1.7421875, -1.646484375, -1.55078125, -1.455078125, -1.359375, -1.263671875, -1.16796875, -1.072265625, -0.9765625, -0.880859375, -0.78515625, -0.689453125, -0.59375, -0.498046875, -0.40234375, -0.306640625, -0.2109375, -0.115234375, -0.01953125, 0.076171875, 0.171875, 0.267578125, 0.36328125, 0.458984375, 0.5546875, 0.650390625, 0.74609375, 0.841796875, 0.9375, 1.033203125, 1.12890625, 1.224609375, 1.3203125, 1.416015625, 1.51171875, 1.607421875, 1.703125, 1.798828125, 1.89453125, 1.990234375, 2.0859375, 2.181640625, 2.27734375, 2.373046875, 2.46875, 2.564453125, 2.66015625, 2.755859375, 2.8515625, 2.947265625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 8.0, 6.0, 11.0, 20.0, 36.0, 56.0, 84.0, 106.0, 178.0, 279.0, 459.0, 649.0, 1060.0, 1686.0, 2738.0, 4327.0, 7118.0, 11484.0, 19564.0, 33583.0, 60226.0, 121755.0, 323471.0, 239571.0, 97877.0, 50652.0, 28387.0, 16730.0, 9971.0, 6218.0, 3724.0, 2378.0, 1497.0, 914.0, 603.0, 379.0, 243.0, 177.0, 98.0, 79.0, 40.0, 28.0, 30.0, 11.0, 9.0, 11.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 4.0], "bins": [-0.1710205078125, -0.1658153533935547, -0.16061019897460938, -0.15540504455566406, -0.15019989013671875, -0.14499473571777344, -0.13978958129882812, -0.1345844268798828, -0.1293792724609375, -0.12417411804199219, -0.11896896362304688, -0.11376380920410156, -0.10855865478515625, -0.10335350036621094, -0.09814834594726562, -0.09294319152832031, -0.087738037109375, -0.08253288269042969, -0.07732772827148438, -0.07212257385253906, -0.06691741943359375, -0.06171226501464844, -0.056507110595703125, -0.05130195617675781, -0.0460968017578125, -0.04089164733886719, -0.035686492919921875, -0.030481338500976562, -0.02527618408203125, -0.020071029663085938, -0.014865875244140625, -0.009660720825195312, -0.00445556640625, 0.0007495880126953125, 0.005954742431640625, 0.011159896850585938, 0.01636505126953125, 0.021570205688476562, 0.026775360107421875, 0.03198051452636719, 0.0371856689453125, 0.04239082336425781, 0.047595977783203125, 0.05280113220214844, 0.05800628662109375, 0.06321144104003906, 0.06841659545898438, 0.07362174987792969, 0.078826904296875, 0.08403205871582031, 0.08923721313476562, 0.09444236755371094, 0.09964752197265625, 0.10485267639160156, 0.11005783081054688, 0.11526298522949219, 0.1204681396484375, 0.1256732940673828, 0.13087844848632812, 0.13608360290527344, 0.14128875732421875, 0.14649391174316406, 0.15169906616210938, 0.1569042205810547, 0.162109375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 10.0, 8.0, 14.0, 13.0, 9.0, 20.0, 15.0, 20.0, 30.0, 35.0, 21.0, 53.0, 22.0, 37.0, 47.0, 43.0, 49.0, 1075.0, 48.0, 44.0, 39.0, 26.0, 31.0, 40.0, 38.0, 34.0, 28.0, 30.0, 23.0, 29.0, 17.0, 16.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 7.0, 7.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.20703125, -2.140106201171875, -2.07318115234375, -2.006256103515625, -1.9393310546875, -1.872406005859375, -1.80548095703125, -1.738555908203125, -1.671630859375, -1.604705810546875, -1.53778076171875, -1.470855712890625, -1.4039306640625, -1.337005615234375, -1.27008056640625, -1.203155517578125, -1.13623046875, -1.069305419921875, -1.00238037109375, -0.935455322265625, -0.8685302734375, -0.801605224609375, -0.73468017578125, -0.667755126953125, -0.600830078125, -0.533905029296875, -0.46697998046875, -0.400054931640625, -0.3331298828125, -0.266204833984375, -0.19927978515625, -0.132354736328125, -0.0654296875, 0.001495361328125, 0.06842041015625, 0.135345458984375, 0.2022705078125, 0.269195556640625, 0.33612060546875, 0.403045654296875, 0.469970703125, 0.536895751953125, 0.60382080078125, 0.670745849609375, 0.7376708984375, 0.804595947265625, 0.87152099609375, 0.938446044921875, 1.00537109375, 1.072296142578125, 1.13922119140625, 1.206146240234375, 1.2730712890625, 1.339996337890625, 1.40692138671875, 1.473846435546875, 1.540771484375, 1.607696533203125, 1.67462158203125, 1.741546630859375, 1.8084716796875, 1.875396728515625, 1.94232177734375, 2.009246826171875, 2.076171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 3.0, 8.0, 18.0, 27.0, 41.0, 50.0, 78.0, 119.0, 213.0, 288.0, 413.0, 648.0, 1062.0, 1498.0, 2333.0, 3835.0, 5726.0, 9337.0, 15379.0, 25339.0, 43637.0, 78669.0, 154344.0, 1351999.0, 186079.0, 91212.0, 50179.0, 28699.0, 17091.0, 10516.0, 6569.0, 4173.0, 2606.0, 1655.0, 1185.0, 667.0, 468.0, 312.0, 239.0, 131.0, 91.0, 61.0, 47.0, 22.0, 23.0, 13.0, 12.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.062042236328125, -0.060196876525878906, -0.05835151672363281, -0.05650615692138672, -0.054660797119140625, -0.05281543731689453, -0.05097007751464844, -0.049124717712402344, -0.04727935791015625, -0.045433998107910156, -0.04358863830566406, -0.04174327850341797, -0.039897918701171875, -0.03805255889892578, -0.03620719909667969, -0.034361839294433594, -0.0325164794921875, -0.030671119689941406, -0.028825759887695312, -0.02698040008544922, -0.025135040283203125, -0.02328968048095703, -0.021444320678710938, -0.019598960876464844, -0.01775360107421875, -0.015908241271972656, -0.014062881469726562, -0.012217521667480469, -0.010372161865234375, -0.008526802062988281, -0.0066814422607421875, -0.004836082458496094, -0.00299072265625, -0.0011453628540039062, 0.0006999969482421875, 0.0025453567504882812, 0.004390716552734375, 0.006236076354980469, 0.008081436157226562, 0.009926795959472656, 0.01177215576171875, 0.013617515563964844, 0.015462875366210938, 0.01730823516845703, 0.019153594970703125, 0.02099895477294922, 0.022844314575195312, 0.024689674377441406, 0.0265350341796875, 0.028380393981933594, 0.030225753784179688, 0.03207111358642578, 0.033916473388671875, 0.03576183319091797, 0.03760719299316406, 0.039452552795410156, 0.04129791259765625, 0.043143272399902344, 0.04498863220214844, 0.04683399200439453, 0.048679351806640625, 0.05052471160888672, 0.05237007141113281, 0.054215431213378906, 0.056060791015625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 11.0, 12.0, 16.0, 36.0, 30.0, 32.0, 41.0, 62.0, 98.0, 152.0, 136.0, 97.0, 65.0, 48.0, 41.0, 28.0, 14.0, 14.0, 13.0, 6.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0100345611572266e-05, -2.9058195650577545e-05, -2.8016045689582825e-05, -2.6973895728588104e-05, -2.5931745767593384e-05, -2.4889595806598663e-05, -2.3847445845603943e-05, -2.2805295884609222e-05, -2.1763145923614502e-05, -2.072099596261978e-05, -1.967884600162506e-05, -1.863669604063034e-05, -1.759454607963562e-05, -1.65523961186409e-05, -1.551024615764618e-05, -1.4468096196651459e-05, -1.3425946235656738e-05, -1.2383796274662018e-05, -1.1341646313667297e-05, -1.0299496352672577e-05, -9.257346391677856e-06, -8.215196430683136e-06, -7.1730464696884155e-06, -6.130896508693695e-06, -5.088746547698975e-06, -4.046596586704254e-06, -3.0044466257095337e-06, -1.9622966647148132e-06, -9.201467037200928e-07, 1.2200325727462769e-07, 1.1641532182693481e-06, 2.2063031792640686e-06, 3.248453140258789e-06, 4.2906031012535095e-06, 5.33275306224823e-06, 6.3749030232429504e-06, 7.417052984237671e-06, 8.459202945232391e-06, 9.501352906227112e-06, 1.0543502867221832e-05, 1.1585652828216553e-05, 1.2627802789211273e-05, 1.3669952750205994e-05, 1.4712102711200714e-05, 1.5754252672195435e-05, 1.6796402633190155e-05, 1.7838552594184875e-05, 1.8880702555179596e-05, 1.9922852516174316e-05, 2.0965002477169037e-05, 2.2007152438163757e-05, 2.3049302399158478e-05, 2.4091452360153198e-05, 2.513360232114792e-05, 2.617575228214264e-05, 2.721790224313736e-05, 2.826005220413208e-05, 2.93022021651268e-05, 3.034435212612152e-05, 3.138650208711624e-05, 3.242865204811096e-05, 3.347080200910568e-05, 3.45129519701004e-05, 3.555510193109512e-05, 3.6597251892089844e-05]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 4.0, 5.0, 13.0, 14.0, 21.0, 46.0, 78.0, 160.0, 329.0, 1318.0, 55163.0, 981307.0, 8860.0, 682.0, 236.0, 107.0, 67.0, 45.0, 26.0, 14.0, 10.0, 9.0, 8.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000644683837890625, -0.0006258934736251831, -0.0006071031093597412, -0.0005883127450942993, -0.0005695223808288574, -0.0005507320165634155, -0.0005319416522979736, -0.0005131512880325317, -0.0004943609237670898, -0.00047557055950164795, -0.00045678019523620605, -0.00043798983097076416, -0.00041919946670532227, -0.00040040910243988037, -0.0003816187381744385, -0.0003628283739089966, -0.0003440380096435547, -0.0003252476453781128, -0.0003064572811126709, -0.000287666916847229, -0.0002688765525817871, -0.0002500861883163452, -0.00023129582405090332, -0.00021250545978546143, -0.00019371509552001953, -0.00017492473125457764, -0.00015613436698913574, -0.00013734400272369385, -0.00011855363845825195, -9.976327419281006e-05, -8.097290992736816e-05, -6.218254566192627e-05, -4.3392181396484375e-05, -2.460181713104248e-05, -5.811452865600586e-06, 1.2978911399841309e-05, 3.17692756652832e-05, 5.05596399307251e-05, 6.935000419616699e-05, 8.814036846160889e-05, 0.00010693073272705078, 0.00012572109699249268, 0.00014451146125793457, 0.00016330182552337646, 0.00018209218978881836, 0.00020088255405426025, 0.00021967291831970215, 0.00023846328258514404, 0.00025725364685058594, 0.00027604401111602783, 0.0002948343753814697, 0.0003136247396469116, 0.0003324151039123535, 0.0003512054681777954, 0.0003699958324432373, 0.0003887861967086792, 0.0004075765609741211, 0.000426366925239563, 0.0004451572895050049, 0.0004639476537704468, 0.00048273801803588867, 0.0005015283823013306, 0.0005203187465667725, 0.0005391091108322144, 0.0005578994750976562]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 13.0, 643.0, 356.0, 3.0, 1.0], "bins": [-0.0005762206856161356, -0.0005667611258104444, -0.0005573015660047531, -0.0005478420061990619, -0.0005383824463933706, -0.0005289228865876794, -0.0005194633267819881, -0.0005100037669762969, -0.0005005442071706057, -0.0004910846473649144, -0.0004816250875592232, -0.00047216552775353193, -0.0004627059679478407, -0.0004532464372459799, -0.00044378687744028866, -0.0004343273176345974, -0.00042486778693273664, -0.0004154082271270454, -0.00040594866732135415, -0.0003964891075156629, -0.00038702954770997167, -0.0003775700170081109, -0.00036811045720241964, -0.0003586508973967284, -0.00034919133759103715, -0.0003397317777853459, -0.00033027221797965467, -0.00032081265817396343, -0.00031135312747210264, -0.0003018935676664114, -0.00029243400786072016, -0.0002829744480550289, -0.00027351491735316813, -0.0002640553575474769, -0.00025459579774178565, -0.0002451362379360944, -0.0002356766926823184, -0.00022621713287662715, -0.00021675758762285113, -0.0002072980278171599, -0.00019783845345955342, -0.00018837889365386218, -0.00017891934840008616, -0.00016945978859439492, -0.00016000022878870368, -0.00015054066898301244, -0.0001410811091773212, -0.00013162156392354518, -0.00012216200411785394, -0.0001127024443121627, -0.00010324289178242907, -9.378333925269544e-05, -8.43237794470042e-05, -7.486421964131296e-05, -6.540466711157933e-05, -5.59451145818457e-05, -4.648555477615446e-05, -3.7025998608442023e-05, -2.7566442440729588e-05, -1.8106886273017153e-05, -8.647330105304718e-06, 8.122260624077171e-07, 1.0271782230120152e-05, 1.973133475985378e-05, 2.919089274655562e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 8.0, 20.0, 26.0, 23.0, 30.0, 54.0, 52.0, 51.0, 64.0, 67.0, 88.0, 87.0, 60.0, 69.0, 60.0, 56.0, 48.0, 32.0, 28.0, 22.0, 19.0, 14.0, 11.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4781951904296875e-05, -1.3964250683784485e-05, -1.3146549463272095e-05, -1.2328848242759705e-05, -1.1511147022247314e-05, -1.0693445801734924e-05, -9.875744581222534e-06, -9.058043360710144e-06, -8.240342140197754e-06, -7.422640919685364e-06, -6.604939699172974e-06, -5.7872384786605835e-06, -4.969537258148193e-06, -4.151836037635803e-06, -3.334134817123413e-06, -2.516433596611023e-06, -1.6987323760986328e-06, -8.810311555862427e-07, -6.332993507385254e-08, 7.543712854385376e-07, 1.5720725059509277e-06, 2.389773726463318e-06, 3.207474946975708e-06, 4.025176167488098e-06, 4.842877388000488e-06, 5.660578608512878e-06, 6.4782798290252686e-06, 7.295981049537659e-06, 8.113682270050049e-06, 8.931383490562439e-06, 9.749084711074829e-06, 1.056678593158722e-05, 1.138448715209961e-05, 1.2202188372612e-05, 1.301988959312439e-05, 1.383759081363678e-05, 1.465529203414917e-05, 1.547299325466156e-05, 1.629069447517395e-05, 1.710839569568634e-05, 1.792609691619873e-05, 1.874379813671112e-05, 1.956149935722351e-05, 2.03792005777359e-05, 2.119690179824829e-05, 2.201460301876068e-05, 2.283230423927307e-05, 2.365000545978546e-05, 2.446770668029785e-05, 2.5285407900810242e-05, 2.6103109121322632e-05, 2.6920810341835022e-05, 2.7738511562347412e-05, 2.8556212782859802e-05, 2.9373914003372192e-05, 3.0191615223884583e-05, 3.100931644439697e-05, 3.182701766490936e-05, 3.264471888542175e-05, 3.346242010593414e-05, 3.428012132644653e-05, 3.509782254695892e-05, 3.5915523767471313e-05, 3.6733224987983704e-05, 3.7550926208496094e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 7.0, 11.0, 6.0, 12.0, 11.0, 10.0, 14.0, 20.0, 22.0, 20.0, 20.0, 29.0, 33.0, 37.0, 43.0, 41.0, 41.0, 34.0, 40.0, 41.0, 46.0, 45.0, 37.0, 39.0, 47.0, 31.0, 29.0, 26.0, 31.0, 17.0, 27.0, 29.0, 16.0, 15.0, 12.0, 14.0, 15.0, 5.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.177734375, -3.08203125, -2.986328125, -2.890625, -2.794921875, -2.69921875, -2.603515625, -2.5078125, -2.412109375, -2.31640625, -2.220703125, -2.125, -2.029296875, -1.93359375, -1.837890625, -1.7421875, -1.646484375, -1.55078125, -1.455078125, -1.359375, -1.263671875, -1.16796875, -1.072265625, -0.9765625, -0.880859375, -0.78515625, -0.689453125, -0.59375, -0.498046875, -0.40234375, -0.306640625, -0.2109375, -0.115234375, -0.01953125, 0.076171875, 0.171875, 0.267578125, 0.36328125, 0.458984375, 0.5546875, 0.650390625, 0.74609375, 0.841796875, 0.9375, 1.033203125, 1.12890625, 1.224609375, 1.3203125, 1.416015625, 1.51171875, 1.607421875, 1.703125, 1.798828125, 1.89453125, 1.990234375, 2.0859375, 2.181640625, 2.27734375, 2.373046875, 2.46875, 2.564453125, 2.66015625, 2.755859375, 2.8515625, 2.947265625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 12.0, 12.0, 16.0, 16.0, 37.0, 43.0, 63.0, 104.0, 167.0, 225.0, 292.0, 478.0, 738.0, 1098.0, 1557.0, 2452.0, 3859.0, 6151.0, 10299.0, 18819.0, 37442.0, 84080.0, 211531.0, 371850.0, 161840.0, 65200.0, 30453.0, 15708.0, 8883.0, 5356.0, 3292.0, 2104.0, 1435.0, 918.0, 632.0, 472.0, 269.0, 213.0, 133.0, 107.0, 57.0, 44.0, 26.0, 20.0, 14.0, 20.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.12890625, -3.0404052734375, -2.951904296875, -2.8634033203125, -2.77490234375, -2.6864013671875, -2.597900390625, -2.5093994140625, -2.4208984375, -2.3323974609375, -2.243896484375, -2.1553955078125, -2.06689453125, -1.9783935546875, -1.889892578125, -1.8013916015625, -1.712890625, -1.6243896484375, -1.535888671875, -1.4473876953125, -1.35888671875, -1.2703857421875, -1.181884765625, -1.0933837890625, -1.0048828125, -0.9163818359375, -0.827880859375, -0.7393798828125, -0.65087890625, -0.5623779296875, -0.473876953125, -0.3853759765625, -0.296875, -0.2083740234375, -0.119873046875, -0.0313720703125, 0.05712890625, 0.1456298828125, 0.234130859375, 0.3226318359375, 0.4111328125, 0.4996337890625, 0.588134765625, 0.6766357421875, 0.76513671875, 0.8536376953125, 0.942138671875, 1.0306396484375, 1.119140625, 1.2076416015625, 1.296142578125, 1.3846435546875, 1.47314453125, 1.5616455078125, 1.650146484375, 1.7386474609375, 1.8271484375, 1.9156494140625, 2.004150390625, 2.0926513671875, 2.18115234375, 2.2696533203125, 2.358154296875, 2.4466552734375, 2.53515625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 6.0, 10.0, 9.0, 8.0, 16.0, 21.0, 30.0, 26.0, 35.0, 30.0, 27.0, 41.0, 39.0, 36.0, 73.0, 92.0, 152.0, 1490.0, 326.0, 137.0, 55.0, 47.0, 35.0, 41.0, 26.0, 24.0, 21.0, 29.0, 30.0, 27.0, 22.0, 8.0, 12.0, 15.0, 6.0, 8.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-10.9296875, -10.6158447265625, -10.302001953125, -9.9881591796875, -9.67431640625, -9.3604736328125, -9.046630859375, -8.7327880859375, -8.4189453125, -8.1051025390625, -7.791259765625, -7.4774169921875, -7.16357421875, -6.8497314453125, -6.535888671875, -6.2220458984375, -5.908203125, -5.5943603515625, -5.280517578125, -4.9666748046875, -4.65283203125, -4.3389892578125, -4.025146484375, -3.7113037109375, -3.3974609375, -3.0836181640625, -2.769775390625, -2.4559326171875, -2.14208984375, -1.8282470703125, -1.514404296875, -1.2005615234375, -0.88671875, -0.5728759765625, -0.259033203125, 0.0548095703125, 0.36865234375, 0.6824951171875, 0.996337890625, 1.3101806640625, 1.6240234375, 1.9378662109375, 2.251708984375, 2.5655517578125, 2.87939453125, 3.1932373046875, 3.507080078125, 3.8209228515625, 4.134765625, 4.4486083984375, 4.762451171875, 5.0762939453125, 5.39013671875, 5.7039794921875, 6.017822265625, 6.3316650390625, 6.6455078125, 6.9593505859375, 7.273193359375, 7.5870361328125, 7.90087890625, 8.2147216796875, 8.528564453125, 8.8424072265625, 9.15625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 7.0, 2.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 15.0, 12.0, 25.0, 30.0, 46.0, 54.0, 59.0, 60.0, 108.0, 131.0, 195.0, 314.0, 697.0, 2942.0, 26522.0, 2598568.0, 500987.0, 11717.0, 1680.0, 514.0, 262.0, 202.0, 122.0, 85.0, 70.0, 60.0, 35.0, 34.0, 24.0, 25.0, 17.0, 9.0, 10.0, 5.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6953125, -15.1314697265625, -14.567626953125, -14.0037841796875, -13.43994140625, -12.8760986328125, -12.312255859375, -11.7484130859375, -11.1845703125, -10.6207275390625, -10.056884765625, -9.4930419921875, -8.92919921875, -8.3653564453125, -7.801513671875, -7.2376708984375, -6.673828125, -6.1099853515625, -5.546142578125, -4.9822998046875, -4.41845703125, -3.8546142578125, -3.290771484375, -2.7269287109375, -2.1630859375, -1.5992431640625, -1.035400390625, -0.4715576171875, 0.09228515625, 0.6561279296875, 1.219970703125, 1.7838134765625, 2.34765625, 2.9114990234375, 3.475341796875, 4.0391845703125, 4.60302734375, 5.1668701171875, 5.730712890625, 6.2945556640625, 6.8583984375, 7.4222412109375, 7.986083984375, 8.5499267578125, 9.11376953125, 9.6776123046875, 10.241455078125, 10.8052978515625, 11.369140625, 11.9329833984375, 12.496826171875, 13.0606689453125, 13.62451171875, 14.1883544921875, 14.752197265625, 15.3160400390625, 15.8798828125, 16.4437255859375, 17.007568359375, 17.5714111328125, 18.13525390625, 18.6990966796875, 19.262939453125, 19.8267822265625, 20.390625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 78.0, 502.0, 374.0, 57.0, 4.0, 0.0, 2.0], "bins": [-159.2655792236328, -156.56248474121094, -153.859375, -151.15628051757812, -148.45318603515625, -145.7500762939453, -143.04698181152344, -140.34388732910156, -137.64077758789062, -134.93768310546875, -132.2345733642578, -129.53147888183594, -126.82837677001953, -124.12527465820312, -121.42218017578125, -118.71907806396484, -116.01598358154297, -113.31288146972656, -110.60978698730469, -107.90668487548828, -105.20358276367188, -102.50048828125, -99.7973861694336, -97.09428405761719, -94.39118957519531, -91.6880874633789, -88.98499298095703, -86.28189086914062, -83.57878875732422, -80.87568664550781, -78.17259216308594, -75.46949005126953, -72.76639556884766, -70.06329345703125, -67.36019897460938, -64.65709686279297, -61.95399475097656, -59.25089645385742, -56.54779815673828, -53.844696044921875, -51.14159393310547, -48.43849563598633, -45.73539352416992, -43.03229522705078, -40.329193115234375, -37.626094818115234, -34.922996520996094, -32.21989440917969, -29.51679801940918, -26.813697814941406, -24.110599517822266, -21.407499313354492, -18.70439910888672, -16.001298904418945, -13.298200607299805, -10.595100402832031, -7.892000198364258, -5.188900470733643, -2.4858007431030273, 0.2172985076904297, 2.920398712158203, 5.623498916625977, 8.326597213745117, 11.02969741821289, 13.732797622680664]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 9.0, 13.0, 15.0, 11.0, 12.0, 18.0, 22.0, 29.0, 23.0, 22.0, 26.0, 30.0, 33.0, 35.0, 40.0, 33.0, 42.0, 34.0, 42.0, 39.0, 31.0, 41.0, 40.0, 41.0, 40.0, 35.0, 41.0, 37.0, 25.0, 20.0, 13.0, 16.0, 20.0, 13.0, 10.0, 6.0, 12.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-25.493305206298828, -24.70520782470703, -23.917110443115234, -23.12901496887207, -22.340917587280273, -21.552820205688477, -20.76472282409668, -19.976627349853516, -19.18852996826172, -18.400432586669922, -17.612335205078125, -16.82423973083496, -16.036142349243164, -15.248044967651367, -14.45994758605957, -13.67185115814209, -12.883753776550293, -12.095656394958496, -11.307559967041016, -10.519462585449219, -9.731366157531738, -8.943268775939941, -8.155172348022461, -7.367074966430664, -6.578978061676025, -5.790881156921387, -5.002784252166748, -4.214687347412109, -3.4265902042388916, -2.638493299484253, -1.8503961563110352, -1.0622992515563965, -0.2742023468017578, 0.5138946175575256, 1.301991581916809, 2.0900886058807373, 2.878185510635376, 3.6662824153900146, 4.454379558563232, 5.242476463317871, 6.03057336807251, 6.818670272827148, 7.606767177581787, 8.394864082336426, 9.182961463928223, 9.971057891845703, 10.7591552734375, 11.547252655029297, 12.335349082946777, 13.123446464538574, 13.911542892456055, 14.699640274047852, 15.487736701965332, 16.275833129882812, 17.06393051147461, 17.852027893066406, 18.640125274658203, 19.42822265625, 20.216320037841797, 21.00441551208496, 21.792512893676758, 22.580610275268555, 23.36870765686035, 24.156803131103516, 24.944900512695312]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 14.0, 21.0, 9.0, 22.0, 16.0, 28.0, 29.0, 27.0, 37.0, 37.0, 41.0, 28.0, 33.0, 41.0, 51.0, 47.0, 41.0, 38.0, 42.0, 42.0, 45.0, 33.0, 35.0, 31.0, 23.0, 15.0, 30.0, 16.0, 18.0, 16.0, 14.0, 13.0, 10.0, 5.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.243682861328125, -3.14166259765625, -3.039642333984375, -2.9376220703125, -2.835601806640625, -2.73358154296875, -2.631561279296875, -2.529541015625, -2.427520751953125, -2.32550048828125, -2.223480224609375, -2.1214599609375, -2.019439697265625, -1.91741943359375, -1.815399169921875, -1.71337890625, -1.611358642578125, -1.50933837890625, -1.407318115234375, -1.3052978515625, -1.203277587890625, -1.10125732421875, -0.999237060546875, -0.897216796875, -0.795196533203125, -0.69317626953125, -0.591156005859375, -0.4891357421875, -0.387115478515625, -0.28509521484375, -0.183074951171875, -0.0810546875, 0.020965576171875, 0.12298583984375, 0.225006103515625, 0.3270263671875, 0.429046630859375, 0.53106689453125, 0.633087158203125, 0.735107421875, 0.837127685546875, 0.93914794921875, 1.041168212890625, 1.1431884765625, 1.245208740234375, 1.34722900390625, 1.449249267578125, 1.55126953125, 1.653289794921875, 1.75531005859375, 1.857330322265625, 1.9593505859375, 2.061370849609375, 2.16339111328125, 2.265411376953125, 2.367431640625, 2.469451904296875, 2.57147216796875, 2.673492431640625, 2.7755126953125, 2.877532958984375, 2.97955322265625, 3.081573486328125, 3.18359375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 6.0, 4.0, 5.0, 7.0, 13.0, 18.0, 28.0, 41.0, 31.0, 53.0, 77.0, 119.0, 202.0, 349.0, 611.0, 1321.0, 2809.0, 6381.0, 16218.0, 45982.0, 150698.0, 582464.0, 1714523.0, 1214342.0, 319651.0, 88998.0, 29535.0, 10906.0, 4480.0, 2034.0, 1006.0, 515.0, 294.0, 153.0, 117.0, 86.0, 46.0, 32.0, 35.0, 21.0, 11.0, 18.0, 6.0, 8.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-5.53125, -5.362548828125, -5.19384765625, -5.025146484375, -4.8564453125, -4.687744140625, -4.51904296875, -4.350341796875, -4.181640625, -4.012939453125, -3.84423828125, -3.675537109375, -3.5068359375, -3.338134765625, -3.16943359375, -3.000732421875, -2.83203125, -2.663330078125, -2.49462890625, -2.325927734375, -2.1572265625, -1.988525390625, -1.81982421875, -1.651123046875, -1.482421875, -1.313720703125, -1.14501953125, -0.976318359375, -0.8076171875, -0.638916015625, -0.47021484375, -0.301513671875, -0.1328125, 0.035888671875, 0.20458984375, 0.373291015625, 0.5419921875, 0.710693359375, 0.87939453125, 1.048095703125, 1.216796875, 1.385498046875, 1.55419921875, 1.722900390625, 1.8916015625, 2.060302734375, 2.22900390625, 2.397705078125, 2.56640625, 2.735107421875, 2.90380859375, 3.072509765625, 3.2412109375, 3.409912109375, 3.57861328125, 3.747314453125, 3.916015625, 4.084716796875, 4.25341796875, 4.422119140625, 4.5908203125, 4.759521484375, 4.92822265625, 5.096923828125, 5.265625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 9.0, 3.0, 8.0, 6.0, 8.0, 5.0, 14.0, 16.0, 26.0, 37.0, 50.0, 63.0, 101.0, 134.0, 132.0, 188.0, 212.0, 296.0, 359.0, 378.0, 383.0, 348.0, 288.0, 248.0, 201.0, 145.0, 102.0, 76.0, 65.0, 42.0, 35.0, 27.0, 14.0, 20.0, 9.0, 7.0, 8.0, 4.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-7.12890625, -6.9361572265625, -6.743408203125, -6.5506591796875, -6.35791015625, -6.1651611328125, -5.972412109375, -5.7796630859375, -5.5869140625, -5.3941650390625, -5.201416015625, -5.0086669921875, -4.81591796875, -4.6231689453125, -4.430419921875, -4.2376708984375, -4.044921875, -3.8521728515625, -3.659423828125, -3.4666748046875, -3.27392578125, -3.0811767578125, -2.888427734375, -2.6956787109375, -2.5029296875, -2.3101806640625, -2.117431640625, -1.9246826171875, -1.73193359375, -1.5391845703125, -1.346435546875, -1.1536865234375, -0.9609375, -0.7681884765625, -0.575439453125, -0.3826904296875, -0.18994140625, 0.0028076171875, 0.195556640625, 0.3883056640625, 0.5810546875, 0.7738037109375, 0.966552734375, 1.1593017578125, 1.35205078125, 1.5447998046875, 1.737548828125, 1.9302978515625, 2.123046875, 2.3157958984375, 2.508544921875, 2.7012939453125, 2.89404296875, 3.0867919921875, 3.279541015625, 3.4722900390625, 3.6650390625, 3.8577880859375, 4.050537109375, 4.2432861328125, 4.43603515625, 4.6287841796875, 4.821533203125, 5.0142822265625, 5.20703125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 9.0, 16.0, 19.0, 31.0, 36.0, 53.0, 72.0, 113.0, 154.0, 255.0, 462.0, 1270.0, 13989.0, 1627481.0, 2527289.0, 20186.0, 1442.0, 511.0, 285.0, 190.0, 133.0, 84.0, 49.0, 48.0, 30.0, 12.0, 8.0, 8.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.19189453125, -22.2275390625, -21.26318359375, -20.298828125, -19.33447265625, -18.3701171875, -17.40576171875, -16.44140625, -15.47705078125, -14.5126953125, -13.54833984375, -12.583984375, -11.61962890625, -10.6552734375, -9.69091796875, -8.7265625, -7.76220703125, -6.7978515625, -5.83349609375, -4.869140625, -3.90478515625, -2.9404296875, -1.97607421875, -1.01171875, -0.04736328125, 0.9169921875, 1.88134765625, 2.845703125, 3.81005859375, 4.7744140625, 5.73876953125, 6.703125, 7.66748046875, 8.6318359375, 9.59619140625, 10.560546875, 11.52490234375, 12.4892578125, 13.45361328125, 14.41796875, 15.38232421875, 16.3466796875, 17.31103515625, 18.275390625, 19.23974609375, 20.2041015625, 21.16845703125, 22.1328125, 23.09716796875, 24.0615234375, 25.02587890625, 25.990234375, 26.95458984375, 27.9189453125, 28.88330078125, 29.84765625, 30.81201171875, 31.7763671875, 32.74072265625, 33.705078125, 34.66943359375, 35.6337890625, 36.59814453125, 37.5625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 20.0, 49.0, 74.0, 111.0, 177.0, 146.0, 154.0, 107.0, 81.0, 43.0, 20.0, 16.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.49700927734375, -76.73894500732422, -74.98087310791016, -73.22280883789062, -71.46473693847656, -69.70667266845703, -67.94860076904297, -66.19053649902344, -64.43246459960938, -62.67439651489258, -60.91632843017578, -59.158260345458984, -57.40019226074219, -55.642127990722656, -53.88405990600586, -52.12599182128906, -50.36792755126953, -48.609859466552734, -46.85179138183594, -45.09372329711914, -43.335655212402344, -41.57759094238281, -39.819522857666016, -38.06145477294922, -36.30338668823242, -34.545318603515625, -32.78725051879883, -31.029184341430664, -29.271116256713867, -27.51304817199707, -25.754981994628906, -23.99691390991211, -22.238849639892578, -20.48078155517578, -18.722713470458984, -16.96464729309082, -15.206579208374023, -13.448511123657227, -11.690443992614746, -9.932376861572266, -8.174308776855469, -6.41624116897583, -4.658173561096191, -2.9001059532165527, -1.142038345336914, 0.6160297393798828, 2.3740968704223633, 4.132164001464844, 5.890232086181641, 7.648299694061279, 9.406367301940918, 11.164434432983398, 12.922502517700195, 14.680570602416992, 16.438636779785156, 18.196704864501953, 19.95477294921875, 21.712841033935547, 23.470909118652344, 25.228975296020508, 26.987043380737305, 28.7451114654541, 30.503177642822266, 32.26124572753906, 34.01931381225586]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 2.0, 9.0, 8.0, 3.0, 11.0, 11.0, 11.0, 18.0, 13.0, 18.0, 22.0, 24.0, 26.0, 25.0, 29.0, 33.0, 28.0, 35.0, 28.0, 38.0, 33.0, 37.0, 49.0, 46.0, 36.0, 33.0, 32.0, 39.0, 27.0, 32.0, 17.0, 28.0, 29.0, 24.0, 27.0, 22.0, 14.0, 13.0, 15.0, 8.0, 9.0, 9.0, 5.0, 7.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.873092651367188, -20.21981430053711, -19.56653594970703, -18.913259506225586, -18.259981155395508, -17.60670280456543, -16.953426361083984, -16.300148010253906, -15.646869659423828, -14.99359130859375, -14.340313911437988, -13.687036514282227, -13.033758163452148, -12.38047981262207, -11.727202415466309, -11.073925018310547, -10.420646667480469, -9.76736831665039, -9.114090919494629, -8.460813522338867, -7.807535171508789, -7.154257297515869, -6.500979423522949, -5.847701549530029, -5.194423675537109, -4.5411458015441895, -3.8878679275512695, -3.2345900535583496, -2.5813121795654297, -1.9280343055725098, -1.2747564315795898, -0.6214785575866699, 0.03179931640625, 0.6850771903991699, 1.3383550643920898, 1.9916329383850098, 2.6449108123779297, 3.2981886863708496, 3.9514665603637695, 4.6047444343566895, 5.258022308349609, 5.911300182342529, 6.564578056335449, 7.217855930328369, 7.871133804321289, 8.524412155151367, 9.177689552307129, 9.83096694946289, 10.484245300292969, 11.137523651123047, 11.790801048278809, 12.44407844543457, 13.097356796264648, 13.750635147094727, 14.403912544250488, 15.05718994140625, 15.710468292236328, 16.363746643066406, 17.017024993896484, 17.67030143737793, 18.323579788208008, 18.976858139038086, 19.63013458251953, 20.28341293334961, 20.936691284179688]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 2.0, 5.0, 11.0, 7.0, 5.0, 14.0, 19.0, 16.0, 17.0, 17.0, 35.0, 27.0, 49.0, 32.0, 42.0, 48.0, 47.0, 36.0, 27.0, 47.0, 43.0, 40.0, 40.0, 36.0, 49.0, 34.0, 28.0, 51.0, 31.0, 17.0, 16.0, 18.0, 18.0, 22.0, 15.0, 9.0, 7.0, 2.0, 2.0, 6.0, 5.0, 0.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.36328125, -3.257537841796875, -3.15179443359375, -3.046051025390625, -2.9403076171875, -2.834564208984375, -2.72882080078125, -2.623077392578125, -2.517333984375, -2.411590576171875, -2.30584716796875, -2.200103759765625, -2.0943603515625, -1.988616943359375, -1.88287353515625, -1.777130126953125, -1.67138671875, -1.565643310546875, -1.45989990234375, -1.354156494140625, -1.2484130859375, -1.142669677734375, -1.03692626953125, -0.931182861328125, -0.825439453125, -0.719696044921875, -0.61395263671875, -0.508209228515625, -0.4024658203125, -0.296722412109375, -0.19097900390625, -0.085235595703125, 0.0205078125, 0.126251220703125, 0.23199462890625, 0.337738037109375, 0.4434814453125, 0.549224853515625, 0.65496826171875, 0.760711669921875, 0.866455078125, 0.972198486328125, 1.07794189453125, 1.183685302734375, 1.2894287109375, 1.395172119140625, 1.50091552734375, 1.606658935546875, 1.71240234375, 1.818145751953125, 1.92388916015625, 2.029632568359375, 2.1353759765625, 2.241119384765625, 2.34686279296875, 2.452606201171875, 2.558349609375, 2.664093017578125, 2.76983642578125, 2.875579833984375, 2.9813232421875, 3.087066650390625, 3.19281005859375, 3.298553466796875, 3.404296875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 14.0, 13.0, 29.0, 25.0, 32.0, 59.0, 99.0, 115.0, 212.0, 276.0, 402.0, 679.0, 1006.0, 1646.0, 2406.0, 3858.0, 6179.0, 9537.0, 15778.0, 25725.0, 44568.0, 80681.0, 178488.0, 360774.0, 145231.0, 70225.0, 38958.0, 23074.0, 14049.0, 8831.0, 5492.0, 3544.0, 2275.0, 1478.0, 917.0, 648.0, 394.0, 298.0, 164.0, 119.0, 82.0, 41.0, 41.0, 25.0, 18.0, 6.0, 11.0, 12.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.16064453125, -0.15552711486816406, -0.15040969848632812, -0.1452922821044922, -0.14017486572265625, -0.1350574493408203, -0.12994003295898438, -0.12482261657714844, -0.1197052001953125, -0.11458778381347656, -0.10947036743164062, -0.10435295104980469, -0.09923553466796875, -0.09411811828613281, -0.08900070190429688, -0.08388328552246094, -0.078765869140625, -0.07364845275878906, -0.06853103637695312, -0.06341361999511719, -0.05829620361328125, -0.05317878723144531, -0.048061370849609375, -0.04294395446777344, -0.0378265380859375, -0.03270912170410156, -0.027591705322265625, -0.022474288940429688, -0.01735687255859375, -0.012239456176757812, -0.007122039794921875, -0.0020046234130859375, 0.00311279296875, 0.008230209350585938, 0.013347625732421875, 0.018465042114257812, 0.02358245849609375, 0.028699874877929688, 0.033817291259765625, 0.03893470764160156, 0.0440521240234375, 0.04916954040527344, 0.054286956787109375, 0.05940437316894531, 0.06452178955078125, 0.06963920593261719, 0.07475662231445312, 0.07987403869628906, 0.084991455078125, 0.09010887145996094, 0.09522628784179688, 0.10034370422363281, 0.10546112060546875, 0.11057853698730469, 0.11569595336914062, 0.12081336975097656, 0.1259307861328125, 0.13104820251464844, 0.13616561889648438, 0.1412830352783203, 0.14640045166015625, 0.1515178680419922, 0.15663528442382812, 0.16175270080566406, 0.1668701171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 10.0, 6.0, 14.0, 13.0, 15.0, 20.0, 17.0, 14.0, 24.0, 25.0, 33.0, 30.0, 24.0, 40.0, 53.0, 43.0, 50.0, 46.0, 43.0, 1057.0, 49.0, 29.0, 26.0, 30.0, 35.0, 26.0, 26.0, 23.0, 22.0, 21.0, 30.0, 27.0, 11.0, 10.0, 13.0, 9.0, 15.0, 6.0, 5.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.949462890625, -1.88330078125, -1.817138671875, -1.7509765625, -1.684814453125, -1.61865234375, -1.552490234375, -1.486328125, -1.420166015625, -1.35400390625, -1.287841796875, -1.2216796875, -1.155517578125, -1.08935546875, -1.023193359375, -0.95703125, -0.890869140625, -0.82470703125, -0.758544921875, -0.6923828125, -0.626220703125, -0.56005859375, -0.493896484375, -0.427734375, -0.361572265625, -0.29541015625, -0.229248046875, -0.1630859375, -0.096923828125, -0.03076171875, 0.035400390625, 0.1015625, 0.167724609375, 0.23388671875, 0.300048828125, 0.3662109375, 0.432373046875, 0.49853515625, 0.564697265625, 0.630859375, 0.697021484375, 0.76318359375, 0.829345703125, 0.8955078125, 0.961669921875, 1.02783203125, 1.093994140625, 1.16015625, 1.226318359375, 1.29248046875, 1.358642578125, 1.4248046875, 1.490966796875, 1.55712890625, 1.623291015625, 1.689453125, 1.755615234375, 1.82177734375, 1.887939453125, 1.9541015625, 2.020263671875, 2.08642578125, 2.152587890625, 2.21875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 5.0, 16.0, 28.0, 39.0, 72.0, 103.0, 146.0, 224.0, 398.0, 640.0, 958.0, 1667.0, 2706.0, 4371.0, 7229.0, 12624.0, 21922.0, 39683.0, 75590.0, 160932.0, 1375956.0, 196142.0, 89100.0, 45860.0, 25186.0, 14513.0, 8371.0, 4890.0, 2947.0, 1783.0, 1162.0, 677.0, 435.0, 251.0, 183.0, 106.0, 70.0, 41.0, 26.0, 30.0, 13.0, 10.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063720703125, -0.0615692138671875, -0.059417724609375, -0.0572662353515625, -0.05511474609375, -0.0529632568359375, -0.050811767578125, -0.0486602783203125, -0.0465087890625, -0.0443572998046875, -0.042205810546875, -0.0400543212890625, -0.03790283203125, -0.0357513427734375, -0.033599853515625, -0.0314483642578125, -0.029296875, -0.0271453857421875, -0.024993896484375, -0.0228424072265625, -0.02069091796875, -0.0185394287109375, -0.016387939453125, -0.0142364501953125, -0.0120849609375, -0.0099334716796875, -0.007781982421875, -0.0056304931640625, -0.00347900390625, -0.0013275146484375, 0.000823974609375, 0.0029754638671875, 0.005126953125, 0.0072784423828125, 0.009429931640625, 0.0115814208984375, 0.01373291015625, 0.0158843994140625, 0.018035888671875, 0.0201873779296875, 0.0223388671875, 0.0244903564453125, 0.026641845703125, 0.0287933349609375, 0.03094482421875, 0.0330963134765625, 0.035247802734375, 0.0373992919921875, 0.03955078125, 0.0417022705078125, 0.043853759765625, 0.0460052490234375, 0.04815673828125, 0.0503082275390625, 0.052459716796875, 0.0546112060546875, 0.0567626953125, 0.0589141845703125, 0.061065673828125, 0.0632171630859375, 0.06536865234375, 0.0675201416015625, 0.069671630859375, 0.0718231201171875, 0.073974609375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 7.0, 10.0, 10.0, 3.0, 13.0, 13.0, 14.0, 19.0, 24.0, 43.0, 28.0, 38.0, 45.0, 45.0, 55.0, 65.0, 58.0, 70.0, 64.0, 55.0, 44.0, 38.0, 32.0, 44.0, 27.0, 29.0, 19.0, 13.0, 19.0, 9.0, 11.0, 5.0, 6.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.7835369110107422e-05, -2.6827678084373474e-05, -2.5819987058639526e-05, -2.481229603290558e-05, -2.380460500717163e-05, -2.2796913981437683e-05, -2.1789222955703735e-05, -2.0781531929969788e-05, -1.977384090423584e-05, -1.8766149878501892e-05, -1.7758458852767944e-05, -1.6750767827033997e-05, -1.574307680130005e-05, -1.4735385775566101e-05, -1.3727694749832153e-05, -1.2720003724098206e-05, -1.1712312698364258e-05, -1.070462167263031e-05, -9.696930646896362e-06, -8.689239621162415e-06, -7.681548595428467e-06, -6.673857569694519e-06, -5.666166543960571e-06, -4.6584755182266235e-06, -3.6507844924926758e-06, -2.643093466758728e-06, -1.6354024410247803e-06, -6.277114152908325e-07, 3.7997961044311523e-07, 1.387670636177063e-06, 2.3953616619110107e-06, 3.4030526876449585e-06, 4.410743713378906e-06, 5.418434739112854e-06, 6.426125764846802e-06, 7.4338167905807495e-06, 8.441507816314697e-06, 9.449198842048645e-06, 1.0456889867782593e-05, 1.146458089351654e-05, 1.2472271919250488e-05, 1.3479962944984436e-05, 1.4487653970718384e-05, 1.549534499645233e-05, 1.650303602218628e-05, 1.7510727047920227e-05, 1.8518418073654175e-05, 1.9526109099388123e-05, 2.053380012512207e-05, 2.1541491150856018e-05, 2.2549182176589966e-05, 2.3556873202323914e-05, 2.456456422805786e-05, 2.557225525379181e-05, 2.6579946279525757e-05, 2.7587637305259705e-05, 2.8595328330993652e-05, 2.96030193567276e-05, 3.061071038246155e-05, 3.1618401408195496e-05, 3.262609243392944e-05, 3.363378345966339e-05, 3.464147448539734e-05, 3.564916551113129e-05, 3.6656856536865234e-05]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 8.0, 6.0, 11.0, 8.0, 17.0, 16.0, 22.0, 27.0, 45.0, 54.0, 79.0, 131.0, 177.0, 353.0, 1013.0, 11759.0, 980031.0, 52018.0, 1612.0, 492.0, 235.0, 132.0, 70.0, 63.0, 39.0, 25.0, 18.0, 20.0, 10.0, 9.0, 7.0, 10.0, 11.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0006995201110839844, -0.0006809458136558533, -0.0006623715162277222, -0.0006437972187995911, -0.00062522292137146, -0.0006066486239433289, -0.0005880743265151978, -0.0005695000290870667, -0.0005509257316589355, -0.0005323514342308044, -0.0005137771368026733, -0.0004952028393745422, -0.00047662854194641113, -0.00045805424451828003, -0.0004394799470901489, -0.0004209056496620178, -0.0004023313522338867, -0.0003837570548057556, -0.0003651827573776245, -0.0003466084599494934, -0.0003280341625213623, -0.0003094598650932312, -0.0002908855676651001, -0.000272311270236969, -0.0002537369728088379, -0.0002351626753807068, -0.00021658837795257568, -0.00019801408052444458, -0.00017943978309631348, -0.00016086548566818237, -0.00014229118824005127, -0.00012371689081192017, -0.00010514259338378906, -8.656829595565796e-05, -6.799399852752686e-05, -4.941970109939575e-05, -3.084540367126465e-05, -1.2271106243133545e-05, 6.303191184997559e-06, 2.4877488613128662e-05, 4.3451786041259766e-05, 6.202608346939087e-05, 8.060038089752197e-05, 9.917467832565308e-05, 0.00011774897575378418, 0.00013632327318191528, 0.0001548975706100464, 0.0001734718680381775, 0.0001920461654663086, 0.0002106204628944397, 0.0002291947603225708, 0.0002477690577507019, 0.000266343355178833, 0.0002849176526069641, 0.0003034919500350952, 0.0003220662474632263, 0.0003406405448913574, 0.0003592148423194885, 0.00037778913974761963, 0.00039636343717575073, 0.00041493773460388184, 0.00043351203203201294, 0.00045208632946014404, 0.00047066062688827515, 0.0004892349243164062]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 127.0, 882.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.0008219456649385393, -0.0008080642437562346, -0.0007941828807815909, -0.0007803014595992863, -0.0007664200384169817, -0.000752538675442338, -0.0007386572542600334, -0.0007247758330777287, -0.000710894470103085, -0.0006970130489207804, -0.0006831316859461367, -0.0006692502647638321, -0.0006553688435815275, -0.0006414874806068838, -0.0006276060594245791, -0.0006137246964499354, -0.0005998432752676308, -0.0005859618540853262, -0.0005720804911106825, -0.0005581990699283779, -0.0005443176487460732, -0.0005304362857714295, -0.0005165548645891249, -0.0005026734434068203, -0.0004887920804321766, -0.0004749106883537024, -0.0004610292671713978, -0.00044714787509292364, -0.0004332664830144495, -0.0004193850909359753, -0.0004055036697536707, -0.00039162227767519653, -0.00037774088559672236, -0.0003638594935182482, -0.0003499780723359436, -0.0003360966802574694, -0.00032221528817899525, -0.0003083338961005211, -0.00029445247491821647, -0.0002805710828397423, -0.00026668969076126814, -0.000252808298682794, -0.00023892689205240458, -0.0002250454854220152, -0.00021116409334354103, -0.00019728268671315163, -0.00018340128008276224, -0.00016951988800428808, -0.00015563846682198346, -0.00014175706019159406, -0.0001278756681131199, -0.00011399426148273051, -0.00010011286940425634, -8.623146277386695e-05, -7.235006341943517e-05, -5.8468664065003395e-05, -4.458727198652923e-05, -3.070587263209745e-05, -1.682447145867627e-05, -2.9430702852550894e-06, 1.0938329069176689e-05, 2.4819732061587274e-05, 3.870113141601905e-05, 5.258253077045083e-05, 6.646393012488261e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 12.0, 9.0, 19.0, 27.0, 30.0, 43.0, 35.0, 53.0, 57.0, 67.0, 69.0, 79.0, 70.0, 73.0, 62.0, 57.0, 39.0, 41.0, 46.0, 26.0, 17.0, 20.0, 14.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4139881134033203e-05, -2.3050233721733093e-05, -2.1960586309432983e-05, -2.0870938897132874e-05, -1.9781291484832764e-05, -1.8691644072532654e-05, -1.7601996660232544e-05, -1.6512349247932434e-05, -1.5422701835632324e-05, -1.4333054423332214e-05, -1.3243407011032104e-05, -1.2153759598731995e-05, -1.1064112186431885e-05, -9.974464774131775e-06, -8.884817361831665e-06, -7.795169949531555e-06, -6.705522537231445e-06, -5.6158751249313354e-06, -4.526227712631226e-06, -3.4365803003311157e-06, -2.346932888031006e-06, -1.257285475730896e-06, -1.6763806343078613e-07, 9.220093488693237e-07, 2.0116567611694336e-06, 3.1013041734695435e-06, 4.190951585769653e-06, 5.280598998069763e-06, 6.370246410369873e-06, 7.459893822669983e-06, 8.549541234970093e-06, 9.639188647270203e-06, 1.0728836059570312e-05, 1.1818483471870422e-05, 1.2908130884170532e-05, 1.3997778296470642e-05, 1.5087425708770752e-05, 1.6177073121070862e-05, 1.726672053337097e-05, 1.835636794567108e-05, 1.944601535797119e-05, 2.05356627702713e-05, 2.162531018257141e-05, 2.271495759487152e-05, 2.380460500717163e-05, 2.489425241947174e-05, 2.598389983177185e-05, 2.707354724407196e-05, 2.816319465637207e-05, 2.925284206867218e-05, 3.034248948097229e-05, 3.14321368932724e-05, 3.252178430557251e-05, 3.361143171787262e-05, 3.470107913017273e-05, 3.579072654247284e-05, 3.688037395477295e-05, 3.797002136707306e-05, 3.905966877937317e-05, 4.014931619167328e-05, 4.123896360397339e-05, 4.23286110162735e-05, 4.341825842857361e-05, 4.450790584087372e-05, 4.559755325317383e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 2.0, 5.0, 11.0, 7.0, 5.0, 14.0, 19.0, 16.0, 17.0, 17.0, 35.0, 27.0, 49.0, 32.0, 42.0, 48.0, 47.0, 36.0, 27.0, 47.0, 43.0, 40.0, 40.0, 36.0, 49.0, 34.0, 28.0, 51.0, 31.0, 17.0, 16.0, 18.0, 18.0, 22.0, 15.0, 9.0, 7.0, 2.0, 2.0, 6.0, 5.0, 0.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.36328125, -3.257537841796875, -3.15179443359375, -3.046051025390625, -2.9403076171875, -2.834564208984375, -2.72882080078125, -2.623077392578125, -2.517333984375, -2.411590576171875, -2.30584716796875, -2.200103759765625, -2.0943603515625, -1.988616943359375, -1.88287353515625, -1.777130126953125, -1.67138671875, -1.565643310546875, -1.45989990234375, -1.354156494140625, -1.2484130859375, -1.142669677734375, -1.03692626953125, -0.931182861328125, -0.825439453125, -0.719696044921875, -0.61395263671875, -0.508209228515625, -0.4024658203125, -0.296722412109375, -0.19097900390625, -0.085235595703125, 0.0205078125, 0.126251220703125, 0.23199462890625, 0.337738037109375, 0.4434814453125, 0.549224853515625, 0.65496826171875, 0.760711669921875, 0.866455078125, 0.972198486328125, 1.07794189453125, 1.183685302734375, 1.2894287109375, 1.395172119140625, 1.50091552734375, 1.606658935546875, 1.71240234375, 1.818145751953125, 1.92388916015625, 2.029632568359375, 2.1353759765625, 2.241119384765625, 2.34686279296875, 2.452606201171875, 2.558349609375, 2.664093017578125, 2.76983642578125, 2.875579833984375, 2.9813232421875, 3.087066650390625, 3.19281005859375, 3.298553466796875, 3.404296875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 8.0, 5.0, 15.0, 20.0, 38.0, 38.0, 74.0, 89.0, 135.0, 219.0, 383.0, 613.0, 1072.0, 1642.0, 2810.0, 4791.0, 8209.0, 14485.0, 25669.0, 50237.0, 119295.0, 376134.0, 261641.0, 89453.0, 40555.0, 21564.0, 12031.0, 7081.0, 4070.0, 2433.0, 1440.0, 843.0, 502.0, 318.0, 210.0, 143.0, 91.0, 52.0, 42.0, 34.0, 19.0, 11.0, 16.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 5.0], "bins": [-3.462890625, -3.363525390625, -3.26416015625, -3.164794921875, -3.0654296875, -2.966064453125, -2.86669921875, -2.767333984375, -2.66796875, -2.568603515625, -2.46923828125, -2.369873046875, -2.2705078125, -2.171142578125, -2.07177734375, -1.972412109375, -1.873046875, -1.773681640625, -1.67431640625, -1.574951171875, -1.4755859375, -1.376220703125, -1.27685546875, -1.177490234375, -1.078125, -0.978759765625, -0.87939453125, -0.780029296875, -0.6806640625, -0.581298828125, -0.48193359375, -0.382568359375, -0.283203125, -0.183837890625, -0.08447265625, 0.014892578125, 0.1142578125, 0.213623046875, 0.31298828125, 0.412353515625, 0.51171875, 0.611083984375, 0.71044921875, 0.809814453125, 0.9091796875, 1.008544921875, 1.10791015625, 1.207275390625, 1.306640625, 1.406005859375, 1.50537109375, 1.604736328125, 1.7041015625, 1.803466796875, 1.90283203125, 2.002197265625, 2.1015625, 2.200927734375, 2.30029296875, 2.399658203125, 2.4990234375, 2.598388671875, 2.69775390625, 2.797119140625, 2.896484375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 10.0, 8.0, 8.0, 6.0, 11.0, 11.0, 12.0, 16.0, 19.0, 21.0, 25.0, 28.0, 24.0, 25.0, 26.0, 37.0, 27.0, 34.0, 77.0, 107.0, 182.0, 1468.0, 279.0, 120.0, 61.0, 47.0, 38.0, 39.0, 26.0, 25.0, 39.0, 31.0, 26.0, 26.0, 14.0, 18.0, 9.0, 12.0, 5.0, 11.0, 4.0, 7.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-9.484375, -9.194091796875, -8.90380859375, -8.613525390625, -8.3232421875, -8.032958984375, -7.74267578125, -7.452392578125, -7.162109375, -6.871826171875, -6.58154296875, -6.291259765625, -6.0009765625, -5.710693359375, -5.42041015625, -5.130126953125, -4.83984375, -4.549560546875, -4.25927734375, -3.968994140625, -3.6787109375, -3.388427734375, -3.09814453125, -2.807861328125, -2.517578125, -2.227294921875, -1.93701171875, -1.646728515625, -1.3564453125, -1.066162109375, -0.77587890625, -0.485595703125, -0.1953125, 0.094970703125, 0.38525390625, 0.675537109375, 0.9658203125, 1.256103515625, 1.54638671875, 1.836669921875, 2.126953125, 2.417236328125, 2.70751953125, 2.997802734375, 3.2880859375, 3.578369140625, 3.86865234375, 4.158935546875, 4.44921875, 4.739501953125, 5.02978515625, 5.320068359375, 5.6103515625, 5.900634765625, 6.19091796875, 6.481201171875, 6.771484375, 7.061767578125, 7.35205078125, 7.642333984375, 7.9326171875, 8.222900390625, 8.51318359375, 8.803466796875, 9.09375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 10.0, 4.0, 11.0, 4.0, 6.0, 9.0, 13.0, 14.0, 16.0, 20.0, 34.0, 40.0, 59.0, 68.0, 60.0, 111.0, 129.0, 185.0, 273.0, 495.0, 2892.0, 79195.0, 2982953.0, 74912.0, 2637.0, 527.0, 244.0, 164.0, 141.0, 97.0, 69.0, 63.0, 52.0, 45.0, 29.0, 28.0, 16.0, 17.0, 16.0, 11.0, 3.0, 13.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-20.859375, -20.197021484375, -19.53466796875, -18.872314453125, -18.2099609375, -17.547607421875, -16.88525390625, -16.222900390625, -15.560546875, -14.898193359375, -14.23583984375, -13.573486328125, -12.9111328125, -12.248779296875, -11.58642578125, -10.924072265625, -10.26171875, -9.599365234375, -8.93701171875, -8.274658203125, -7.6123046875, -6.949951171875, -6.28759765625, -5.625244140625, -4.962890625, -4.300537109375, -3.63818359375, -2.975830078125, -2.3134765625, -1.651123046875, -0.98876953125, -0.326416015625, 0.3359375, 0.998291015625, 1.66064453125, 2.322998046875, 2.9853515625, 3.647705078125, 4.31005859375, 4.972412109375, 5.634765625, 6.297119140625, 6.95947265625, 7.621826171875, 8.2841796875, 8.946533203125, 9.60888671875, 10.271240234375, 10.93359375, 11.595947265625, 12.25830078125, 12.920654296875, 13.5830078125, 14.245361328125, 14.90771484375, 15.570068359375, 16.232421875, 16.894775390625, 17.55712890625, 18.219482421875, 18.8818359375, 19.544189453125, 20.20654296875, 20.868896484375, 21.53125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 14.0, 35.0, 84.0, 160.0, 198.0, 213.0, 147.0, 101.0, 38.0, 14.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.40932083129883, -40.51087951660156, -39.6124382019043, -38.71399688720703, -37.81555938720703, -36.917118072509766, -36.0186767578125, -35.120235443115234, -34.22179412841797, -33.3233528137207, -32.42491149902344, -31.526472091674805, -30.62803077697754, -29.729591369628906, -28.83115005493164, -27.932708740234375, -27.03426742553711, -26.135826110839844, -25.23738670349121, -24.338945388793945, -23.44050407409668, -22.542064666748047, -21.64362335205078, -20.745182037353516, -19.846742630004883, -18.948301315307617, -18.049861907958984, -17.15142059326172, -16.252979278564453, -15.354538917541504, -14.456098556518555, -13.557657241821289, -12.659215927124023, -11.760775566101074, -10.862334251403809, -9.96389389038086, -9.065452575683594, -8.167012214660645, -7.268571376800537, -6.37013053894043, -5.471689701080322, -4.573248863220215, -3.6748080253601074, -2.776367425918579, -1.8779265880584717, -0.9794859886169434, -0.08104515075683594, 0.8173956871032715, 1.715836524963379, 2.6142773628234863, 3.5127182006835938, 4.411158561706543, 5.309599876403809, 6.208040237426758, 7.106481075286865, 8.004921913146973, 8.903362274169922, 9.801802635192871, 10.700243949890137, 11.598684310913086, 12.497125625610352, 13.3955659866333, 14.29400634765625, 15.192447662353516, 16.09088897705078]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 0.0, 3.0, 4.0, 8.0, 8.0, 16.0, 18.0, 14.0, 9.0, 24.0, 19.0, 24.0, 31.0, 22.0, 38.0, 26.0, 36.0, 35.0, 39.0, 40.0, 46.0, 46.0, 44.0, 38.0, 47.0, 40.0, 28.0, 41.0, 29.0, 31.0, 26.0, 30.0, 19.0, 20.0, 25.0, 14.0, 11.0, 10.0, 13.0, 6.0, 4.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.766494750976562, -24.909870147705078, -24.053247451782227, -23.196622848510742, -22.34000015258789, -21.483375549316406, -20.626750946044922, -19.77012825012207, -18.913503646850586, -18.0568790435791, -17.20025634765625, -16.343631744384766, -15.487008094787598, -14.63038444519043, -13.773760795593262, -12.917137145996094, -12.060513496398926, -11.203889846801758, -10.34726619720459, -9.490642547607422, -8.634017944335938, -7.7773942947387695, -6.920770645141602, -6.064146518707275, -5.207522869110107, -4.3508992195129395, -3.4942750930786133, -2.6376514434814453, -1.7810275554656982, -0.9244036674499512, -0.0677800178527832, 0.788844108581543, 1.645467758178711, 2.502091646194458, 3.358715534210205, 4.215339183807373, 5.071963310241699, 5.928586959838867, 6.785210609436035, 7.641834735870361, 8.498458862304688, 9.355082511901855, 10.211706161499023, 11.068330764770508, 11.924954414367676, 12.781578063964844, 13.638201713562012, 14.49482536315918, 15.351449012756348, 16.208072662353516, 17.064697265625, 17.92131996154785, 18.777944564819336, 19.634567260742188, 20.491191864013672, 21.347816467285156, 22.204439163208008, 23.061063766479492, 23.917686462402344, 24.774311065673828, 25.63093376159668, 26.487558364868164, 27.344181060791016, 28.2008056640625, 29.057430267333984]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 6.0, 7.0, 8.0, 10.0, 13.0, 10.0, 21.0, 18.0, 25.0, 29.0, 38.0, 47.0, 36.0, 48.0, 30.0, 44.0, 47.0, 37.0, 36.0, 43.0, 50.0, 37.0, 43.0, 37.0, 32.0, 34.0, 24.0, 31.0, 33.0, 23.0, 19.0, 17.0, 16.0, 17.0, 6.0, 3.0, 4.0, 5.0, 1.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.35321044921875, -3.2396240234375, -3.12603759765625, -3.012451171875, -2.89886474609375, -2.7852783203125, -2.67169189453125, -2.55810546875, -2.44451904296875, -2.3309326171875, -2.21734619140625, -2.103759765625, -1.99017333984375, -1.8765869140625, -1.76300048828125, -1.6494140625, -1.53582763671875, -1.4222412109375, -1.30865478515625, -1.195068359375, -1.08148193359375, -0.9678955078125, -0.85430908203125, -0.74072265625, -0.62713623046875, -0.5135498046875, -0.39996337890625, -0.286376953125, -0.17279052734375, -0.0592041015625, 0.05438232421875, 0.16796875, 0.28155517578125, 0.3951416015625, 0.50872802734375, 0.622314453125, 0.73590087890625, 0.8494873046875, 0.96307373046875, 1.07666015625, 1.19024658203125, 1.3038330078125, 1.41741943359375, 1.531005859375, 1.64459228515625, 1.7581787109375, 1.87176513671875, 1.9853515625, 2.09893798828125, 2.2125244140625, 2.32611083984375, 2.439697265625, 2.55328369140625, 2.6668701171875, 2.78045654296875, 2.89404296875, 3.00762939453125, 3.1212158203125, 3.23480224609375, 3.348388671875, 3.46197509765625, 3.5755615234375, 3.68914794921875, 3.802734375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 11.0, 14.0, 18.0, 29.0, 31.0, 49.0, 93.0, 117.0, 247.0, 623.0, 1837.0, 7414.0, 42850.0, 437644.0, 2998801.0, 634168.0, 57005.0, 9586.0, 2279.0, 717.0, 291.0, 164.0, 83.0, 54.0, 39.0, 18.0, 27.0, 15.0, 7.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.28125, -8.944580078125, -8.60791015625, -8.271240234375, -7.9345703125, -7.597900390625, -7.26123046875, -6.924560546875, -6.587890625, -6.251220703125, -5.91455078125, -5.577880859375, -5.2412109375, -4.904541015625, -4.56787109375, -4.231201171875, -3.89453125, -3.557861328125, -3.22119140625, -2.884521484375, -2.5478515625, -2.211181640625, -1.87451171875, -1.537841796875, -1.201171875, -0.864501953125, -0.52783203125, -0.191162109375, 0.1455078125, 0.482177734375, 0.81884765625, 1.155517578125, 1.4921875, 1.828857421875, 2.16552734375, 2.502197265625, 2.8388671875, 3.175537109375, 3.51220703125, 3.848876953125, 4.185546875, 4.522216796875, 4.85888671875, 5.195556640625, 5.5322265625, 5.868896484375, 6.20556640625, 6.542236328125, 6.87890625, 7.215576171875, 7.55224609375, 7.888916015625, 8.2255859375, 8.562255859375, 8.89892578125, 9.235595703125, 9.572265625, 9.908935546875, 10.24560546875, 10.582275390625, 10.9189453125, 11.255615234375, 11.59228515625, 11.928955078125, 12.265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 9.0, 19.0, 20.0, 19.0, 30.0, 35.0, 51.0, 82.0, 102.0, 132.0, 151.0, 215.0, 309.0, 366.0, 450.0, 433.0, 374.0, 299.0, 248.0, 195.0, 140.0, 98.0, 70.0, 67.0, 31.0, 30.0, 24.0, 15.0, 19.0, 9.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.59039306640625, -5.3917236328125, -5.19305419921875, -4.994384765625, -4.79571533203125, -4.5970458984375, -4.39837646484375, -4.19970703125, -4.00103759765625, -3.8023681640625, -3.60369873046875, -3.405029296875, -3.20635986328125, -3.0076904296875, -2.80902099609375, -2.6103515625, -2.41168212890625, -2.2130126953125, -2.01434326171875, -1.815673828125, -1.61700439453125, -1.4183349609375, -1.21966552734375, -1.02099609375, -0.82232666015625, -0.6236572265625, -0.42498779296875, -0.226318359375, -0.02764892578125, 0.1710205078125, 0.36968994140625, 0.568359375, 0.76702880859375, 0.9656982421875, 1.16436767578125, 1.363037109375, 1.56170654296875, 1.7603759765625, 1.95904541015625, 2.15771484375, 2.35638427734375, 2.5550537109375, 2.75372314453125, 2.952392578125, 3.15106201171875, 3.3497314453125, 3.54840087890625, 3.7470703125, 3.94573974609375, 4.1444091796875, 4.34307861328125, 4.541748046875, 4.74041748046875, 4.9390869140625, 5.13775634765625, 5.33642578125, 5.53509521484375, 5.7337646484375, 5.93243408203125, 6.131103515625, 6.32977294921875, 6.5284423828125, 6.72711181640625, 6.92578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 3.0, 6.0, 17.0, 15.0, 13.0, 25.0, 27.0, 43.0, 54.0, 79.0, 139.0, 178.0, 254.0, 407.0, 1513.0, 30370.0, 3002073.0, 1144291.0, 12602.0, 971.0, 357.0, 241.0, 159.0, 117.0, 89.0, 73.0, 48.0, 28.0, 17.0, 25.0, 14.0, 9.0, 16.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.82470703125, -29.9150390625, -29.00537109375, -28.095703125, -27.18603515625, -26.2763671875, -25.36669921875, -24.45703125, -23.54736328125, -22.6376953125, -21.72802734375, -20.818359375, -19.90869140625, -18.9990234375, -18.08935546875, -17.1796875, -16.27001953125, -15.3603515625, -14.45068359375, -13.541015625, -12.63134765625, -11.7216796875, -10.81201171875, -9.90234375, -8.99267578125, -8.0830078125, -7.17333984375, -6.263671875, -5.35400390625, -4.4443359375, -3.53466796875, -2.625, -1.71533203125, -0.8056640625, 0.10400390625, 1.013671875, 1.92333984375, 2.8330078125, 3.74267578125, 4.65234375, 5.56201171875, 6.4716796875, 7.38134765625, 8.291015625, 9.20068359375, 10.1103515625, 11.02001953125, 11.9296875, 12.83935546875, 13.7490234375, 14.65869140625, 15.568359375, 16.47802734375, 17.3876953125, 18.29736328125, 19.20703125, 20.11669921875, 21.0263671875, 21.93603515625, 22.845703125, 23.75537109375, 24.6650390625, 25.57470703125, 26.484375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 39.0, 80.0, 199.0, 195.0, 225.0, 158.0, 74.0, 24.0, 10.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.960176467895508, -20.628643035888672, -18.297107696533203, -15.96557331085205, -13.634038925170898, -11.302504539489746, -8.970970153808594, -6.639436721801758, -4.307901382446289, -1.9763669967651367, 0.3551673889160156, 2.686701774597168, 5.01823616027832, 7.349770545959473, 9.681304931640625, 12.012838363647461, 14.34437370300293, 16.675907135009766, 19.007442474365234, 21.338977813720703, 23.67051124572754, 26.002044677734375, 28.333580017089844, 30.66511344909668, 32.99665069580078, 35.32818603515625, 37.65972137451172, 39.99125289916992, 42.32278823852539, 44.65432357788086, 46.98585510253906, 49.31739044189453, 51.64892578125, 53.98046112060547, 56.31199645996094, 58.64352798461914, 60.97506332397461, 63.30659866333008, 65.63813018798828, 67.96966552734375, 70.30120086669922, 72.63273620605469, 74.96427154541016, 77.29580688476562, 79.62733459472656, 81.95886993408203, 84.2904052734375, 86.62194061279297, 88.95347595214844, 91.2850112915039, 93.61654663085938, 95.94808197021484, 98.27961730957031, 100.61114501953125, 102.94268035888672, 105.27421569824219, 107.60575103759766, 109.93728637695312, 112.2688217163086, 114.60035705566406, 116.931884765625, 119.26342010498047, 121.59495544433594, 123.9264907836914, 126.25802612304688]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 6.0, 4.0, 9.0, 9.0, 11.0, 7.0, 11.0, 20.0, 17.0, 17.0, 34.0, 29.0, 25.0, 34.0, 36.0, 35.0, 44.0, 38.0, 36.0, 43.0, 37.0, 49.0, 30.0, 39.0, 38.0, 31.0, 30.0, 31.0, 23.0, 30.0, 29.0, 21.0, 20.0, 13.0, 18.0, 18.0, 22.0, 13.0, 13.0, 5.0, 10.0, 1.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.737152099609375, -20.08965301513672, -19.44215202331543, -18.794652938842773, -18.147151947021484, -17.499652862548828, -16.852153778076172, -16.204654693603516, -15.557153701782227, -14.909653663635254, -14.262153625488281, -13.614654541015625, -12.967154502868652, -12.31965446472168, -11.672155380249023, -11.02465534210205, -10.377155303955078, -9.729655265808105, -9.082155227661133, -8.434656143188477, -7.787156105041504, -7.139656066894531, -6.492156505584717, -5.844656944274902, -5.19715690612793, -4.549656867980957, -3.9021573066711426, -3.254657506942749, -2.6071577072143555, -1.959657907485962, -1.3121581077575684, -0.6646585464477539, -0.01715850830078125, 0.6303412914276123, 1.2778410911560059, 1.9253408908843994, 2.572840690612793, 3.2203404903411865, 3.86784029006958, 4.5153398513793945, 5.162839889526367, 5.81033992767334, 6.457839488983154, 7.105339050292969, 7.752839088439941, 8.400339126586914, 9.04783821105957, 9.695338249206543, 10.342838287353516, 10.990338325500488, 11.637838363647461, 12.285337448120117, 12.93283748626709, 13.580337524414062, 14.227836608886719, 14.875336647033691, 15.522836685180664, 16.17033576965332, 16.81783676147461, 17.465335845947266, 18.112834930419922, 18.76033592224121, 19.407835006713867, 20.055335998535156, 20.702835083007812]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 11.0, 10.0, 8.0, 13.0, 29.0, 14.0, 19.0, 27.0, 32.0, 32.0, 45.0, 36.0, 36.0, 46.0, 43.0, 46.0, 41.0, 43.0, 46.0, 40.0, 31.0, 30.0, 34.0, 33.0, 26.0, 34.0, 30.0, 24.0, 19.0, 22.0, 19.0, 17.0, 16.0, 8.0, 3.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.066375732421875, -2.95697021484375, -2.847564697265625, -2.7381591796875, -2.628753662109375, -2.51934814453125, -2.409942626953125, -2.300537109375, -2.191131591796875, -2.08172607421875, -1.972320556640625, -1.8629150390625, -1.753509521484375, -1.64410400390625, -1.534698486328125, -1.42529296875, -1.315887451171875, -1.20648193359375, -1.097076416015625, -0.9876708984375, -0.878265380859375, -0.76885986328125, -0.659454345703125, -0.550048828125, -0.440643310546875, -0.33123779296875, -0.221832275390625, -0.1124267578125, -0.003021240234375, 0.10638427734375, 0.215789794921875, 0.3251953125, 0.434600830078125, 0.54400634765625, 0.653411865234375, 0.7628173828125, 0.872222900390625, 0.98162841796875, 1.091033935546875, 1.200439453125, 1.309844970703125, 1.41925048828125, 1.528656005859375, 1.6380615234375, 1.747467041015625, 1.85687255859375, 1.966278076171875, 2.07568359375, 2.185089111328125, 2.29449462890625, 2.403900146484375, 2.5133056640625, 2.622711181640625, 2.73211669921875, 2.841522216796875, 2.950927734375, 3.060333251953125, 3.16973876953125, 3.279144287109375, 3.3885498046875, 3.497955322265625, 3.60736083984375, 3.716766357421875, 3.826171875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 5.0, 12.0, 13.0, 16.0, 24.0, 29.0, 37.0, 52.0, 70.0, 111.0, 172.0, 248.0, 396.0, 621.0, 903.0, 1368.0, 1998.0, 3117.0, 5063.0, 8100.0, 12507.0, 20403.0, 33610.0, 56308.0, 108191.0, 275870.0, 269230.0, 106311.0, 56188.0, 33098.0, 19921.0, 12642.0, 7779.0, 4968.0, 3179.0, 2004.0, 1336.0, 862.0, 597.0, 414.0, 266.0, 169.0, 91.0, 72.0, 55.0, 30.0, 23.0, 13.0, 15.0, 12.0, 10.0, 9.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.1519775390625, -0.1469097137451172, -0.14184188842773438, -0.13677406311035156, -0.13170623779296875, -0.12663841247558594, -0.12157058715820312, -0.11650276184082031, -0.1114349365234375, -0.10636711120605469, -0.10129928588867188, -0.09623146057128906, -0.09116363525390625, -0.08609580993652344, -0.08102798461914062, -0.07596015930175781, -0.070892333984375, -0.06582450866699219, -0.060756683349609375, -0.05568885803222656, -0.05062103271484375, -0.04555320739746094, -0.040485382080078125, -0.03541755676269531, -0.0303497314453125, -0.025281906127929688, -0.020214080810546875, -0.015146255493164062, -0.01007843017578125, -0.0050106048583984375, 5.7220458984375e-05, 0.0051250457763671875, 0.01019287109375, 0.015260696411132812, 0.020328521728515625, 0.025396347045898438, 0.03046417236328125, 0.03553199768066406, 0.040599822998046875, 0.04566764831542969, 0.0507354736328125, 0.05580329895019531, 0.060871124267578125, 0.06593894958496094, 0.07100677490234375, 0.07607460021972656, 0.08114242553710938, 0.08621025085449219, 0.091278076171875, 0.09634590148925781, 0.10141372680664062, 0.10648155212402344, 0.11154937744140625, 0.11661720275878906, 0.12168502807617188, 0.1267528533935547, 0.1318206787109375, 0.1368885040283203, 0.14195632934570312, 0.14702415466308594, 0.15209197998046875, 0.15715980529785156, 0.16222763061523438, 0.1672954559326172, 0.17236328125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 13.0, 8.0, 10.0, 19.0, 17.0, 14.0, 21.0, 27.0, 25.0, 26.0, 30.0, 31.0, 43.0, 47.0, 31.0, 44.0, 25.0, 46.0, 1061.0, 43.0, 33.0, 46.0, 29.0, 40.0, 41.0, 26.0, 23.0, 23.0, 29.0, 21.0, 25.0, 20.0, 17.0, 10.0, 15.0, 8.0, 6.0, 5.0, 10.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.153228759765625, -2.07989501953125, -2.006561279296875, -1.9332275390625, -1.859893798828125, -1.78656005859375, -1.713226318359375, -1.639892578125, -1.566558837890625, -1.49322509765625, -1.419891357421875, -1.3465576171875, -1.273223876953125, -1.19989013671875, -1.126556396484375, -1.05322265625, -0.979888916015625, -0.90655517578125, -0.833221435546875, -0.7598876953125, -0.686553955078125, -0.61322021484375, -0.539886474609375, -0.466552734375, -0.393218994140625, -0.31988525390625, -0.246551513671875, -0.1732177734375, -0.099884033203125, -0.02655029296875, 0.046783447265625, 0.1201171875, 0.193450927734375, 0.26678466796875, 0.340118408203125, 0.4134521484375, 0.486785888671875, 0.56011962890625, 0.633453369140625, 0.706787109375, 0.780120849609375, 0.85345458984375, 0.926788330078125, 1.0001220703125, 1.073455810546875, 1.14678955078125, 1.220123291015625, 1.29345703125, 1.366790771484375, 1.44012451171875, 1.513458251953125, 1.5867919921875, 1.660125732421875, 1.73345947265625, 1.806793212890625, 1.880126953125, 1.953460693359375, 2.02679443359375, 2.100128173828125, 2.1734619140625, 2.246795654296875, 2.32012939453125, 2.393463134765625, 2.466796875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 11.0, 25.0, 34.0, 44.0, 72.0, 103.0, 136.0, 233.0, 296.0, 549.0, 775.0, 1122.0, 1813.0, 2868.0, 4401.0, 7153.0, 11669.0, 19181.0, 32231.0, 56292.0, 104245.0, 210180.0, 1322467.0, 142785.0, 73927.0, 41201.0, 24366.0, 14504.0, 9053.0, 5487.0, 3522.0, 2314.0, 1371.0, 889.0, 600.0, 415.0, 268.0, 155.0, 136.0, 74.0, 48.0, 36.0, 22.0, 17.0, 9.0, 10.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06060791015625, -0.05866718292236328, -0.05672645568847656, -0.054785728454589844, -0.052845001220703125, -0.050904273986816406, -0.04896354675292969, -0.04702281951904297, -0.04508209228515625, -0.04314136505126953, -0.04120063781738281, -0.039259910583496094, -0.037319183349609375, -0.035378456115722656, -0.03343772888183594, -0.03149700164794922, -0.0295562744140625, -0.02761554718017578, -0.025674819946289062, -0.023734092712402344, -0.021793365478515625, -0.019852638244628906, -0.017911911010742188, -0.01597118377685547, -0.01403045654296875, -0.012089729309082031, -0.010149002075195312, -0.008208274841308594, -0.006267547607421875, -0.004326820373535156, -0.0023860931396484375, -0.00044536590576171875, 0.001495361328125, 0.0034360885620117188, 0.0053768157958984375, 0.007317543029785156, 0.009258270263671875, 0.011198997497558594, 0.013139724731445312, 0.015080451965332031, 0.01702117919921875, 0.01896190643310547, 0.020902633666992188, 0.022843360900878906, 0.024784088134765625, 0.026724815368652344, 0.028665542602539062, 0.03060626983642578, 0.0325469970703125, 0.03448772430419922, 0.03642845153808594, 0.038369178771972656, 0.040309906005859375, 0.042250633239746094, 0.04419136047363281, 0.04613208770751953, 0.04807281494140625, 0.05001354217529297, 0.05195426940917969, 0.053894996643066406, 0.055835723876953125, 0.057776451110839844, 0.05971717834472656, 0.06165790557861328, 0.0635986328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 3.0, 8.0, 7.0, 7.0, 7.0, 11.0, 4.0, 21.0, 30.0, 31.0, 43.0, 80.0, 83.0, 105.0, 84.0, 99.0, 107.0, 63.0, 43.0, 36.0, 29.0, 26.0, 15.0, 14.0, 8.0, 6.0, 2.0, 10.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.424022674560547e-05, -5.271565169095993e-05, -5.119107663631439e-05, -4.9666501581668854e-05, -4.8141926527023315e-05, -4.661735147237778e-05, -4.509277641773224e-05, -4.35682013630867e-05, -4.204362630844116e-05, -4.0519051253795624e-05, -3.8994476199150085e-05, -3.746990114450455e-05, -3.594532608985901e-05, -3.442075103521347e-05, -3.289617598056793e-05, -3.1371600925922394e-05, -2.9847025871276855e-05, -2.8322450816631317e-05, -2.679787576198578e-05, -2.527330070734024e-05, -2.3748725652694702e-05, -2.2224150598049164e-05, -2.0699575543403625e-05, -1.9175000488758087e-05, -1.765042543411255e-05, -1.612585037946701e-05, -1.4601275324821472e-05, -1.3076700270175934e-05, -1.1552125215530396e-05, -1.0027550160884857e-05, -8.502975106239319e-06, -6.9784000515937805e-06, -5.453824996948242e-06, -3.929249942302704e-06, -2.4046748876571655e-06, -8.800998330116272e-07, 6.444752216339111e-07, 2.1690502762794495e-06, 3.693625330924988e-06, 5.218200385570526e-06, 6.7427754402160645e-06, 8.267350494861603e-06, 9.791925549507141e-06, 1.131650060415268e-05, 1.2841075658798218e-05, 1.4365650713443756e-05, 1.5890225768089294e-05, 1.7414800822734833e-05, 1.893937587738037e-05, 2.046395093202591e-05, 2.1988525986671448e-05, 2.3513101041316986e-05, 2.5037676095962524e-05, 2.6562251150608063e-05, 2.80868262052536e-05, 2.961140125989914e-05, 3.113597631454468e-05, 3.2660551369190216e-05, 3.4185126423835754e-05, 3.570970147848129e-05, 3.723427653312683e-05, 3.875885158777237e-05, 4.028342664241791e-05, 4.1808001697063446e-05, 4.3332576751708984e-05]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 6.0, 14.0, 15.0, 19.0, 38.0, 42.0, 72.0, 107.0, 229.0, 600.0, 11605.0, 1029875.0, 4897.0, 494.0, 192.0, 108.0, 75.0, 32.0, 30.0, 22.0, 12.0, 8.0, 4.0, 10.0, 3.0, 9.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008530616760253906, -0.0008230432868003845, -0.0007930248975753784, -0.0007630065083503723, -0.0007329881191253662, -0.0007029697299003601, -0.000672951340675354, -0.0006429329514503479, -0.0006129145622253418, -0.0005828961730003357, -0.0005528777837753296, -0.0005228593945503235, -0.0004928410053253174, -0.0004628226161003113, -0.0004328042268753052, -0.00040278583765029907, -0.00037276744842529297, -0.00034274905920028687, -0.00031273066997528076, -0.00028271228075027466, -0.00025269389152526855, -0.00022267550230026245, -0.00019265711307525635, -0.00016263872385025024, -0.00013262033462524414, -0.00010260194540023804, -7.258355617523193e-05, -4.256516695022583e-05, -1.2546777725219727e-05, 1.7471611499786377e-05, 4.749000072479248e-05, 7.750838994979858e-05, 0.00010752677917480469, 0.0001375451683998108, 0.0001675635576248169, 0.000197581946849823, 0.0002276003360748291, 0.0002576187252998352, 0.0002876371145248413, 0.0003176555037498474, 0.0003476738929748535, 0.0003776922821998596, 0.0004077106714248657, 0.0004377290606498718, 0.00046774744987487793, 0.000497765839099884, 0.0005277842283248901, 0.0005578026175498962, 0.0005878210067749023, 0.0006178393959999084, 0.0006478577852249146, 0.0006778761744499207, 0.0007078945636749268, 0.0007379129528999329, 0.000767931342124939, 0.0007979497313499451, 0.0008279681205749512, 0.0008579865097999573, 0.0008880048990249634, 0.0009180232882499695, 0.0009480416774749756, 0.0009780600666999817, 0.0010080784559249878, 0.001038096845149994, 0.001068115234375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 976.0, 35.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009671393781900406, -0.000950653338804841, -0.0009341673576273024, -0.0009176813764497638, -0.0009011953370645642, -0.0008847092976793647, -0.000868223316501826, -0.0008517373353242874, -0.0008352512959390879, -0.0008187652565538883, -0.0008022792753763497, -0.0007857932941988111, -0.0007693072548136115, -0.000752821215428412, -0.0007363352342508733, -0.0007198492530733347, -0.0007033632136881351, -0.0006868771743029356, -0.000670391193125397, -0.0006539052119478583, -0.0006374191725626588, -0.0006209331331774592, -0.0006044471519999206, -0.000587961170822382, -0.0005714751314371824, -0.0005549890920519829, -0.0005385031108744442, -0.0005220171296969056, -0.0005055310903117061, -0.0004890450509265065, -0.0004725590697489679, -0.0004560730594675988, -0.0004395869909785688, -0.0004231009806971997, -0.0004066149704158306, -0.0003901289601344615, -0.00037364294985309243, -0.00035715693957172334, -0.00034067092929035425, -0.00032418491900898516, -0.00030769890872761607, -0.000291212898446247, -0.0002747268881648779, -0.0002582408778835088, -0.0002417548676021397, -0.00022526885732077062, -0.00020878284703940153, -0.00019229683675803244, -0.00017581082647666335, -0.00015932481619529426, -0.00014283880591392517, -0.00012635279563255608, -0.00010986678535118699, -9.33807750698179e-05, -7.689476478844881e-05, -6.040875450707972e-05, -4.3922751501668245e-05, -2.7436741220299155e-05, -1.0950730938930064e-05, 5.535279342439026e-06, 2.2021289623808116e-05, 3.8507299905177206e-05, 5.4993310186546296e-05, 7.147932046791539e-05, 8.796533074928448e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 16.0, 8.0, 17.0, 19.0, 17.0, 23.0, 26.0, 40.0, 50.0, 42.0, 61.0, 61.0, 70.0, 63.0, 54.0, 56.0, 75.0, 45.0, 53.0, 37.0, 33.0, 22.0, 24.0, 29.0, 22.0, 12.0, 6.0, 11.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3186206817626953e-05, -2.2067688405513763e-05, -2.0949169993400574e-05, -1.9830651581287384e-05, -1.8712133169174194e-05, -1.7593614757061005e-05, -1.6475096344947815e-05, -1.5356577932834625e-05, -1.4238059520721436e-05, -1.3119541108608246e-05, -1.2001022696495056e-05, -1.0882504284381866e-05, -9.763985872268677e-06, -8.645467460155487e-06, -7.526949048042297e-06, -6.408430635929108e-06, -5.289912223815918e-06, -4.171393811702728e-06, -3.0528753995895386e-06, -1.934356987476349e-06, -8.158385753631592e-07, 3.026798367500305e-07, 1.4211982488632202e-06, 2.53971666097641e-06, 3.6582350730895996e-06, 4.776753485202789e-06, 5.895271897315979e-06, 7.013790309429169e-06, 8.132308721542358e-06, 9.250827133655548e-06, 1.0369345545768738e-05, 1.1487863957881927e-05, 1.2606382369995117e-05, 1.3724900782108307e-05, 1.4843419194221497e-05, 1.5961937606334686e-05, 1.7080456018447876e-05, 1.8198974430561066e-05, 1.9317492842674255e-05, 2.0436011254787445e-05, 2.1554529666900635e-05, 2.2673048079013824e-05, 2.3791566491127014e-05, 2.4910084903240204e-05, 2.6028603315353394e-05, 2.7147121727466583e-05, 2.8265640139579773e-05, 2.9384158551692963e-05, 3.0502676963806152e-05, 3.162119537591934e-05, 3.273971378803253e-05, 3.385823220014572e-05, 3.497675061225891e-05, 3.60952690243721e-05, 3.721378743648529e-05, 3.833230584859848e-05, 3.945082426071167e-05, 4.056934267282486e-05, 4.168786108493805e-05, 4.280637949705124e-05, 4.392489790916443e-05, 4.504341632127762e-05, 4.616193473339081e-05, 4.7280453145504e-05, 4.839897155761719e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 11.0, 10.0, 8.0, 13.0, 29.0, 14.0, 19.0, 27.0, 32.0, 32.0, 45.0, 36.0, 36.0, 46.0, 43.0, 46.0, 41.0, 43.0, 46.0, 40.0, 31.0, 30.0, 34.0, 33.0, 26.0, 34.0, 30.0, 24.0, 19.0, 22.0, 19.0, 17.0, 16.0, 8.0, 3.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.066375732421875, -2.95697021484375, -2.847564697265625, -2.7381591796875, -2.628753662109375, -2.51934814453125, -2.409942626953125, -2.300537109375, -2.191131591796875, -2.08172607421875, -1.972320556640625, -1.8629150390625, -1.753509521484375, -1.64410400390625, -1.534698486328125, -1.42529296875, -1.315887451171875, -1.20648193359375, -1.097076416015625, -0.9876708984375, -0.878265380859375, -0.76885986328125, -0.659454345703125, -0.550048828125, -0.440643310546875, -0.33123779296875, -0.221832275390625, -0.1124267578125, -0.003021240234375, 0.10638427734375, 0.215789794921875, 0.3251953125, 0.434600830078125, 0.54400634765625, 0.653411865234375, 0.7628173828125, 0.872222900390625, 0.98162841796875, 1.091033935546875, 1.200439453125, 1.309844970703125, 1.41925048828125, 1.528656005859375, 1.6380615234375, 1.747467041015625, 1.85687255859375, 1.966278076171875, 2.07568359375, 2.185089111328125, 2.29449462890625, 2.403900146484375, 2.5133056640625, 2.622711181640625, 2.73211669921875, 2.841522216796875, 2.950927734375, 3.060333251953125, 3.16973876953125, 3.279144287109375, 3.3885498046875, 3.497955322265625, 3.60736083984375, 3.716766357421875, 3.826171875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 8.0, 15.0, 15.0, 21.0, 28.0, 60.0, 89.0, 152.0, 236.0, 346.0, 660.0, 1045.0, 1735.0, 3013.0, 5364.0, 9482.0, 17111.0, 31553.0, 63893.0, 155784.0, 425746.0, 182628.0, 71749.0, 34933.0, 18635.0, 10351.0, 5860.0, 3307.0, 1895.0, 1095.0, 656.0, 386.0, 244.0, 145.0, 103.0, 73.0, 40.0, 30.0, 18.0, 11.0, 10.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.283203125, -3.168304443359375, -3.05340576171875, -2.938507080078125, -2.8236083984375, -2.708709716796875, -2.59381103515625, -2.478912353515625, -2.364013671875, -2.249114990234375, -2.13421630859375, -2.019317626953125, -1.9044189453125, -1.789520263671875, -1.67462158203125, -1.559722900390625, -1.44482421875, -1.329925537109375, -1.21502685546875, -1.100128173828125, -0.9852294921875, -0.870330810546875, -0.75543212890625, -0.640533447265625, -0.525634765625, -0.410736083984375, -0.29583740234375, -0.180938720703125, -0.0660400390625, 0.048858642578125, 0.16375732421875, 0.278656005859375, 0.3935546875, 0.508453369140625, 0.62335205078125, 0.738250732421875, 0.8531494140625, 0.968048095703125, 1.08294677734375, 1.197845458984375, 1.312744140625, 1.427642822265625, 1.54254150390625, 1.657440185546875, 1.7723388671875, 1.887237548828125, 2.00213623046875, 2.117034912109375, 2.23193359375, 2.346832275390625, 2.46173095703125, 2.576629638671875, 2.6915283203125, 2.806427001953125, 2.92132568359375, 3.036224365234375, 3.151123046875, 3.266021728515625, 3.38092041015625, 3.495819091796875, 3.6107177734375, 3.725616455078125, 3.84051513671875, 3.955413818359375, 4.0703125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 5.0, 11.0, 10.0, 12.0, 18.0, 18.0, 22.0, 18.0, 21.0, 31.0, 21.0, 33.0, 37.0, 46.0, 41.0, 67.0, 156.0, 1404.0, 452.0, 155.0, 68.0, 50.0, 50.0, 39.0, 39.0, 29.0, 28.0, 21.0, 18.0, 26.0, 16.0, 16.0, 14.0, 9.0, 8.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.9921875, -10.6590576171875, -10.325927734375, -9.9927978515625, -9.65966796875, -9.3265380859375, -8.993408203125, -8.6602783203125, -8.3271484375, -7.9940185546875, -7.660888671875, -7.3277587890625, -6.99462890625, -6.6614990234375, -6.328369140625, -5.9952392578125, -5.662109375, -5.3289794921875, -4.995849609375, -4.6627197265625, -4.32958984375, -3.9964599609375, -3.663330078125, -3.3302001953125, -2.9970703125, -2.6639404296875, -2.330810546875, -1.9976806640625, -1.66455078125, -1.3314208984375, -0.998291015625, -0.6651611328125, -0.33203125, 0.0010986328125, 0.334228515625, 0.6673583984375, 1.00048828125, 1.3336181640625, 1.666748046875, 1.9998779296875, 2.3330078125, 2.6661376953125, 2.999267578125, 3.3323974609375, 3.66552734375, 3.9986572265625, 4.331787109375, 4.6649169921875, 4.998046875, 5.3311767578125, 5.664306640625, 5.9974365234375, 6.33056640625, 6.6636962890625, 6.996826171875, 7.3299560546875, 7.6630859375, 7.9962158203125, 8.329345703125, 8.6624755859375, 8.99560546875, 9.3287353515625, 9.661865234375, 9.9949951171875, 10.328125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 7.0, 6.0, 8.0, 21.0, 18.0, 27.0, 30.0, 39.0, 32.0, 51.0, 84.0, 99.0, 161.0, 199.0, 355.0, 814.0, 3200.0, 34810.0, 2513429.0, 572705.0, 16071.0, 1931.0, 582.0, 274.0, 179.0, 104.0, 101.0, 76.0, 59.0, 47.0, 29.0, 39.0, 29.0, 10.0, 19.0, 12.0, 12.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.1748046875, -16.599609375, -16.0244140625, -15.44921875, -14.8740234375, -14.298828125, -13.7236328125, -13.1484375, -12.5732421875, -11.998046875, -11.4228515625, -10.84765625, -10.2724609375, -9.697265625, -9.1220703125, -8.546875, -7.9716796875, -7.396484375, -6.8212890625, -6.24609375, -5.6708984375, -5.095703125, -4.5205078125, -3.9453125, -3.3701171875, -2.794921875, -2.2197265625, -1.64453125, -1.0693359375, -0.494140625, 0.0810546875, 0.65625, 1.2314453125, 1.806640625, 2.3818359375, 2.95703125, 3.5322265625, 4.107421875, 4.6826171875, 5.2578125, 5.8330078125, 6.408203125, 6.9833984375, 7.55859375, 8.1337890625, 8.708984375, 9.2841796875, 9.859375, 10.4345703125, 11.009765625, 11.5849609375, 12.16015625, 12.7353515625, 13.310546875, 13.8857421875, 14.4609375, 15.0361328125, 15.611328125, 16.1865234375, 16.76171875, 17.3369140625, 17.912109375, 18.4873046875, 19.0625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 11.0, 316.0, 634.0, 58.0], "bins": [-232.66358947753906, -228.9227294921875, -225.18186950683594, -221.44100952148438, -217.7001495361328, -213.95928955078125, -210.2184295654297, -206.47756958007812, -202.73670959472656, -198.995849609375, -195.25498962402344, -191.51412963867188, -187.7732696533203, -184.03240966796875, -180.2915496826172, -176.55068969726562, -172.809814453125, -169.06895446777344, -165.32809448242188, -161.5872344970703, -157.84637451171875, -154.1055145263672, -150.36465454101562, -146.62379455566406, -142.8829345703125, -139.14207458496094, -135.40121459960938, -131.6603546142578, -127.91949462890625, -124.17863464355469, -120.43777465820312, -116.69691467285156, -112.9560546875, -109.21519470214844, -105.47433471679688, -101.73347473144531, -97.99261474609375, -94.25175476074219, -90.51089477539062, -86.77003479003906, -83.02916717529297, -79.2883071899414, -75.54744720458984, -71.80658721923828, -68.06572723388672, -64.32486724853516, -60.58400344848633, -56.843143463134766, -53.1022834777832, -49.36142349243164, -45.62056350708008, -41.87969970703125, -38.13883972167969, -34.397979736328125, -30.657119750976562, -26.916259765625, -23.175399780273438, -19.434539794921875, -15.693678855895996, -11.952817916870117, -8.211957931518555, -4.471097946166992, -0.7302360534667969, 3.0106239318847656, 6.751483917236328]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 5.0, 12.0, 10.0, 12.0, 15.0, 16.0, 18.0, 21.0, 16.0, 29.0, 31.0, 19.0, 35.0, 37.0, 27.0, 46.0, 49.0, 54.0, 40.0, 44.0, 54.0, 46.0, 35.0, 44.0, 38.0, 31.0, 29.0, 23.0, 31.0, 32.0, 13.0, 19.0, 13.0, 10.0, 8.0, 9.0, 5.0, 10.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.15752410888672, -24.285110473632812, -23.412694931030273, -22.540281295776367, -21.667865753173828, -20.795452117919922, -19.923038482666016, -19.050622940063477, -18.178207397460938, -17.30579376220703, -16.433378219604492, -15.560964584350586, -14.688549041748047, -13.81613540649414, -12.943720817565918, -12.071306228637695, -11.198892593383789, -10.326478004455566, -9.454063415527344, -8.581649780273438, -7.709234714508057, -6.836820125579834, -5.9644060134887695, -5.091991424560547, -4.219576835632324, -3.3471622467041016, -2.474747896194458, -1.6023335456848145, -0.7299189567565918, 0.14249563217163086, 1.0149097442626953, 1.887324333190918, 2.7597389221191406, 3.6321535110473633, 4.504568099975586, 5.37698221206665, 6.249396800994873, 7.121811389923096, 7.99422550201416, 8.866640090942383, 9.739054679870605, 10.611469268798828, 11.48388385772705, 12.356298446655273, 13.22871208190918, 14.101127624511719, 14.973541259765625, 15.845955848693848, 16.71837043762207, 17.590784072875977, 18.463199615478516, 19.335613250732422, 20.20802879333496, 21.080442428588867, 21.952857971191406, 22.825271606445312, 23.69768524169922, 24.570098876953125, 25.442514419555664, 26.31492805480957, 27.18734359741211, 28.059757232666016, 28.932170867919922, 29.80458641052246, 30.677001953125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 6.0, 5.0, 12.0, 9.0, 13.0, 13.0, 23.0, 19.0, 25.0, 26.0, 26.0, 32.0, 34.0, 36.0, 45.0, 39.0, 46.0, 47.0, 45.0, 49.0, 35.0, 49.0, 38.0, 36.0, 34.0, 25.0, 31.0, 26.0, 34.0, 24.0, 17.0, 23.0, 24.0, 11.0, 8.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.405517578125, -3.28759765625, -3.169677734375, -3.0517578125, -2.933837890625, -2.81591796875, -2.697998046875, -2.580078125, -2.462158203125, -2.34423828125, -2.226318359375, -2.1083984375, -1.990478515625, -1.87255859375, -1.754638671875, -1.63671875, -1.518798828125, -1.40087890625, -1.282958984375, -1.1650390625, -1.047119140625, -0.92919921875, -0.811279296875, -0.693359375, -0.575439453125, -0.45751953125, -0.339599609375, -0.2216796875, -0.103759765625, 0.01416015625, 0.132080078125, 0.25, 0.367919921875, 0.48583984375, 0.603759765625, 0.7216796875, 0.839599609375, 0.95751953125, 1.075439453125, 1.193359375, 1.311279296875, 1.42919921875, 1.547119140625, 1.6650390625, 1.782958984375, 1.90087890625, 2.018798828125, 2.13671875, 2.254638671875, 2.37255859375, 2.490478515625, 2.6083984375, 2.726318359375, 2.84423828125, 2.962158203125, 3.080078125, 3.197998046875, 3.31591796875, 3.433837890625, 3.5517578125, 3.669677734375, 3.78759765625, 3.905517578125, 4.0234375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 10.0, 9.0, 10.0, 12.0, 8.0, 12.0, 14.0, 23.0, 23.0, 29.0, 39.0, 55.0, 92.0, 233.0, 618.0, 2164.0, 9347.0, 55386.0, 632081.0, 3000071.0, 439932.0, 43535.0, 7638.0, 1838.0, 574.0, 198.0, 88.0, 44.0, 27.0, 23.0, 24.0, 19.0, 18.0, 14.0, 15.0, 13.0, 10.0, 2.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.4296875, -10.097900390625, -9.76611328125, -9.434326171875, -9.1025390625, -8.770751953125, -8.43896484375, -8.107177734375, -7.775390625, -7.443603515625, -7.11181640625, -6.780029296875, -6.4482421875, -6.116455078125, -5.78466796875, -5.452880859375, -5.12109375, -4.789306640625, -4.45751953125, -4.125732421875, -3.7939453125, -3.462158203125, -3.13037109375, -2.798583984375, -2.466796875, -2.135009765625, -1.80322265625, -1.471435546875, -1.1396484375, -0.807861328125, -0.47607421875, -0.144287109375, 0.1875, 0.519287109375, 0.85107421875, 1.182861328125, 1.5146484375, 1.846435546875, 2.17822265625, 2.510009765625, 2.841796875, 3.173583984375, 3.50537109375, 3.837158203125, 4.1689453125, 4.500732421875, 4.83251953125, 5.164306640625, 5.49609375, 5.827880859375, 6.15966796875, 6.491455078125, 6.8232421875, 7.155029296875, 7.48681640625, 7.818603515625, 8.150390625, 8.482177734375, 8.81396484375, 9.145751953125, 9.4775390625, 9.809326171875, 10.14111328125, 10.472900390625, 10.8046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 10.0, 14.0, 17.0, 28.0, 48.0, 37.0, 78.0, 118.0, 168.0, 216.0, 298.0, 421.0, 528.0, 548.0, 438.0, 308.0, 253.0, 165.0, 112.0, 94.0, 58.0, 39.0, 25.0, 18.0, 14.0, 7.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.1976318359375, -6.949951171875, -6.7022705078125, -6.45458984375, -6.2069091796875, -5.959228515625, -5.7115478515625, -5.4638671875, -5.2161865234375, -4.968505859375, -4.7208251953125, -4.47314453125, -4.2254638671875, -3.977783203125, -3.7301025390625, -3.482421875, -3.2347412109375, -2.987060546875, -2.7393798828125, -2.49169921875, -2.2440185546875, -1.996337890625, -1.7486572265625, -1.5009765625, -1.2532958984375, -1.005615234375, -0.7579345703125, -0.51025390625, -0.2625732421875, -0.014892578125, 0.2327880859375, 0.48046875, 0.7281494140625, 0.975830078125, 1.2235107421875, 1.47119140625, 1.7188720703125, 1.966552734375, 2.2142333984375, 2.4619140625, 2.7095947265625, 2.957275390625, 3.2049560546875, 3.45263671875, 3.7003173828125, 3.947998046875, 4.1956787109375, 4.443359375, 4.6910400390625, 4.938720703125, 5.1864013671875, 5.43408203125, 5.6817626953125, 5.929443359375, 6.1771240234375, 6.4248046875, 6.6724853515625, 6.920166015625, 7.1678466796875, 7.41552734375, 7.6632080078125, 7.910888671875, 8.1585693359375, 8.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 10.0, 9.0, 10.0, 28.0, 34.0, 62.0, 80.0, 116.0, 193.0, 293.0, 562.0, 4087.0, 2364182.0, 1819531.0, 3667.0, 545.0, 309.0, 186.0, 135.0, 82.0, 59.0, 37.0, 23.0, 20.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.75, -47.3154296875, -45.880859375, -44.4462890625, -43.01171875, -41.5771484375, -40.142578125, -38.7080078125, -37.2734375, -35.8388671875, -34.404296875, -32.9697265625, -31.53515625, -30.1005859375, -28.666015625, -27.2314453125, -25.796875, -24.3623046875, -22.927734375, -21.4931640625, -20.05859375, -18.6240234375, -17.189453125, -15.7548828125, -14.3203125, -12.8857421875, -11.451171875, -10.0166015625, -8.58203125, -7.1474609375, -5.712890625, -4.2783203125, -2.84375, -1.4091796875, 0.025390625, 1.4599609375, 2.89453125, 4.3291015625, 5.763671875, 7.1982421875, 8.6328125, 10.0673828125, 11.501953125, 12.9365234375, 14.37109375, 15.8056640625, 17.240234375, 18.6748046875, 20.109375, 21.5439453125, 22.978515625, 24.4130859375, 25.84765625, 27.2822265625, 28.716796875, 30.1513671875, 31.5859375, 33.0205078125, 34.455078125, 35.8896484375, 37.32421875, 38.7587890625, 40.193359375, 41.6279296875, 43.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 9.0, 15.0, 25.0, 41.0, 33.0, 74.0, 80.0, 100.0, 127.0, 124.0, 101.0, 89.0, 71.0, 38.0, 32.0, 22.0, 12.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.389074325561523, -20.30548667907715, -19.221900939941406, -18.13831329345703, -17.054725646972656, -15.971138954162598, -14.887552261352539, -13.803964614868164, -12.720377922058105, -11.636791229248047, -10.553203582763672, -9.469616889953613, -8.386030197143555, -7.30244255065918, -6.218855857849121, -5.135268688201904, -4.0516815185546875, -2.9680943489074707, -1.884507417678833, -0.8009204864501953, 0.2826666831970215, 1.3662538528442383, 2.449840545654297, 3.5334277153015137, 4.6170148849487305, 5.700602054595947, 6.784189224243164, 7.867775917053223, 8.951362609863281, 10.034950256347656, 11.118536949157715, 12.202123641967773, 13.285709381103516, 14.369296073913574, 15.45288372039795, 16.536470413208008, 17.620058059692383, 18.703643798828125, 19.7872314453125, 20.870819091796875, 21.95440673828125, 23.037994384765625, 24.121580123901367, 25.205167770385742, 26.288755416870117, 27.37234115600586, 28.455928802490234, 29.53951644897461, 30.62310218811035, 31.706689834594727, 32.79027557373047, 33.873863220214844, 34.95745086669922, 36.041038513183594, 37.12462615966797, 38.20820999145508, 39.29179763793945, 40.37538528442383, 41.4589729309082, 42.54255676269531, 43.62614440917969, 44.70973205566406, 45.79331970214844, 46.87690734863281, 47.96049499511719]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 8.0, 5.0, 7.0, 6.0, 10.0, 13.0, 12.0, 9.0, 14.0, 20.0, 13.0, 26.0, 35.0, 28.0, 36.0, 37.0, 35.0, 45.0, 43.0, 39.0, 39.0, 37.0, 42.0, 35.0, 35.0, 30.0, 35.0, 38.0, 30.0, 25.0, 24.0, 24.0, 18.0, 27.0, 25.0, 14.0, 17.0, 10.0, 17.0, 9.0, 2.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.401016235351562, -20.75477409362793, -20.10853385925293, -19.462291717529297, -18.816051483154297, -18.169809341430664, -17.52356719970703, -16.87732696533203, -16.2310848236084, -15.584843635559082, -14.938602447509766, -14.292360305786133, -13.646119117736816, -12.9998779296875, -12.353635787963867, -11.70739459991455, -11.061153411865234, -10.414912223815918, -9.768671035766602, -9.122428894042969, -8.476187705993652, -7.829946517944336, -7.183704853057861, -6.537463188171387, -5.89122200012207, -5.244980812072754, -4.598739147186279, -3.952497720718384, -3.3062562942504883, -2.6600148677825928, -2.0137734413146973, -1.3675317764282227, -0.7212905883789062, -0.07504916191101074, 0.5711922645568848, 1.2174336910247803, 1.8636751174926758, 2.5099165439605713, 3.156157970428467, 3.8023996353149414, 4.448640823364258, 5.094882011413574, 5.741123676300049, 6.387365341186523, 7.03360652923584, 7.679847717285156, 8.326089859008789, 8.972331047058105, 9.618572235107422, 10.264813423156738, 10.911054611206055, 11.557296752929688, 12.203537940979004, 12.84977912902832, 13.496021270751953, 14.14226245880127, 14.788503646850586, 15.434744834899902, 16.08098602294922, 16.72722816467285, 17.373470306396484, 18.019710540771484, 18.665952682495117, 19.31219482421875, 19.95843505859375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 8.0, 13.0, 10.0, 13.0, 16.0, 15.0, 21.0, 34.0, 28.0, 27.0, 33.0, 38.0, 42.0, 47.0, 29.0, 43.0, 43.0, 44.0, 35.0, 29.0, 35.0, 38.0, 42.0, 31.0, 36.0, 22.0, 30.0, 25.0, 21.0, 20.0, 18.0, 23.0, 15.0, 15.0, 10.0, 5.0, 6.0, 8.0, 3.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.673828125, -3.561614990234375, -3.44940185546875, -3.337188720703125, -3.2249755859375, -3.112762451171875, -3.00054931640625, -2.888336181640625, -2.776123046875, -2.663909912109375, -2.55169677734375, -2.439483642578125, -2.3272705078125, -2.215057373046875, -2.10284423828125, -1.990631103515625, -1.87841796875, -1.766204833984375, -1.65399169921875, -1.541778564453125, -1.4295654296875, -1.317352294921875, -1.20513916015625, -1.092926025390625, -0.980712890625, -0.868499755859375, -0.75628662109375, -0.644073486328125, -0.5318603515625, -0.419647216796875, -0.30743408203125, -0.195220947265625, -0.0830078125, 0.029205322265625, 0.14141845703125, 0.253631591796875, 0.3658447265625, 0.478057861328125, 0.59027099609375, 0.702484130859375, 0.814697265625, 0.926910400390625, 1.03912353515625, 1.151336669921875, 1.2635498046875, 1.375762939453125, 1.48797607421875, 1.600189208984375, 1.71240234375, 1.824615478515625, 1.93682861328125, 2.049041748046875, 2.1612548828125, 2.273468017578125, 2.38568115234375, 2.497894287109375, 2.610107421875, 2.722320556640625, 2.83453369140625, 2.946746826171875, 3.0589599609375, 3.171173095703125, 3.28338623046875, 3.395599365234375, 3.5078125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 12.0, 19.0, 33.0, 29.0, 50.0, 69.0, 102.0, 159.0, 262.0, 358.0, 527.0, 852.0, 1234.0, 1769.0, 2858.0, 4367.0, 6853.0, 10767.0, 17369.0, 28929.0, 49109.0, 89777.0, 192659.0, 322295.0, 141611.0, 71352.0, 40655.0, 23934.0, 14494.0, 9212.0, 5934.0, 3707.0, 2423.0, 1523.0, 1078.0, 735.0, 472.0, 313.0, 214.0, 148.0, 81.0, 52.0, 55.0, 29.0, 20.0, 17.0, 11.0, 7.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1510009765625, -0.14602088928222656, -0.14104080200195312, -0.1360607147216797, -0.13108062744140625, -0.1261005401611328, -0.12112045288085938, -0.11614036560058594, -0.1111602783203125, -0.10618019104003906, -0.10120010375976562, -0.09622001647949219, -0.09123992919921875, -0.08625984191894531, -0.08127975463867188, -0.07629966735839844, -0.071319580078125, -0.06633949279785156, -0.061359405517578125, -0.05637931823730469, -0.05139923095703125, -0.04641914367675781, -0.041439056396484375, -0.03645896911621094, -0.0314788818359375, -0.026498794555664062, -0.021518707275390625, -0.016538619995117188, -0.01155853271484375, -0.0065784454345703125, -0.001598358154296875, 0.0033817291259765625, 0.00836181640625, 0.013341903686523438, 0.018321990966796875, 0.023302078247070312, 0.02828216552734375, 0.03326225280761719, 0.038242340087890625, 0.04322242736816406, 0.0482025146484375, 0.05318260192871094, 0.058162689208984375, 0.06314277648925781, 0.06812286376953125, 0.07310295104980469, 0.07808303833007812, 0.08306312561035156, 0.088043212890625, 0.09302330017089844, 0.09800338745117188, 0.10298347473144531, 0.10796356201171875, 0.11294364929199219, 0.11792373657226562, 0.12290382385253906, 0.1278839111328125, 0.13286399841308594, 0.13784408569335938, 0.1428241729736328, 0.14780426025390625, 0.1527843475341797, 0.15776443481445312, 0.16274452209472656, 0.167724609375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 8.0, 7.0, 19.0, 12.0, 29.0, 16.0, 20.0, 36.0, 26.0, 29.0, 39.0, 33.0, 45.0, 42.0, 53.0, 49.0, 1079.0, 41.0, 50.0, 49.0, 32.0, 38.0, 33.0, 33.0, 27.0, 25.0, 26.0, 21.0, 13.0, 12.0, 19.0, 15.0, 12.0, 8.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44140625, -2.356781005859375, -2.27215576171875, -2.187530517578125, -2.1029052734375, -2.018280029296875, -1.93365478515625, -1.849029541015625, -1.764404296875, -1.679779052734375, -1.59515380859375, -1.510528564453125, -1.4259033203125, -1.341278076171875, -1.25665283203125, -1.172027587890625, -1.08740234375, -1.002777099609375, -0.91815185546875, -0.833526611328125, -0.7489013671875, -0.664276123046875, -0.57965087890625, -0.495025634765625, -0.410400390625, -0.325775146484375, -0.24114990234375, -0.156524658203125, -0.0718994140625, 0.012725830078125, 0.09735107421875, 0.181976318359375, 0.2666015625, 0.351226806640625, 0.43585205078125, 0.520477294921875, 0.6051025390625, 0.689727783203125, 0.77435302734375, 0.858978271484375, 0.943603515625, 1.028228759765625, 1.11285400390625, 1.197479248046875, 1.2821044921875, 1.366729736328125, 1.45135498046875, 1.535980224609375, 1.62060546875, 1.705230712890625, 1.78985595703125, 1.874481201171875, 1.9591064453125, 2.043731689453125, 2.12835693359375, 2.212982177734375, 2.297607421875, 2.382232666015625, 2.46685791015625, 2.551483154296875, 2.6361083984375, 2.720733642578125, 2.80535888671875, 2.889984130859375, 2.974609375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 3.0, 5.0, 12.0, 16.0, 20.0, 28.0, 33.0, 63.0, 100.0, 155.0, 172.0, 301.0, 410.0, 645.0, 953.0, 1323.0, 2046.0, 3162.0, 5017.0, 7710.0, 12351.0, 20777.0, 34882.0, 61306.0, 111940.0, 221819.0, 1306857.0, 131979.0, 70751.0, 39957.0, 23428.0, 14128.0, 8775.0, 5598.0, 3510.0, 2226.0, 1550.0, 1004.0, 662.0, 467.0, 340.0, 208.0, 143.0, 96.0, 63.0, 42.0, 36.0, 21.0, 19.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0587158203125, -0.05669975280761719, -0.054683685302734375, -0.05266761779785156, -0.05065155029296875, -0.04863548278808594, -0.046619415283203125, -0.04460334777832031, -0.0425872802734375, -0.04057121276855469, -0.038555145263671875, -0.03653907775878906, -0.03452301025390625, -0.03250694274902344, -0.030490875244140625, -0.028474807739257812, -0.026458740234375, -0.024442672729492188, -0.022426605224609375, -0.020410537719726562, -0.01839447021484375, -0.016378402709960938, -0.014362335205078125, -0.012346267700195312, -0.0103302001953125, -0.008314132690429688, -0.006298065185546875, -0.0042819976806640625, -0.00226593017578125, -0.0002498626708984375, 0.001766204833984375, 0.0037822723388671875, 0.00579833984375, 0.007814407348632812, 0.009830474853515625, 0.011846542358398438, 0.01386260986328125, 0.015878677368164062, 0.017894744873046875, 0.019910812377929688, 0.0219268798828125, 0.023942947387695312, 0.025959014892578125, 0.027975082397460938, 0.02999114990234375, 0.03200721740722656, 0.034023284912109375, 0.03603935241699219, 0.038055419921875, 0.04007148742675781, 0.042087554931640625, 0.04410362243652344, 0.04611968994140625, 0.04813575744628906, 0.050151824951171875, 0.05216789245605469, 0.0541839599609375, 0.05620002746582031, 0.058216094970703125, 0.06023216247558594, 0.06224822998046875, 0.06426429748535156, 0.06628036499023438, 0.06829643249511719, 0.0703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 9.0, 5.0, 10.0, 5.0, 10.0, 19.0, 46.0, 47.0, 81.0, 118.0, 152.0, 152.0, 122.0, 71.0, 48.0, 31.0, 16.0, 14.0, 7.0, 6.0, 6.0, 7.0, 2.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.233287811279297e-05, -5.0446949899196625e-05, -4.856102168560028e-05, -4.667509347200394e-05, -4.478916525840759e-05, -4.290323704481125e-05, -4.1017308831214905e-05, -3.913138061761856e-05, -3.724545240402222e-05, -3.535952419042587e-05, -3.347359597682953e-05, -3.1587667763233185e-05, -2.970173954963684e-05, -2.7815811336040497e-05, -2.5929883122444153e-05, -2.404395490884781e-05, -2.2158026695251465e-05, -2.027209848165512e-05, -1.8386170268058777e-05, -1.6500242054462433e-05, -1.4614313840866089e-05, -1.2728385627269745e-05, -1.0842457413673401e-05, -8.956529200077057e-06, -7.070600986480713e-06, -5.184672772884369e-06, -3.298744559288025e-06, -1.412816345691681e-06, 4.731118679046631e-07, 2.359040081501007e-06, 4.244968295097351e-06, 6.130896508693695e-06, 8.016824722290039e-06, 9.902752935886383e-06, 1.1788681149482727e-05, 1.3674609363079071e-05, 1.5560537576675415e-05, 1.744646579027176e-05, 1.9332394003868103e-05, 2.1218322217464447e-05, 2.310425043106079e-05, 2.4990178644657135e-05, 2.687610685825348e-05, 2.8762035071849823e-05, 3.064796328544617e-05, 3.253389149904251e-05, 3.4419819712638855e-05, 3.63057479262352e-05, 3.819167613983154e-05, 4.007760435342789e-05, 4.196353256702423e-05, 4.3849460780620575e-05, 4.573538899421692e-05, 4.762131720781326e-05, 4.950724542140961e-05, 5.139317363500595e-05, 5.3279101848602295e-05, 5.516503006219864e-05, 5.705095827579498e-05, 5.893688648939133e-05, 6.082281470298767e-05, 6.270874291658401e-05, 6.459467113018036e-05, 6.64805993437767e-05, 6.836652755737305e-05]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 7.0, 14.0, 24.0, 42.0, 66.0, 146.0, 402.0, 11892.0, 1034649.0, 856.0, 198.0, 94.0, 65.0, 19.0, 12.0, 10.0, 9.0, 8.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0015573501586914062, -0.0015143752098083496, -0.001471400260925293, -0.0014284253120422363, -0.0013854503631591797, -0.001342475414276123, -0.0012995004653930664, -0.0012565255165100098, -0.0012135505676269531, -0.0011705756187438965, -0.0011276006698608398, -0.0010846257209777832, -0.0010416507720947266, -0.00099867582321167, -0.0009557008743286133, -0.0009127259254455566, -0.0008697509765625, -0.0008267760276794434, -0.0007838010787963867, -0.0007408261299133301, -0.0006978511810302734, -0.0006548762321472168, -0.0006119012832641602, -0.0005689263343811035, -0.0005259513854980469, -0.00048297643661499023, -0.0004400014877319336, -0.00039702653884887695, -0.0003540515899658203, -0.00031107664108276367, -0.00026810169219970703, -0.0002251267433166504, -0.00018215179443359375, -0.0001391768455505371, -9.620189666748047e-05, -5.322694778442383e-05, -1.0251998901367188e-05, 3.272294998168945e-05, 7.56978988647461e-05, 0.00011867284774780273, 0.00016164779663085938, 0.00020462274551391602, 0.00024759769439697266, 0.0002905726432800293, 0.00033354759216308594, 0.0003765225410461426, 0.0004194974899291992, 0.00046247243881225586, 0.0005054473876953125, 0.0005484223365783691, 0.0005913972854614258, 0.0006343722343444824, 0.0006773471832275391, 0.0007203221321105957, 0.0007632970809936523, 0.000806272029876709, 0.0008492469787597656, 0.0008922219276428223, 0.0009351968765258789, 0.0009781718254089355, 0.0010211467742919922, 0.0010641217231750488, 0.0011070966720581055, 0.0011500716209411621, 0.0011930465698242188]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 1005.0, 2.0, 1.0], "bins": [-0.001066856668330729, -0.001049501239322126, -0.0010321459267288446, -0.0010147904977202415, -0.0009974350687116385, -0.0009800797561183572, -0.0009627243271097541, -0.0009453689563088119, -0.0009280135855078697, -0.0009106582147069275, -0.0008933027856983244, -0.0008759474148973823, -0.0008585920440964401, -0.0008412366732954979, -0.0008238812442868948, -0.0008065258734859526, -0.0007891704444773495, -0.0007718150736764073, -0.0007544596446678042, -0.0007371042738668621, -0.0007197489030659199, -0.0007023934740573168, -0.0006850381032563746, -0.0006676827324554324, -0.0006503273034468293, -0.0006329719326458871, -0.000615616503637284, -0.0005982611328363419, -0.0005809057620353997, -0.0005635503912344575, -0.0005461949622258544, -0.0005288395914249122, -0.0005114842788316309, -0.0004941289080306888, -0.0004767735081259161, -0.0004594181082211435, -0.0004420627374202013, -0.00042470733751542866, -0.000407351937610656, -0.00038999656680971384, -0.00037264113780111074, -0.0003552857378963381, -0.0003379303670953959, -0.0003205749671906233, -0.0003032195963896811, -0.00028586419648490846, -0.0002685087965801358, -0.00025115342577919364, -0.000233798025874421, -0.0002164426405215636, -0.00019908725516870618, -0.00018173185526393354, -0.00016437646991107613, -0.00014702108455821872, -0.00012966568465344608, -0.00011231029930058867, -9.495491394773126e-05, -7.759952859487385e-05, -6.024413596605882e-05, -4.28887469752226e-05, -2.5533357984386384e-05, -8.177972631528974e-06, 9.177419997286052e-06, 2.6532812626101077e-05, 4.388819434097968e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 6.0, 2.0, 13.0, 10.0, 13.0, 21.0, 35.0, 27.0, 38.0, 60.0, 55.0, 44.0, 52.0, 69.0, 74.0, 61.0, 65.0, 69.0, 59.0, 31.0, 49.0, 43.0, 26.0, 27.0, 22.0, 8.0, 8.0, 11.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0563602447509766e-05, -1.9476749002933502e-05, -1.838989555835724e-05, -1.7303042113780975e-05, -1.6216188669204712e-05, -1.5129335224628448e-05, -1.4042481780052185e-05, -1.2955628335475922e-05, -1.1868774890899658e-05, -1.0781921446323395e-05, -9.695068001747131e-06, -8.608214557170868e-06, -7.5213611125946045e-06, -6.434507668018341e-06, -5.347654223442078e-06, -4.260800778865814e-06, -3.1739473342895508e-06, -2.0870938897132874e-06, -1.000240445137024e-06, 8.66129994392395e-08, 1.173466444015503e-06, 2.2603198885917664e-06, 3.3471733331680298e-06, 4.434026777744293e-06, 5.520880222320557e-06, 6.60773366689682e-06, 7.694587111473083e-06, 8.781440556049347e-06, 9.86829400062561e-06, 1.0955147445201874e-05, 1.2042000889778137e-05, 1.31288543343544e-05, 1.4215707778930664e-05, 1.5302561223506927e-05, 1.638941466808319e-05, 1.7476268112659454e-05, 1.8563121557235718e-05, 1.964997500181198e-05, 2.0736828446388245e-05, 2.1823681890964508e-05, 2.291053533554077e-05, 2.3997388780117035e-05, 2.50842422246933e-05, 2.6171095669269562e-05, 2.7257949113845825e-05, 2.834480255842209e-05, 2.9431656002998352e-05, 3.0518509447574615e-05, 3.160536289215088e-05, 3.269221633672714e-05, 3.3779069781303406e-05, 3.486592322587967e-05, 3.595277667045593e-05, 3.7039630115032196e-05, 3.812648355960846e-05, 3.921333700418472e-05, 4.0300190448760986e-05, 4.138704389333725e-05, 4.247389733791351e-05, 4.3560750782489777e-05, 4.464760422706604e-05, 4.5734457671642303e-05, 4.682131111621857e-05, 4.790816456079483e-05, 4.8995018005371094e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 8.0, 13.0, 10.0, 13.0, 16.0, 15.0, 21.0, 34.0, 28.0, 27.0, 33.0, 38.0, 42.0, 47.0, 29.0, 43.0, 43.0, 44.0, 35.0, 29.0, 35.0, 38.0, 42.0, 31.0, 36.0, 22.0, 30.0, 25.0, 21.0, 20.0, 18.0, 23.0, 15.0, 15.0, 10.0, 5.0, 6.0, 8.0, 3.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.673828125, -3.561614990234375, -3.44940185546875, -3.337188720703125, -3.2249755859375, -3.112762451171875, -3.00054931640625, -2.888336181640625, -2.776123046875, -2.663909912109375, -2.55169677734375, -2.439483642578125, -2.3272705078125, -2.215057373046875, -2.10284423828125, -1.990631103515625, -1.87841796875, -1.766204833984375, -1.65399169921875, -1.541778564453125, -1.4295654296875, -1.317352294921875, -1.20513916015625, -1.092926025390625, -0.980712890625, -0.868499755859375, -0.75628662109375, -0.644073486328125, -0.5318603515625, -0.419647216796875, -0.30743408203125, -0.195220947265625, -0.0830078125, 0.029205322265625, 0.14141845703125, 0.253631591796875, 0.3658447265625, 0.478057861328125, 0.59027099609375, 0.702484130859375, 0.814697265625, 0.926910400390625, 1.03912353515625, 1.151336669921875, 1.2635498046875, 1.375762939453125, 1.48797607421875, 1.600189208984375, 1.71240234375, 1.824615478515625, 1.93682861328125, 2.049041748046875, 2.1612548828125, 2.273468017578125, 2.38568115234375, 2.497894287109375, 2.610107421875, 2.722320556640625, 2.83453369140625, 2.946746826171875, 3.0589599609375, 3.171173095703125, 3.28338623046875, 3.395599365234375, 3.5078125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 10.0, 11.0, 12.0, 14.0, 16.0, 29.0, 44.0, 60.0, 71.0, 143.0, 227.0, 404.0, 741.0, 1362.0, 2535.0, 5119.0, 10613.0, 22560.0, 49887.0, 144079.0, 565094.0, 149776.0, 50996.0, 23274.0, 10660.0, 5219.0, 2534.0, 1287.0, 714.0, 387.0, 221.0, 119.0, 100.0, 64.0, 44.0, 37.0, 23.0, 14.0, 13.0, 9.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.71484375, -4.56982421875, -4.4248046875, -4.27978515625, -4.134765625, -3.98974609375, -3.8447265625, -3.69970703125, -3.5546875, -3.40966796875, -3.2646484375, -3.11962890625, -2.974609375, -2.82958984375, -2.6845703125, -2.53955078125, -2.39453125, -2.24951171875, -2.1044921875, -1.95947265625, -1.814453125, -1.66943359375, -1.5244140625, -1.37939453125, -1.234375, -1.08935546875, -0.9443359375, -0.79931640625, -0.654296875, -0.50927734375, -0.3642578125, -0.21923828125, -0.07421875, 0.07080078125, 0.2158203125, 0.36083984375, 0.505859375, 0.65087890625, 0.7958984375, 0.94091796875, 1.0859375, 1.23095703125, 1.3759765625, 1.52099609375, 1.666015625, 1.81103515625, 1.9560546875, 2.10107421875, 2.24609375, 2.39111328125, 2.5361328125, 2.68115234375, 2.826171875, 2.97119140625, 3.1162109375, 3.26123046875, 3.40625, 3.55126953125, 3.6962890625, 3.84130859375, 3.986328125, 4.13134765625, 4.2763671875, 4.42138671875, 4.56640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 10.0, 4.0, 6.0, 5.0, 5.0, 10.0, 11.0, 8.0, 13.0, 16.0, 14.0, 17.0, 14.0, 18.0, 30.0, 38.0, 38.0, 37.0, 29.0, 40.0, 55.0, 81.0, 162.0, 1556.0, 246.0, 114.0, 64.0, 48.0, 26.0, 42.0, 37.0, 30.0, 18.0, 25.0, 28.0, 24.0, 24.0, 13.0, 19.0, 8.0, 6.0, 13.0, 7.0, 10.0, 10.0, 6.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0], "bins": [-10.9453125, -10.62109375, -10.296875, -9.97265625, -9.6484375, -9.32421875, -9.0, -8.67578125, -8.3515625, -8.02734375, -7.703125, -7.37890625, -7.0546875, -6.73046875, -6.40625, -6.08203125, -5.7578125, -5.43359375, -5.109375, -4.78515625, -4.4609375, -4.13671875, -3.8125, -3.48828125, -3.1640625, -2.83984375, -2.515625, -2.19140625, -1.8671875, -1.54296875, -1.21875, -0.89453125, -0.5703125, -0.24609375, 0.078125, 0.40234375, 0.7265625, 1.05078125, 1.375, 1.69921875, 2.0234375, 2.34765625, 2.671875, 2.99609375, 3.3203125, 3.64453125, 3.96875, 4.29296875, 4.6171875, 4.94140625, 5.265625, 5.58984375, 5.9140625, 6.23828125, 6.5625, 6.88671875, 7.2109375, 7.53515625, 7.859375, 8.18359375, 8.5078125, 8.83203125, 9.15625, 9.48046875, 9.8046875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 8.0, 1.0, 1.0, 7.0, 4.0, 3.0, 10.0, 9.0, 8.0, 13.0, 7.0, 8.0, 15.0, 15.0, 25.0, 23.0, 25.0, 33.0, 37.0, 42.0, 77.0, 101.0, 146.0, 249.0, 484.0, 2333.0, 39758.0, 2960029.0, 136281.0, 4329.0, 721.0, 305.0, 157.0, 102.0, 79.0, 56.0, 37.0, 27.0, 22.0, 18.0, 14.0, 17.0, 14.0, 10.0, 13.0, 11.0, 4.0, 4.0, 6.0, 4.0, 10.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.671875, -21.931884765625, -21.19189453125, -20.451904296875, -19.7119140625, -18.971923828125, -18.23193359375, -17.491943359375, -16.751953125, -16.011962890625, -15.27197265625, -14.531982421875, -13.7919921875, -13.052001953125, -12.31201171875, -11.572021484375, -10.83203125, -10.092041015625, -9.35205078125, -8.612060546875, -7.8720703125, -7.132080078125, -6.39208984375, -5.652099609375, -4.912109375, -4.172119140625, -3.43212890625, -2.692138671875, -1.9521484375, -1.212158203125, -0.47216796875, 0.267822265625, 1.0078125, 1.747802734375, 2.48779296875, 3.227783203125, 3.9677734375, 4.707763671875, 5.44775390625, 6.187744140625, 6.927734375, 7.667724609375, 8.40771484375, 9.147705078125, 9.8876953125, 10.627685546875, 11.36767578125, 12.107666015625, 12.84765625, 13.587646484375, 14.32763671875, 15.067626953125, 15.8076171875, 16.547607421875, 17.28759765625, 18.027587890625, 18.767578125, 19.507568359375, 20.24755859375, 20.987548828125, 21.7275390625, 22.467529296875, 23.20751953125, 23.947509765625, 24.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 44.0, 177.0, 337.0, 294.0, 129.0, 25.0, 3.0], "bins": [-90.25357818603516, -88.74502563476562, -87.2364730834961, -85.72792053222656, -84.2193603515625, -82.71080780029297, -81.20225524902344, -79.6937026977539, -78.18515014648438, -76.67659759521484, -75.16804504394531, -73.65948486328125, -72.15093231201172, -70.64237976074219, -69.13382720947266, -67.62527465820312, -66.11671447753906, -64.60816192626953, -63.099605560302734, -61.5910530090332, -60.08250045776367, -58.573944091796875, -57.065391540527344, -55.55683898925781, -54.04828643798828, -52.53973388671875, -51.03117752075195, -49.52262496948242, -48.01407241821289, -46.505516052246094, -44.99696350097656, -43.48841094970703, -41.979854583740234, -40.4713020324707, -38.962745666503906, -37.454193115234375, -35.945640563964844, -34.43708801269531, -32.928531646728516, -31.419979095458984, -29.91142463684082, -28.402870178222656, -26.894317626953125, -25.38576316833496, -23.877208709716797, -22.368656158447266, -20.8601016998291, -19.351547241210938, -17.842994689941406, -16.334440231323242, -14.825887680053711, -13.317333221435547, -11.8087797164917, -10.300226211547852, -8.791671752929688, -7.28311824798584, -5.774564743041992, -4.2660112380981445, -2.7574572563171387, -1.2489032745361328, 0.25965023040771484, 1.7682037353515625, 3.2767581939697266, 4.785311698913574, 6.293865203857422]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 2.0, 4.0, 9.0, 16.0, 9.0, 14.0, 15.0, 37.0, 28.0, 26.0, 38.0, 40.0, 57.0, 59.0, 37.0, 52.0, 58.0, 44.0, 47.0, 54.0, 48.0, 33.0, 42.0, 33.0, 38.0, 22.0, 26.0, 23.0, 17.0, 22.0, 8.0, 5.0, 8.0, 12.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.20233154296875, -38.94664764404297, -37.69096755981445, -36.43528366088867, -35.17959976196289, -33.92391586303711, -32.668235778808594, -31.412551879882812, -30.15686798095703, -28.901185989379883, -27.6455020904541, -26.389820098876953, -25.134136199951172, -23.878454208374023, -22.622772216796875, -21.367088317871094, -20.111406326293945, -18.855724334716797, -17.600040435791016, -16.344358444213867, -15.088674545288086, -13.832992553710938, -12.577309608459473, -11.321626663208008, -10.065943717956543, -8.810260772705078, -7.554577827453613, -6.298895359039307, -5.043212413787842, -3.787529468536377, -2.5318470001220703, -1.2761640548706055, -0.020481109619140625, 1.2352017164230347, 2.49088454246521, 3.7465672492980957, 5.0022501945495605, 6.257933139801025, 7.513615608215332, 8.769298553466797, 10.024981498718262, 11.280664443969727, 12.536347389221191, 13.792030334472656, 15.047712326049805, 16.303396224975586, 17.559078216552734, 18.814762115478516, 20.070444107055664, 21.326126098632812, 22.581809997558594, 23.837491989135742, 25.093175888061523, 26.348857879638672, 27.604541778564453, 28.8602237701416, 30.11590576171875, 31.3715877532959, 32.62726974487305, 33.88295364379883, 35.13863754272461, 36.39432144165039, 37.650001525878906, 38.90568542480469, 40.16136932373047]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 6.0, 10.0, 3.0, 8.0, 9.0, 17.0, 19.0, 23.0, 14.0, 23.0, 25.0, 23.0, 31.0, 39.0, 28.0, 32.0, 45.0, 43.0, 36.0, 38.0, 40.0, 28.0, 40.0, 36.0, 33.0, 25.0, 41.0, 31.0, 31.0, 32.0, 30.0, 23.0, 17.0, 15.0, 17.0, 19.0, 14.0, 7.0, 10.0, 5.0, 3.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.78125, -3.66827392578125, -3.5552978515625, -3.44232177734375, -3.329345703125, -3.21636962890625, -3.1033935546875, -2.99041748046875, -2.87744140625, -2.76446533203125, -2.6514892578125, -2.53851318359375, -2.425537109375, -2.31256103515625, -2.1995849609375, -2.08660888671875, -1.9736328125, -1.86065673828125, -1.7476806640625, -1.63470458984375, -1.521728515625, -1.40875244140625, -1.2957763671875, -1.18280029296875, -1.06982421875, -0.95684814453125, -0.8438720703125, -0.73089599609375, -0.617919921875, -0.50494384765625, -0.3919677734375, -0.27899169921875, -0.166015625, -0.05303955078125, 0.0599365234375, 0.17291259765625, 0.285888671875, 0.39886474609375, 0.5118408203125, 0.62481689453125, 0.73779296875, 0.85076904296875, 0.9637451171875, 1.07672119140625, 1.189697265625, 1.30267333984375, 1.4156494140625, 1.52862548828125, 1.6416015625, 1.75457763671875, 1.8675537109375, 1.98052978515625, 2.093505859375, 2.20648193359375, 2.3194580078125, 2.43243408203125, 2.54541015625, 2.65838623046875, 2.7713623046875, 2.88433837890625, 2.997314453125, 3.11029052734375, 3.2232666015625, 3.33624267578125, 3.44921875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 17.0, 20.0, 27.0, 51.0, 69.0, 102.0, 170.0, 251.0, 430.0, 816.0, 1479.0, 2738.0, 5435.0, 11564.0, 25990.0, 65627.0, 189198.0, 583880.0, 1374810.0, 1218239.0, 463955.0, 152426.0, 54339.0, 22442.0, 10026.0, 4698.0, 2427.0, 1243.0, 735.0, 413.0, 239.0, 136.0, 95.0, 47.0, 46.0, 33.0, 18.0, 13.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.859375, -4.711669921875, -4.56396484375, -4.416259765625, -4.2685546875, -4.120849609375, -3.97314453125, -3.825439453125, -3.677734375, -3.530029296875, -3.38232421875, -3.234619140625, -3.0869140625, -2.939208984375, -2.79150390625, -2.643798828125, -2.49609375, -2.348388671875, -2.20068359375, -2.052978515625, -1.9052734375, -1.757568359375, -1.60986328125, -1.462158203125, -1.314453125, -1.166748046875, -1.01904296875, -0.871337890625, -0.7236328125, -0.575927734375, -0.42822265625, -0.280517578125, -0.1328125, 0.014892578125, 0.16259765625, 0.310302734375, 0.4580078125, 0.605712890625, 0.75341796875, 0.901123046875, 1.048828125, 1.196533203125, 1.34423828125, 1.491943359375, 1.6396484375, 1.787353515625, 1.93505859375, 2.082763671875, 2.23046875, 2.378173828125, 2.52587890625, 2.673583984375, 2.8212890625, 2.968994140625, 3.11669921875, 3.264404296875, 3.412109375, 3.559814453125, 3.70751953125, 3.855224609375, 4.0029296875, 4.150634765625, 4.29833984375, 4.446044921875, 4.59375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 6.0, 12.0, 6.0, 7.0, 8.0, 17.0, 18.0, 29.0, 21.0, 39.0, 48.0, 72.0, 92.0, 119.0, 144.0, 208.0, 232.0, 334.0, 402.0, 439.0, 398.0, 303.0, 260.0, 194.0, 150.0, 134.0, 77.0, 80.0, 65.0, 43.0, 29.0, 22.0, 23.0, 16.0, 10.0, 5.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0, -5.79693603515625, -5.5938720703125, -5.39080810546875, -5.187744140625, -4.98468017578125, -4.7816162109375, -4.57855224609375, -4.37548828125, -4.17242431640625, -3.9693603515625, -3.76629638671875, -3.563232421875, -3.36016845703125, -3.1571044921875, -2.95404052734375, -2.7509765625, -2.54791259765625, -2.3448486328125, -2.14178466796875, -1.938720703125, -1.73565673828125, -1.5325927734375, -1.32952880859375, -1.12646484375, -0.92340087890625, -0.7203369140625, -0.51727294921875, -0.314208984375, -0.11114501953125, 0.0919189453125, 0.29498291015625, 0.498046875, 0.70111083984375, 0.9041748046875, 1.10723876953125, 1.310302734375, 1.51336669921875, 1.7164306640625, 1.91949462890625, 2.12255859375, 2.32562255859375, 2.5286865234375, 2.73175048828125, 2.934814453125, 3.13787841796875, 3.3409423828125, 3.54400634765625, 3.7470703125, 3.95013427734375, 4.1531982421875, 4.35626220703125, 4.559326171875, 4.76239013671875, 4.9654541015625, 5.16851806640625, 5.37158203125, 5.57464599609375, 5.7777099609375, 5.98077392578125, 6.183837890625, 6.38690185546875, 6.5899658203125, 6.79302978515625, 6.99609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 8.0, 7.0, 13.0, 19.0, 19.0, 23.0, 39.0, 65.0, 74.0, 80.0, 141.0, 174.0, 273.0, 480.0, 1209.0, 11343.0, 403197.0, 3629613.0, 139750.0, 5587.0, 881.0, 429.0, 252.0, 169.0, 112.0, 82.0, 60.0, 43.0, 30.0, 29.0, 24.0, 14.0, 9.0, 9.0, 5.0, 4.0, 10.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.640625, -26.859130859375, -26.07763671875, -25.296142578125, -24.5146484375, -23.733154296875, -22.95166015625, -22.170166015625, -21.388671875, -20.607177734375, -19.82568359375, -19.044189453125, -18.2626953125, -17.481201171875, -16.69970703125, -15.918212890625, -15.13671875, -14.355224609375, -13.57373046875, -12.792236328125, -12.0107421875, -11.229248046875, -10.44775390625, -9.666259765625, -8.884765625, -8.103271484375, -7.32177734375, -6.540283203125, -5.7587890625, -4.977294921875, -4.19580078125, -3.414306640625, -2.6328125, -1.851318359375, -1.06982421875, -0.288330078125, 0.4931640625, 1.274658203125, 2.05615234375, 2.837646484375, 3.619140625, 4.400634765625, 5.18212890625, 5.963623046875, 6.7451171875, 7.526611328125, 8.30810546875, 9.089599609375, 9.87109375, 10.652587890625, 11.43408203125, 12.215576171875, 12.9970703125, 13.778564453125, 14.56005859375, 15.341552734375, 16.123046875, 16.904541015625, 17.68603515625, 18.467529296875, 19.2490234375, 20.030517578125, 20.81201171875, 21.593505859375, 22.375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 24.0, 136.0, 391.0, 330.0, 114.0, 20.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.8264923095703, -175.53370666503906, -171.24093627929688, -166.94815063476562, -162.65536499023438, -158.3625946044922, -154.06980895996094, -149.77703857421875, -145.4842529296875, -141.19146728515625, -136.89869689941406, -132.6059112548828, -128.31314086914062, -124.02035522460938, -119.72756958007812, -115.4347915649414, -111.14201354980469, -106.84923553466797, -102.55645751953125, -98.263671875, -93.97089385986328, -89.67811584472656, -85.38533020019531, -81.0925521850586, -76.79977416992188, -72.50699615478516, -68.21421813964844, -63.92143249511719, -59.62865447998047, -55.33587646484375, -51.043094635009766, -46.75031280517578, -42.457550048828125, -38.164772033691406, -33.87199020385742, -29.57921028137207, -25.28643035888672, -20.993650436401367, -16.700870513916016, -12.408090591430664, -8.115310668945312, -3.822530746459961, 0.4702491760253906, 4.763029098510742, 9.055809020996094, 13.348588943481445, 17.641368865966797, 21.93414878845215, 26.2269287109375, 30.51970863342285, 34.8124885559082, 39.10527038574219, 43.398048400878906, 47.690826416015625, 51.98360824584961, 56.276390075683594, 60.56916809082031, 64.86194610595703, 69.15472412109375, 73.447509765625, 77.74028778076172, 82.03306579589844, 86.32585144042969, 90.6186294555664, 94.91140747070312]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 6.0, 11.0, 10.0, 12.0, 22.0, 19.0, 31.0, 22.0, 29.0, 27.0, 20.0, 28.0, 39.0, 34.0, 42.0, 34.0, 59.0, 31.0, 46.0, 49.0, 49.0, 41.0, 37.0, 20.0, 29.0, 21.0, 20.0, 30.0, 23.0, 26.0, 22.0, 16.0, 9.0, 10.0, 6.0, 9.0, 13.0, 5.0, 5.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 3.0], "bins": [-24.526206970214844, -23.780555725097656, -23.03490447998047, -22.28925323486328, -21.543601989746094, -20.797950744628906, -20.05229949951172, -19.30664825439453, -18.560997009277344, -17.815345764160156, -17.06969451904297, -16.32404327392578, -15.578392028808594, -14.832740783691406, -14.087088584899902, -13.341437339782715, -12.595785140991211, -11.850133895874023, -11.104482650756836, -10.358831405639648, -9.613180160522461, -8.867528915405273, -8.12187671661377, -7.376225471496582, -6.6305742263793945, -5.884922981262207, -5.1392717361450195, -4.393620014190674, -3.6479687690734863, -2.902317523956299, -2.156665802001953, -1.4110145568847656, -0.6653633117675781, 0.08028805255889893, 0.825939416885376, 1.5715909004211426, 2.31724214553833, 3.0628933906555176, 3.8085451126098633, 4.554196357727051, 5.299847602844238, 6.045498847961426, 6.791150093078613, 7.536801815032959, 8.282453536987305, 9.028104782104492, 9.77375602722168, 10.519407272338867, 11.265058517456055, 12.010709762573242, 12.75636100769043, 13.502012252807617, 14.247663497924805, 14.993314743041992, 15.738966941833496, 16.484619140625, 17.230270385742188, 17.975921630859375, 18.721572875976562, 19.46722412109375, 20.212875366210938, 20.958526611328125, 21.704177856445312, 22.4498291015625, 23.195480346679688]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 8.0, 5.0, 14.0, 14.0, 12.0, 19.0, 17.0, 18.0, 29.0, 23.0, 35.0, 29.0, 37.0, 30.0, 40.0, 36.0, 41.0, 44.0, 40.0, 41.0, 44.0, 35.0, 39.0, 41.0, 37.0, 34.0, 32.0, 24.0, 25.0, 29.0, 19.0, 14.0, 14.0, 15.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0], "bins": [-4.0703125, -3.955535888671875, -3.84075927734375, -3.725982666015625, -3.6112060546875, -3.496429443359375, -3.38165283203125, -3.266876220703125, -3.152099609375, -3.037322998046875, -2.92254638671875, -2.807769775390625, -2.6929931640625, -2.578216552734375, -2.46343994140625, -2.348663330078125, -2.23388671875, -2.119110107421875, -2.00433349609375, -1.889556884765625, -1.7747802734375, -1.660003662109375, -1.54522705078125, -1.430450439453125, -1.315673828125, -1.200897216796875, -1.08612060546875, -0.971343994140625, -0.8565673828125, -0.741790771484375, -0.62701416015625, -0.512237548828125, -0.3974609375, -0.282684326171875, -0.16790771484375, -0.053131103515625, 0.0616455078125, 0.176422119140625, 0.29119873046875, 0.405975341796875, 0.520751953125, 0.635528564453125, 0.75030517578125, 0.865081787109375, 0.9798583984375, 1.094635009765625, 1.20941162109375, 1.324188232421875, 1.43896484375, 1.553741455078125, 1.66851806640625, 1.783294677734375, 1.8980712890625, 2.012847900390625, 2.12762451171875, 2.242401123046875, 2.357177734375, 2.471954345703125, 2.58673095703125, 2.701507568359375, 2.8162841796875, 2.931060791015625, 3.04583740234375, 3.160614013671875, 3.275390625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 8.0, 6.0, 7.0, 23.0, 30.0, 46.0, 63.0, 116.0, 176.0, 270.0, 489.0, 708.0, 1169.0, 1886.0, 3170.0, 5230.0, 8645.0, 14714.0, 26069.0, 48908.0, 101984.0, 261694.0, 324668.0, 120890.0, 57017.0, 29669.0, 16425.0, 9807.0, 5671.0, 3457.0, 2106.0, 1279.0, 774.0, 488.0, 329.0, 187.0, 140.0, 85.0, 58.0, 38.0, 13.0, 22.0, 10.0, 9.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2095947265625, -0.20344924926757812, -0.19730377197265625, -0.19115829467773438, -0.1850128173828125, -0.17886734008789062, -0.17272186279296875, -0.16657638549804688, -0.160430908203125, -0.15428543090820312, -0.14813995361328125, -0.14199447631835938, -0.1358489990234375, -0.12970352172851562, -0.12355804443359375, -0.11741256713867188, -0.11126708984375, -0.10512161254882812, -0.09897613525390625, -0.09283065795898438, -0.0866851806640625, -0.08053970336914062, -0.07439422607421875, -0.06824874877929688, -0.062103271484375, -0.055957794189453125, -0.04981231689453125, -0.043666839599609375, -0.0375213623046875, -0.031375885009765625, -0.02523040771484375, -0.019084930419921875, -0.012939453125, -0.006793975830078125, -0.00064849853515625, 0.005496978759765625, 0.0116424560546875, 0.017787933349609375, 0.02393341064453125, 0.030078887939453125, 0.036224365234375, 0.042369842529296875, 0.04851531982421875, 0.054660797119140625, 0.0608062744140625, 0.06695175170898438, 0.07309722900390625, 0.07924270629882812, 0.08538818359375, 0.09153366088867188, 0.09767913818359375, 0.10382461547851562, 0.1099700927734375, 0.11611557006835938, 0.12226104736328125, 0.12840652465820312, 0.134552001953125, 0.14069747924804688, 0.14684295654296875, 0.15298843383789062, 0.1591339111328125, 0.16527938842773438, 0.17142486572265625, 0.17757034301757812, 0.1837158203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 11.0, 4.0, 3.0, 7.0, 12.0, 16.0, 20.0, 21.0, 14.0, 21.0, 28.0, 31.0, 21.0, 29.0, 37.0, 33.0, 37.0, 39.0, 39.0, 1062.0, 47.0, 46.0, 35.0, 47.0, 46.0, 32.0, 37.0, 32.0, 30.0, 31.0, 30.0, 22.0, 19.0, 20.0, 11.0, 12.0, 10.0, 5.0, 11.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.9453125, -2.8631591796875, -2.781005859375, -2.6988525390625, -2.61669921875, -2.5345458984375, -2.452392578125, -2.3702392578125, -2.2880859375, -2.2059326171875, -2.123779296875, -2.0416259765625, -1.95947265625, -1.8773193359375, -1.795166015625, -1.7130126953125, -1.630859375, -1.5487060546875, -1.466552734375, -1.3843994140625, -1.30224609375, -1.2200927734375, -1.137939453125, -1.0557861328125, -0.9736328125, -0.8914794921875, -0.809326171875, -0.7271728515625, -0.64501953125, -0.5628662109375, -0.480712890625, -0.3985595703125, -0.31640625, -0.2342529296875, -0.152099609375, -0.0699462890625, 0.01220703125, 0.0943603515625, 0.176513671875, 0.2586669921875, 0.3408203125, 0.4229736328125, 0.505126953125, 0.5872802734375, 0.66943359375, 0.7515869140625, 0.833740234375, 0.9158935546875, 0.998046875, 1.0802001953125, 1.162353515625, 1.2445068359375, 1.32666015625, 1.4088134765625, 1.490966796875, 1.5731201171875, 1.6552734375, 1.7374267578125, 1.819580078125, 1.9017333984375, 1.98388671875, 2.0660400390625, 2.148193359375, 2.2303466796875, 2.3125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 26.0, 27.0, 29.0, 53.0, 67.0, 94.0, 167.0, 194.0, 345.0, 499.0, 813.0, 1252.0, 2001.0, 3050.0, 4961.0, 7872.0, 13284.0, 22506.0, 39579.0, 72809.0, 146023.0, 1344528.0, 211082.0, 100063.0, 52453.0, 29358.0, 16911.0, 10155.0, 6144.0, 3837.0, 2457.0, 1550.0, 1008.0, 684.0, 424.0, 264.0, 183.0, 113.0, 100.0, 45.0, 29.0, 23.0, 17.0, 17.0, 10.0, 4.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.083740234375, -0.08139705657958984, -0.07905387878417969, -0.07671070098876953, -0.07436752319335938, -0.07202434539794922, -0.06968116760253906, -0.0673379898071289, -0.06499481201171875, -0.0626516342163086, -0.06030845642089844, -0.05796527862548828, -0.055622100830078125, -0.05327892303466797, -0.05093574523925781, -0.048592567443847656, -0.0462493896484375, -0.043906211853027344, -0.04156303405761719, -0.03921985626220703, -0.036876678466796875, -0.03453350067138672, -0.03219032287597656, -0.029847145080566406, -0.02750396728515625, -0.025160789489746094, -0.022817611694335938, -0.02047443389892578, -0.018131256103515625, -0.01578807830810547, -0.013444900512695312, -0.011101722717285156, -0.008758544921875, -0.006415367126464844, -0.0040721893310546875, -0.0017290115356445312, 0.000614166259765625, 0.0029573440551757812, 0.0053005218505859375, 0.007643699645996094, 0.00998687744140625, 0.012330055236816406, 0.014673233032226562, 0.01701641082763672, 0.019359588623046875, 0.02170276641845703, 0.024045944213867188, 0.026389122009277344, 0.0287322998046875, 0.031075477600097656, 0.03341865539550781, 0.03576183319091797, 0.038105010986328125, 0.04044818878173828, 0.04279136657714844, 0.045134544372558594, 0.04747772216796875, 0.049820899963378906, 0.05216407775878906, 0.05450725555419922, 0.056850433349609375, 0.05919361114501953, 0.06153678894042969, 0.06387996673583984, 0.06622314453125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 7.0, 19.0, 17.0, 17.0, 16.0, 22.0, 43.0, 28.0, 32.0, 59.0, 62.0, 81.0, 82.0, 86.0, 72.0, 59.0, 42.0, 52.0, 31.0, 29.0, 25.0, 17.0, 18.0, 19.0, 9.0, 9.0, 4.0, 4.0, 9.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.719329833984375e-05, -3.590434789657593e-05, -3.4615397453308105e-05, -3.332644701004028e-05, -3.203749656677246e-05, -3.074854612350464e-05, -2.9459595680236816e-05, -2.8170645236968994e-05, -2.6881694793701172e-05, -2.559274435043335e-05, -2.4303793907165527e-05, -2.3014843463897705e-05, -2.1725893020629883e-05, -2.043694257736206e-05, -1.9147992134094238e-05, -1.7859041690826416e-05, -1.6570091247558594e-05, -1.528114080429077e-05, -1.399219036102295e-05, -1.2703239917755127e-05, -1.1414289474487305e-05, -1.0125339031219482e-05, -8.83638858795166e-06, -7.547438144683838e-06, -6.258487701416016e-06, -4.969537258148193e-06, -3.680586814880371e-06, -2.391636371612549e-06, -1.1026859283447266e-06, 1.862645149230957e-07, 1.475214958190918e-06, 2.7641654014587402e-06, 4.0531158447265625e-06, 5.342066287994385e-06, 6.631016731262207e-06, 7.91996717453003e-06, 9.208917617797852e-06, 1.0497868061065674e-05, 1.1786818504333496e-05, 1.3075768947601318e-05, 1.436471939086914e-05, 1.5653669834136963e-05, 1.6942620277404785e-05, 1.8231570720672607e-05, 1.952052116394043e-05, 2.0809471607208252e-05, 2.2098422050476074e-05, 2.3387372493743896e-05, 2.467632293701172e-05, 2.596527338027954e-05, 2.7254223823547363e-05, 2.8543174266815186e-05, 2.9832124710083008e-05, 3.112107515335083e-05, 3.241002559661865e-05, 3.3698976039886475e-05, 3.49879264831543e-05, 3.627687692642212e-05, 3.756582736968994e-05, 3.8854777812957764e-05, 4.0143728256225586e-05, 4.143267869949341e-05, 4.272162914276123e-05, 4.401057958602905e-05, 4.5299530029296875e-05]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 6.0, 6.0, 6.0, 4.0, 8.0, 18.0, 15.0, 21.0, 25.0, 29.0, 47.0, 68.0, 116.0, 221.0, 560.0, 6778.0, 1036749.0, 2868.0, 488.0, 180.0, 97.0, 54.0, 51.0, 28.0, 18.0, 19.0, 23.0, 15.0, 5.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00104522705078125, -0.0010157153010368347, -0.0009862035512924194, -0.0009566918015480042, -0.0009271800518035889, -0.0008976683020591736, -0.0008681565523147583, -0.000838644802570343, -0.0008091330528259277, -0.0007796213030815125, -0.0007501095533370972, -0.0007205978035926819, -0.0006910860538482666, -0.0006615743041038513, -0.000632062554359436, -0.0006025508046150208, -0.0005730390548706055, -0.0005435273051261902, -0.0005140155553817749, -0.0004845038056373596, -0.00045499205589294434, -0.00042548030614852905, -0.00039596855640411377, -0.0003664568066596985, -0.0003369450569152832, -0.0003074333071708679, -0.00027792155742645264, -0.00024840980768203735, -0.00021889805793762207, -0.0001893863081932068, -0.0001598745584487915, -0.00013036280870437622, -0.00010085105895996094, -7.133930921554565e-05, -4.182755947113037e-05, -1.2315809726715088e-05, 1.7195940017700195e-05, 4.670768976211548e-05, 7.621943950653076e-05, 0.00010573118925094604, 0.00013524293899536133, 0.0001647546887397766, 0.0001942664384841919, 0.00022377818822860718, 0.00025328993797302246, 0.00028280168771743774, 0.00031231343746185303, 0.0003418251872062683, 0.0003713369369506836, 0.0004008486866950989, 0.00043036043643951416, 0.00045987218618392944, 0.0004893839359283447, 0.00051889568567276, 0.0005484074354171753, 0.0005779191851615906, 0.0006074309349060059, 0.0006369426846504211, 0.0006664544343948364, 0.0006959661841392517, 0.000725477933883667, 0.0007549896836280823, 0.0007845014333724976, 0.0008140131831169128, 0.0008435249328613281]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 506.0, 507.0], "bins": [-0.0010290639474987984, -0.0010127297136932611, -0.000996395363472402, -0.0009800611296668649, -0.0009637268958613276, -0.0009473926038481295, -0.0009310583700425923, -0.0009147240780293941, -0.0008983898442238569, -0.0008820555522106588, -0.0008657213184051216, -0.0008493870263919234, -0.0008330527925863862, -0.0008167185005731881, -0.0008003842667676508, -0.0007840499747544527, -0.0007677157409489155, -0.0007513814489357173, -0.0007350472151301801, -0.000718712923116982, -0.0007023786893114448, -0.0006860443972982466, -0.0006697101634927094, -0.0006533758714795113, -0.0006370415794663131, -0.000620707287453115, -0.0006043730536475778, -0.0005880387616343796, -0.0005717045278288424, -0.0005553702358156443, -0.000539036002010107, -0.0005227017099969089, -0.0005063674761913717, -0.0004900331841781735, -0.0004736989503726363, -0.00045736468746326864, -0.00044103042455390096, -0.0004246961616445333, -0.0004083618987351656, -0.00039202760672196746, -0.00037569337291643023, -0.00035935911000706255, -0.0003430248470976949, -0.0003266905841883272, -0.0003103563212789595, -0.00029402205836959183, -0.00027768779546022415, -0.000261353503447026, -0.0002450192696414888, -0.0002286850067321211, -0.00021235074382275343, -0.00019601648091338575, -0.00017968221800401807, -0.0001633479550946504, -0.00014701367763336748, -0.0001306794147239998, -0.0001143451445386745, -9.801088162930682e-05, -8.167661144398153e-05, -6.534234853461385e-05, -4.900808562524617e-05, -3.267382271587849e-05, -1.6339552530553192e-05, -5.289621185511351e-09, 1.6328971469192766e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 8.0, 13.0, 13.0, 21.0, 16.0, 22.0, 34.0, 30.0, 34.0, 50.0, 54.0, 50.0, 63.0, 70.0, 54.0, 73.0, 60.0, 63.0, 55.0, 39.0, 48.0, 32.0, 28.0, 24.0, 12.0, 3.0, 14.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.187490463256836e-05, -2.0818784832954407e-05, -1.9762665033340454e-05, -1.87065452337265e-05, -1.765042543411255e-05, -1.6594305634498596e-05, -1.5538185834884644e-05, -1.4482066035270691e-05, -1.3425946235656738e-05, -1.2369826436042786e-05, -1.1313706636428833e-05, -1.025758683681488e-05, -9.201467037200928e-06, -8.145347237586975e-06, -7.0892274379730225e-06, -6.03310763835907e-06, -4.976987838745117e-06, -3.9208680391311646e-06, -2.864748239517212e-06, -1.8086284399032593e-06, -7.525086402893066e-07, 3.03611159324646e-07, 1.3597309589385986e-06, 2.4158507585525513e-06, 3.471970558166504e-06, 4.5280903577804565e-06, 5.584210157394409e-06, 6.640329957008362e-06, 7.696449756622314e-06, 8.752569556236267e-06, 9.80868935585022e-06, 1.0864809155464172e-05, 1.1920928955078125e-05, 1.2977048754692078e-05, 1.403316855430603e-05, 1.5089288353919983e-05, 1.6145408153533936e-05, 1.7201527953147888e-05, 1.825764775276184e-05, 1.9313767552375793e-05, 2.0369887351989746e-05, 2.14260071516037e-05, 2.248212695121765e-05, 2.3538246750831604e-05, 2.4594366550445557e-05, 2.565048635005951e-05, 2.6706606149673462e-05, 2.7762725949287415e-05, 2.8818845748901367e-05, 2.987496554851532e-05, 3.093108534812927e-05, 3.1987205147743225e-05, 3.304332494735718e-05, 3.409944474697113e-05, 3.515556454658508e-05, 3.6211684346199036e-05, 3.726780414581299e-05, 3.832392394542694e-05, 3.9380043745040894e-05, 4.0436163544654846e-05, 4.14922833442688e-05, 4.254840314388275e-05, 4.3604522943496704e-05, 4.466064274311066e-05, 4.571676254272461e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 8.0, 5.0, 14.0, 14.0, 12.0, 19.0, 17.0, 18.0, 29.0, 23.0, 35.0, 29.0, 37.0, 30.0, 40.0, 36.0, 41.0, 44.0, 40.0, 41.0, 44.0, 35.0, 39.0, 41.0, 37.0, 34.0, 32.0, 24.0, 25.0, 29.0, 19.0, 14.0, 14.0, 15.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0], "bins": [-4.0703125, -3.955535888671875, -3.84075927734375, -3.725982666015625, -3.6112060546875, -3.496429443359375, -3.38165283203125, -3.266876220703125, -3.152099609375, -3.037322998046875, -2.92254638671875, -2.807769775390625, -2.6929931640625, -2.578216552734375, -2.46343994140625, -2.348663330078125, -2.23388671875, -2.119110107421875, -2.00433349609375, -1.889556884765625, -1.7747802734375, -1.660003662109375, -1.54522705078125, -1.430450439453125, -1.315673828125, -1.200897216796875, -1.08612060546875, -0.971343994140625, -0.8565673828125, -0.741790771484375, -0.62701416015625, -0.512237548828125, -0.3974609375, -0.282684326171875, -0.16790771484375, -0.053131103515625, 0.0616455078125, 0.176422119140625, 0.29119873046875, 0.405975341796875, 0.520751953125, 0.635528564453125, 0.75030517578125, 0.865081787109375, 0.9798583984375, 1.094635009765625, 1.20941162109375, 1.324188232421875, 1.43896484375, 1.553741455078125, 1.66851806640625, 1.783294677734375, 1.8980712890625, 2.012847900390625, 2.12762451171875, 2.242401123046875, 2.357177734375, 2.471954345703125, 2.58673095703125, 2.701507568359375, 2.8162841796875, 2.931060791015625, 3.04583740234375, 3.160614013671875, 3.275390625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 12.0, 18.0, 29.0, 56.0, 70.0, 114.0, 148.0, 245.0, 332.0, 569.0, 821.0, 1301.0, 1793.0, 2967.0, 4382.0, 6718.0, 10216.0, 16099.0, 26445.0, 44631.0, 84865.0, 168617.0, 268930.0, 186723.0, 95148.0, 49535.0, 28439.0, 17451.0, 10946.0, 7185.0, 4643.0, 3129.0, 2037.0, 1313.0, 918.0, 587.0, 397.0, 251.0, 162.0, 90.0, 66.0, 54.0, 25.0, 19.0, 21.0, 11.0, 9.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.8671875, -2.776397705078125, -2.68560791015625, -2.594818115234375, -2.5040283203125, -2.413238525390625, -2.32244873046875, -2.231658935546875, -2.140869140625, -2.050079345703125, -1.95928955078125, -1.868499755859375, -1.7777099609375, -1.686920166015625, -1.59613037109375, -1.505340576171875, -1.41455078125, -1.323760986328125, -1.23297119140625, -1.142181396484375, -1.0513916015625, -0.960601806640625, -0.86981201171875, -0.779022216796875, -0.688232421875, -0.597442626953125, -0.50665283203125, -0.415863037109375, -0.3250732421875, -0.234283447265625, -0.14349365234375, -0.052703857421875, 0.0380859375, 0.128875732421875, 0.21966552734375, 0.310455322265625, 0.4012451171875, 0.492034912109375, 0.58282470703125, 0.673614501953125, 0.764404296875, 0.855194091796875, 0.94598388671875, 1.036773681640625, 1.1275634765625, 1.218353271484375, 1.30914306640625, 1.399932861328125, 1.49072265625, 1.581512451171875, 1.67230224609375, 1.763092041015625, 1.8538818359375, 1.944671630859375, 2.03546142578125, 2.126251220703125, 2.217041015625, 2.307830810546875, 2.39862060546875, 2.489410400390625, 2.5802001953125, 2.670989990234375, 2.76177978515625, 2.852569580078125, 2.943359375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 9.0, 5.0, 13.0, 8.0, 8.0, 9.0, 12.0, 17.0, 17.0, 23.0, 18.0, 12.0, 25.0, 31.0, 22.0, 32.0, 37.0, 36.0, 43.0, 57.0, 90.0, 191.0, 1405.0, 330.0, 133.0, 75.0, 46.0, 28.0, 30.0, 22.0, 44.0, 16.0, 17.0, 19.0, 18.0, 22.0, 18.0, 21.0, 14.0, 13.0, 14.0, 8.0, 5.0, 3.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-9.5625, -9.2418212890625, -8.921142578125, -8.6004638671875, -8.27978515625, -7.9591064453125, -7.638427734375, -7.3177490234375, -6.9970703125, -6.6763916015625, -6.355712890625, -6.0350341796875, -5.71435546875, -5.3936767578125, -5.072998046875, -4.7523193359375, -4.431640625, -4.1109619140625, -3.790283203125, -3.4696044921875, -3.14892578125, -2.8282470703125, -2.507568359375, -2.1868896484375, -1.8662109375, -1.5455322265625, -1.224853515625, -0.9041748046875, -0.58349609375, -0.2628173828125, 0.057861328125, 0.3785400390625, 0.69921875, 1.0198974609375, 1.340576171875, 1.6612548828125, 1.98193359375, 2.3026123046875, 2.623291015625, 2.9439697265625, 3.2646484375, 3.5853271484375, 3.906005859375, 4.2266845703125, 4.54736328125, 4.8680419921875, 5.188720703125, 5.5093994140625, 5.830078125, 6.1507568359375, 6.471435546875, 6.7921142578125, 7.11279296875, 7.4334716796875, 7.754150390625, 8.0748291015625, 8.3955078125, 8.7161865234375, 9.036865234375, 9.3575439453125, 9.67822265625, 9.9989013671875, 10.319580078125, 10.6402587890625, 10.9609375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 1.0, 6.0, 10.0, 8.0, 10.0, 19.0, 19.0, 30.0, 25.0, 39.0, 33.0, 48.0, 59.0, 80.0, 97.0, 135.0, 209.0, 314.0, 765.0, 3281.0, 23270.0, 312664.0, 2661184.0, 126515.0, 13077.0, 2102.0, 609.0, 267.0, 170.0, 131.0, 95.0, 81.0, 66.0, 54.0, 40.0, 29.0, 29.0, 28.0, 13.0, 21.0, 6.0, 8.0, 9.0, 11.0, 8.0, 7.0, 3.0, 8.0, 5.0, 2.0, 0.0, 3.0], "bins": [-14.5546875, -14.131103515625, -13.70751953125, -13.283935546875, -12.8603515625, -12.436767578125, -12.01318359375, -11.589599609375, -11.166015625, -10.742431640625, -10.31884765625, -9.895263671875, -9.4716796875, -9.048095703125, -8.62451171875, -8.200927734375, -7.77734375, -7.353759765625, -6.93017578125, -6.506591796875, -6.0830078125, -5.659423828125, -5.23583984375, -4.812255859375, -4.388671875, -3.965087890625, -3.54150390625, -3.117919921875, -2.6943359375, -2.270751953125, -1.84716796875, -1.423583984375, -1.0, -0.576416015625, -0.15283203125, 0.270751953125, 0.6943359375, 1.117919921875, 1.54150390625, 1.965087890625, 2.388671875, 2.812255859375, 3.23583984375, 3.659423828125, 4.0830078125, 4.506591796875, 4.93017578125, 5.353759765625, 5.77734375, 6.200927734375, 6.62451171875, 7.048095703125, 7.4716796875, 7.895263671875, 8.31884765625, 8.742431640625, 9.166015625, 9.589599609375, 10.01318359375, 10.436767578125, 10.8603515625, 11.283935546875, 11.70751953125, 12.131103515625, 12.5546875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 354.0, 637.0, 26.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.737876892089844, -28.1551513671875, -23.572425842285156, -18.98969841003418, -14.406972885131836, -9.824247360229492, -5.241519927978516, -0.6587944030761719, 3.923931121826172, 8.506656646728516, 13.089383125305176, 17.672109603881836, 22.25483512878418, 26.837560653686523, 31.4202880859375, 36.003013610839844, 40.58573913574219, 45.16846466064453, 49.751190185546875, 54.33391571044922, 58.91664123535156, 63.499366760253906, 68.08209228515625, 72.66482543945312, 77.24754333496094, 81.83026885986328, 86.41299438476562, 90.99571990966797, 95.57844543457031, 100.16117095947266, 104.743896484375, 109.32662963867188, 113.90934753417969, 118.49207305908203, 123.07479858398438, 127.65752410888672, 132.24024963378906, 136.82298278808594, 141.40570068359375, 145.98843383789062, 150.57115173339844, 155.1538848876953, 159.73660278320312, 164.3193359375, 168.9020538330078, 173.4847869873047, 178.0675048828125, 182.65023803710938, 187.23297119140625, 191.81570434570312, 196.39842224121094, 200.9811553955078, 205.56387329101562, 210.1466064453125, 214.7293243408203, 219.3120574951172, 223.894775390625, 228.47750854492188, 233.0602264404297, 237.64295959472656, 242.22567749023438, 246.80841064453125, 251.39112854003906, 255.97386169433594, 260.55657958984375]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 10.0, 8.0, 11.0, 11.0, 9.0, 15.0, 15.0, 22.0, 17.0, 18.0, 14.0, 28.0, 20.0, 44.0, 34.0, 38.0, 49.0, 30.0, 32.0, 40.0, 44.0, 38.0, 44.0, 37.0, 38.0, 26.0, 39.0, 29.0, 28.0, 22.0, 26.0, 16.0, 29.0, 15.0, 9.0, 13.0, 12.0, 13.0, 8.0, 11.0, 6.0, 5.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-29.559341430664062, -28.652421951293945, -27.745502471923828, -26.838584899902344, -25.931665420532227, -25.02474594116211, -24.117828369140625, -23.210908889770508, -22.30398941040039, -21.397069931030273, -20.490150451660156, -19.583232879638672, -18.676313400268555, -17.769393920898438, -16.862476348876953, -15.955556869506836, -15.048637390136719, -14.141717910766602, -13.2347993850708, -12.327880859375, -11.420961380004883, -10.514041900634766, -9.607123374938965, -8.700204849243164, -7.793285369873047, -6.886366367340088, -5.979447364807129, -5.07252836227417, -4.165609359741211, -3.258690357208252, -2.351771354675293, -1.444852352142334, -0.537933349609375, 0.368985652923584, 1.275904655456543, 2.182823657989502, 3.089742660522461, 3.99666166305542, 4.903580665588379, 5.810499668121338, 6.717418670654297, 7.624337673187256, 8.531256675720215, 9.438175201416016, 10.345094680786133, 11.25201416015625, 12.15893268585205, 13.065851211547852, 13.972770690917969, 14.879690170288086, 15.786608695983887, 16.693527221679688, 17.600446701049805, 18.507366180419922, 19.414283752441406, 20.321203231811523, 21.22812271118164, 22.135042190551758, 23.041961669921875, 23.94887924194336, 24.855798721313477, 25.762718200683594, 26.669635772705078, 27.576555252075195, 28.483474731445312]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 6.0, 2.0, 4.0, 11.0, 11.0, 11.0, 17.0, 14.0, 24.0, 21.0, 28.0, 28.0, 28.0, 25.0, 39.0, 40.0, 33.0, 42.0, 49.0, 49.0, 45.0, 41.0, 40.0, 37.0, 33.0, 25.0, 35.0, 39.0, 48.0, 26.0, 21.0, 22.0, 17.0, 19.0, 9.0, 8.0, 10.0, 9.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.21875, -4.098480224609375, -3.97821044921875, -3.857940673828125, -3.7376708984375, -3.617401123046875, -3.49713134765625, -3.376861572265625, -3.256591796875, -3.136322021484375, -3.01605224609375, -2.895782470703125, -2.7755126953125, -2.655242919921875, -2.53497314453125, -2.414703369140625, -2.29443359375, -2.174163818359375, -2.05389404296875, -1.933624267578125, -1.8133544921875, -1.693084716796875, -1.57281494140625, -1.452545166015625, -1.332275390625, -1.212005615234375, -1.09173583984375, -0.971466064453125, -0.8511962890625, -0.730926513671875, -0.61065673828125, -0.490386962890625, -0.3701171875, -0.249847412109375, -0.12957763671875, -0.009307861328125, 0.1109619140625, 0.231231689453125, 0.35150146484375, 0.471771240234375, 0.592041015625, 0.712310791015625, 0.83258056640625, 0.952850341796875, 1.0731201171875, 1.193389892578125, 1.31365966796875, 1.433929443359375, 1.55419921875, 1.674468994140625, 1.79473876953125, 1.915008544921875, 2.0352783203125, 2.155548095703125, 2.27581787109375, 2.396087646484375, 2.516357421875, 2.636627197265625, 2.75689697265625, 2.877166748046875, 2.9974365234375, 3.117706298828125, 3.23797607421875, 3.358245849609375, 3.478515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 1.0, 10.0, 9.0, 10.0, 12.0, 13.0, 17.0, 15.0, 28.0, 42.0, 62.0, 118.0, 241.0, 506.0, 1279.0, 3221.0, 10040.0, 38988.0, 208162.0, 1637614.0, 1969591.0, 259344.0, 46873.0, 11657.0, 3723.0, 1458.0, 582.0, 269.0, 138.0, 63.0, 51.0, 23.0, 16.0, 20.0, 12.0, 15.0, 8.0, 12.0, 4.0, 6.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.90625, -8.62841796875, -8.3505859375, -8.07275390625, -7.794921875, -7.51708984375, -7.2392578125, -6.96142578125, -6.68359375, -6.40576171875, -6.1279296875, -5.85009765625, -5.572265625, -5.29443359375, -5.0166015625, -4.73876953125, -4.4609375, -4.18310546875, -3.9052734375, -3.62744140625, -3.349609375, -3.07177734375, -2.7939453125, -2.51611328125, -2.23828125, -1.96044921875, -1.6826171875, -1.40478515625, -1.126953125, -0.84912109375, -0.5712890625, -0.29345703125, -0.015625, 0.26220703125, 0.5400390625, 0.81787109375, 1.095703125, 1.37353515625, 1.6513671875, 1.92919921875, 2.20703125, 2.48486328125, 2.7626953125, 3.04052734375, 3.318359375, 3.59619140625, 3.8740234375, 4.15185546875, 4.4296875, 4.70751953125, 4.9853515625, 5.26318359375, 5.541015625, 5.81884765625, 6.0966796875, 6.37451171875, 6.65234375, 6.93017578125, 7.2080078125, 7.48583984375, 7.763671875, 8.04150390625, 8.3193359375, 8.59716796875, 8.875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 5.0, 8.0, 11.0, 11.0, 21.0, 24.0, 29.0, 44.0, 54.0, 75.0, 91.0, 140.0, 171.0, 201.0, 283.0, 329.0, 409.0, 434.0, 356.0, 303.0, 214.0, 222.0, 130.0, 133.0, 72.0, 73.0, 68.0, 38.0, 25.0, 18.0, 19.0, 18.0, 11.0, 7.0, 2.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.62109375, -6.43890380859375, -6.2567138671875, -6.07452392578125, -5.892333984375, -5.71014404296875, -5.5279541015625, -5.34576416015625, -5.16357421875, -4.98138427734375, -4.7991943359375, -4.61700439453125, -4.434814453125, -4.25262451171875, -4.0704345703125, -3.88824462890625, -3.7060546875, -3.52386474609375, -3.3416748046875, -3.15948486328125, -2.977294921875, -2.79510498046875, -2.6129150390625, -2.43072509765625, -2.24853515625, -2.06634521484375, -1.8841552734375, -1.70196533203125, -1.519775390625, -1.33758544921875, -1.1553955078125, -0.97320556640625, -0.791015625, -0.60882568359375, -0.4266357421875, -0.24444580078125, -0.062255859375, 0.11993408203125, 0.3021240234375, 0.48431396484375, 0.66650390625, 0.84869384765625, 1.0308837890625, 1.21307373046875, 1.395263671875, 1.57745361328125, 1.7596435546875, 1.94183349609375, 2.1240234375, 2.30621337890625, 2.4884033203125, 2.67059326171875, 2.852783203125, 3.03497314453125, 3.2171630859375, 3.39935302734375, 3.58154296875, 3.76373291015625, 3.9459228515625, 4.12811279296875, 4.310302734375, 4.49249267578125, 4.6746826171875, 4.85687255859375, 5.0390625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 2.0, 17.0, 14.0, 20.0, 26.0, 37.0, 38.0, 50.0, 69.0, 125.0, 148.0, 207.0, 330.0, 769.0, 3255.0, 29537.0, 628397.0, 3351815.0, 165168.0, 11090.0, 1573.0, 581.0, 306.0, 201.0, 136.0, 87.0, 70.0, 55.0, 49.0, 32.0, 18.0, 16.0, 9.0, 11.0, 1.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.515625, -17.83740234375, -17.1591796875, -16.48095703125, -15.802734375, -15.12451171875, -14.4462890625, -13.76806640625, -13.08984375, -12.41162109375, -11.7333984375, -11.05517578125, -10.376953125, -9.69873046875, -9.0205078125, -8.34228515625, -7.6640625, -6.98583984375, -6.3076171875, -5.62939453125, -4.951171875, -4.27294921875, -3.5947265625, -2.91650390625, -2.23828125, -1.56005859375, -0.8818359375, -0.20361328125, 0.474609375, 1.15283203125, 1.8310546875, 2.50927734375, 3.1875, 3.86572265625, 4.5439453125, 5.22216796875, 5.900390625, 6.57861328125, 7.2568359375, 7.93505859375, 8.61328125, 9.29150390625, 9.9697265625, 10.64794921875, 11.326171875, 12.00439453125, 12.6826171875, 13.36083984375, 14.0390625, 14.71728515625, 15.3955078125, 16.07373046875, 16.751953125, 17.43017578125, 18.1083984375, 18.78662109375, 19.46484375, 20.14306640625, 20.8212890625, 21.49951171875, 22.177734375, 22.85595703125, 23.5341796875, 24.21240234375, 24.890625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 15.0, 22.0, 34.0, 72.0, 104.0, 131.0, 153.0, 151.0, 114.0, 95.0, 53.0, 30.0, 18.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.29335021972656, -38.93925857543945, -37.585166931152344, -36.23107147216797, -34.87697982788086, -33.52288818359375, -32.16879653930664, -30.81470489501953, -29.46061134338379, -28.10651969909668, -26.752426147460938, -25.398334503173828, -24.04424285888672, -22.690149307250977, -21.336057662963867, -19.981964111328125, -18.627872467041016, -17.273780822753906, -15.919687271118164, -14.565595626831055, -13.211503028869629, -11.857410430908203, -10.503318786621094, -9.149226188659668, -7.795133590698242, -6.441040992736816, -5.086948871612549, -3.7328567504882812, -2.3787641525268555, -1.0246715545654297, 0.3294200897216797, 1.6835126876831055, 3.037609100341797, 4.391701698303223, 5.74579381942749, 7.099885940551758, 8.453978538513184, 9.80807113647461, 11.162162780761719, 12.516255378723145, 13.87034797668457, 15.224440574645996, 16.578533172607422, 17.93262481689453, 19.28671646118164, 20.640810012817383, 21.994901657104492, 23.348995208740234, 24.703086853027344, 26.057178497314453, 27.411272048950195, 28.765363693237305, 30.119457244873047, 31.473548889160156, 32.827640533447266, 34.181732177734375, 35.53582763671875, 36.88991928100586, 38.24401092529297, 39.598106384277344, 40.95219802856445, 42.30628967285156, 43.66038131713867, 45.01447296142578, 46.36856460571289]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 8.0, 4.0, 13.0, 9.0, 14.0, 13.0, 20.0, 19.0, 26.0, 24.0, 31.0, 37.0, 32.0, 43.0, 41.0, 46.0, 42.0, 32.0, 45.0, 39.0, 48.0, 46.0, 46.0, 45.0, 33.0, 22.0, 31.0, 40.0, 25.0, 26.0, 30.0, 11.0, 6.0, 17.0, 10.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.848724365234375, -25.073223114013672, -24.29772186279297, -23.522220611572266, -22.746719360351562, -21.971216201782227, -21.195714950561523, -20.42021369934082, -19.644712448120117, -18.869211196899414, -18.09370994567871, -17.318208694458008, -16.542705535888672, -15.767205238342285, -14.991703033447266, -14.216201782226562, -13.44070053100586, -12.665199279785156, -11.889698028564453, -11.114195823669434, -10.33869457244873, -9.563193321228027, -8.787691116333008, -8.012189865112305, -7.236688613891602, -6.461187362670898, -5.685685634613037, -4.910183906555176, -4.134682655334473, -3.3591811656951904, -2.583679676055908, -1.8081779479980469, -1.0326766967773438, -0.2571752071380615, 0.5183262825012207, 1.293827772140503, 2.069329261779785, 2.8448307514190674, 3.6203322410583496, 4.395833969116211, 5.171335220336914, 5.946836471557617, 6.7223381996154785, 7.49783992767334, 8.273341178894043, 9.048842430114746, 9.824344635009766, 10.599845886230469, 11.375347137451172, 12.150848388671875, 12.926349639892578, 13.701851844787598, 14.4773530960083, 15.252854347229004, 16.028356552124023, 16.803857803344727, 17.57935905456543, 18.354860305786133, 19.130361557006836, 19.90586280822754, 20.681365966796875, 21.456867218017578, 22.23236846923828, 23.007869720458984, 23.783370971679688]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 14.0, 10.0, 15.0, 17.0, 22.0, 17.0, 28.0, 25.0, 31.0, 31.0, 26.0, 31.0, 31.0, 35.0, 35.0, 47.0, 48.0, 43.0, 48.0, 29.0, 43.0, 36.0, 30.0, 35.0, 33.0, 29.0, 32.0, 23.0, 21.0, 25.0, 16.0, 13.0, 9.0, 9.0, 4.0, 6.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.552734375, -3.4373779296875, -3.322021484375, -3.2066650390625, -3.09130859375, -2.9759521484375, -2.860595703125, -2.7452392578125, -2.6298828125, -2.5145263671875, -2.399169921875, -2.2838134765625, -2.16845703125, -2.0531005859375, -1.937744140625, -1.8223876953125, -1.70703125, -1.5916748046875, -1.476318359375, -1.3609619140625, -1.24560546875, -1.1302490234375, -1.014892578125, -0.8995361328125, -0.7841796875, -0.6688232421875, -0.553466796875, -0.4381103515625, -0.32275390625, -0.2073974609375, -0.092041015625, 0.0233154296875, 0.138671875, 0.2540283203125, 0.369384765625, 0.4847412109375, 0.60009765625, 0.7154541015625, 0.830810546875, 0.9461669921875, 1.0615234375, 1.1768798828125, 1.292236328125, 1.4075927734375, 1.52294921875, 1.6383056640625, 1.753662109375, 1.8690185546875, 1.984375, 2.0997314453125, 2.215087890625, 2.3304443359375, 2.44580078125, 2.5611572265625, 2.676513671875, 2.7918701171875, 2.9072265625, 3.0225830078125, 3.137939453125, 3.2532958984375, 3.36865234375, 3.4840087890625, 3.599365234375, 3.7147216796875, 3.830078125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 11.0, 11.0, 16.0, 22.0, 24.0, 54.0, 70.0, 107.0, 152.0, 278.0, 391.0, 685.0, 1030.0, 1724.0, 2898.0, 4707.0, 7875.0, 13196.0, 22077.0, 38875.0, 72921.0, 166591.0, 367711.0, 174487.0, 76061.0, 39543.0, 22976.0, 13300.0, 8119.0, 5068.0, 2892.0, 1807.0, 1040.0, 638.0, 429.0, 292.0, 159.0, 107.0, 72.0, 48.0, 41.0, 21.0, 11.0, 10.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1943359375, -0.18817138671875, -0.1820068359375, -0.17584228515625, -0.169677734375, -0.16351318359375, -0.1573486328125, -0.15118408203125, -0.14501953125, -0.13885498046875, -0.1326904296875, -0.12652587890625, -0.120361328125, -0.11419677734375, -0.1080322265625, -0.10186767578125, -0.095703125, -0.08953857421875, -0.0833740234375, -0.07720947265625, -0.071044921875, -0.06488037109375, -0.0587158203125, -0.05255126953125, -0.04638671875, -0.04022216796875, -0.0340576171875, -0.02789306640625, -0.021728515625, -0.01556396484375, -0.0093994140625, -0.00323486328125, 0.0029296875, 0.00909423828125, 0.0152587890625, 0.02142333984375, 0.027587890625, 0.03375244140625, 0.0399169921875, 0.04608154296875, 0.05224609375, 0.05841064453125, 0.0645751953125, 0.07073974609375, 0.076904296875, 0.08306884765625, 0.0892333984375, 0.09539794921875, 0.1015625, 0.10772705078125, 0.1138916015625, 0.12005615234375, 0.126220703125, 0.13238525390625, 0.1385498046875, 0.14471435546875, 0.15087890625, 0.15704345703125, 0.1632080078125, 0.16937255859375, 0.175537109375, 0.18170166015625, 0.1878662109375, 0.19403076171875, 0.2001953125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 9.0, 2.0, 11.0, 7.0, 9.0, 10.0, 20.0, 27.0, 20.0, 25.0, 38.0, 38.0, 20.0, 34.0, 36.0, 49.0, 45.0, 49.0, 1073.0, 46.0, 58.0, 45.0, 40.0, 33.0, 39.0, 30.0, 30.0, 36.0, 26.0, 27.0, 14.0, 23.0, 17.0, 12.0, 11.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.303375244140625, -2.21026611328125, -2.117156982421875, -2.0240478515625, -1.930938720703125, -1.83782958984375, -1.744720458984375, -1.651611328125, -1.558502197265625, -1.46539306640625, -1.372283935546875, -1.2791748046875, -1.186065673828125, -1.09295654296875, -0.999847412109375, -0.90673828125, -0.813629150390625, -0.72052001953125, -0.627410888671875, -0.5343017578125, -0.441192626953125, -0.34808349609375, -0.254974365234375, -0.161865234375, -0.068756103515625, 0.02435302734375, 0.117462158203125, 0.2105712890625, 0.303680419921875, 0.39678955078125, 0.489898681640625, 0.5830078125, 0.676116943359375, 0.76922607421875, 0.862335205078125, 0.9554443359375, 1.048553466796875, 1.14166259765625, 1.234771728515625, 1.327880859375, 1.420989990234375, 1.51409912109375, 1.607208251953125, 1.7003173828125, 1.793426513671875, 1.88653564453125, 1.979644775390625, 2.07275390625, 2.165863037109375, 2.25897216796875, 2.352081298828125, 2.4451904296875, 2.538299560546875, 2.63140869140625, 2.724517822265625, 2.817626953125, 2.910736083984375, 3.00384521484375, 3.096954345703125, 3.1900634765625, 3.283172607421875, 3.37628173828125, 3.469390869140625, 3.5625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 14.0, 10.0, 28.0, 38.0, 46.0, 86.0, 126.0, 167.0, 253.0, 408.0, 603.0, 889.0, 1463.0, 2223.0, 3583.0, 5766.0, 9316.0, 15342.0, 25993.0, 45375.0, 82551.0, 162818.0, 1350447.0, 179503.0, 90228.0, 48637.0, 28100.0, 16526.0, 9986.0, 6063.0, 3848.0, 2348.0, 1517.0, 916.0, 662.0, 406.0, 284.0, 173.0, 129.0, 88.0, 47.0, 44.0, 27.0, 19.0, 6.0, 10.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0709228515625, -0.06867599487304688, -0.06642913818359375, -0.06418228149414062, -0.0619354248046875, -0.059688568115234375, -0.05744171142578125, -0.055194854736328125, -0.052947998046875, -0.050701141357421875, -0.04845428466796875, -0.046207427978515625, -0.0439605712890625, -0.041713714599609375, -0.03946685791015625, -0.037220001220703125, -0.03497314453125, -0.032726287841796875, -0.03047943115234375, -0.028232574462890625, -0.0259857177734375, -0.023738861083984375, -0.02149200439453125, -0.019245147705078125, -0.016998291015625, -0.014751434326171875, -0.01250457763671875, -0.010257720947265625, -0.0080108642578125, -0.005764007568359375, -0.00351715087890625, -0.001270294189453125, 0.0009765625, 0.003223419189453125, 0.00547027587890625, 0.007717132568359375, 0.0099639892578125, 0.012210845947265625, 0.01445770263671875, 0.016704559326171875, 0.018951416015625, 0.021198272705078125, 0.02344512939453125, 0.025691986083984375, 0.0279388427734375, 0.030185699462890625, 0.03243255615234375, 0.034679412841796875, 0.03692626953125, 0.039173126220703125, 0.04141998291015625, 0.043666839599609375, 0.0459136962890625, 0.048160552978515625, 0.05040740966796875, 0.052654266357421875, 0.054901123046875, 0.057147979736328125, 0.05939483642578125, 0.061641693115234375, 0.0638885498046875, 0.06613540649414062, 0.06838226318359375, 0.07062911987304688, 0.0728759765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 3.0, 4.0, 9.0, 13.0, 12.0, 20.0, 26.0, 19.0, 50.0, 53.0, 85.0, 110.0, 124.0, 114.0, 104.0, 69.0, 46.0, 45.0, 18.0, 18.0, 12.0, 16.0, 3.0, 4.0, 8.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.589557647705078e-05, -4.4704414904117584e-05, -4.351325333118439e-05, -4.232209175825119e-05, -4.113093018531799e-05, -3.9939768612384796e-05, -3.87486070394516e-05, -3.75574454665184e-05, -3.6366283893585205e-05, -3.517512232065201e-05, -3.398396074771881e-05, -3.2792799174785614e-05, -3.160163760185242e-05, -3.041047602891922e-05, -2.9219314455986023e-05, -2.8028152883052826e-05, -2.683699131011963e-05, -2.5645829737186432e-05, -2.4454668164253235e-05, -2.3263506591320038e-05, -2.207234501838684e-05, -2.0881183445453644e-05, -1.9690021872520447e-05, -1.849886029958725e-05, -1.7307698726654053e-05, -1.6116537153720856e-05, -1.4925375580787659e-05, -1.3734214007854462e-05, -1.2543052434921265e-05, -1.1351890861988068e-05, -1.016072928905487e-05, -8.969567716121674e-06, -7.778406143188477e-06, -6.5872445702552795e-06, -5.3960829973220825e-06, -4.2049214243888855e-06, -3.0137598514556885e-06, -1.8225982785224915e-06, -6.314367055892944e-07, 5.597248673439026e-07, 1.7508864402770996e-06, 2.9420480132102966e-06, 4.133209586143494e-06, 5.324371159076691e-06, 6.515532732009888e-06, 7.706694304943085e-06, 8.897855877876282e-06, 1.0089017450809479e-05, 1.1280179023742676e-05, 1.2471340596675873e-05, 1.366250216960907e-05, 1.4853663742542267e-05, 1.6044825315475464e-05, 1.723598688840866e-05, 1.8427148461341858e-05, 1.9618310034275055e-05, 2.0809471607208252e-05, 2.200063318014145e-05, 2.3191794753074646e-05, 2.4382956326007843e-05, 2.557411789894104e-05, 2.6765279471874237e-05, 2.7956441044807434e-05, 2.914760261774063e-05, 3.0338764190673828e-05]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 2.0, 8.0, 9.0, 19.0, 15.0, 31.0, 47.0, 81.0, 158.0, 422.0, 6129.0, 1038379.0, 2558.0, 302.0, 142.0, 78.0, 49.0, 32.0, 23.0, 14.0, 14.0, 7.0, 4.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007185935974121094, -0.0006903335452079773, -0.0006620734930038452, -0.0006338134407997131, -0.0006055533885955811, -0.000577293336391449, -0.0005490332841873169, -0.0005207732319831848, -0.0004925131797790527, -0.00046425312757492065, -0.0004359930753707886, -0.0004077330231666565, -0.0003794729709625244, -0.00035121291875839233, -0.00032295286655426025, -0.0002946928143501282, -0.0002664327621459961, -0.00023817270994186401, -0.00020991265773773193, -0.00018165260553359985, -0.00015339255332946777, -0.0001251325011253357, -9.687244892120361e-05, -6.861239671707153e-05, -4.035234451293945e-05, -1.2092292308807373e-05, 1.6167759895324707e-05, 4.442781209945679e-05, 7.268786430358887e-05, 0.00010094791650772095, 0.00012920796871185303, 0.0001574680209159851, 0.0001857280731201172, 0.00021398812532424927, 0.00024224817752838135, 0.00027050822973251343, 0.0002987682819366455, 0.0003270283341407776, 0.00035528838634490967, 0.00038354843854904175, 0.00041180849075317383, 0.0004400685429573059, 0.000468328595161438, 0.0004965886473655701, 0.0005248486995697021, 0.0005531087517738342, 0.0005813688039779663, 0.0006096288561820984, 0.0006378889083862305, 0.0006661489605903625, 0.0006944090127944946, 0.0007226690649986267, 0.0007509291172027588, 0.0007791891694068909, 0.000807449221611023, 0.000835709273815155, 0.0008639693260192871, 0.0008922293782234192, 0.0009204894304275513, 0.0009487494826316833, 0.0009770095348358154, 0.0010052695870399475, 0.0010335296392440796, 0.0010617896914482117, 0.0010900497436523438]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 99.0, 918.0], "bins": [-0.000828880409244448, -0.000815770763438195, -0.000802661117631942, -0.0007895514718256891, -0.0007764418260194361, -0.0007633321802131832, -0.0007502225344069302, -0.0007371128303930163, -0.0007240031845867634, -0.0007108935387805104, -0.0006977838929742575, -0.0006846742471680045, -0.0006715646013617516, -0.0006584549555554986, -0.0006453453097492456, -0.0006322356639429927, -0.0006191260181367397, -0.0006060163723304868, -0.0005929067265242338, -0.0005797970807179809, -0.0005666874349117279, -0.000553577789105475, -0.000540468143299222, -0.000527358497492969, -0.0005142488516867161, -0.0005011392058804631, -0.00048802956007421017, -0.0004749199142679572, -0.00046181026846170425, -0.0004487006226554513, -0.0004355909477453679, -0.00042248130193911493, -0.00040937159792520106, -0.0003962619521189481, -0.00038315230631269515, -0.0003700426605064422, -0.0003569329855963588, -0.0003438233397901058, -0.00033071369398385286, -0.0003176040481775999, -0.00030449440237134695, -0.000291384756565094, -0.00027827511075884104, -0.0002651654649525881, -0.0002520558191463351, -0.00023894615878816694, -0.00022583649842999876, -0.0002127268526237458, -0.00019961722136940807, -0.00018650757556315511, -0.00017339791520498693, -0.00016028826939873397, -0.00014717862359248102, -0.00013406897778622806, -0.00012095932470401749, -0.00010784967162180692, -9.474001853959635e-05, -8.163036545738578e-05, -6.852071965113282e-05, -5.541107020690106e-05, -4.2301420762669295e-05, -2.919177495641634e-05, -1.6082121874205768e-05, -2.9724687919951975e-06, 1.0137176104763057e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 13.0, 15.0, 21.0, 35.0, 38.0, 42.0, 48.0, 68.0, 69.0, 72.0, 70.0, 71.0, 71.0, 62.0, 60.0, 48.0, 54.0, 30.0, 25.0, 24.0, 15.0, 13.0, 14.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.817941665649414e-05, -1.7355196177959442e-05, -1.6530975699424744e-05, -1.5706755220890045e-05, -1.4882534742355347e-05, -1.4058314263820648e-05, -1.323409378528595e-05, -1.2409873306751251e-05, -1.1585652828216553e-05, -1.0761432349681854e-05, -9.937211871147156e-06, -9.112991392612457e-06, -8.288770914077759e-06, -7.46455043554306e-06, -6.640329957008362e-06, -5.816109478473663e-06, -4.991888999938965e-06, -4.167668521404266e-06, -3.343448042869568e-06, -2.5192275643348694e-06, -1.695007085800171e-06, -8.707866072654724e-07, -4.6566128730773926e-08, 7.776543498039246e-07, 1.601874828338623e-06, 2.4260953068733215e-06, 3.25031578540802e-06, 4.0745362639427185e-06, 4.898756742477417e-06, 5.7229772210121155e-06, 6.547197699546814e-06, 7.3714181780815125e-06, 8.195638656616211e-06, 9.01985913515091e-06, 9.844079613685608e-06, 1.0668300092220306e-05, 1.1492520570755005e-05, 1.2316741049289703e-05, 1.3140961527824402e-05, 1.39651820063591e-05, 1.4789402484893799e-05, 1.5613622963428497e-05, 1.6437843441963196e-05, 1.7262063920497894e-05, 1.8086284399032593e-05, 1.891050487756729e-05, 1.973472535610199e-05, 2.0558945834636688e-05, 2.1383166313171387e-05, 2.2207386791706085e-05, 2.3031607270240784e-05, 2.3855827748775482e-05, 2.468004822731018e-05, 2.550426870584488e-05, 2.6328489184379578e-05, 2.7152709662914276e-05, 2.7976930141448975e-05, 2.8801150619983673e-05, 2.962537109851837e-05, 3.044959157705307e-05, 3.127381205558777e-05, 3.209803253412247e-05, 3.2922253012657166e-05, 3.3746473491191864e-05, 3.457069396972656e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 14.0, 10.0, 15.0, 17.0, 22.0, 17.0, 28.0, 25.0, 31.0, 31.0, 26.0, 31.0, 31.0, 35.0, 35.0, 47.0, 48.0, 43.0, 48.0, 29.0, 43.0, 36.0, 30.0, 35.0, 33.0, 29.0, 32.0, 23.0, 21.0, 25.0, 16.0, 13.0, 9.0, 9.0, 4.0, 6.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.552734375, -3.4373779296875, -3.322021484375, -3.2066650390625, -3.09130859375, -2.9759521484375, -2.860595703125, -2.7452392578125, -2.6298828125, -2.5145263671875, -2.399169921875, -2.2838134765625, -2.16845703125, -2.0531005859375, -1.937744140625, -1.8223876953125, -1.70703125, -1.5916748046875, -1.476318359375, -1.3609619140625, -1.24560546875, -1.1302490234375, -1.014892578125, -0.8995361328125, -0.7841796875, -0.6688232421875, -0.553466796875, -0.4381103515625, -0.32275390625, -0.2073974609375, -0.092041015625, 0.0233154296875, 0.138671875, 0.2540283203125, 0.369384765625, 0.4847412109375, 0.60009765625, 0.7154541015625, 0.830810546875, 0.9461669921875, 1.0615234375, 1.1768798828125, 1.292236328125, 1.4075927734375, 1.52294921875, 1.6383056640625, 1.753662109375, 1.8690185546875, 1.984375, 2.0997314453125, 2.215087890625, 2.3304443359375, 2.44580078125, 2.5611572265625, 2.676513671875, 2.7918701171875, 2.9072265625, 3.0225830078125, 3.137939453125, 3.2532958984375, 3.36865234375, 3.4840087890625, 3.599365234375, 3.7147216796875, 3.830078125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 6.0, 6.0, 10.0, 10.0, 20.0, 24.0, 19.0, 23.0, 40.0, 47.0, 72.0, 85.0, 143.0, 223.0, 432.0, 762.0, 1437.0, 2848.0, 6036.0, 14188.0, 40515.0, 167345.0, 605707.0, 146800.0, 37119.0, 13069.0, 5627.0, 2718.0, 1362.0, 699.0, 413.0, 253.0, 128.0, 80.0, 60.0, 53.0, 41.0, 28.0, 27.0, 18.0, 14.0, 9.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.94921875, -5.75390625, -5.55859375, -5.36328125, -5.16796875, -4.97265625, -4.77734375, -4.58203125, -4.38671875, -4.19140625, -3.99609375, -3.80078125, -3.60546875, -3.41015625, -3.21484375, -3.01953125, -2.82421875, -2.62890625, -2.43359375, -2.23828125, -2.04296875, -1.84765625, -1.65234375, -1.45703125, -1.26171875, -1.06640625, -0.87109375, -0.67578125, -0.48046875, -0.28515625, -0.08984375, 0.10546875, 0.30078125, 0.49609375, 0.69140625, 0.88671875, 1.08203125, 1.27734375, 1.47265625, 1.66796875, 1.86328125, 2.05859375, 2.25390625, 2.44921875, 2.64453125, 2.83984375, 3.03515625, 3.23046875, 3.42578125, 3.62109375, 3.81640625, 4.01171875, 4.20703125, 4.40234375, 4.59765625, 4.79296875, 4.98828125, 5.18359375, 5.37890625, 5.57421875, 5.76953125, 5.96484375, 6.16015625, 6.35546875, 6.55078125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 7.0, 9.0, 9.0, 9.0, 3.0, 12.0, 14.0, 13.0, 18.0, 13.0, 22.0, 16.0, 37.0, 23.0, 32.0, 34.0, 39.0, 54.0, 55.0, 101.0, 167.0, 1558.0, 268.0, 108.0, 53.0, 37.0, 38.0, 28.0, 40.0, 31.0, 32.0, 24.0, 18.0, 24.0, 13.0, 22.0, 12.0, 12.0, 6.0, 8.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.328125, -10.991943359375, -10.65576171875, -10.319580078125, -9.9833984375, -9.647216796875, -9.31103515625, -8.974853515625, -8.638671875, -8.302490234375, -7.96630859375, -7.630126953125, -7.2939453125, -6.957763671875, -6.62158203125, -6.285400390625, -5.94921875, -5.613037109375, -5.27685546875, -4.940673828125, -4.6044921875, -4.268310546875, -3.93212890625, -3.595947265625, -3.259765625, -2.923583984375, -2.58740234375, -2.251220703125, -1.9150390625, -1.578857421875, -1.24267578125, -0.906494140625, -0.5703125, -0.234130859375, 0.10205078125, 0.438232421875, 0.7744140625, 1.110595703125, 1.44677734375, 1.782958984375, 2.119140625, 2.455322265625, 2.79150390625, 3.127685546875, 3.4638671875, 3.800048828125, 4.13623046875, 4.472412109375, 4.80859375, 5.144775390625, 5.48095703125, 5.817138671875, 6.1533203125, 6.489501953125, 6.82568359375, 7.161865234375, 7.498046875, 7.834228515625, 8.17041015625, 8.506591796875, 8.8427734375, 9.178955078125, 9.51513671875, 9.851318359375, 10.1875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 9.0, 8.0, 7.0, 17.0, 21.0, 22.0, 21.0, 27.0, 32.0, 44.0, 57.0, 87.0, 116.0, 198.0, 417.0, 1470.0, 7875.0, 114075.0, 2941721.0, 70924.0, 6193.0, 1206.0, 445.0, 210.0, 115.0, 78.0, 46.0, 64.0, 38.0, 17.0, 17.0, 22.0, 18.0, 11.0, 14.0, 5.0, 10.0, 8.0, 7.0, 6.0, 10.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.63525390625, -17.0361328125, -16.43701171875, -15.837890625, -15.23876953125, -14.6396484375, -14.04052734375, -13.44140625, -12.84228515625, -12.2431640625, -11.64404296875, -11.044921875, -10.44580078125, -9.8466796875, -9.24755859375, -8.6484375, -8.04931640625, -7.4501953125, -6.85107421875, -6.251953125, -5.65283203125, -5.0537109375, -4.45458984375, -3.85546875, -3.25634765625, -2.6572265625, -2.05810546875, -1.458984375, -0.85986328125, -0.2607421875, 0.33837890625, 0.9375, 1.53662109375, 2.1357421875, 2.73486328125, 3.333984375, 3.93310546875, 4.5322265625, 5.13134765625, 5.73046875, 6.32958984375, 6.9287109375, 7.52783203125, 8.126953125, 8.72607421875, 9.3251953125, 9.92431640625, 10.5234375, 11.12255859375, 11.7216796875, 12.32080078125, 12.919921875, 13.51904296875, 14.1181640625, 14.71728515625, 15.31640625, 15.91552734375, 16.5146484375, 17.11376953125, 17.712890625, 18.31201171875, 18.9111328125, 19.51025390625, 20.109375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 37.0, 126.0, 294.0, 300.0, 172.0, 51.0, 21.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.56342315673828, -35.1634635925293, -33.76350402832031, -32.363548278808594, -30.96358871459961, -29.563629150390625, -28.16366958618164, -26.76371192932129, -25.363754272460938, -23.963794708251953, -22.5638370513916, -21.163877487182617, -19.763919830322266, -18.36396026611328, -16.964000701904297, -15.564043045043945, -14.164083480834961, -12.764124870300293, -11.364166259765625, -9.96420669555664, -8.564249038696289, -7.164289951324463, -5.764330863952637, -4.364372253417969, -2.964413642883301, -1.5644549131393433, -0.16449618339538574, 1.2354626655578613, 2.6354212760925293, 4.035379886627197, 5.435338973999023, 6.835297584533691, 8.23525619506836, 9.635214805603027, 11.035173416137695, 12.43513298034668, 13.835090637207031, 15.235050201416016, 16.635009765625, 18.03496742248535, 19.434925079345703, 20.834884643554688, 22.23484230041504, 23.634801864624023, 25.034759521484375, 26.43471908569336, 27.834678649902344, 29.234636306762695, 30.63459587097168, 32.03455352783203, 33.434513092041016, 34.83447265625, 36.234432220458984, 37.6343879699707, 39.03434753417969, 40.43430709838867, 41.834266662597656, 43.23422622680664, 44.634185791015625, 46.034141540527344, 47.43410110473633, 48.83406066894531, 50.2340202331543, 51.63397979736328, 53.033935546875]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 5.0, 8.0, 4.0, 7.0, 14.0, 15.0, 20.0, 19.0, 16.0, 21.0, 23.0, 19.0, 24.0, 24.0, 35.0, 30.0, 51.0, 29.0, 40.0, 31.0, 29.0, 42.0, 34.0, 35.0, 37.0, 39.0, 51.0, 29.0, 33.0, 35.0, 13.0, 36.0, 28.0, 15.0, 18.0, 8.0, 16.0, 17.0, 6.0, 7.0, 5.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-28.14946746826172, -27.307607650756836, -26.465747833251953, -25.62388801574707, -24.782028198242188, -23.940166473388672, -23.09830665588379, -22.256446838378906, -21.414587020874023, -20.57272720336914, -19.730867385864258, -18.889007568359375, -18.04714584350586, -17.20528793334961, -16.363426208496094, -15.521566390991211, -14.679706573486328, -13.837846755981445, -12.995986938476562, -12.154126167297363, -11.31226634979248, -10.470406532287598, -9.628545761108398, -8.786685943603516, -7.944826126098633, -7.10296630859375, -6.261106014251709, -5.419245719909668, -4.577385902404785, -3.7355260848999023, -2.8936657905578613, -2.0518054962158203, -1.2099475860595703, -0.3680875301361084, 0.4737725257873535, 1.3156325817108154, 2.1574926376342773, 2.99935245513916, 3.841212749481201, 4.683073043823242, 5.524932861328125, 6.366792678833008, 7.208652973175049, 8.05051326751709, 8.892373085021973, 9.734232902526855, 10.576093673706055, 11.417953491210938, 12.25981330871582, 13.101673126220703, 13.943532943725586, 14.785393714904785, 15.627253532409668, 16.469112396240234, 17.31097412109375, 18.152833938598633, 18.994693756103516, 19.8365535736084, 20.67841339111328, 21.520273208618164, 22.362133026123047, 23.203994750976562, 24.045854568481445, 24.887714385986328, 25.72957420349121]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 11.0, 6.0, 9.0, 10.0, 19.0, 20.0, 26.0, 11.0, 20.0, 22.0, 34.0, 20.0, 36.0, 28.0, 32.0, 36.0, 34.0, 43.0, 46.0, 36.0, 43.0, 33.0, 37.0, 31.0, 31.0, 32.0, 30.0, 27.0, 24.0, 38.0, 27.0, 20.0, 13.0, 20.0, 14.0, 12.0, 10.0, 8.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.474609375, -3.36383056640625, -3.2530517578125, -3.14227294921875, -3.031494140625, -2.92071533203125, -2.8099365234375, -2.69915771484375, -2.58837890625, -2.47760009765625, -2.3668212890625, -2.25604248046875, -2.145263671875, -2.03448486328125, -1.9237060546875, -1.81292724609375, -1.7021484375, -1.59136962890625, -1.4805908203125, -1.36981201171875, -1.259033203125, -1.14825439453125, -1.0374755859375, -0.92669677734375, -0.81591796875, -0.70513916015625, -0.5943603515625, -0.48358154296875, -0.372802734375, -0.26202392578125, -0.1512451171875, -0.04046630859375, 0.0703125, 0.18109130859375, 0.2918701171875, 0.40264892578125, 0.513427734375, 0.62420654296875, 0.7349853515625, 0.84576416015625, 0.95654296875, 1.06732177734375, 1.1781005859375, 1.28887939453125, 1.399658203125, 1.51043701171875, 1.6212158203125, 1.73199462890625, 1.8427734375, 1.95355224609375, 2.0643310546875, 2.17510986328125, 2.285888671875, 2.39666748046875, 2.5074462890625, 2.61822509765625, 2.72900390625, 2.83978271484375, 2.9505615234375, 3.06134033203125, 3.172119140625, 3.28289794921875, 3.3936767578125, 3.50445556640625, 3.615234375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 3.0, 7.0, 9.0, 13.0, 10.0, 11.0, 13.0, 28.0, 40.0, 47.0, 110.0, 197.0, 375.0, 802.0, 1723.0, 4233.0, 11222.0, 32693.0, 116094.0, 560199.0, 2236477.0, 974848.0, 182583.0, 47048.0, 15356.0, 5714.0, 2251.0, 1015.0, 486.0, 245.0, 137.0, 84.0, 49.0, 33.0, 26.0, 28.0, 12.0, 8.0, 5.0, 6.0, 3.0, 12.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44140625, -7.19866943359375, -6.9559326171875, -6.71319580078125, -6.470458984375, -6.22772216796875, -5.9849853515625, -5.74224853515625, -5.49951171875, -5.25677490234375, -5.0140380859375, -4.77130126953125, -4.528564453125, -4.28582763671875, -4.0430908203125, -3.80035400390625, -3.5576171875, -3.31488037109375, -3.0721435546875, -2.82940673828125, -2.586669921875, -2.34393310546875, -2.1011962890625, -1.85845947265625, -1.61572265625, -1.37298583984375, -1.1302490234375, -0.88751220703125, -0.644775390625, -0.40203857421875, -0.1593017578125, 0.08343505859375, 0.326171875, 0.56890869140625, 0.8116455078125, 1.05438232421875, 1.297119140625, 1.53985595703125, 1.7825927734375, 2.02532958984375, 2.26806640625, 2.51080322265625, 2.7535400390625, 2.99627685546875, 3.239013671875, 3.48175048828125, 3.7244873046875, 3.96722412109375, 4.2099609375, 4.45269775390625, 4.6954345703125, 4.93817138671875, 5.180908203125, 5.42364501953125, 5.6663818359375, 5.90911865234375, 6.15185546875, 6.39459228515625, 6.6373291015625, 6.88006591796875, 7.122802734375, 7.36553955078125, 7.6082763671875, 7.85101318359375, 8.09375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 5.0, 9.0, 21.0, 19.0, 31.0, 38.0, 30.0, 66.0, 65.0, 90.0, 126.0, 183.0, 247.0, 285.0, 390.0, 479.0, 462.0, 377.0, 294.0, 227.0, 156.0, 104.0, 88.0, 72.0, 44.0, 51.0, 28.0, 21.0, 15.0, 12.0, 16.0, 9.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.359375, -6.15380859375, -5.9482421875, -5.74267578125, -5.537109375, -5.33154296875, -5.1259765625, -4.92041015625, -4.71484375, -4.50927734375, -4.3037109375, -4.09814453125, -3.892578125, -3.68701171875, -3.4814453125, -3.27587890625, -3.0703125, -2.86474609375, -2.6591796875, -2.45361328125, -2.248046875, -2.04248046875, -1.8369140625, -1.63134765625, -1.42578125, -1.22021484375, -1.0146484375, -0.80908203125, -0.603515625, -0.39794921875, -0.1923828125, 0.01318359375, 0.21875, 0.42431640625, 0.6298828125, 0.83544921875, 1.041015625, 1.24658203125, 1.4521484375, 1.65771484375, 1.86328125, 2.06884765625, 2.2744140625, 2.47998046875, 2.685546875, 2.89111328125, 3.0966796875, 3.30224609375, 3.5078125, 3.71337890625, 3.9189453125, 4.12451171875, 4.330078125, 4.53564453125, 4.7412109375, 4.94677734375, 5.15234375, 5.35791015625, 5.5634765625, 5.76904296875, 5.974609375, 6.18017578125, 6.3857421875, 6.59130859375, 6.796875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 11.0, 13.0, 18.0, 18.0, 21.0, 38.0, 48.0, 63.0, 98.0, 129.0, 234.0, 345.0, 789.0, 2403.0, 11445.0, 94206.0, 1531943.0, 2392225.0, 139423.0, 15691.0, 2987.0, 952.0, 425.0, 230.0, 137.0, 99.0, 83.0, 57.0, 41.0, 37.0, 27.0, 14.0, 7.0, 4.0, 6.0, 6.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -15.981689453125, -15.43212890625, -14.882568359375, -14.3330078125, -13.783447265625, -13.23388671875, -12.684326171875, -12.134765625, -11.585205078125, -11.03564453125, -10.486083984375, -9.9365234375, -9.386962890625, -8.83740234375, -8.287841796875, -7.73828125, -7.188720703125, -6.63916015625, -6.089599609375, -5.5400390625, -4.990478515625, -4.44091796875, -3.891357421875, -3.341796875, -2.792236328125, -2.24267578125, -1.693115234375, -1.1435546875, -0.593994140625, -0.04443359375, 0.505126953125, 1.0546875, 1.604248046875, 2.15380859375, 2.703369140625, 3.2529296875, 3.802490234375, 4.35205078125, 4.901611328125, 5.451171875, 6.000732421875, 6.55029296875, 7.099853515625, 7.6494140625, 8.198974609375, 8.74853515625, 9.298095703125, 9.84765625, 10.397216796875, 10.94677734375, 11.496337890625, 12.0458984375, 12.595458984375, 13.14501953125, 13.694580078125, 14.244140625, 14.793701171875, 15.34326171875, 15.892822265625, 16.4423828125, 16.991943359375, 17.54150390625, 18.091064453125, 18.640625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 15.0, 59.0, 157.0, 269.0, 251.0, 154.0, 67.0, 29.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.54264450073242, -51.95706558227539, -49.371482849121094, -46.78590393066406, -44.200321197509766, -41.614742279052734, -39.02915954589844, -36.443580627441406, -33.858001708984375, -31.27242088317871, -28.686840057373047, -26.101261138916016, -23.51567840576172, -20.930099487304688, -18.344518661499023, -15.75893783569336, -13.173355102539062, -10.587774276733398, -8.002193450927734, -5.416613578796387, -2.8310327529907227, -0.2454519271850586, 2.340127944946289, 4.925708770751953, 7.511289596557617, 10.096870422363281, 12.682451248168945, 15.268031120300293, 17.85361099243164, 20.439193725585938, 23.02477264404297, 25.610353469848633, 28.195938110351562, 30.781518936157227, 33.36709976196289, 35.95267868041992, 38.53826141357422, 41.12384033203125, 43.70941925048828, 46.29500198364258, 48.880584716796875, 51.466163635253906, 54.0517463684082, 56.637325286865234, 59.22290802001953, 61.80848693847656, 64.3940658569336, 66.97964477539062, 69.56523132324219, 72.15081024169922, 74.73638916015625, 77.32197570800781, 79.90755462646484, 82.49313354492188, 85.0787124633789, 87.66429138183594, 90.24987030029297, 92.83544921875, 95.42102813720703, 98.0066146850586, 100.59219360351562, 103.17777252197266, 105.76335144042969, 108.34893798828125, 110.93451690673828]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 10.0, 7.0, 9.0, 11.0, 11.0, 18.0, 16.0, 15.0, 23.0, 38.0, 29.0, 22.0, 36.0, 40.0, 37.0, 41.0, 44.0, 44.0, 40.0, 46.0, 39.0, 39.0, 31.0, 43.0, 39.0, 39.0, 25.0, 35.0, 28.0, 24.0, 15.0, 15.0, 15.0, 17.0, 12.0, 8.0, 11.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.403060913085938, -22.648710250854492, -21.894359588623047, -21.14000701904297, -20.385656356811523, -19.631305694580078, -18.876953125, -18.122602462768555, -17.36825180053711, -16.613901138305664, -15.859549522399902, -15.10519790649414, -14.350847244262695, -13.59649658203125, -12.842144966125488, -12.087793350219727, -11.333442687988281, -10.579092025756836, -9.824740409851074, -9.070388793945312, -8.316038131713867, -7.561686992645264, -6.80733585357666, -6.052984714508057, -5.298633575439453, -4.54428243637085, -3.789931297302246, -3.0355801582336426, -2.281229019165039, -1.5268778800964355, -0.772526741027832, -0.018175601959228516, 0.736175537109375, 1.4905266761779785, 2.244877815246582, 2.9992289543151855, 3.753580093383789, 4.507931232452393, 5.262282371520996, 6.0166335105896, 6.770984649658203, 7.525335788726807, 8.27968692779541, 9.034038543701172, 9.788389205932617, 10.542739868164062, 11.297091484069824, 12.051443099975586, 12.805793762207031, 13.560144424438477, 14.314496040344238, 15.06884765625, 15.823198318481445, 16.57754898071289, 17.33190155029297, 18.086252212524414, 18.84060287475586, 19.594953536987305, 20.34930419921875, 21.103656768798828, 21.858007431030273, 22.61235809326172, 23.366710662841797, 24.121061325073242, 24.875411987304688]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 3.0, 6.0, 9.0, 9.0, 13.0, 10.0, 7.0, 11.0, 11.0, 22.0, 22.0, 18.0, 23.0, 22.0, 34.0, 17.0, 33.0, 17.0, 41.0, 43.0, 28.0, 37.0, 33.0, 42.0, 45.0, 46.0, 30.0, 37.0, 33.0, 43.0, 27.0, 26.0, 28.0, 25.0, 15.0, 17.0, 18.0, 17.0, 19.0, 13.0, 11.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.916015625, -3.801055908203125, -3.68609619140625, -3.571136474609375, -3.4561767578125, -3.341217041015625, -3.22625732421875, -3.111297607421875, -2.996337890625, -2.881378173828125, -2.76641845703125, -2.651458740234375, -2.5364990234375, -2.421539306640625, -2.30657958984375, -2.191619873046875, -2.07666015625, -1.961700439453125, -1.84674072265625, -1.731781005859375, -1.6168212890625, -1.501861572265625, -1.38690185546875, -1.271942138671875, -1.156982421875, -1.042022705078125, -0.92706298828125, -0.812103271484375, -0.6971435546875, -0.582183837890625, -0.46722412109375, -0.352264404296875, -0.2373046875, -0.122344970703125, -0.00738525390625, 0.107574462890625, 0.2225341796875, 0.337493896484375, 0.45245361328125, 0.567413330078125, 0.682373046875, 0.797332763671875, 0.91229248046875, 1.027252197265625, 1.1422119140625, 1.257171630859375, 1.37213134765625, 1.487091064453125, 1.60205078125, 1.717010498046875, 1.83197021484375, 1.946929931640625, 2.0618896484375, 2.176849365234375, 2.29180908203125, 2.406768798828125, 2.521728515625, 2.636688232421875, 2.75164794921875, 2.866607666015625, 2.9815673828125, 3.096527099609375, 3.21148681640625, 3.326446533203125, 3.44140625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 19.0, 22.0, 27.0, 50.0, 78.0, 110.0, 128.0, 233.0, 384.0, 553.0, 891.0, 1465.0, 2250.0, 3711.0, 6053.0, 10042.0, 16675.0, 28642.0, 50543.0, 100480.0, 254908.0, 312444.0, 120506.0, 58408.0, 32126.0, 18888.0, 11180.0, 6749.0, 4072.0, 2555.0, 1555.0, 960.0, 627.0, 421.0, 266.0, 190.0, 120.0, 67.0, 45.0, 41.0, 18.0, 10.0, 7.0, 9.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18538856506347656, -0.17961502075195312, -0.1738414764404297, -0.16806793212890625, -0.1622943878173828, -0.15652084350585938, -0.15074729919433594, -0.1449737548828125, -0.13920021057128906, -0.13342666625976562, -0.1276531219482422, -0.12187957763671875, -0.11610603332519531, -0.11033248901367188, -0.10455894470214844, -0.098785400390625, -0.09301185607910156, -0.08723831176757812, -0.08146476745605469, -0.07569122314453125, -0.06991767883300781, -0.06414413452148438, -0.05837059020996094, -0.0525970458984375, -0.04682350158691406, -0.041049957275390625, -0.03527641296386719, -0.02950286865234375, -0.023729324340820312, -0.017955780029296875, -0.012182235717773438, -0.00640869140625, -0.0006351470947265625, 0.005138397216796875, 0.010911941528320312, 0.01668548583984375, 0.022459030151367188, 0.028232574462890625, 0.03400611877441406, 0.0397796630859375, 0.04555320739746094, 0.051326751708984375, 0.05710029602050781, 0.06287384033203125, 0.06864738464355469, 0.07442092895507812, 0.08019447326660156, 0.085968017578125, 0.09174156188964844, 0.09751510620117188, 0.10328865051269531, 0.10906219482421875, 0.11483573913574219, 0.12060928344726562, 0.12638282775878906, 0.1321563720703125, 0.13792991638183594, 0.14370346069335938, 0.1494770050048828, 0.15525054931640625, 0.1610240936279297, 0.16679763793945312, 0.17257118225097656, 0.1783447265625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 5.0, 6.0, 7.0, 8.0, 8.0, 19.0, 17.0, 21.0, 21.0, 21.0, 27.0, 24.0, 26.0, 47.0, 36.0, 30.0, 33.0, 36.0, 47.0, 35.0, 1063.0, 44.0, 33.0, 31.0, 40.0, 34.0, 33.0, 18.0, 30.0, 26.0, 24.0, 26.0, 16.0, 18.0, 10.0, 16.0, 8.0, 9.0, 12.0, 6.0, 4.0, 8.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.24609375, -2.169097900390625, -2.09210205078125, -2.015106201171875, -1.9381103515625, -1.861114501953125, -1.78411865234375, -1.707122802734375, -1.630126953125, -1.553131103515625, -1.47613525390625, -1.399139404296875, -1.3221435546875, -1.245147705078125, -1.16815185546875, -1.091156005859375, -1.01416015625, -0.937164306640625, -0.86016845703125, -0.783172607421875, -0.7061767578125, -0.629180908203125, -0.55218505859375, -0.475189208984375, -0.398193359375, -0.321197509765625, -0.24420166015625, -0.167205810546875, -0.0902099609375, -0.013214111328125, 0.06378173828125, 0.140777587890625, 0.2177734375, 0.294769287109375, 0.37176513671875, 0.448760986328125, 0.5257568359375, 0.602752685546875, 0.67974853515625, 0.756744384765625, 0.833740234375, 0.910736083984375, 0.98773193359375, 1.064727783203125, 1.1417236328125, 1.218719482421875, 1.29571533203125, 1.372711181640625, 1.44970703125, 1.526702880859375, 1.60369873046875, 1.680694580078125, 1.7576904296875, 1.834686279296875, 1.91168212890625, 1.988677978515625, 2.065673828125, 2.142669677734375, 2.21966552734375, 2.296661376953125, 2.3736572265625, 2.450653076171875, 2.52764892578125, 2.604644775390625, 2.681640625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 4.0, 10.0, 25.0, 33.0, 30.0, 90.0, 103.0, 152.0, 261.0, 370.0, 593.0, 888.0, 1427.0, 2242.0, 3432.0, 5551.0, 9061.0, 14900.0, 24954.0, 43014.0, 77463.0, 149303.0, 1335984.0, 197014.0, 98480.0, 54061.0, 30428.0, 18156.0, 10774.0, 6794.0, 4184.0, 2617.0, 1706.0, 1067.0, 690.0, 448.0, 298.0, 170.0, 129.0, 71.0, 47.0, 43.0, 15.0, 13.0, 15.0, 9.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07847118377685547, -0.07607078552246094, -0.0736703872680664, -0.07126998901367188, -0.06886959075927734, -0.06646919250488281, -0.06406879425048828, -0.06166839599609375, -0.05926799774169922, -0.05686759948730469, -0.054467201232910156, -0.052066802978515625, -0.049666404724121094, -0.04726600646972656, -0.04486560821533203, -0.0424652099609375, -0.04006481170654297, -0.03766441345214844, -0.035264015197753906, -0.032863616943359375, -0.030463218688964844, -0.028062820434570312, -0.02566242218017578, -0.02326202392578125, -0.02086162567138672, -0.018461227416992188, -0.016060829162597656, -0.013660430908203125, -0.011260032653808594, -0.008859634399414062, -0.006459236145019531, -0.004058837890625, -0.0016584396362304688, 0.0007419586181640625, 0.0031423568725585938, 0.005542755126953125, 0.007943153381347656, 0.010343551635742188, 0.012743949890136719, 0.01514434814453125, 0.01754474639892578, 0.019945144653320312, 0.022345542907714844, 0.024745941162109375, 0.027146339416503906, 0.029546737670898438, 0.03194713592529297, 0.0343475341796875, 0.03674793243408203, 0.03914833068847656, 0.041548728942871094, 0.043949127197265625, 0.046349525451660156, 0.04874992370605469, 0.05115032196044922, 0.05355072021484375, 0.05595111846923828, 0.05835151672363281, 0.060751914978027344, 0.06315231323242188, 0.0655527114868164, 0.06795310974121094, 0.07035350799560547, 0.07275390625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 12.0, 13.0, 13.0, 23.0, 27.0, 33.0, 45.0, 60.0, 65.0, 77.0, 84.0, 103.0, 88.0, 76.0, 63.0, 41.0, 45.0, 26.0, 13.0, 15.0, 16.0, 17.0, 2.0, 10.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8252601623535156e-05, -2.7257949113845825e-05, -2.6263296604156494e-05, -2.5268644094467163e-05, -2.4273991584777832e-05, -2.32793390750885e-05, -2.228468656539917e-05, -2.129003405570984e-05, -2.0295381546020508e-05, -1.9300729036331177e-05, -1.8306076526641846e-05, -1.7311424016952515e-05, -1.6316771507263184e-05, -1.5322118997573853e-05, -1.4327466487884521e-05, -1.333281397819519e-05, -1.233816146850586e-05, -1.1343508958816528e-05, -1.0348856449127197e-05, -9.354203939437866e-06, -8.359551429748535e-06, -7.364898920059204e-06, -6.370246410369873e-06, -5.375593900680542e-06, -4.380941390991211e-06, -3.38628888130188e-06, -2.391636371612549e-06, -1.3969838619232178e-06, -4.023313522338867e-07, 5.923211574554443e-07, 1.5869736671447754e-06, 2.5816261768341064e-06, 3.5762786865234375e-06, 4.5709311962127686e-06, 5.5655837059021e-06, 6.560236215591431e-06, 7.554888725280762e-06, 8.549541234970093e-06, 9.544193744659424e-06, 1.0538846254348755e-05, 1.1533498764038086e-05, 1.2528151273727417e-05, 1.3522803783416748e-05, 1.4517456293106079e-05, 1.551210880279541e-05, 1.650676131248474e-05, 1.7501413822174072e-05, 1.8496066331863403e-05, 1.9490718841552734e-05, 2.0485371351242065e-05, 2.1480023860931396e-05, 2.2474676370620728e-05, 2.346932888031006e-05, 2.446398138999939e-05, 2.545863389968872e-05, 2.6453286409378052e-05, 2.7447938919067383e-05, 2.8442591428756714e-05, 2.9437243938446045e-05, 3.0431896448135376e-05, 3.142654895782471e-05, 3.242120146751404e-05, 3.341585397720337e-05, 3.44105064868927e-05, 3.540515899658203e-05]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 5.0, 6.0, 12.0, 18.0, 17.0, 15.0, 22.0, 55.0, 60.0, 93.0, 187.0, 472.0, 4766.0, 1035222.0, 6490.0, 509.0, 206.0, 123.0, 79.0, 32.0, 45.0, 29.0, 17.0, 17.0, 15.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0007753372192382812, -0.0007535144686698914, -0.0007316917181015015, -0.0007098689675331116, -0.0006880462169647217, -0.0006662234663963318, -0.0006444007158279419, -0.000622577965259552, -0.0006007552146911621, -0.0005789324641227722, -0.0005571097135543823, -0.0005352869629859924, -0.0005134642124176025, -0.0004916414618492126, -0.00046981871128082275, -0.00044799596071243286, -0.00042617321014404297, -0.0004043504595756531, -0.0003825277090072632, -0.0003607049584388733, -0.0003388822078704834, -0.0003170594573020935, -0.0002952367067337036, -0.0002734139561653137, -0.00025159120559692383, -0.00022976845502853394, -0.00020794570446014404, -0.00018612295389175415, -0.00016430020332336426, -0.00014247745275497437, -0.00012065470218658447, -9.883195161819458e-05, -7.700920104980469e-05, -5.5186450481414795e-05, -3.33636999130249e-05, -1.154094934463501e-05, 1.0281801223754883e-05, 3.2104551792144775e-05, 5.392730236053467e-05, 7.575005292892456e-05, 9.757280349731445e-05, 0.00011939555406570435, 0.00014121830463409424, 0.00016304105520248413, 0.00018486380577087402, 0.00020668655633926392, 0.0002285093069076538, 0.0002503320574760437, 0.0002721548080444336, 0.0002939775586128235, 0.0003158003091812134, 0.00033762305974960327, 0.00035944581031799316, 0.00038126856088638306, 0.00040309131145477295, 0.00042491406202316284, 0.00044673681259155273, 0.0004685595631599426, 0.0004903823137283325, 0.0005122050642967224, 0.0005340278148651123, 0.0005558505654335022, 0.0005776733160018921, 0.000599496066570282, 0.0006213188171386719]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 409.0, 604.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047305430052801967, -0.00046476468560285866, -0.0004564750415738672, -0.0004481854266487062, -0.00043989578261971474, -0.00043160616769455373, -0.00042331652366556227, -0.00041502690874040127, -0.0004067372647114098, -0.0003984476497862488, -0.00039015800575725734, -0.00038186839083209634, -0.0003735787468031049, -0.0003652891318779439, -0.0003569994878489524, -0.0003487098729237914, -0.00034042022889479995, -0.00033213061396963894, -0.0003238409699406475, -0.0003155513550154865, -0.000307261710986495, -0.000298972096061334, -0.00029068245203234255, -0.00028239283710718155, -0.00027410322218202055, -0.00026581360725685954, -0.0002575239632278681, -0.0002492343483027071, -0.00024094470427371562, -0.00023265507479663938, -0.00022436544531956315, -0.00021607583039440215, -0.00020778618636541069, -0.00019949655688833445, -0.00019120692741125822, -0.000182917297934182, -0.00017462766845710576, -0.00016633803898002952, -0.0001580484095029533, -0.0001497587945777923, -0.00014146916510071605, -0.00013317953562363982, -0.0001248899061465636, -0.00011660027666948736, -0.00010831064719241112, -0.00010002101771533489, -9.173139551421627e-05, -8.344176603714004e-05, -7.515213656006381e-05, -6.686250708298758e-05, -5.8572877605911344e-05, -5.028325176681392e-05, -4.1993622289737687e-05, -3.3703992812661454e-05, -2.541436697356403e-05, -1.7124737496487796e-05, -8.835108019411564e-06, -5.454794518300332e-07, 7.744149115751497e-06, 1.6033776773838326e-05, 2.432340625091456e-05, 3.261303572799079e-05, 4.0902661567088217e-05, 4.919229104416445e-05, 5.748192052124068e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 15.0, 6.0, 7.0, 25.0, 42.0, 48.0, 49.0, 47.0, 58.0, 64.0, 70.0, 62.0, 60.0, 55.0, 61.0, 67.0, 46.0, 67.0, 31.0, 34.0, 22.0, 24.0, 14.0, 11.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3484230041503906e-05, -2.2681429982185364e-05, -2.187862992286682e-05, -2.107582986354828e-05, -2.0273029804229736e-05, -1.9470229744911194e-05, -1.866742968559265e-05, -1.786462962627411e-05, -1.7061829566955566e-05, -1.6259029507637024e-05, -1.545622944831848e-05, -1.4653429388999939e-05, -1.3850629329681396e-05, -1.3047829270362854e-05, -1.2245029211044312e-05, -1.1442229151725769e-05, -1.0639429092407227e-05, -9.836629033088684e-06, -9.033828973770142e-06, -8.231028914451599e-06, -7.428228855133057e-06, -6.625428795814514e-06, -5.822628736495972e-06, -5.019828677177429e-06, -4.217028617858887e-06, -3.4142285585403442e-06, -2.6114284992218018e-06, -1.8086284399032593e-06, -1.0058283805847168e-06, -2.0302832126617432e-07, 5.997717380523682e-07, 1.4025717973709106e-06, 2.205371856689453e-06, 3.0081719160079956e-06, 3.810971975326538e-06, 4.6137720346450806e-06, 5.416572093963623e-06, 6.2193721532821655e-06, 7.022172212600708e-06, 7.82497227191925e-06, 8.627772331237793e-06, 9.430572390556335e-06, 1.0233372449874878e-05, 1.103617250919342e-05, 1.1838972568511963e-05, 1.2641772627830505e-05, 1.3444572687149048e-05, 1.424737274646759e-05, 1.5050172805786133e-05, 1.5852972865104675e-05, 1.6655772924423218e-05, 1.745857298374176e-05, 1.8261373043060303e-05, 1.9064173102378845e-05, 1.9866973161697388e-05, 2.066977322101593e-05, 2.1472573280334473e-05, 2.2275373339653015e-05, 2.3078173398971558e-05, 2.38809734582901e-05, 2.4683773517608643e-05, 2.5486573576927185e-05, 2.6289373636245728e-05, 2.709217369556427e-05, 2.7894973754882812e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 3.0, 6.0, 9.0, 9.0, 13.0, 10.0, 7.0, 11.0, 11.0, 22.0, 22.0, 18.0, 23.0, 22.0, 34.0, 17.0, 33.0, 17.0, 41.0, 43.0, 28.0, 37.0, 33.0, 42.0, 45.0, 46.0, 30.0, 37.0, 33.0, 43.0, 27.0, 26.0, 28.0, 25.0, 15.0, 17.0, 18.0, 17.0, 19.0, 13.0, 11.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.916015625, -3.801055908203125, -3.68609619140625, -3.571136474609375, -3.4561767578125, -3.341217041015625, -3.22625732421875, -3.111297607421875, -2.996337890625, -2.881378173828125, -2.76641845703125, -2.651458740234375, -2.5364990234375, -2.421539306640625, -2.30657958984375, -2.191619873046875, -2.07666015625, -1.961700439453125, -1.84674072265625, -1.731781005859375, -1.6168212890625, -1.501861572265625, -1.38690185546875, -1.271942138671875, -1.156982421875, -1.042022705078125, -0.92706298828125, -0.812103271484375, -0.6971435546875, -0.582183837890625, -0.46722412109375, -0.352264404296875, -0.2373046875, -0.122344970703125, -0.00738525390625, 0.107574462890625, 0.2225341796875, 0.337493896484375, 0.45245361328125, 0.567413330078125, 0.682373046875, 0.797332763671875, 0.91229248046875, 1.027252197265625, 1.1422119140625, 1.257171630859375, 1.37213134765625, 1.487091064453125, 1.60205078125, 1.717010498046875, 1.83197021484375, 1.946929931640625, 2.0618896484375, 2.176849365234375, 2.29180908203125, 2.406768798828125, 2.521728515625, 2.636688232421875, 2.75164794921875, 2.866607666015625, 2.9815673828125, 3.096527099609375, 3.21148681640625, 3.326446533203125, 3.44140625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 6.0, 7.0, 14.0, 17.0, 22.0, 32.0, 33.0, 33.0, 39.0, 51.0, 65.0, 102.0, 132.0, 187.0, 331.0, 544.0, 990.0, 1740.0, 3293.0, 5855.0, 10828.0, 20664.0, 39151.0, 93361.0, 585841.0, 175693.0, 52090.0, 26194.0, 14089.0, 7534.0, 4198.0, 2261.0, 1193.0, 659.0, 418.0, 246.0, 145.0, 119.0, 82.0, 62.0, 50.0, 45.0, 35.0, 26.0, 19.0, 15.0, 12.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.02734375, -6.81878662109375, -6.6102294921875, -6.40167236328125, -6.193115234375, -5.98455810546875, -5.7760009765625, -5.56744384765625, -5.35888671875, -5.15032958984375, -4.9417724609375, -4.73321533203125, -4.524658203125, -4.31610107421875, -4.1075439453125, -3.89898681640625, -3.6904296875, -3.48187255859375, -3.2733154296875, -3.06475830078125, -2.856201171875, -2.64764404296875, -2.4390869140625, -2.23052978515625, -2.02197265625, -1.81341552734375, -1.6048583984375, -1.39630126953125, -1.187744140625, -0.97918701171875, -0.7706298828125, -0.56207275390625, -0.353515625, -0.14495849609375, 0.0635986328125, 0.27215576171875, 0.480712890625, 0.68927001953125, 0.8978271484375, 1.10638427734375, 1.31494140625, 1.52349853515625, 1.7320556640625, 1.94061279296875, 2.149169921875, 2.35772705078125, 2.5662841796875, 2.77484130859375, 2.9833984375, 3.19195556640625, 3.4005126953125, 3.60906982421875, 3.817626953125, 4.02618408203125, 4.2347412109375, 4.44329833984375, 4.65185546875, 4.86041259765625, 5.0689697265625, 5.27752685546875, 5.486083984375, 5.69464111328125, 5.9031982421875, 6.11175537109375, 6.3203125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 4.0, 9.0, 8.0, 12.0, 8.0, 13.0, 16.0, 14.0, 22.0, 28.0, 32.0, 28.0, 31.0, 44.0, 43.0, 48.0, 57.0, 76.0, 96.0, 1518.0, 346.0, 71.0, 87.0, 67.0, 53.0, 49.0, 46.0, 37.0, 29.0, 22.0, 23.0, 16.0, 20.0, 14.0, 11.0, 6.0, 10.0, 9.0, 9.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.6640625, -12.301513671875, -11.93896484375, -11.576416015625, -11.2138671875, -10.851318359375, -10.48876953125, -10.126220703125, -9.763671875, -9.401123046875, -9.03857421875, -8.676025390625, -8.3134765625, -7.950927734375, -7.58837890625, -7.225830078125, -6.86328125, -6.500732421875, -6.13818359375, -5.775634765625, -5.4130859375, -5.050537109375, -4.68798828125, -4.325439453125, -3.962890625, -3.600341796875, -3.23779296875, -2.875244140625, -2.5126953125, -2.150146484375, -1.78759765625, -1.425048828125, -1.0625, -0.699951171875, -0.33740234375, 0.025146484375, 0.3876953125, 0.750244140625, 1.11279296875, 1.475341796875, 1.837890625, 2.200439453125, 2.56298828125, 2.925537109375, 3.2880859375, 3.650634765625, 4.01318359375, 4.375732421875, 4.73828125, 5.100830078125, 5.46337890625, 5.825927734375, 6.1884765625, 6.551025390625, 6.91357421875, 7.276123046875, 7.638671875, 8.001220703125, 8.36376953125, 8.726318359375, 9.0888671875, 9.451416015625, 9.81396484375, 10.176513671875, 10.5390625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 7.0, 8.0, 9.0, 12.0, 11.0, 17.0, 22.0, 32.0, 32.0, 38.0, 58.0, 91.0, 131.0, 182.0, 300.0, 681.0, 2527.0, 15621.0, 151596.0, 2805451.0, 149781.0, 14996.0, 2435.0, 676.0, 306.0, 188.0, 107.0, 78.0, 74.0, 46.0, 40.0, 28.0, 22.0, 19.0, 21.0, 15.0, 8.0, 6.0, 8.0, 4.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.473876953125, -16.83837890625, -16.202880859375, -15.5673828125, -14.931884765625, -14.29638671875, -13.660888671875, -13.025390625, -12.389892578125, -11.75439453125, -11.118896484375, -10.4833984375, -9.847900390625, -9.21240234375, -8.576904296875, -7.94140625, -7.305908203125, -6.67041015625, -6.034912109375, -5.3994140625, -4.763916015625, -4.12841796875, -3.492919921875, -2.857421875, -2.221923828125, -1.58642578125, -0.950927734375, -0.3154296875, 0.320068359375, 0.95556640625, 1.591064453125, 2.2265625, 2.862060546875, 3.49755859375, 4.133056640625, 4.7685546875, 5.404052734375, 6.03955078125, 6.675048828125, 7.310546875, 7.946044921875, 8.58154296875, 9.217041015625, 9.8525390625, 10.488037109375, 11.12353515625, 11.759033203125, 12.39453125, 13.030029296875, 13.66552734375, 14.301025390625, 14.9365234375, 15.572021484375, 16.20751953125, 16.843017578125, 17.478515625, 18.114013671875, 18.74951171875, 19.385009765625, 20.0205078125, 20.656005859375, 21.29150390625, 21.927001953125, 22.5625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 85.0, 218.0, 374.0, 240.0, 73.0, 14.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.12257766723633, -30.991851806640625, -28.861127853393555, -26.730403900146484, -24.59967803955078, -22.468952178955078, -20.338228225708008, -18.207504272460938, -16.076778411865234, -13.946053504943848, -11.815328598022461, -9.684603691101074, -7.5538787841796875, -5.423153877258301, -3.292428970336914, -1.1617040634155273, 0.9690208435058594, 3.099745750427246, 5.230470657348633, 7.3611955642700195, 9.491920471191406, 11.622645378112793, 13.75337028503418, 15.884095191955566, 18.014820098876953, 20.145545959472656, 22.276269912719727, 24.406993865966797, 26.5377197265625, 28.668445587158203, 30.799169540405273, 32.929893493652344, 35.06061553955078, 37.191341400146484, 39.32206726074219, 41.452789306640625, 43.58351516723633, 45.71424102783203, 47.84496307373047, 49.97568893432617, 52.106414794921875, 54.23714065551758, 56.36786651611328, 58.49858856201172, 60.62931442260742, 62.760040283203125, 64.89076232910156, 67.02149200439453, 69.15221405029297, 71.2829360961914, 73.41366577148438, 75.54438781738281, 77.67510986328125, 79.80583953857422, 81.93656158447266, 84.06729125976562, 86.19801330566406, 88.3287353515625, 90.45946502685547, 92.5901870727539, 94.72091674804688, 96.85163879394531, 98.98236083984375, 101.11309051513672, 103.24381256103516]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 0.0, 4.0, 8.0, 8.0, 11.0, 11.0, 17.0, 24.0, 17.0, 17.0, 30.0, 25.0, 28.0, 32.0, 31.0, 48.0, 38.0, 34.0, 51.0, 47.0, 49.0, 37.0, 41.0, 44.0, 39.0, 36.0, 38.0, 27.0, 26.0, 43.0, 26.0, 24.0, 14.0, 13.0, 11.0, 13.0, 12.0, 9.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.36260986328125, -30.351551055908203, -29.34049415588379, -28.329437255859375, -27.318378448486328, -26.30731964111328, -25.296262741088867, -24.285205841064453, -23.274147033691406, -22.26308822631836, -21.252031326293945, -20.24097442626953, -19.229915618896484, -18.218856811523438, -17.207799911499023, -16.19674301147461, -15.185684204101562, -14.174626350402832, -13.163568496704102, -12.152510643005371, -11.14145278930664, -10.13039493560791, -9.11933708190918, -8.10827922821045, -7.097221374511719, -6.086163520812988, -5.075105667114258, -4.064047813415527, -3.052989959716797, -2.0419321060180664, -1.030874252319336, -0.01981639862060547, 0.991241455078125, 2.0022993087768555, 3.013357162475586, 4.024415016174316, 5.035472869873047, 6.046530723571777, 7.057588577270508, 8.068646430969238, 9.079704284667969, 10.0907621383667, 11.10181999206543, 12.11287784576416, 13.12393569946289, 14.134993553161621, 15.146051406860352, 16.157108306884766, 17.168167114257812, 18.17922592163086, 19.190282821655273, 20.201339721679688, 21.212398529052734, 22.22345733642578, 23.234514236450195, 24.24557113647461, 25.256629943847656, 26.267688751220703, 27.278745651245117, 28.28980255126953, 29.300861358642578, 30.311920166015625, 31.32297706604004, 32.33403396606445, 33.3450927734375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 8.0, 7.0, 3.0, 4.0, 10.0, 10.0, 13.0, 10.0, 17.0, 23.0, 21.0, 17.0, 35.0, 29.0, 24.0, 27.0, 31.0, 28.0, 39.0, 45.0, 32.0, 41.0, 50.0, 51.0, 35.0, 41.0, 40.0, 52.0, 26.0, 37.0, 35.0, 17.0, 27.0, 16.0, 21.0, 19.0, 15.0, 12.0, 15.0, 5.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.6953125, -4.561920166015625, -4.42852783203125, -4.295135498046875, -4.1617431640625, -4.028350830078125, -3.89495849609375, -3.761566162109375, -3.628173828125, -3.494781494140625, -3.36138916015625, -3.227996826171875, -3.0946044921875, -2.961212158203125, -2.82781982421875, -2.694427490234375, -2.56103515625, -2.427642822265625, -2.29425048828125, -2.160858154296875, -2.0274658203125, -1.894073486328125, -1.76068115234375, -1.627288818359375, -1.493896484375, -1.360504150390625, -1.22711181640625, -1.093719482421875, -0.9603271484375, -0.826934814453125, -0.69354248046875, -0.560150146484375, -0.4267578125, -0.293365478515625, -0.15997314453125, -0.026580810546875, 0.1068115234375, 0.240203857421875, 0.37359619140625, 0.506988525390625, 0.640380859375, 0.773773193359375, 0.90716552734375, 1.040557861328125, 1.1739501953125, 1.307342529296875, 1.44073486328125, 1.574127197265625, 1.70751953125, 1.840911865234375, 1.97430419921875, 2.107696533203125, 2.2410888671875, 2.374481201171875, 2.50787353515625, 2.641265869140625, 2.774658203125, 2.908050537109375, 3.04144287109375, 3.174835205078125, 3.3082275390625, 3.441619873046875, 3.57501220703125, 3.708404541015625, 3.841796875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 3.0, 7.0, 8.0, 5.0, 12.0, 22.0, 23.0, 49.0, 53.0, 94.0, 115.0, 193.0, 288.0, 492.0, 761.0, 1318.0, 2283.0, 4228.0, 8324.0, 17859.0, 42287.0, 115570.0, 403454.0, 1514316.0, 1490133.0, 399517.0, 114794.0, 41848.0, 17800.0, 8394.0, 4257.0, 2259.0, 1329.0, 784.0, 487.0, 315.0, 189.0, 145.0, 70.0, 55.0, 43.0, 26.0, 10.0, 19.0, 13.0, 12.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.93359375, -5.73577880859375, -5.5379638671875, -5.34014892578125, -5.142333984375, -4.94451904296875, -4.7467041015625, -4.54888916015625, -4.35107421875, -4.15325927734375, -3.9554443359375, -3.75762939453125, -3.559814453125, -3.36199951171875, -3.1641845703125, -2.96636962890625, -2.7685546875, -2.57073974609375, -2.3729248046875, -2.17510986328125, -1.977294921875, -1.77947998046875, -1.5816650390625, -1.38385009765625, -1.18603515625, -0.98822021484375, -0.7904052734375, -0.59259033203125, -0.394775390625, -0.19696044921875, 0.0008544921875, 0.19866943359375, 0.396484375, 0.59429931640625, 0.7921142578125, 0.98992919921875, 1.187744140625, 1.38555908203125, 1.5833740234375, 1.78118896484375, 1.97900390625, 2.17681884765625, 2.3746337890625, 2.57244873046875, 2.770263671875, 2.96807861328125, 3.1658935546875, 3.36370849609375, 3.5615234375, 3.75933837890625, 3.9571533203125, 4.15496826171875, 4.352783203125, 4.55059814453125, 4.7484130859375, 4.94622802734375, 5.14404296875, 5.34185791015625, 5.5396728515625, 5.73748779296875, 5.935302734375, 6.13311767578125, 6.3309326171875, 6.52874755859375, 6.7265625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 5.0, 6.0, 24.0, 26.0, 42.0, 57.0, 78.0, 100.0, 123.0, 200.0, 274.0, 341.0, 483.0, 520.0, 460.0, 356.0, 251.0, 204.0, 118.0, 110.0, 84.0, 64.0, 39.0, 28.0, 20.0, 16.0, 6.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.421875, -6.180419921875, -5.93896484375, -5.697509765625, -5.4560546875, -5.214599609375, -4.97314453125, -4.731689453125, -4.490234375, -4.248779296875, -4.00732421875, -3.765869140625, -3.5244140625, -3.282958984375, -3.04150390625, -2.800048828125, -2.55859375, -2.317138671875, -2.07568359375, -1.834228515625, -1.5927734375, -1.351318359375, -1.10986328125, -0.868408203125, -0.626953125, -0.385498046875, -0.14404296875, 0.097412109375, 0.3388671875, 0.580322265625, 0.82177734375, 1.063232421875, 1.3046875, 1.546142578125, 1.78759765625, 2.029052734375, 2.2705078125, 2.511962890625, 2.75341796875, 2.994873046875, 3.236328125, 3.477783203125, 3.71923828125, 3.960693359375, 4.2021484375, 4.443603515625, 4.68505859375, 4.926513671875, 5.16796875, 5.409423828125, 5.65087890625, 5.892333984375, 6.1337890625, 6.375244140625, 6.61669921875, 6.858154296875, 7.099609375, 7.341064453125, 7.58251953125, 7.823974609375, 8.0654296875, 8.306884765625, 8.54833984375, 8.789794921875, 9.03125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 2.0, 11.0, 8.0, 34.0, 30.0, 57.0, 94.0, 124.0, 193.0, 367.0, 964.0, 4019.0, 32410.0, 646672.0, 3337664.0, 155816.0, 12293.0, 2099.0, 669.0, 268.0, 148.0, 115.0, 83.0, 42.0, 27.0, 20.0, 12.0, 6.0, 11.0, 9.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.828125, -26.108642578125, -25.38916015625, -24.669677734375, -23.9501953125, -23.230712890625, -22.51123046875, -21.791748046875, -21.072265625, -20.352783203125, -19.63330078125, -18.913818359375, -18.1943359375, -17.474853515625, -16.75537109375, -16.035888671875, -15.31640625, -14.596923828125, -13.87744140625, -13.157958984375, -12.4384765625, -11.718994140625, -10.99951171875, -10.280029296875, -9.560546875, -8.841064453125, -8.12158203125, -7.402099609375, -6.6826171875, -5.963134765625, -5.24365234375, -4.524169921875, -3.8046875, -3.085205078125, -2.36572265625, -1.646240234375, -0.9267578125, -0.207275390625, 0.51220703125, 1.231689453125, 1.951171875, 2.670654296875, 3.39013671875, 4.109619140625, 4.8291015625, 5.548583984375, 6.26806640625, 6.987548828125, 7.70703125, 8.426513671875, 9.14599609375, 9.865478515625, 10.5849609375, 11.304443359375, 12.02392578125, 12.743408203125, 13.462890625, 14.182373046875, 14.90185546875, 15.621337890625, 16.3408203125, 17.060302734375, 17.77978515625, 18.499267578125, 19.21875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 14.0, 35.0, 72.0, 167.0, 230.0, 197.0, 157.0, 90.0, 23.0, 15.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.9752311706543, -59.826393127441406, -57.67755889892578, -55.52872085571289, -53.3798828125, -51.231048583984375, -49.082210540771484, -46.933372497558594, -44.78453826904297, -42.63570022583008, -40.48686599731445, -38.33802795410156, -36.18919372558594, -34.04035568237305, -31.891517639160156, -29.7426815032959, -27.59384536743164, -25.445009231567383, -23.296173095703125, -21.147335052490234, -18.998498916625977, -16.84966278076172, -14.700825691223145, -12.55198860168457, -10.403152465820312, -8.254316329956055, -6.1054792404174805, -3.9566426277160645, -1.8078060150146484, 0.3410301208496094, 2.4898672103881836, 4.638704299926758, 6.787544250488281, 8.936380386352539, 11.085217475891113, 13.234054565429688, 15.382890701293945, 17.531726837158203, 19.680564880371094, 21.82940101623535, 23.97823715209961, 26.127073287963867, 28.275909423828125, 30.424747467041016, 32.573585510253906, 34.72241973876953, 36.87125778198242, 39.02009582519531, 41.16893005371094, 43.31776809692383, 45.46660232543945, 47.615440368652344, 49.76427459716797, 51.91311264038086, 54.06195068359375, 56.210784912109375, 58.359622955322266, 60.508460998535156, 62.65729522705078, 64.8061294555664, 66.95497131347656, 69.10380554199219, 71.25263977050781, 73.40148162841797, 75.5503158569336]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 5.0, 4.0, 7.0, 4.0, 11.0, 6.0, 18.0, 15.0, 19.0, 34.0, 27.0, 24.0, 28.0, 39.0, 28.0, 33.0, 26.0, 48.0, 43.0, 31.0, 40.0, 48.0, 45.0, 54.0, 42.0, 34.0, 33.0, 43.0, 25.0, 33.0, 28.0, 23.0, 20.0, 14.0, 7.0, 18.0, 10.0, 8.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.988861083984375, -23.199922561645508, -22.410982131958008, -21.62204360961914, -20.83310317993164, -20.044164657592773, -19.255226135253906, -18.466285705566406, -17.67734718322754, -16.888408660888672, -16.099468231201172, -15.310529708862305, -14.521590232849121, -13.732650756835938, -12.943711280822754, -12.15477180480957, -11.365832328796387, -10.576892852783203, -9.78795337677002, -8.999013900756836, -8.210075378417969, -7.421135902404785, -6.632196426391602, -5.843257427215576, -5.054317951202393, -4.265378475189209, -3.4764394760131836, -2.6875, -1.8985607624053955, -1.109621524810791, -0.3206820487976074, 0.46825695037841797, 1.2571964263916016, 2.046135663986206, 2.8350749015808105, 3.624014377593994, 4.4129533767700195, 5.201892852783203, 5.990832328796387, 6.779771327972412, 7.568710803985596, 8.357649803161621, 9.146589279174805, 9.935528755187988, 10.724468231201172, 11.513406753540039, 12.302347183227539, 13.091285705566406, 13.88022518157959, 14.669164657592773, 15.458104133605957, 16.24704360961914, 17.035982131958008, 17.824920654296875, 18.613861083984375, 19.402799606323242, 20.191740036010742, 20.98067855834961, 21.76961898803711, 22.558557510375977, 23.347497940063477, 24.136436462402344, 24.925376892089844, 25.71431541442871, 26.503253936767578]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 9.0, 8.0, 5.0, 17.0, 19.0, 16.0, 21.0, 24.0, 23.0, 25.0, 20.0, 31.0, 32.0, 28.0, 33.0, 38.0, 34.0, 48.0, 35.0, 35.0, 50.0, 44.0, 40.0, 27.0, 38.0, 30.0, 41.0, 27.0, 36.0, 26.0, 25.0, 16.0, 21.0, 16.0, 12.0, 8.0, 5.0, 4.0, 4.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.1630859375, -4.029296875, -3.8955078125, -3.76171875, -3.6279296875, -3.494140625, -3.3603515625, -3.2265625, -3.0927734375, -2.958984375, -2.8251953125, -2.69140625, -2.5576171875, -2.423828125, -2.2900390625, -2.15625, -2.0224609375, -1.888671875, -1.7548828125, -1.62109375, -1.4873046875, -1.353515625, -1.2197265625, -1.0859375, -0.9521484375, -0.818359375, -0.6845703125, -0.55078125, -0.4169921875, -0.283203125, -0.1494140625, -0.015625, 0.1181640625, 0.251953125, 0.3857421875, 0.51953125, 0.6533203125, 0.787109375, 0.9208984375, 1.0546875, 1.1884765625, 1.322265625, 1.4560546875, 1.58984375, 1.7236328125, 1.857421875, 1.9912109375, 2.125, 2.2587890625, 2.392578125, 2.5263671875, 2.66015625, 2.7939453125, 2.927734375, 3.0615234375, 3.1953125, 3.3291015625, 3.462890625, 3.5966796875, 3.73046875, 3.8642578125, 3.998046875, 4.1318359375, 4.265625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 9.0, 12.0, 20.0, 32.0, 41.0, 71.0, 89.0, 135.0, 222.0, 334.0, 525.0, 827.0, 1420.0, 2373.0, 4119.0, 6931.0, 12110.0, 22921.0, 45522.0, 99114.0, 283100.0, 345715.0, 114147.0, 51069.0, 25555.0, 13490.0, 7593.0, 4383.0, 2563.0, 1458.0, 960.0, 612.0, 384.0, 231.0, 151.0, 105.0, 66.0, 36.0, 34.0, 16.0, 18.0, 8.0, 6.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.20745849609375, -0.2005615234375, -0.19366455078125, -0.186767578125, -0.17987060546875, -0.1729736328125, -0.16607666015625, -0.1591796875, -0.15228271484375, -0.1453857421875, -0.13848876953125, -0.131591796875, -0.12469482421875, -0.1177978515625, -0.11090087890625, -0.10400390625, -0.09710693359375, -0.0902099609375, -0.08331298828125, -0.076416015625, -0.06951904296875, -0.0626220703125, -0.05572509765625, -0.048828125, -0.04193115234375, -0.0350341796875, -0.02813720703125, -0.021240234375, -0.01434326171875, -0.0074462890625, -0.00054931640625, 0.00634765625, 0.01324462890625, 0.0201416015625, 0.02703857421875, 0.033935546875, 0.04083251953125, 0.0477294921875, 0.05462646484375, 0.0615234375, 0.06842041015625, 0.0753173828125, 0.08221435546875, 0.089111328125, 0.09600830078125, 0.1029052734375, 0.10980224609375, 0.11669921875, 0.12359619140625, 0.1304931640625, 0.13739013671875, 0.144287109375, 0.15118408203125, 0.1580810546875, 0.16497802734375, 0.171875, 0.17877197265625, 0.1856689453125, 0.19256591796875, 0.199462890625, 0.20635986328125, 0.2132568359375, 0.22015380859375, 0.22705078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 11.0, 11.0, 10.0, 17.0, 15.0, 18.0, 23.0, 31.0, 24.0, 33.0, 38.0, 36.0, 39.0, 39.0, 32.0, 38.0, 41.0, 1071.0, 42.0, 56.0, 44.0, 31.0, 42.0, 41.0, 34.0, 24.0, 25.0, 21.0, 18.0, 18.0, 17.0, 16.0, 12.0, 7.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.99609375, -2.900146484375, -2.80419921875, -2.708251953125, -2.6123046875, -2.516357421875, -2.42041015625, -2.324462890625, -2.228515625, -2.132568359375, -2.03662109375, -1.940673828125, -1.8447265625, -1.748779296875, -1.65283203125, -1.556884765625, -1.4609375, -1.364990234375, -1.26904296875, -1.173095703125, -1.0771484375, -0.981201171875, -0.88525390625, -0.789306640625, -0.693359375, -0.597412109375, -0.50146484375, -0.405517578125, -0.3095703125, -0.213623046875, -0.11767578125, -0.021728515625, 0.07421875, 0.170166015625, 0.26611328125, 0.362060546875, 0.4580078125, 0.553955078125, 0.64990234375, 0.745849609375, 0.841796875, 0.937744140625, 1.03369140625, 1.129638671875, 1.2255859375, 1.321533203125, 1.41748046875, 1.513427734375, 1.609375, 1.705322265625, 1.80126953125, 1.897216796875, 1.9931640625, 2.089111328125, 2.18505859375, 2.281005859375, 2.376953125, 2.472900390625, 2.56884765625, 2.664794921875, 2.7607421875, 2.856689453125, 2.95263671875, 3.048583984375, 3.14453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 8.0, 8.0, 12.0, 19.0, 25.0, 48.0, 62.0, 109.0, 168.0, 242.0, 362.0, 605.0, 938.0, 1445.0, 2115.0, 3354.0, 5392.0, 8607.0, 14067.0, 23072.0, 39499.0, 70887.0, 132072.0, 1322932.0, 219788.0, 107312.0, 58615.0, 33291.0, 19837.0, 11929.0, 7361.0, 4694.0, 2899.0, 1885.0, 1216.0, 799.0, 482.0, 351.0, 210.0, 151.0, 88.0, 62.0, 33.0, 36.0, 16.0, 14.0, 10.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771484375, -0.0746469497680664, -0.07214546203613281, -0.06964397430419922, -0.06714248657226562, -0.06464099884033203, -0.06213951110839844, -0.059638023376464844, -0.05713653564453125, -0.054635047912597656, -0.05213356018066406, -0.04963207244873047, -0.047130584716796875, -0.04462909698486328, -0.04212760925292969, -0.039626121520996094, -0.0371246337890625, -0.034623146057128906, -0.03212165832519531, -0.02962017059326172, -0.027118682861328125, -0.02461719512939453, -0.022115707397460938, -0.019614219665527344, -0.01711273193359375, -0.014611244201660156, -0.012109756469726562, -0.009608268737792969, -0.007106781005859375, -0.004605293273925781, -0.0021038055419921875, 0.00039768218994140625, 0.002899169921875, 0.005400657653808594, 0.007902145385742188, 0.010403633117675781, 0.012905120849609375, 0.015406608581542969, 0.017908096313476562, 0.020409584045410156, 0.02291107177734375, 0.025412559509277344, 0.027914047241210938, 0.03041553497314453, 0.032917022705078125, 0.03541851043701172, 0.03791999816894531, 0.040421485900878906, 0.0429229736328125, 0.045424461364746094, 0.04792594909667969, 0.05042743682861328, 0.052928924560546875, 0.05543041229248047, 0.05793190002441406, 0.060433387756347656, 0.06293487548828125, 0.06543636322021484, 0.06793785095214844, 0.07043933868408203, 0.07294082641601562, 0.07544231414794922, 0.07794380187988281, 0.0804452896118164, 0.08294677734375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 6.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 13.0, 11.0, 15.0, 25.0, 11.0, 24.0, 31.0, 36.0, 49.0, 47.0, 60.0, 78.0, 70.0, 73.0, 95.0, 57.0, 56.0, 44.0, 21.0, 34.0, 20.0, 19.0, 15.0, 17.0, 9.0, 4.0, 8.0, 6.0, 2.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6464462280273438e-05, -2.561137080192566e-05, -2.475827932357788e-05, -2.3905187845230103e-05, -2.3052096366882324e-05, -2.2199004888534546e-05, -2.1345913410186768e-05, -2.049282193183899e-05, -1.963973045349121e-05, -1.8786638975143433e-05, -1.7933547496795654e-05, -1.7080456018447876e-05, -1.6227364540100098e-05, -1.537427306175232e-05, -1.4521181583404541e-05, -1.3668090105056763e-05, -1.2814998626708984e-05, -1.1961907148361206e-05, -1.1108815670013428e-05, -1.025572419166565e-05, -9.402632713317871e-06, -8.549541234970093e-06, -7.696449756622314e-06, -6.843358278274536e-06, -5.990266799926758e-06, -5.1371753215789795e-06, -4.284083843231201e-06, -3.430992364883423e-06, -2.5779008865356445e-06, -1.7248094081878662e-06, -8.717179298400879e-07, -1.862645149230957e-08, 8.344650268554688e-07, 1.687556505203247e-06, 2.5406479835510254e-06, 3.3937394618988037e-06, 4.246830940246582e-06, 5.09992241859436e-06, 5.953013896942139e-06, 6.806105375289917e-06, 7.659196853637695e-06, 8.512288331985474e-06, 9.365379810333252e-06, 1.021847128868103e-05, 1.1071562767028809e-05, 1.1924654245376587e-05, 1.2777745723724365e-05, 1.3630837202072144e-05, 1.4483928680419922e-05, 1.53370201587677e-05, 1.619011163711548e-05, 1.7043203115463257e-05, 1.7896294593811035e-05, 1.8749386072158813e-05, 1.9602477550506592e-05, 2.045556902885437e-05, 2.130866050720215e-05, 2.2161751985549927e-05, 2.3014843463897705e-05, 2.3867934942245483e-05, 2.4721026420593262e-05, 2.557411789894104e-05, 2.642720937728882e-05, 2.7280300855636597e-05, 2.8133392333984375e-05]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 1.0, 7.0, 2.0, 9.0, 6.0, 12.0, 13.0, 16.0, 25.0, 28.0, 47.0, 44.0, 87.0, 145.0, 255.0, 651.0, 25831.0, 1017287.0, 2949.0, 442.0, 213.0, 126.0, 88.0, 63.0, 36.0, 28.0, 22.0, 21.0, 23.0, 8.0, 13.0, 8.0, 8.0, 10.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0005717277526855469, -0.0005534738302230835, -0.0005352199077606201, -0.0005169659852981567, -0.0004987120628356934, -0.00048045814037323, -0.0004622042179107666, -0.0004439502954483032, -0.00042569637298583984, -0.00040744245052337646, -0.0003891885280609131, -0.0003709346055984497, -0.00035268068313598633, -0.00033442676067352295, -0.00031617283821105957, -0.0002979189157485962, -0.0002796649932861328, -0.00026141107082366943, -0.00024315714836120605, -0.00022490322589874268, -0.0002066493034362793, -0.00018839538097381592, -0.00017014145851135254, -0.00015188753604888916, -0.00013363361358642578, -0.0001153796911239624, -9.712576866149902e-05, -7.887184619903564e-05, -6.0617923736572266e-05, -4.236400127410889e-05, -2.4110078811645508e-05, -5.856156349182129e-06, 1.239776611328125e-05, 3.065168857574463e-05, 4.890561103820801e-05, 6.715953350067139e-05, 8.541345596313477e-05, 0.00010366737842559814, 0.00012192130088806152, 0.0001401752233505249, 0.00015842914581298828, 0.00017668306827545166, 0.00019493699073791504, 0.00021319091320037842, 0.0002314448356628418, 0.0002496987581253052, 0.00026795268058776855, 0.00028620660305023193, 0.0003044605255126953, 0.0003227144479751587, 0.00034096837043762207, 0.00035922229290008545, 0.00037747621536254883, 0.0003957301378250122, 0.0004139840602874756, 0.00043223798274993896, 0.00045049190521240234, 0.0004687458276748657, 0.0004869997501373291, 0.0005052536725997925, 0.0005235075950622559, 0.0005417615175247192, 0.0005600154399871826, 0.000578269362449646, 0.0005965232849121094]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 21.0, 421.0, 538.0, 26.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.443971844622865e-05, -7.121629460016266e-05, -6.799286347813904e-05, -6.476943963207304e-05, -6.154601578600705e-05, -5.8322584663983434e-05, -5.5099160817917436e-05, -5.187573333387263e-05, -4.8652305849827826e-05, -4.542887836578302e-05, -4.2205450881738216e-05, -3.898202703567222e-05, -3.575859955162741e-05, -3.253517206758261e-05, -2.9311746402527206e-05, -2.6088320737471804e-05, -2.2864893253427e-05, -1.9641465769382194e-05, -1.6418040104326792e-05, -1.3194613529776689e-05, -9.971186955226585e-06, -6.74775947118178e-06, -3.5243338061263785e-06, -3.0090814107097685e-07, 2.9225193429738283e-06, 6.145945917523932e-06, 9.369372492074035e-06, 1.2592799066624139e-05, 1.5816225641174242e-05, 1.9039653125219047e-05, 2.226307879027445e-05, 2.548650445532985e-05, 2.870993921533227e-05, 3.1933366699377075e-05, 3.515679418342188e-05, 3.838021802948788e-05, 4.160364551353268e-05, 4.482707299757749e-05, 4.8050496843643486e-05, 5.127392432768829e-05, 5.44973518117331e-05, 5.77207792957779e-05, 6.094420677982271e-05, 6.41676306258887e-05, 6.73910544719547e-05, 7.061448559397832e-05, 7.383790944004431e-05, 7.706134056206793e-05, 8.028476440813392e-05, 8.350818825419992e-05, 8.673161937622353e-05, 8.995504322228953e-05, 9.317847434431314e-05, 9.640189819037914e-05, 9.962532203644514e-05, 0.00010284874588251114, 0.00010607217700453475, 0.00010929560085060075, 0.00011251903197262436, 0.00011574245581869036, 0.00011896587966475636, 0.00012218931806273758, 0.00012541274190880358, 0.00012863616575486958, 0.00013185958960093558]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 6.0, 2.0, 2.0, 11.0, 13.0, 19.0, 14.0, 30.0, 24.0, 26.0, 37.0, 40.0, 56.0, 50.0, 60.0, 69.0, 68.0, 46.0, 63.0, 55.0, 55.0, 50.0, 46.0, 39.0, 28.0, 28.0, 14.0, 16.0, 14.0, 9.0, 6.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2993812561035156e-05, -1.2337230145931244e-05, -1.1680647730827332e-05, -1.102406531572342e-05, -1.0367482900619507e-05, -9.710900485515594e-06, -9.054318070411682e-06, -8.39773565530777e-06, -7.741153240203857e-06, -7.084570825099945e-06, -6.427988409996033e-06, -5.77140599489212e-06, -5.114823579788208e-06, -4.458241164684296e-06, -3.8016587495803833e-06, -3.145076334476471e-06, -2.4884939193725586e-06, -1.8319115042686462e-06, -1.1753290891647339e-06, -5.187466740608215e-07, 1.3783574104309082e-07, 7.944181561470032e-07, 1.4510005712509155e-06, 2.107582986354828e-06, 2.7641654014587402e-06, 3.4207478165626526e-06, 4.077330231666565e-06, 4.733912646770477e-06, 5.39049506187439e-06, 6.047077476978302e-06, 6.703659892082214e-06, 7.360242307186127e-06, 8.016824722290039e-06, 8.673407137393951e-06, 9.329989552497864e-06, 9.986571967601776e-06, 1.0643154382705688e-05, 1.12997367978096e-05, 1.1956319212913513e-05, 1.2612901628017426e-05, 1.3269484043121338e-05, 1.392606645822525e-05, 1.4582648873329163e-05, 1.5239231288433075e-05, 1.5895813703536987e-05, 1.65523961186409e-05, 1.7208978533744812e-05, 1.7865560948848724e-05, 1.8522143363952637e-05, 1.917872577905655e-05, 1.983530819416046e-05, 2.0491890609264374e-05, 2.1148473024368286e-05, 2.18050554394722e-05, 2.246163785457611e-05, 2.3118220269680023e-05, 2.3774802684783936e-05, 2.4431385099887848e-05, 2.508796751499176e-05, 2.5744549930095673e-05, 2.6401132345199585e-05, 2.7057714760303497e-05, 2.771429717540741e-05, 2.8370879590511322e-05, 2.9027462005615234e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 9.0, 8.0, 5.0, 17.0, 19.0, 16.0, 21.0, 24.0, 23.0, 25.0, 20.0, 31.0, 32.0, 28.0, 33.0, 38.0, 34.0, 48.0, 35.0, 35.0, 50.0, 44.0, 40.0, 27.0, 38.0, 30.0, 41.0, 27.0, 36.0, 26.0, 25.0, 16.0, 21.0, 16.0, 12.0, 8.0, 5.0, 4.0, 4.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.296875, -4.1630859375, -4.029296875, -3.8955078125, -3.76171875, -3.6279296875, -3.494140625, -3.3603515625, -3.2265625, -3.0927734375, -2.958984375, -2.8251953125, -2.69140625, -2.5576171875, -2.423828125, -2.2900390625, -2.15625, -2.0224609375, -1.888671875, -1.7548828125, -1.62109375, -1.4873046875, -1.353515625, -1.2197265625, -1.0859375, -0.9521484375, -0.818359375, -0.6845703125, -0.55078125, -0.4169921875, -0.283203125, -0.1494140625, -0.015625, 0.1181640625, 0.251953125, 0.3857421875, 0.51953125, 0.6533203125, 0.787109375, 0.9208984375, 1.0546875, 1.1884765625, 1.322265625, 1.4560546875, 1.58984375, 1.7236328125, 1.857421875, 1.9912109375, 2.125, 2.2587890625, 2.392578125, 2.5263671875, 2.66015625, 2.7939453125, 2.927734375, 3.0615234375, 3.1953125, 3.3291015625, 3.462890625, 3.5966796875, 3.73046875, 3.8642578125, 3.998046875, 4.1318359375, 4.265625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 12.0, 11.0, 21.0, 31.0, 55.0, 58.0, 87.0, 156.0, 236.0, 403.0, 593.0, 1008.0, 1644.0, 2702.0, 4561.0, 7986.0, 13875.0, 25145.0, 46305.0, 92344.0, 219447.0, 329128.0, 151831.0, 68331.0, 35987.0, 19633.0, 11033.0, 6412.0, 3734.0, 2282.0, 1376.0, 793.0, 510.0, 321.0, 204.0, 103.0, 56.0, 48.0, 33.0, 18.0, 13.0, 14.0, 4.0, 2.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.39923095703125, -5.2320556640625, -5.06488037109375, -4.897705078125, -4.73052978515625, -4.5633544921875, -4.39617919921875, -4.22900390625, -4.06182861328125, -3.8946533203125, -3.72747802734375, -3.560302734375, -3.39312744140625, -3.2259521484375, -3.05877685546875, -2.8916015625, -2.72442626953125, -2.5572509765625, -2.39007568359375, -2.222900390625, -2.05572509765625, -1.8885498046875, -1.72137451171875, -1.55419921875, -1.38702392578125, -1.2198486328125, -1.05267333984375, -0.885498046875, -0.71832275390625, -0.5511474609375, -0.38397216796875, -0.216796875, -0.04962158203125, 0.1175537109375, 0.28472900390625, 0.451904296875, 0.61907958984375, 0.7862548828125, 0.95343017578125, 1.12060546875, 1.28778076171875, 1.4549560546875, 1.62213134765625, 1.789306640625, 1.95648193359375, 2.1236572265625, 2.29083251953125, 2.4580078125, 2.62518310546875, 2.7923583984375, 2.95953369140625, 3.126708984375, 3.29388427734375, 3.4610595703125, 3.62823486328125, 3.79541015625, 3.96258544921875, 4.1297607421875, 4.29693603515625, 4.464111328125, 4.63128662109375, 4.7984619140625, 4.96563720703125, 5.1328125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 8.0, 11.0, 8.0, 8.0, 11.0, 11.0, 18.0, 30.0, 22.0, 26.0, 25.0, 26.0, 34.0, 42.0, 46.0, 60.0, 71.0, 120.0, 230.0, 1411.0, 216.0, 114.0, 74.0, 52.0, 50.0, 51.0, 43.0, 29.0, 28.0, 30.0, 21.0, 18.0, 18.0, 24.0, 13.0, 8.0, 8.0, 4.0, 7.0, 7.0, 3.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.0693359375, -10.693359375, -10.3173828125, -9.94140625, -9.5654296875, -9.189453125, -8.8134765625, -8.4375, -8.0615234375, -7.685546875, -7.3095703125, -6.93359375, -6.5576171875, -6.181640625, -5.8056640625, -5.4296875, -5.0537109375, -4.677734375, -4.3017578125, -3.92578125, -3.5498046875, -3.173828125, -2.7978515625, -2.421875, -2.0458984375, -1.669921875, -1.2939453125, -0.91796875, -0.5419921875, -0.166015625, 0.2099609375, 0.5859375, 0.9619140625, 1.337890625, 1.7138671875, 2.08984375, 2.4658203125, 2.841796875, 3.2177734375, 3.59375, 3.9697265625, 4.345703125, 4.7216796875, 5.09765625, 5.4736328125, 5.849609375, 6.2255859375, 6.6015625, 6.9775390625, 7.353515625, 7.7294921875, 8.10546875, 8.4814453125, 8.857421875, 9.2333984375, 9.609375, 9.9853515625, 10.361328125, 10.7373046875, 11.11328125, 11.4892578125, 11.865234375, 12.2412109375, 12.6171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 7.0, 3.0, 10.0, 16.0, 12.0, 21.0, 31.0, 49.0, 72.0, 65.0, 129.0, 177.0, 266.0, 590.0, 1305.0, 3942.0, 14529.0, 63973.0, 486261.0, 2307261.0, 215386.0, 37695.0, 9036.0, 2708.0, 987.0, 426.0, 245.0, 144.0, 85.0, 74.0, 43.0, 36.0, 31.0, 19.0, 23.0, 12.0, 15.0, 5.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-13.6953125, -13.29638671875, -12.8974609375, -12.49853515625, -12.099609375, -11.70068359375, -11.3017578125, -10.90283203125, -10.50390625, -10.10498046875, -9.7060546875, -9.30712890625, -8.908203125, -8.50927734375, -8.1103515625, -7.71142578125, -7.3125, -6.91357421875, -6.5146484375, -6.11572265625, -5.716796875, -5.31787109375, -4.9189453125, -4.52001953125, -4.12109375, -3.72216796875, -3.3232421875, -2.92431640625, -2.525390625, -2.12646484375, -1.7275390625, -1.32861328125, -0.9296875, -0.53076171875, -0.1318359375, 0.26708984375, 0.666015625, 1.06494140625, 1.4638671875, 1.86279296875, 2.26171875, 2.66064453125, 3.0595703125, 3.45849609375, 3.857421875, 4.25634765625, 4.6552734375, 5.05419921875, 5.453125, 5.85205078125, 6.2509765625, 6.64990234375, 7.048828125, 7.44775390625, 7.8466796875, 8.24560546875, 8.64453125, 9.04345703125, 9.4423828125, 9.84130859375, 10.240234375, 10.63916015625, 11.0380859375, 11.43701171875, 11.8359375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 37.0, 417.0, 502.0, 53.0, 4.0, 2.0], "bins": [-300.0197448730469, -295.0248107910156, -290.02984619140625, -285.034912109375, -280.0399475097656, -275.0450134277344, -270.0500793457031, -265.05511474609375, -260.0601806640625, -255.0652313232422, -250.07028198242188, -245.07534790039062, -240.0803985595703, -235.08544921875, -230.0904998779297, -225.09555053710938, -220.10061645507812, -215.1056671142578, -210.1107177734375, -205.11578369140625, -200.12083435058594, -195.12588500976562, -190.1309356689453, -185.135986328125, -180.1410369873047, -175.14608764648438, -170.15113830566406, -165.1562042236328, -160.1612548828125, -155.1663055419922, -150.17135620117188, -145.17642211914062, -140.18145751953125, -135.18650817871094, -130.19155883789062, -125.19661712646484, -120.20167541503906, -115.20672607421875, -110.21177673339844, -105.21683502197266, -100.22189331054688, -95.22694396972656, -90.23200225830078, -85.23705291748047, -80.24211120605469, -75.24716186523438, -70.25221252441406, -65.25727081298828, -60.262325286865234, -55.26737976074219, -50.27243423461914, -45.277488708496094, -40.28253936767578, -35.28759765625, -30.292648315429688, -25.29770278930664, -20.302757263183594, -15.307811737060547, -10.312865257263184, -5.31791877746582, -0.32297325134277344, 4.671972274780273, 9.666919708251953, 14.661865234375, 19.656810760498047]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 11.0, 8.0, 11.0, 12.0, 16.0, 13.0, 24.0, 29.0, 29.0, 23.0, 42.0, 24.0, 33.0, 41.0, 37.0, 37.0, 50.0, 42.0, 46.0, 45.0, 41.0, 38.0, 36.0, 31.0, 28.0, 29.0, 29.0, 25.0, 25.0, 19.0, 15.0, 19.0, 22.0, 16.0, 11.0, 6.0, 4.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.530290603637695, -28.6097412109375, -27.689193725585938, -26.768644332885742, -25.848094940185547, -24.927547454833984, -24.00699806213379, -23.086448669433594, -22.16590118408203, -21.245351791381836, -20.324804306030273, -19.404254913330078, -18.483705520629883, -17.563156127929688, -16.642608642578125, -15.72205924987793, -14.801509857177734, -13.880961418151855, -12.96041202545166, -12.039863586425781, -11.119314193725586, -10.198765754699707, -9.278217315673828, -8.357667922973633, -7.437119483947754, -6.516570568084717, -5.59602165222168, -4.675473213195801, -3.7549242973327637, -2.8343753814697266, -1.9138269424438477, -0.9932780265808105, -0.07272720336914062, 0.8478215932846069, 1.7683703899383545, 2.6889190673828125, 3.6094679832458496, 4.530016899108887, 5.450565338134766, 6.371114253997803, 7.29166316986084, 8.212211608886719, 9.132761001586914, 10.053309440612793, 10.973857879638672, 11.894407272338867, 12.814955711364746, 13.735504150390625, 14.65605354309082, 15.5766019821167, 16.497150421142578, 17.417699813842773, 18.33824920654297, 19.25879669189453, 20.179346084594727, 21.099895477294922, 22.020442962646484, 22.94099235534668, 23.861539840698242, 24.782089233398438, 25.702638626098633, 26.623188018798828, 27.54373550415039, 28.464284896850586, 29.38483428955078]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 2.0, 11.0, 7.0, 11.0, 4.0, 7.0, 18.0, 10.0, 16.0, 17.0, 28.0, 27.0, 15.0, 15.0, 30.0, 26.0, 28.0, 39.0, 31.0, 25.0, 40.0, 36.0, 29.0, 44.0, 34.0, 40.0, 36.0, 33.0, 35.0, 27.0, 35.0, 31.0, 26.0, 22.0, 20.0, 28.0, 17.0, 12.0, 21.0, 12.0, 7.0, 10.0, 6.0, 6.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.9244384765625, -3.798095703125, -3.6717529296875, -3.54541015625, -3.4190673828125, -3.292724609375, -3.1663818359375, -3.0400390625, -2.9136962890625, -2.787353515625, -2.6610107421875, -2.53466796875, -2.4083251953125, -2.281982421875, -2.1556396484375, -2.029296875, -1.9029541015625, -1.776611328125, -1.6502685546875, -1.52392578125, -1.3975830078125, -1.271240234375, -1.1448974609375, -1.0185546875, -0.8922119140625, -0.765869140625, -0.6395263671875, -0.51318359375, -0.3868408203125, -0.260498046875, -0.1341552734375, -0.0078125, 0.1185302734375, 0.244873046875, 0.3712158203125, 0.49755859375, 0.6239013671875, 0.750244140625, 0.8765869140625, 1.0029296875, 1.1292724609375, 1.255615234375, 1.3819580078125, 1.50830078125, 1.6346435546875, 1.760986328125, 1.8873291015625, 2.013671875, 2.1400146484375, 2.266357421875, 2.3927001953125, 2.51904296875, 2.6453857421875, 2.771728515625, 2.8980712890625, 3.0244140625, 3.1507568359375, 3.277099609375, 3.4034423828125, 3.52978515625, 3.6561279296875, 3.782470703125, 3.9088134765625, 4.03515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 2.0, 5.0, 8.0, 8.0, 8.0, 13.0, 19.0, 21.0, 36.0, 52.0, 65.0, 116.0, 185.0, 317.0, 568.0, 1118.0, 2232.0, 4938.0, 11639.0, 32779.0, 115512.0, 593407.0, 2276042.0, 916273.0, 167495.0, 44126.0, 15214.0, 6144.0, 2762.0, 1362.0, 718.0, 426.0, 234.0, 129.0, 101.0, 54.0, 48.0, 31.0, 28.0, 14.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9765625, -7.7320556640625, -7.487548828125, -7.2430419921875, -6.99853515625, -6.7540283203125, -6.509521484375, -6.2650146484375, -6.0205078125, -5.7760009765625, -5.531494140625, -5.2869873046875, -5.04248046875, -4.7979736328125, -4.553466796875, -4.3089599609375, -4.064453125, -3.8199462890625, -3.575439453125, -3.3309326171875, -3.08642578125, -2.8419189453125, -2.597412109375, -2.3529052734375, -2.1083984375, -1.8638916015625, -1.619384765625, -1.3748779296875, -1.13037109375, -0.8858642578125, -0.641357421875, -0.3968505859375, -0.15234375, 0.0921630859375, 0.336669921875, 0.5811767578125, 0.82568359375, 1.0701904296875, 1.314697265625, 1.5592041015625, 1.8037109375, 2.0482177734375, 2.292724609375, 2.5372314453125, 2.78173828125, 3.0262451171875, 3.270751953125, 3.5152587890625, 3.759765625, 4.0042724609375, 4.248779296875, 4.4932861328125, 4.73779296875, 4.9822998046875, 5.226806640625, 5.4713134765625, 5.7158203125, 5.9603271484375, 6.204833984375, 6.4493408203125, 6.69384765625, 6.9383544921875, 7.182861328125, 7.4273681640625, 7.671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 2.0, 9.0, 12.0, 8.0, 11.0, 15.0, 17.0, 23.0, 34.0, 38.0, 48.0, 64.0, 74.0, 96.0, 115.0, 150.0, 181.0, 221.0, 346.0, 377.0, 416.0, 421.0, 309.0, 251.0, 191.0, 143.0, 140.0, 82.0, 70.0, 54.0, 34.0, 23.0, 20.0, 12.0, 14.0, 13.0, 9.0, 8.0, 9.0, 4.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.09375, -5.91754150390625, -5.7413330078125, -5.56512451171875, -5.388916015625, -5.21270751953125, -5.0364990234375, -4.86029052734375, -4.68408203125, -4.50787353515625, -4.3316650390625, -4.15545654296875, -3.979248046875, -3.80303955078125, -3.6268310546875, -3.45062255859375, -3.2744140625, -3.09820556640625, -2.9219970703125, -2.74578857421875, -2.569580078125, -2.39337158203125, -2.2171630859375, -2.04095458984375, -1.86474609375, -1.68853759765625, -1.5123291015625, -1.33612060546875, -1.159912109375, -0.98370361328125, -0.8074951171875, -0.63128662109375, -0.455078125, -0.27886962890625, -0.1026611328125, 0.07354736328125, 0.249755859375, 0.42596435546875, 0.6021728515625, 0.77838134765625, 0.95458984375, 1.13079833984375, 1.3070068359375, 1.48321533203125, 1.659423828125, 1.83563232421875, 2.0118408203125, 2.18804931640625, 2.3642578125, 2.54046630859375, 2.7166748046875, 2.89288330078125, 3.069091796875, 3.24530029296875, 3.4215087890625, 3.59771728515625, 3.77392578125, 3.95013427734375, 4.1263427734375, 4.30255126953125, 4.478759765625, 4.65496826171875, 4.8311767578125, 5.00738525390625, 5.18359375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 13.0, 11.0, 18.0, 32.0, 38.0, 63.0, 79.0, 117.0, 164.0, 290.0, 581.0, 1196.0, 2820.0, 6957.0, 19144.0, 60825.0, 221516.0, 1154746.0, 2182988.0, 397376.0, 98037.0, 29544.0, 10222.0, 3843.0, 1664.0, 775.0, 409.0, 255.0, 171.0, 101.0, 71.0, 47.0, 50.0, 29.0, 16.0, 14.0, 16.0, 10.0, 7.0, 5.0, 8.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9921875, -6.7032470703125, -6.414306640625, -6.1253662109375, -5.83642578125, -5.5474853515625, -5.258544921875, -4.9696044921875, -4.6806640625, -4.3917236328125, -4.102783203125, -3.8138427734375, -3.52490234375, -3.2359619140625, -2.947021484375, -2.6580810546875, -2.369140625, -2.0802001953125, -1.791259765625, -1.5023193359375, -1.21337890625, -0.9244384765625, -0.635498046875, -0.3465576171875, -0.0576171875, 0.2313232421875, 0.520263671875, 0.8092041015625, 1.09814453125, 1.3870849609375, 1.676025390625, 1.9649658203125, 2.25390625, 2.5428466796875, 2.831787109375, 3.1207275390625, 3.40966796875, 3.6986083984375, 3.987548828125, 4.2764892578125, 4.5654296875, 4.8543701171875, 5.143310546875, 5.4322509765625, 5.72119140625, 6.0101318359375, 6.299072265625, 6.5880126953125, 6.876953125, 7.1658935546875, 7.454833984375, 7.7437744140625, 8.03271484375, 8.3216552734375, 8.610595703125, 8.8995361328125, 9.1884765625, 9.4774169921875, 9.766357421875, 10.0552978515625, 10.34423828125, 10.6331787109375, 10.922119140625, 11.2110595703125, 11.5]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 22.0, 79.0, 153.0, 274.0, 272.0, 140.0, 49.0, 19.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.4439640045166, -24.927635192871094, -22.411304473876953, -19.894975662231445, -17.378646850585938, -14.86231803894043, -12.345988273620605, -9.829658508300781, -7.313329696655273, -4.797000408172607, -2.2806711196899414, 0.2356581687927246, 2.7519874572753906, 5.268316268920898, 7.784646034240723, 10.300975799560547, 12.817304611206055, 15.333633422851562, 17.849964141845703, 20.36629295349121, 22.88262176513672, 25.398950576782227, 27.915279388427734, 30.431610107421875, 32.94793701171875, 35.46426773071289, 37.980594635009766, 40.496925354003906, 43.01325225830078, 45.52958297729492, 48.04591369628906, 50.56224060058594, 53.07856750488281, 55.59489822387695, 58.11122512817383, 60.62755584716797, 63.143882751464844, 65.66021728515625, 68.17654418945312, 70.69287109375, 73.20919799804688, 75.72552490234375, 78.24185943603516, 80.75818634033203, 83.2745132446289, 85.79084777832031, 88.30717468261719, 90.82350158691406, 93.33983612060547, 95.85616302490234, 98.37249755859375, 100.88882446289062, 103.4051513671875, 105.92147827148438, 108.43781280517578, 110.95413970947266, 113.47047424316406, 115.98680114746094, 118.50313568115234, 121.01946258544922, 123.5357894897461, 126.0521240234375, 128.56845092773438, 131.08477783203125, 133.60110473632812]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 9.0, 7.0, 10.0, 9.0, 16.0, 12.0, 15.0, 19.0, 19.0, 22.0, 23.0, 27.0, 26.0, 28.0, 43.0, 37.0, 31.0, 40.0, 39.0, 33.0, 51.0, 44.0, 44.0, 33.0, 48.0, 29.0, 30.0, 34.0, 30.0, 29.0, 24.0, 18.0, 16.0, 18.0, 14.0, 13.0, 6.0, 5.0, 11.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-25.861602783203125, -25.097434997558594, -24.333267211914062, -23.56909942626953, -22.804933547973633, -22.0407657623291, -21.27659797668457, -20.51243019104004, -19.74826431274414, -18.98409652709961, -18.219928741455078, -17.455760955810547, -16.69159507751465, -15.927427291870117, -15.163259506225586, -14.399091720581055, -13.634923934936523, -12.870756149291992, -12.106589317321777, -11.342421531677246, -10.578254699707031, -9.8140869140625, -9.049919128417969, -8.285751342773438, -7.521584510803223, -6.75741720199585, -5.993249893188477, -5.229082107543945, -4.464914798736572, -3.700747489929199, -2.936579704284668, -2.172412395477295, -1.4082450866699219, -0.6440776586532593, 0.12008976936340332, 0.8842573165893555, 1.6484246253967285, 2.4125919342041016, 3.176759719848633, 3.940927028656006, 4.705094337463379, 5.469261646270752, 6.233428955078125, 6.997596740722656, 7.761764049530029, 8.525931358337402, 9.290099143981934, 10.054265975952148, 10.81843376159668, 11.582601547241211, 12.346768379211426, 13.110936164855957, 13.875102996826172, 14.639270782470703, 15.403438568115234, 16.167606353759766, 16.931774139404297, 17.695941925048828, 18.46010971069336, 19.22427749633789, 19.98844337463379, 20.75261116027832, 21.51677894592285, 22.280946731567383, 23.04511260986328]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 6.0, 2.0, 10.0, 6.0, 15.0, 13.0, 13.0, 17.0, 14.0, 22.0, 20.0, 23.0, 31.0, 32.0, 24.0, 29.0, 39.0, 43.0, 48.0, 28.0, 38.0, 32.0, 46.0, 49.0, 36.0, 32.0, 32.0, 28.0, 34.0, 31.0, 25.0, 23.0, 28.0, 23.0, 20.0, 10.0, 14.0, 14.0, 8.0, 11.0, 11.0, 3.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.58203125, -4.4442138671875, -4.306396484375, -4.1685791015625, -4.03076171875, -3.8929443359375, -3.755126953125, -3.6173095703125, -3.4794921875, -3.3416748046875, -3.203857421875, -3.0660400390625, -2.92822265625, -2.7904052734375, -2.652587890625, -2.5147705078125, -2.376953125, -2.2391357421875, -2.101318359375, -1.9635009765625, -1.82568359375, -1.6878662109375, -1.550048828125, -1.4122314453125, -1.2744140625, -1.1365966796875, -0.998779296875, -0.8609619140625, -0.72314453125, -0.5853271484375, -0.447509765625, -0.3096923828125, -0.171875, -0.0340576171875, 0.103759765625, 0.2415771484375, 0.37939453125, 0.5172119140625, 0.655029296875, 0.7928466796875, 0.9306640625, 1.0684814453125, 1.206298828125, 1.3441162109375, 1.48193359375, 1.6197509765625, 1.757568359375, 1.8953857421875, 2.033203125, 2.1710205078125, 2.308837890625, 2.4466552734375, 2.58447265625, 2.7222900390625, 2.860107421875, 2.9979248046875, 3.1357421875, 3.2735595703125, 3.411376953125, 3.5491943359375, 3.68701171875, 3.8248291015625, 3.962646484375, 4.1004638671875, 4.23828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 4.0, 6.0, 17.0, 21.0, 36.0, 37.0, 73.0, 108.0, 171.0, 287.0, 484.0, 746.0, 1406.0, 2410.0, 4329.0, 7990.0, 14802.0, 27553.0, 53192.0, 116491.0, 361481.0, 266045.0, 93721.0, 45073.0, 23508.0, 12778.0, 6839.0, 3847.0, 2086.0, 1217.0, 702.0, 416.0, 236.0, 143.0, 114.0, 68.0, 33.0, 24.0, 22.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.279541015625, -0.27174949645996094, -0.2639579772949219, -0.2561664581298828, -0.24837493896484375, -0.2405834197998047, -0.23279190063476562, -0.22500038146972656, -0.2172088623046875, -0.20941734313964844, -0.20162582397460938, -0.1938343048095703, -0.18604278564453125, -0.1782512664794922, -0.17045974731445312, -0.16266822814941406, -0.154876708984375, -0.14708518981933594, -0.13929367065429688, -0.1315021514892578, -0.12371063232421875, -0.11591911315917969, -0.10812759399414062, -0.10033607482910156, -0.0925445556640625, -0.08475303649902344, -0.07696151733398438, -0.06916999816894531, -0.06137847900390625, -0.05358695983886719, -0.045795440673828125, -0.03800392150878906, -0.03021240234375, -0.022420883178710938, -0.014629364013671875, -0.0068378448486328125, 0.00095367431640625, 0.008745193481445312, 0.016536712646484375, 0.024328231811523438, 0.0321197509765625, 0.03991127014160156, 0.047702789306640625, 0.05549430847167969, 0.06328582763671875, 0.07107734680175781, 0.07886886596679688, 0.08666038513183594, 0.094451904296875, 0.10224342346191406, 0.11003494262695312, 0.11782646179199219, 0.12561798095703125, 0.1334095001220703, 0.14120101928710938, 0.14899253845214844, 0.1567840576171875, 0.16457557678222656, 0.17236709594726562, 0.1801586151123047, 0.18795013427734375, 0.1957416534423828, 0.20353317260742188, 0.21132469177246094, 0.2191162109375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 14.0, 11.0, 13.0, 26.0, 22.0, 36.0, 18.0, 33.0, 36.0, 44.0, 52.0, 38.0, 40.0, 45.0, 1078.0, 44.0, 56.0, 44.0, 47.0, 38.0, 42.0, 33.0, 40.0, 27.0, 28.0, 24.0, 18.0, 14.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7109375, -3.59375, -3.4765625, -3.359375, -3.2421875, -3.125, -3.0078125, -2.890625, -2.7734375, -2.65625, -2.5390625, -2.421875, -2.3046875, -2.1875, -2.0703125, -1.953125, -1.8359375, -1.71875, -1.6015625, -1.484375, -1.3671875, -1.25, -1.1328125, -1.015625, -0.8984375, -0.78125, -0.6640625, -0.546875, -0.4296875, -0.3125, -0.1953125, -0.078125, 0.0390625, 0.15625, 0.2734375, 0.390625, 0.5078125, 0.625, 0.7421875, 0.859375, 0.9765625, 1.09375, 1.2109375, 1.328125, 1.4453125, 1.5625, 1.6796875, 1.796875, 1.9140625, 2.03125, 2.1484375, 2.265625, 2.3828125, 2.5, 2.6171875, 2.734375, 2.8515625, 2.96875, 3.0859375, 3.203125, 3.3203125, 3.4375, 3.5546875, 3.671875, 3.7890625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 15.0, 16.0, 39.0, 43.0, 53.0, 106.0, 135.0, 191.0, 323.0, 492.0, 669.0, 1009.0, 1562.0, 2225.0, 3416.0, 4979.0, 7529.0, 11796.0, 17980.0, 28273.0, 46434.0, 78625.0, 142171.0, 1309643.0, 186078.0, 99469.0, 56943.0, 34368.0, 21763.0, 13810.0, 9009.0, 5823.0, 4020.0, 2644.0, 1787.0, 1183.0, 826.0, 559.0, 380.0, 242.0, 166.0, 106.0, 67.0, 50.0, 32.0, 28.0, 19.0, 11.0, 2.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.06866455078125, -0.06635284423828125, -0.0640411376953125, -0.06172943115234375, -0.059417724609375, -0.05710601806640625, -0.0547943115234375, -0.05248260498046875, -0.0501708984375, -0.04785919189453125, -0.0455474853515625, -0.04323577880859375, -0.040924072265625, -0.03861236572265625, -0.0363006591796875, -0.03398895263671875, -0.03167724609375, -0.02936553955078125, -0.0270538330078125, -0.02474212646484375, -0.022430419921875, -0.02011871337890625, -0.0178070068359375, -0.01549530029296875, -0.01318359375, -0.01087188720703125, -0.0085601806640625, -0.00624847412109375, -0.003936767578125, -0.00162506103515625, 0.0006866455078125, 0.00299835205078125, 0.00531005859375, 0.00762176513671875, 0.0099334716796875, 0.01224517822265625, 0.014556884765625, 0.01686859130859375, 0.0191802978515625, 0.02149200439453125, 0.0238037109375, 0.02611541748046875, 0.0284271240234375, 0.03073883056640625, 0.033050537109375, 0.03536224365234375, 0.0376739501953125, 0.03998565673828125, 0.04229736328125, 0.04460906982421875, 0.0469207763671875, 0.04923248291015625, 0.051544189453125, 0.05385589599609375, 0.0561676025390625, 0.05847930908203125, 0.060791015625, 0.06310272216796875, 0.0654144287109375, 0.06772613525390625, 0.070037841796875, 0.07234954833984375, 0.0746612548828125, 0.07697296142578125, 0.07928466796875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 12.0, 16.0, 11.0, 18.0, 20.0, 27.0, 33.0, 35.0, 45.0, 47.0, 44.0, 45.0, 68.0, 51.0, 63.0, 57.0, 56.0, 49.0, 32.0, 52.0, 31.0, 22.0, 23.0, 21.0, 19.0, 14.0, 10.0, 16.0, 9.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451108932495117e-05, -3.353040665388107e-05, -3.2549723982810974e-05, -3.1569041311740875e-05, -3.0588358640670776e-05, -2.9607675969600677e-05, -2.862699329853058e-05, -2.764631062746048e-05, -2.666562795639038e-05, -2.5684945285320282e-05, -2.4704262614250183e-05, -2.3723579943180084e-05, -2.2742897272109985e-05, -2.1762214601039886e-05, -2.0781531929969788e-05, -1.980084925889969e-05, -1.882016658782959e-05, -1.783948391675949e-05, -1.6858801245689392e-05, -1.5878118574619293e-05, -1.4897435903549194e-05, -1.3916753232479095e-05, -1.2936070561408997e-05, -1.1955387890338898e-05, -1.0974705219268799e-05, -9.9940225481987e-06, -9.013339877128601e-06, -8.032657206058502e-06, -7.051974534988403e-06, -6.0712918639183044e-06, -5.0906091928482056e-06, -4.109926521778107e-06, -3.129243850708008e-06, -2.148561179637909e-06, -1.16787850856781e-06, -1.8719583749771118e-07, 7.934868335723877e-07, 1.7741695046424866e-06, 2.7548521757125854e-06, 3.7355348467826843e-06, 4.716217517852783e-06, 5.696900188922882e-06, 6.677582859992981e-06, 7.65826553106308e-06, 8.638948202133179e-06, 9.619630873203278e-06, 1.0600313544273376e-05, 1.1580996215343475e-05, 1.2561678886413574e-05, 1.3542361557483673e-05, 1.4523044228553772e-05, 1.550372689962387e-05, 1.648440957069397e-05, 1.746509224176407e-05, 1.8445774912834167e-05, 1.9426457583904266e-05, 2.0407140254974365e-05, 2.1387822926044464e-05, 2.2368505597114563e-05, 2.3349188268184662e-05, 2.432987093925476e-05, 2.531055361032486e-05, 2.629123628139496e-05, 2.7271918952465057e-05, 2.8252601623535156e-05]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 8.0, 10.0, 17.0, 12.0, 12.0, 27.0, 21.0, 25.0, 34.0, 59.0, 87.0, 107.0, 191.0, 453.0, 1790.0, 991982.0, 51970.0, 797.0, 329.0, 162.0, 95.0, 84.0, 52.0, 53.0, 26.0, 32.0, 19.0, 19.0, 13.0, 15.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006499290466308594, -0.0006273537874221802, -0.000604778528213501, -0.0005822032690048218, -0.0005596280097961426, -0.0005370527505874634, -0.0005144774913787842, -0.000491902232170105, -0.0004693269729614258, -0.0004467517137527466, -0.0004241764545440674, -0.0004016011953353882, -0.000379025936126709, -0.0003564506769180298, -0.0003338754177093506, -0.0003113001585006714, -0.0002887248992919922, -0.000266149640083313, -0.0002435743808746338, -0.0002209991216659546, -0.0001984238624572754, -0.0001758486032485962, -0.000153273344039917, -0.0001306980848312378, -0.0001081228256225586, -8.55475664138794e-05, -6.29723072052002e-05, -4.0397047996520996e-05, -1.7821788787841797e-05, 4.753470420837402e-06, 2.73287296295166e-05, 4.99039888381958e-05, 7.2479248046875e-05, 9.50545072555542e-05, 0.0001176297664642334, 0.0001402050256729126, 0.0001627802848815918, 0.000185355544090271, 0.0002079308032989502, 0.0002305060625076294, 0.0002530813217163086, 0.0002756565809249878, 0.000298231840133667, 0.0003208070993423462, 0.0003433823585510254, 0.0003659576177597046, 0.0003885328769683838, 0.000411108136177063, 0.0004336833953857422, 0.0004562586545944214, 0.0004788339138031006, 0.0005014091730117798, 0.000523984432220459, 0.0005465596914291382, 0.0005691349506378174, 0.0005917102098464966, 0.0006142854690551758, 0.000636860728263855, 0.0006594359874725342, 0.0006820112466812134, 0.0007045865058898926, 0.0007271617650985718, 0.000749737024307251, 0.0007723122835159302, 0.0007948875427246094]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 42.0, 900.0, 73.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.285699343308806e-05, -8.689121023053303e-05, -8.0925427027978e-05, -7.495964382542297e-05, -6.899386062286794e-05, -6.302807742031291e-05, -5.706229421775788e-05, -5.109651101520285e-05, -4.513072781264782e-05, -3.916494461009279e-05, -3.319916140753776e-05, -2.7233378204982728e-05, -2.1267595002427697e-05, -1.5301811799872667e-05, -9.336028597317636e-06, -3.3702453947626054e-06, 2.595537807792425e-06, 8.561321010347456e-06, 1.4527104212902486e-05, 2.0492887415457517e-05, 2.6458670618012547e-05, 3.242445382056758e-05, 3.839023702312261e-05, 4.435602022567764e-05, 5.032180342823267e-05, 5.62875866307877e-05, 6.225336983334273e-05, 6.821915303589776e-05, 7.418493623845279e-05, 8.015071944100782e-05, 8.611650264356285e-05, 9.208228584611788e-05, 9.804806904867291e-05, 0.00010401385225122795, 0.00010997963545378298, 0.000115945418656338, 0.00012191120185889304, 0.00012787699233740568, 0.0001338427682640031, 0.00013980854419060051, 0.00014577433466911316, 0.0001517401251476258, 0.00015770590107422322, 0.00016367167700082064, 0.00016963746747933328, 0.00017560325795784593, 0.00018156903388444334, 0.00018753480981104076, 0.0001935006002895534, 0.00019946639076806605, 0.00020543216669466347, 0.00021139794262126088, 0.00021736373309977353, 0.00022332952357828617, 0.0002292952995048836, 0.000235261075431481, 0.00024122686590999365, 0.0002471926563885063, 0.00025315844686701894, 0.0002591242082417011, 0.00026508999872021377, 0.0002710557891987264, 0.0002770215505734086, 0.00028298734105192125, 0.0002889531315304339]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 11.0, 11.0, 16.0, 21.0, 24.0, 29.0, 45.0, 43.0, 42.0, 62.0, 63.0, 68.0, 67.0, 59.0, 60.0, 54.0, 57.0, 47.0, 44.0, 37.0, 26.0, 22.0, 27.0, 12.0, 15.0, 13.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.710653305053711e-05, -1.624133437871933e-05, -1.537613570690155e-05, -1.451093703508377e-05, -1.3645738363265991e-05, -1.2780539691448212e-05, -1.1915341019630432e-05, -1.1050142347812653e-05, -1.0184943675994873e-05, -9.319745004177094e-06, -8.454546332359314e-06, -7.5893476605415344e-06, -6.724148988723755e-06, -5.858950316905975e-06, -4.993751645088196e-06, -4.128552973270416e-06, -3.2633543014526367e-06, -2.398155629634857e-06, -1.5329569578170776e-06, -6.677582859992981e-07, 1.9744038581848145e-07, 1.062639057636261e-06, 1.9278377294540405e-06, 2.79303640127182e-06, 3.6582350730895996e-06, 4.523433744907379e-06, 5.388632416725159e-06, 6.253831088542938e-06, 7.119029760360718e-06, 7.984228432178497e-06, 8.849427103996277e-06, 9.714625775814056e-06, 1.0579824447631836e-05, 1.1445023119449615e-05, 1.2310221791267395e-05, 1.3175420463085175e-05, 1.4040619134902954e-05, 1.4905817806720734e-05, 1.5771016478538513e-05, 1.6636215150356293e-05, 1.7501413822174072e-05, 1.8366612493991852e-05, 1.923181116580963e-05, 2.009700983762741e-05, 2.096220850944519e-05, 2.182740718126297e-05, 2.269260585308075e-05, 2.355780452489853e-05, 2.442300319671631e-05, 2.5288201868534088e-05, 2.6153400540351868e-05, 2.7018599212169647e-05, 2.7883797883987427e-05, 2.8748996555805206e-05, 2.9614195227622986e-05, 3.0479393899440765e-05, 3.1344592571258545e-05, 3.2209791243076324e-05, 3.3074989914894104e-05, 3.3940188586711884e-05, 3.480538725852966e-05, 3.567058593034744e-05, 3.653578460216522e-05, 3.7400983273983e-05, 3.826618194580078e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 6.0, 2.0, 10.0, 6.0, 15.0, 13.0, 13.0, 17.0, 14.0, 22.0, 20.0, 23.0, 31.0, 32.0, 24.0, 29.0, 39.0, 43.0, 48.0, 28.0, 38.0, 32.0, 46.0, 49.0, 36.0, 32.0, 32.0, 28.0, 34.0, 31.0, 25.0, 23.0, 28.0, 23.0, 20.0, 10.0, 14.0, 14.0, 8.0, 11.0, 11.0, 3.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.58203125, -4.4442138671875, -4.306396484375, -4.1685791015625, -4.03076171875, -3.8929443359375, -3.755126953125, -3.6173095703125, -3.4794921875, -3.3416748046875, -3.203857421875, -3.0660400390625, -2.92822265625, -2.7904052734375, -2.652587890625, -2.5147705078125, -2.376953125, -2.2391357421875, -2.101318359375, -1.9635009765625, -1.82568359375, -1.6878662109375, -1.550048828125, -1.4122314453125, -1.2744140625, -1.1365966796875, -0.998779296875, -0.8609619140625, -0.72314453125, -0.5853271484375, -0.447509765625, -0.3096923828125, -0.171875, -0.0340576171875, 0.103759765625, 0.2415771484375, 0.37939453125, 0.5172119140625, 0.655029296875, 0.7928466796875, 0.9306640625, 1.0684814453125, 1.206298828125, 1.3441162109375, 1.48193359375, 1.6197509765625, 1.757568359375, 1.8953857421875, 2.033203125, 2.1710205078125, 2.308837890625, 2.4466552734375, 2.58447265625, 2.7222900390625, 2.860107421875, 2.9979248046875, 3.1357421875, 3.2735595703125, 3.411376953125, 3.5491943359375, 3.68701171875, 3.8248291015625, 3.962646484375, 4.1004638671875, 4.23828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 3.0, 13.0, 17.0, 19.0, 36.0, 52.0, 82.0, 115.0, 165.0, 261.0, 404.0, 639.0, 976.0, 1566.0, 2521.0, 4038.0, 6332.0, 10098.0, 16497.0, 27458.0, 49450.0, 105589.0, 264464.0, 304876.0, 120403.0, 55503.0, 29957.0, 17536.0, 10909.0, 6896.0, 4268.0, 2722.0, 1665.0, 1075.0, 649.0, 446.0, 291.0, 185.0, 110.0, 76.0, 58.0, 35.0, 28.0, 18.0, 16.0, 12.0, 4.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.4901123046875, -4.335693359375, -4.1812744140625, -4.02685546875, -3.8724365234375, -3.718017578125, -3.5635986328125, -3.4091796875, -3.2547607421875, -3.100341796875, -2.9459228515625, -2.79150390625, -2.6370849609375, -2.482666015625, -2.3282470703125, -2.173828125, -2.0194091796875, -1.864990234375, -1.7105712890625, -1.55615234375, -1.4017333984375, -1.247314453125, -1.0928955078125, -0.9384765625, -0.7840576171875, -0.629638671875, -0.4752197265625, -0.32080078125, -0.1663818359375, -0.011962890625, 0.1424560546875, 0.296875, 0.4512939453125, 0.605712890625, 0.7601318359375, 0.91455078125, 1.0689697265625, 1.223388671875, 1.3778076171875, 1.5322265625, 1.6866455078125, 1.841064453125, 1.9954833984375, 2.14990234375, 2.3043212890625, 2.458740234375, 2.6131591796875, 2.767578125, 2.9219970703125, 3.076416015625, 3.2308349609375, 3.38525390625, 3.5396728515625, 3.694091796875, 3.8485107421875, 4.0029296875, 4.1573486328125, 4.311767578125, 4.4661865234375, 4.62060546875, 4.7750244140625, 4.929443359375, 5.0838623046875, 5.23828125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 4.0, 7.0, 12.0, 10.0, 10.0, 19.0, 24.0, 21.0, 17.0, 23.0, 25.0, 21.0, 28.0, 41.0, 48.0, 60.0, 56.0, 89.0, 130.0, 244.0, 1364.0, 188.0, 126.0, 76.0, 59.0, 42.0, 43.0, 37.0, 31.0, 27.0, 23.0, 24.0, 21.0, 12.0, 16.0, 10.0, 9.0, 10.0, 10.0, 3.0, 4.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5, -10.1646728515625, -9.829345703125, -9.4940185546875, -9.15869140625, -8.8233642578125, -8.488037109375, -8.1527099609375, -7.8173828125, -7.4820556640625, -7.146728515625, -6.8114013671875, -6.47607421875, -6.1407470703125, -5.805419921875, -5.4700927734375, -5.134765625, -4.7994384765625, -4.464111328125, -4.1287841796875, -3.79345703125, -3.4581298828125, -3.122802734375, -2.7874755859375, -2.4521484375, -2.1168212890625, -1.781494140625, -1.4461669921875, -1.11083984375, -0.7755126953125, -0.440185546875, -0.1048583984375, 0.23046875, 0.5657958984375, 0.901123046875, 1.2364501953125, 1.57177734375, 1.9071044921875, 2.242431640625, 2.5777587890625, 2.9130859375, 3.2484130859375, 3.583740234375, 3.9190673828125, 4.25439453125, 4.5897216796875, 4.925048828125, 5.2603759765625, 5.595703125, 5.9310302734375, 6.266357421875, 6.6016845703125, 6.93701171875, 7.2723388671875, 7.607666015625, 7.9429931640625, 8.2783203125, 8.6136474609375, 8.948974609375, 9.2843017578125, 9.61962890625, 9.9549560546875, 10.290283203125, 10.6256103515625, 10.9609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 9.0, 14.0, 13.0, 19.0, 22.0, 32.0, 48.0, 58.0, 96.0, 119.0, 196.0, 349.0, 702.0, 2439.0, 12454.0, 82312.0, 2134602.0, 849687.0, 50847.0, 8398.0, 1788.0, 584.0, 286.0, 166.0, 137.0, 75.0, 64.0, 54.0, 24.0, 30.0, 24.0, 13.0, 13.0, 12.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.609375, -14.1363525390625, -13.663330078125, -13.1903076171875, -12.71728515625, -12.2442626953125, -11.771240234375, -11.2982177734375, -10.8251953125, -10.3521728515625, -9.879150390625, -9.4061279296875, -8.93310546875, -8.4600830078125, -7.987060546875, -7.5140380859375, -7.041015625, -6.5679931640625, -6.094970703125, -5.6219482421875, -5.14892578125, -4.6759033203125, -4.202880859375, -3.7298583984375, -3.2568359375, -2.7838134765625, -2.310791015625, -1.8377685546875, -1.36474609375, -0.8917236328125, -0.418701171875, 0.0543212890625, 0.52734375, 1.0003662109375, 1.473388671875, 1.9464111328125, 2.41943359375, 2.8924560546875, 3.365478515625, 3.8385009765625, 4.3115234375, 4.7845458984375, 5.257568359375, 5.7305908203125, 6.20361328125, 6.6766357421875, 7.149658203125, 7.6226806640625, 8.095703125, 8.5687255859375, 9.041748046875, 9.5147705078125, 9.98779296875, 10.4608154296875, 10.933837890625, 11.4068603515625, 11.8798828125, 12.3529052734375, 12.825927734375, 13.2989501953125, 13.77197265625, 14.2449951171875, 14.718017578125, 15.1910400390625, 15.6640625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 220.0, 663.0, 122.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.57505798339844, -123.70909118652344, -118.84313201904297, -113.9771728515625, -109.1112060546875, -104.2452392578125, -99.37928009033203, -94.51332092285156, -89.64735412597656, -84.78138732910156, -79.9154281616211, -75.04946899414062, -70.18350219726562, -65.31753540039062, -60.451576232910156, -55.58561325073242, -50.71965026855469, -45.85368728637695, -40.98772430419922, -36.121761322021484, -31.25579833984375, -26.389835357666016, -21.52387237548828, -16.657909393310547, -11.791946411132812, -6.925983428955078, -2.0600204467773438, 2.8059425354003906, 7.671905517578125, 12.53786849975586, 17.403831481933594, 22.269794464111328, 27.1357421875, 32.001705169677734, 36.86766815185547, 41.7336311340332, 46.59959411621094, 51.46555709838867, 56.331520080566406, 61.19748306274414, 66.06344604492188, 70.92941284179688, 75.79537200927734, 80.66133117675781, 85.52729797363281, 90.39326477050781, 95.25922393798828, 100.12518310546875, 104.99114990234375, 109.85711669921875, 114.72307586669922, 119.58903503417969, 124.45500183105469, 129.3209686279297, 134.18692016601562, 139.05288696289062, 143.91885375976562, 148.78482055664062, 153.65078735351562, 158.51673889160156, 163.38270568847656, 168.24867248535156, 173.1146240234375, 177.9805908203125, 182.8465576171875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 4.0, 6.0, 13.0, 8.0, 29.0, 17.0, 19.0, 29.0, 37.0, 24.0, 36.0, 43.0, 44.0, 31.0, 43.0, 52.0, 45.0, 50.0, 46.0, 37.0, 41.0, 32.0, 38.0, 33.0, 32.0, 29.0, 31.0, 20.0, 20.0, 15.0, 18.0, 17.0, 9.0, 13.0, 15.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.86894989013672, -23.96401023864746, -23.059070587158203, -22.154132843017578, -21.24919319152832, -20.344253540039062, -19.439313888549805, -18.534374237060547, -17.629436492919922, -16.724496841430664, -15.819558143615723, -14.914618492126465, -14.009679794311523, -13.104740142822266, -12.199800491333008, -11.29486083984375, -10.389921188354492, -9.484981536865234, -8.580042839050293, -7.675103187561035, -6.7701640129089355, -5.865224838256836, -4.960285186767578, -4.0553460121154785, -3.150406837463379, -2.2454676628112793, -1.3405282497406006, -0.4355888366699219, 0.46935033798217773, 1.3742895126342773, 2.279229164123535, 3.1841683387756348, 4.089107513427734, 4.994046688079834, 5.898985862731934, 6.803925514221191, 7.708864688873291, 8.61380386352539, 9.518743515014648, 10.423683166503906, 11.328621864318848, 12.233561515808105, 13.138500213623047, 14.043439865112305, 14.948379516601562, 15.853318214416504, 16.758258819580078, 17.663196563720703, 18.56813621520996, 19.47307586669922, 20.378015518188477, 21.282955169677734, 22.18789291381836, 23.092832565307617, 23.997772216796875, 24.902711868286133, 25.80765151977539, 26.71259117126465, 27.617530822753906, 28.52246856689453, 29.42740821838379, 30.332347869873047, 31.237287521362305, 32.14222717285156, 33.04716491699219]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 4.0, 6.0, 8.0, 12.0, 13.0, 19.0, 27.0, 17.0, 11.0, 19.0, 26.0, 29.0, 34.0, 28.0, 41.0, 31.0, 41.0, 32.0, 35.0, 31.0, 40.0, 44.0, 45.0, 36.0, 50.0, 29.0, 27.0, 27.0, 33.0, 16.0, 19.0, 24.0, 23.0, 14.0, 18.0, 18.0, 7.0, 16.0, 10.0, 4.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-4.6875, -4.549072265625, -4.41064453125, -4.272216796875, -4.1337890625, -3.995361328125, -3.85693359375, -3.718505859375, -3.580078125, -3.441650390625, -3.30322265625, -3.164794921875, -3.0263671875, -2.887939453125, -2.74951171875, -2.611083984375, -2.47265625, -2.334228515625, -2.19580078125, -2.057373046875, -1.9189453125, -1.780517578125, -1.64208984375, -1.503662109375, -1.365234375, -1.226806640625, -1.08837890625, -0.949951171875, -0.8115234375, -0.673095703125, -0.53466796875, -0.396240234375, -0.2578125, -0.119384765625, 0.01904296875, 0.157470703125, 0.2958984375, 0.434326171875, 0.57275390625, 0.711181640625, 0.849609375, 0.988037109375, 1.12646484375, 1.264892578125, 1.4033203125, 1.541748046875, 1.68017578125, 1.818603515625, 1.95703125, 2.095458984375, 2.23388671875, 2.372314453125, 2.5107421875, 2.649169921875, 2.78759765625, 2.926025390625, 3.064453125, 3.202880859375, 3.34130859375, 3.479736328125, 3.6181640625, 3.756591796875, 3.89501953125, 4.033447265625, 4.171875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 4.0, 15.0, 9.0, 22.0, 22.0, 24.0, 23.0, 33.0, 48.0, 58.0, 80.0, 104.0, 148.0, 181.0, 309.0, 424.0, 2095.0, 878101.0, 3307728.0, 3160.0, 519.0, 288.0, 249.0, 148.0, 93.0, 78.0, 65.0, 49.0, 28.0, 32.0, 29.0, 14.0, 17.0, 20.0, 16.0, 10.0, 2.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.78125, -55.0107421875, -53.240234375, -51.4697265625, -49.69921875, -47.9287109375, -46.158203125, -44.3876953125, -42.6171875, -40.8466796875, -39.076171875, -37.3056640625, -35.53515625, -33.7646484375, -31.994140625, -30.2236328125, -28.453125, -26.6826171875, -24.912109375, -23.1416015625, -21.37109375, -19.6005859375, -17.830078125, -16.0595703125, -14.2890625, -12.5185546875, -10.748046875, -8.9775390625, -7.20703125, -5.4365234375, -3.666015625, -1.8955078125, -0.125, 1.6455078125, 3.416015625, 5.1865234375, 6.95703125, 8.7275390625, 10.498046875, 12.2685546875, 14.0390625, 15.8095703125, 17.580078125, 19.3505859375, 21.12109375, 22.8916015625, 24.662109375, 26.4326171875, 28.203125, 29.9736328125, 31.744140625, 33.5146484375, 35.28515625, 37.0556640625, 38.826171875, 40.5966796875, 42.3671875, 44.1376953125, 45.908203125, 47.6787109375, 49.44921875, 51.2197265625, 52.990234375, 54.7607421875, 56.53125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 8.0, 9.0, 19.0, 20.0, 28.0, 45.0, 52.0, 65.0, 70.0, 117.0, 166.0, 188.0, 294.0, 454.0, 551.0, 554.0, 407.0, 267.0, 174.0, 145.0, 103.0, 78.0, 54.0, 48.0, 34.0, 24.0, 17.0, 17.0, 14.0, 5.0, 5.0, 6.0, 11.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.7734375, -6.56097412109375, -6.3485107421875, -6.13604736328125, -5.923583984375, -5.71112060546875, -5.4986572265625, -5.28619384765625, -5.07373046875, -4.86126708984375, -4.6488037109375, -4.43634033203125, -4.223876953125, -4.01141357421875, -3.7989501953125, -3.58648681640625, -3.3740234375, -3.16156005859375, -2.9490966796875, -2.73663330078125, -2.524169921875, -2.31170654296875, -2.0992431640625, -1.88677978515625, -1.67431640625, -1.46185302734375, -1.2493896484375, -1.03692626953125, -0.824462890625, -0.61199951171875, -0.3995361328125, -0.18707275390625, 0.025390625, 0.23785400390625, 0.4503173828125, 0.66278076171875, 0.875244140625, 1.08770751953125, 1.3001708984375, 1.51263427734375, 1.72509765625, 1.93756103515625, 2.1500244140625, 2.36248779296875, 2.574951171875, 2.78741455078125, 2.9998779296875, 3.21234130859375, 3.4248046875, 3.63726806640625, 3.8497314453125, 4.06219482421875, 4.274658203125, 4.48712158203125, 4.6995849609375, 4.91204833984375, 5.12451171875, 5.33697509765625, 5.5494384765625, 5.76190185546875, 5.974365234375, 6.18682861328125, 6.3992919921875, 6.61175537109375, 6.82421875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 6.0, 5.0, 12.0, 8.0, 10.0, 12.0, 18.0, 18.0, 23.0, 34.0, 25.0, 37.0, 52.0, 90.0, 164.0, 388.0, 1291.0, 7491.0, 99391.0, 3373680.0, 677563.0, 29308.0, 3233.0, 761.0, 236.0, 114.0, 64.0, 48.0, 37.0, 35.0, 31.0, 17.0, 25.0, 9.0, 8.0, 7.0, 5.0, 4.0, 1.0, 3.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.078125, -21.36083984375, -20.6435546875, -19.92626953125, -19.208984375, -18.49169921875, -17.7744140625, -17.05712890625, -16.33984375, -15.62255859375, -14.9052734375, -14.18798828125, -13.470703125, -12.75341796875, -12.0361328125, -11.31884765625, -10.6015625, -9.88427734375, -9.1669921875, -8.44970703125, -7.732421875, -7.01513671875, -6.2978515625, -5.58056640625, -4.86328125, -4.14599609375, -3.4287109375, -2.71142578125, -1.994140625, -1.27685546875, -0.5595703125, 0.15771484375, 0.875, 1.59228515625, 2.3095703125, 3.02685546875, 3.744140625, 4.46142578125, 5.1787109375, 5.89599609375, 6.61328125, 7.33056640625, 8.0478515625, 8.76513671875, 9.482421875, 10.19970703125, 10.9169921875, 11.63427734375, 12.3515625, 13.06884765625, 13.7861328125, 14.50341796875, 15.220703125, 15.93798828125, 16.6552734375, 17.37255859375, 18.08984375, 18.80712890625, 19.5244140625, 20.24169921875, 20.958984375, 21.67626953125, 22.3935546875, 23.11083984375, 23.828125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 65.0, 338.0, 446.0, 145.0, 15.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-213.1513214111328, -209.1475067138672, -205.14369201660156, -201.139892578125, -197.13607788085938, -193.13226318359375, -189.12844848632812, -185.1246337890625, -181.12081909179688, -177.11700439453125, -173.11318969726562, -169.10939025878906, -165.10557556152344, -161.1017608642578, -157.0979461669922, -153.09413146972656, -149.09033203125, -145.08651733398438, -141.08270263671875, -137.0789031982422, -133.07508850097656, -129.07127380371094, -125.06745910644531, -121.06364440917969, -117.0598373413086, -113.05602264404297, -109.05221557617188, -105.04840087890625, -101.04458618164062, -97.04077911376953, -93.0369644165039, -89.03315734863281, -85.02933502197266, -81.02552032470703, -77.02171325683594, -73.01789855957031, -69.01408386230469, -65.0102767944336, -61.00646209716797, -57.00265121459961, -52.99884033203125, -48.99502944946289, -44.99121856689453, -40.987403869628906, -36.98359298706055, -32.97978210449219, -28.975969314575195, -24.972156524658203, -20.968345642089844, -16.964534759521484, -12.960721969604492, -8.956910133361816, -4.953098297119141, -0.9492874145507812, 3.054525375366211, 7.058338165283203, 11.062149047851562, 15.065960884094238, 19.069772720336914, 23.073585510253906, 27.077396392822266, 31.081207275390625, 35.08502197265625, 39.08883285522461, 43.09264373779297]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 2.0, 4.0, 4.0, 10.0, 6.0, 13.0, 13.0, 8.0, 14.0, 20.0, 20.0, 14.0, 22.0, 27.0, 23.0, 34.0, 26.0, 35.0, 53.0, 38.0, 39.0, 54.0, 29.0, 42.0, 44.0, 37.0, 36.0, 33.0, 37.0, 30.0, 27.0, 35.0, 24.0, 20.0, 16.0, 17.0, 17.0, 14.0, 11.0, 13.0, 9.0, 6.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.170665740966797, -22.445714950561523, -21.72076416015625, -20.995813369750977, -20.270862579345703, -19.54591178894043, -18.820960998535156, -18.096010208129883, -17.37105941772461, -16.646108627319336, -15.921157836914062, -15.196207046508789, -14.471256256103516, -13.746305465698242, -13.021354675292969, -12.296403884887695, -11.571452140808105, -10.846501350402832, -10.121550559997559, -9.396599769592285, -8.671648979187012, -7.946698188781738, -7.221746921539307, -6.496796131134033, -5.77184534072876, -5.046894550323486, -4.321943759918213, -3.5969927310943604, -2.872041940689087, -2.1470911502838135, -1.422140121459961, -0.6971893310546875, 0.027761459350585938, 0.7527123093605042, 1.4776631593704224, 2.2026140689849854, 2.927564859390259, 3.6525156497955322, 4.377466678619385, 5.102417469024658, 5.827368259429932, 6.552319049835205, 7.2772698402404785, 8.00222110748291, 8.727171897888184, 9.452122688293457, 10.17707347869873, 10.902024269104004, 11.626975059509277, 12.35192584991455, 13.076876640319824, 13.801827430725098, 14.526778221130371, 15.251729011535645, 15.976680755615234, 16.701631546020508, 17.42658233642578, 18.151533126831055, 18.876483917236328, 19.6014347076416, 20.326385498046875, 21.05133628845215, 21.776287078857422, 22.501237869262695, 23.22618865966797]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 9.0, 9.0, 13.0, 18.0, 15.0, 10.0, 21.0, 23.0, 26.0, 37.0, 31.0, 30.0, 37.0, 27.0, 35.0, 31.0, 35.0, 46.0, 45.0, 27.0, 34.0, 52.0, 33.0, 34.0, 34.0, 31.0, 23.0, 14.0, 34.0, 20.0, 18.0, 12.0, 19.0, 16.0, 23.0, 15.0, 9.0, 7.0, 8.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.4921875, -4.35870361328125, -4.2252197265625, -4.09173583984375, -3.958251953125, -3.82476806640625, -3.6912841796875, -3.55780029296875, -3.42431640625, -3.29083251953125, -3.1573486328125, -3.02386474609375, -2.890380859375, -2.75689697265625, -2.6234130859375, -2.48992919921875, -2.3564453125, -2.22296142578125, -2.0894775390625, -1.95599365234375, -1.822509765625, -1.68902587890625, -1.5555419921875, -1.42205810546875, -1.28857421875, -1.15509033203125, -1.0216064453125, -0.88812255859375, -0.754638671875, -0.62115478515625, -0.4876708984375, -0.35418701171875, -0.220703125, -0.08721923828125, 0.0462646484375, 0.17974853515625, 0.313232421875, 0.44671630859375, 0.5802001953125, 0.71368408203125, 0.84716796875, 0.98065185546875, 1.1141357421875, 1.24761962890625, 1.381103515625, 1.51458740234375, 1.6480712890625, 1.78155517578125, 1.9150390625, 2.04852294921875, 2.1820068359375, 2.31549072265625, 2.448974609375, 2.58245849609375, 2.7159423828125, 2.84942626953125, 2.98291015625, 3.11639404296875, 3.2498779296875, 3.38336181640625, 3.516845703125, 3.65032958984375, 3.7838134765625, 3.91729736328125, 4.05078125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 20.0, 16.0, 51.0, 44.0, 82.0, 118.0, 145.0, 266.0, 383.0, 613.0, 909.0, 1456.0, 2163.0, 3246.0, 5000.0, 8008.0, 12994.0, 21800.0, 37784.0, 69582.0, 145277.0, 331936.0, 200944.0, 89636.0, 46585.0, 26633.0, 16023.0, 9852.0, 6117.0, 3806.0, 2460.0, 1521.0, 996.0, 634.0, 454.0, 304.0, 206.0, 152.0, 98.0, 59.0, 56.0, 26.0, 26.0, 15.0, 15.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0], "bins": [-0.211181640625, -0.2050933837890625, -0.199005126953125, -0.1929168701171875, -0.18682861328125, -0.1807403564453125, -0.174652099609375, -0.1685638427734375, -0.1624755859375, -0.1563873291015625, -0.150299072265625, -0.1442108154296875, -0.13812255859375, -0.1320343017578125, -0.125946044921875, -0.1198577880859375, -0.11376953125, -0.1076812744140625, -0.101593017578125, -0.0955047607421875, -0.08941650390625, -0.0833282470703125, -0.077239990234375, -0.0711517333984375, -0.0650634765625, -0.0589752197265625, -0.052886962890625, -0.0467987060546875, -0.04071044921875, -0.0346221923828125, -0.028533935546875, -0.0224456787109375, -0.016357421875, -0.0102691650390625, -0.004180908203125, 0.0019073486328125, 0.00799560546875, 0.0140838623046875, 0.020172119140625, 0.0262603759765625, 0.0323486328125, 0.0384368896484375, 0.044525146484375, 0.0506134033203125, 0.05670166015625, 0.0627899169921875, 0.068878173828125, 0.0749664306640625, 0.0810546875, 0.0871429443359375, 0.093231201171875, 0.0993194580078125, 0.10540771484375, 0.1114959716796875, 0.117584228515625, 0.1236724853515625, 0.1297607421875, 0.1358489990234375, 0.141937255859375, 0.1480255126953125, 0.15411376953125, 0.1602020263671875, 0.166290283203125, 0.1723785400390625, 0.178466796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 14.0, 15.0, 12.0, 17.0, 20.0, 11.0, 21.0, 23.0, 33.0, 21.0, 28.0, 31.0, 39.0, 28.0, 32.0, 28.0, 39.0, 41.0, 1059.0, 41.0, 42.0, 35.0, 34.0, 38.0, 25.0, 31.0, 34.0, 20.0, 35.0, 18.0, 13.0, 16.0, 9.0, 18.0, 18.0, 19.0, 9.0, 8.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.74609375, -2.66107177734375, -2.5760498046875, -2.49102783203125, -2.406005859375, -2.32098388671875, -2.2359619140625, -2.15093994140625, -2.06591796875, -1.98089599609375, -1.8958740234375, -1.81085205078125, -1.725830078125, -1.64080810546875, -1.5557861328125, -1.47076416015625, -1.3857421875, -1.30072021484375, -1.2156982421875, -1.13067626953125, -1.045654296875, -0.96063232421875, -0.8756103515625, -0.79058837890625, -0.70556640625, -0.62054443359375, -0.5355224609375, -0.45050048828125, -0.365478515625, -0.28045654296875, -0.1954345703125, -0.11041259765625, -0.025390625, 0.05963134765625, 0.1446533203125, 0.22967529296875, 0.314697265625, 0.39971923828125, 0.4847412109375, 0.56976318359375, 0.65478515625, 0.73980712890625, 0.8248291015625, 0.90985107421875, 0.994873046875, 1.07989501953125, 1.1649169921875, 1.24993896484375, 1.3349609375, 1.41998291015625, 1.5050048828125, 1.59002685546875, 1.675048828125, 1.76007080078125, 1.8450927734375, 1.93011474609375, 2.01513671875, 2.10015869140625, 2.1851806640625, 2.27020263671875, 2.355224609375, 2.44024658203125, 2.5252685546875, 2.61029052734375, 2.6953125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 10.0, 14.0, 12.0, 29.0, 52.0, 74.0, 101.0, 188.0, 261.0, 354.0, 596.0, 844.0, 1312.0, 1905.0, 3011.0, 4857.0, 7683.0, 12500.0, 20771.0, 35220.0, 61697.0, 116160.0, 235521.0, 1305961.0, 125769.0, 66413.0, 37854.0, 22138.0, 13231.0, 8197.0, 5207.0, 3126.0, 2077.0, 1351.0, 924.0, 550.0, 373.0, 276.0, 176.0, 120.0, 65.0, 44.0, 44.0, 18.0, 15.0, 12.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08148193359375, -0.07877159118652344, -0.07606124877929688, -0.07335090637207031, -0.07064056396484375, -0.06793022155761719, -0.06521987915039062, -0.06250953674316406, -0.0597991943359375, -0.05708885192871094, -0.054378509521484375, -0.05166816711425781, -0.04895782470703125, -0.04624748229980469, -0.043537139892578125, -0.04082679748535156, -0.038116455078125, -0.03540611267089844, -0.032695770263671875, -0.029985427856445312, -0.02727508544921875, -0.024564743041992188, -0.021854400634765625, -0.019144058227539062, -0.0164337158203125, -0.013723373413085938, -0.011013031005859375, -0.008302688598632812, -0.00559234619140625, -0.0028820037841796875, -0.000171661376953125, 0.0025386810302734375, 0.0052490234375, 0.007959365844726562, 0.010669708251953125, 0.013380050659179688, 0.01609039306640625, 0.018800735473632812, 0.021511077880859375, 0.024221420288085938, 0.0269317626953125, 0.029642105102539062, 0.032352447509765625, 0.03506278991699219, 0.03777313232421875, 0.04048347473144531, 0.043193817138671875, 0.04590415954589844, 0.048614501953125, 0.05132484436035156, 0.054035186767578125, 0.05674552917480469, 0.05945587158203125, 0.06216621398925781, 0.06487655639648438, 0.06758689880371094, 0.0702972412109375, 0.07300758361816406, 0.07571792602539062, 0.07842826843261719, 0.08113861083984375, 0.08384895324707031, 0.08655929565429688, 0.08926963806152344, 0.09197998046875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 7.0, 10.0, 13.0, 28.0, 17.0, 31.0, 40.0, 41.0, 57.0, 62.0, 81.0, 109.0, 90.0, 80.0, 60.0, 52.0, 53.0, 41.0, 25.0, 19.0, 13.0, 14.0, 11.0, 6.0, 4.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2782554626464844e-05, -3.19136306643486e-05, -3.104470670223236e-05, -3.017578274011612e-05, -2.9306858777999878e-05, -2.8437934815883636e-05, -2.7569010853767395e-05, -2.6700086891651154e-05, -2.5831162929534912e-05, -2.496223896741867e-05, -2.409331500530243e-05, -2.3224391043186188e-05, -2.2355467081069946e-05, -2.1486543118953705e-05, -2.0617619156837463e-05, -1.9748695194721222e-05, -1.887977123260498e-05, -1.801084727048874e-05, -1.7141923308372498e-05, -1.6272999346256256e-05, -1.5404075384140015e-05, -1.4535151422023773e-05, -1.3666227459907532e-05, -1.279730349779129e-05, -1.1928379535675049e-05, -1.1059455573558807e-05, -1.0190531611442566e-05, -9.321607649326324e-06, -8.452683687210083e-06, -7.5837597250938416e-06, -6.7148357629776e-06, -5.845911800861359e-06, -4.976987838745117e-06, -4.108063876628876e-06, -3.2391399145126343e-06, -2.370215952396393e-06, -1.5012919902801514e-06, -6.323680281639099e-07, 2.3655593395233154e-07, 1.105479896068573e-06, 1.9744038581848145e-06, 2.843327820301056e-06, 3.7122517824172974e-06, 4.581175744533539e-06, 5.45009970664978e-06, 6.319023668766022e-06, 7.187947630882263e-06, 8.056871592998505e-06, 8.925795555114746e-06, 9.794719517230988e-06, 1.0663643479347229e-05, 1.153256744146347e-05, 1.2401491403579712e-05, 1.3270415365695953e-05, 1.4139339327812195e-05, 1.5008263289928436e-05, 1.5877187252044678e-05, 1.674611121416092e-05, 1.761503517627716e-05, 1.8483959138393402e-05, 1.9352883100509644e-05, 2.0221807062625885e-05, 2.1090731024742126e-05, 2.1959654986858368e-05, 2.282857894897461e-05]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 7.0, 6.0, 14.0, 22.0, 27.0, 26.0, 39.0, 71.0, 111.0, 140.0, 368.0, 2105.0, 1008148.0, 36322.0, 560.0, 203.0, 108.0, 70.0, 63.0, 26.0, 40.0, 15.0, 15.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005388259887695312, -0.0005178898572921753, -0.0004969537258148193, -0.0004760175943374634, -0.0004550814628601074, -0.00043414533138275146, -0.0004132091999053955, -0.00039227306842803955, -0.0003713369369506836, -0.00035040080547332764, -0.0003294646739959717, -0.0003085285425186157, -0.00028759241104125977, -0.0002666562795639038, -0.00024572014808654785, -0.0002247840166091919, -0.00020384788513183594, -0.00018291175365447998, -0.00016197562217712402, -0.00014103949069976807, -0.00012010335922241211, -9.916722774505615e-05, -7.82310962677002e-05, -5.729496479034424e-05, -3.635883331298828e-05, -1.5422701835632324e-05, 5.513429641723633e-06, 2.644956111907959e-05, 4.738569259643555e-05, 6.83218240737915e-05, 8.925795555114746e-05, 0.00011019408702850342, 0.00013113021850585938, 0.00015206634998321533, 0.0001730024814605713, 0.00019393861293792725, 0.0002148747444152832, 0.00023581087589263916, 0.0002567470073699951, 0.0002776831388473511, 0.00029861927032470703, 0.000319555401802063, 0.00034049153327941895, 0.0003614276647567749, 0.00038236379623413086, 0.0004032999277114868, 0.0004242360591888428, 0.00044517219066619873, 0.0004661083221435547, 0.00048704445362091064, 0.0005079805850982666, 0.0005289167165756226, 0.0005498528480529785, 0.0005707889795303345, 0.0005917251110076904, 0.0006126612424850464, 0.0006335973739624023, 0.0006545335054397583, 0.0006754696369171143, 0.0006964057683944702, 0.0007173418998718262, 0.0007382780313491821, 0.0007592141628265381, 0.000780150294303894, 0.00080108642578125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 16.0, 984.0, 17.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.345514051034115e-05, -2.3860206056269817e-05, -1.4265271602198482e-05, -4.670337148127146e-06, 4.9245973059441894e-06, 1.4519533579004928e-05, 2.411446621408686e-05, 3.370939884916879e-05, 4.330433512222953e-05, 5.289926775731146e-05, 6.24942040303722e-05, 7.208914030343294e-05, 8.168407657649368e-05, 9.127901284955442e-05, 0.00010087394184665754, 0.00011046887084376067, 0.00012006380711682141, 0.00012965874338988215, 0.00013925367966294289, 0.00014884861593600363, 0.00015844355220906436, 0.00016803847393020988, 0.00017763341020327061, 0.00018722834647633135, 0.0001968232827493921, 0.00020641821902245283, 0.00021601315529551357, 0.0002256080915685743, 0.00023520301328971982, 0.0002447979641146958, 0.0002543928858358413, 0.0002639878075569868, 0.0002735827583819628, 0.0002831776801031083, 0.00029277263092808425, 0.00030236755264922976, 0.00031196250347420573, 0.00032155742519535124, 0.0003311523760203272, 0.0003407472977414727, 0.0003503422485664487, 0.0003599371702875942, 0.00036953212111257017, 0.0003791270428337157, 0.00038872199365869164, 0.00039831691537983716, 0.0004079118662048131, 0.00041750678792595863, 0.00042710170964710414, 0.00043669663136824965, 0.0004462915821932256, 0.00045588650391437113, 0.0004654814547393471, 0.0004750763764604926, 0.0004846713272854686, 0.0004942662781104445, 0.0005038611707277596, 0.0005134561215527356, 0.0005230510141700506, 0.0005326459649950266, 0.0005422409158200026, 0.0005518358666449785, 0.0005614307592622936, 0.0005710257100872695, 0.0005806206609122455]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 10.0, 14.0, 17.0, 23.0, 32.0, 38.0, 37.0, 51.0, 56.0, 64.0, 71.0, 66.0, 68.0, 75.0, 62.0, 52.0, 50.0, 68.0, 30.0, 31.0, 26.0, 18.0, 12.0, 10.0, 8.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.288818359375e-05, -2.2220425307750702e-05, -2.1552667021751404e-05, -2.0884908735752106e-05, -2.0217150449752808e-05, -1.954939216375351e-05, -1.888163387775421e-05, -1.8213875591754913e-05, -1.7546117305755615e-05, -1.6878359019756317e-05, -1.621060073375702e-05, -1.554284244775772e-05, -1.4875084161758423e-05, -1.4207325875759125e-05, -1.3539567589759827e-05, -1.2871809303760529e-05, -1.220405101776123e-05, -1.1536292731761932e-05, -1.0868534445762634e-05, -1.0200776159763336e-05, -9.533017873764038e-06, -8.86525958776474e-06, -8.197501301765442e-06, -7.529743015766144e-06, -6.861984729766846e-06, -6.194226443767548e-06, -5.5264681577682495e-06, -4.858709871768951e-06, -4.190951585769653e-06, -3.5231932997703552e-06, -2.855435013771057e-06, -2.187676727771759e-06, -1.519918441772461e-06, -8.521601557731628e-07, -1.8440186977386475e-07, 4.833564162254333e-07, 1.1511147022247314e-06, 1.8188729882240295e-06, 2.4866312742233276e-06, 3.1543895602226257e-06, 3.822147846221924e-06, 4.489906132221222e-06, 5.15766441822052e-06, 5.825422704219818e-06, 6.493180990219116e-06, 7.160939276218414e-06, 7.828697562217712e-06, 8.49645584821701e-06, 9.164214134216309e-06, 9.831972420215607e-06, 1.0499730706214905e-05, 1.1167488992214203e-05, 1.1835247278213501e-05, 1.2503005564212799e-05, 1.3170763850212097e-05, 1.3838522136211395e-05, 1.4506280422210693e-05, 1.5174038708209991e-05, 1.584179699420929e-05, 1.6509555280208588e-05, 1.7177313566207886e-05, 1.7845071852207184e-05, 1.8512830138206482e-05, 1.918058842420578e-05, 1.9848346710205078e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 1.0, 4.0, 6.0, 7.0, 9.0, 9.0, 13.0, 18.0, 15.0, 10.0, 21.0, 23.0, 26.0, 37.0, 31.0, 30.0, 37.0, 27.0, 35.0, 31.0, 35.0, 46.0, 45.0, 27.0, 34.0, 52.0, 33.0, 34.0, 34.0, 31.0, 23.0, 14.0, 34.0, 20.0, 18.0, 12.0, 19.0, 16.0, 23.0, 15.0, 9.0, 7.0, 8.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.4921875, -4.35870361328125, -4.2252197265625, -4.09173583984375, -3.958251953125, -3.82476806640625, -3.6912841796875, -3.55780029296875, -3.42431640625, -3.29083251953125, -3.1573486328125, -3.02386474609375, -2.890380859375, -2.75689697265625, -2.6234130859375, -2.48992919921875, -2.3564453125, -2.22296142578125, -2.0894775390625, -1.95599365234375, -1.822509765625, -1.68902587890625, -1.5555419921875, -1.42205810546875, -1.28857421875, -1.15509033203125, -1.0216064453125, -0.88812255859375, -0.754638671875, -0.62115478515625, -0.4876708984375, -0.35418701171875, -0.220703125, -0.08721923828125, 0.0462646484375, 0.17974853515625, 0.313232421875, 0.44671630859375, 0.5802001953125, 0.71368408203125, 0.84716796875, 0.98065185546875, 1.1141357421875, 1.24761962890625, 1.381103515625, 1.51458740234375, 1.6480712890625, 1.78155517578125, 1.9150390625, 2.04852294921875, 2.1820068359375, 2.31549072265625, 2.448974609375, 2.58245849609375, 2.7159423828125, 2.84942626953125, 2.98291015625, 3.11639404296875, 3.2498779296875, 3.38336181640625, 3.516845703125, 3.65032958984375, 3.7838134765625, 3.91729736328125, 4.05078125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 7.0, 4.0, 15.0, 15.0, 19.0, 32.0, 45.0, 55.0, 86.0, 120.0, 171.0, 248.0, 319.0, 498.0, 680.0, 1162.0, 1905.0, 3377.0, 6435.0, 12598.0, 25507.0, 53126.0, 112402.0, 232094.0, 291830.0, 157916.0, 74948.0, 35750.0, 17377.0, 8602.0, 4453.0, 2491.0, 1386.0, 924.0, 580.0, 395.0, 261.0, 196.0, 140.0, 104.0, 73.0, 57.0, 34.0, 34.0, 21.0, 20.0, 13.0, 13.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.703125, -5.531494140625, -5.35986328125, -5.188232421875, -5.0166015625, -4.844970703125, -4.67333984375, -4.501708984375, -4.330078125, -4.158447265625, -3.98681640625, -3.815185546875, -3.6435546875, -3.471923828125, -3.30029296875, -3.128662109375, -2.95703125, -2.785400390625, -2.61376953125, -2.442138671875, -2.2705078125, -2.098876953125, -1.92724609375, -1.755615234375, -1.583984375, -1.412353515625, -1.24072265625, -1.069091796875, -0.8974609375, -0.725830078125, -0.55419921875, -0.382568359375, -0.2109375, -0.039306640625, 0.13232421875, 0.303955078125, 0.4755859375, 0.647216796875, 0.81884765625, 0.990478515625, 1.162109375, 1.333740234375, 1.50537109375, 1.677001953125, 1.8486328125, 2.020263671875, 2.19189453125, 2.363525390625, 2.53515625, 2.706787109375, 2.87841796875, 3.050048828125, 3.2216796875, 3.393310546875, 3.56494140625, 3.736572265625, 3.908203125, 4.079833984375, 4.25146484375, 4.423095703125, 4.5947265625, 4.766357421875, 4.93798828125, 5.109619140625, 5.28125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 6.0, 4.0, 9.0, 9.0, 18.0, 13.0, 14.0, 26.0, 29.0, 32.0, 30.0, 39.0, 55.0, 48.0, 86.0, 136.0, 243.0, 1429.0, 245.0, 142.0, 69.0, 51.0, 60.0, 36.0, 36.0, 30.0, 30.0, 31.0, 20.0, 22.0, 20.0, 5.0, 8.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6640625, -13.243896484375, -12.82373046875, -12.403564453125, -11.9833984375, -11.563232421875, -11.14306640625, -10.722900390625, -10.302734375, -9.882568359375, -9.46240234375, -9.042236328125, -8.6220703125, -8.201904296875, -7.78173828125, -7.361572265625, -6.94140625, -6.521240234375, -6.10107421875, -5.680908203125, -5.2607421875, -4.840576171875, -4.42041015625, -4.000244140625, -3.580078125, -3.159912109375, -2.73974609375, -2.319580078125, -1.8994140625, -1.479248046875, -1.05908203125, -0.638916015625, -0.21875, 0.201416015625, 0.62158203125, 1.041748046875, 1.4619140625, 1.882080078125, 2.30224609375, 2.722412109375, 3.142578125, 3.562744140625, 3.98291015625, 4.403076171875, 4.8232421875, 5.243408203125, 5.66357421875, 6.083740234375, 6.50390625, 6.924072265625, 7.34423828125, 7.764404296875, 8.1845703125, 8.604736328125, 9.02490234375, 9.445068359375, 9.865234375, 10.285400390625, 10.70556640625, 11.125732421875, 11.5458984375, 11.966064453125, 12.38623046875, 12.806396484375, 13.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 9.0, 13.0, 9.0, 12.0, 17.0, 33.0, 42.0, 52.0, 56.0, 101.0, 155.0, 244.0, 440.0, 893.0, 3025.0, 484398.0, 2647453.0, 6338.0, 1072.0, 531.0, 303.0, 163.0, 94.0, 63.0, 40.0, 34.0, 30.0, 24.0, 12.0, 13.0, 4.0, 5.0, 7.0, 8.0, 2.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.921875, -26.852783203125, -25.78369140625, -24.714599609375, -23.6455078125, -22.576416015625, -21.50732421875, -20.438232421875, -19.369140625, -18.300048828125, -17.23095703125, -16.161865234375, -15.0927734375, -14.023681640625, -12.95458984375, -11.885498046875, -10.81640625, -9.747314453125, -8.67822265625, -7.609130859375, -6.5400390625, -5.470947265625, -4.40185546875, -3.332763671875, -2.263671875, -1.194580078125, -0.12548828125, 0.943603515625, 2.0126953125, 3.081787109375, 4.15087890625, 5.219970703125, 6.2890625, 7.358154296875, 8.42724609375, 9.496337890625, 10.5654296875, 11.634521484375, 12.70361328125, 13.772705078125, 14.841796875, 15.910888671875, 16.97998046875, 18.049072265625, 19.1181640625, 20.187255859375, 21.25634765625, 22.325439453125, 23.39453125, 24.463623046875, 25.53271484375, 26.601806640625, 27.6708984375, 28.739990234375, 29.80908203125, 30.878173828125, 31.947265625, 33.016357421875, 34.08544921875, 35.154541015625, 36.2236328125, 37.292724609375, 38.36181640625, 39.430908203125, 40.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 22.0, 43.0, 71.0, 131.0, 175.0, 184.0, 172.0, 108.0, 60.0, 24.0, 10.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.24229431152344, -70.68155670166016, -69.12081146240234, -67.56007385253906, -65.99932861328125, -64.43859100341797, -62.877845764160156, -61.31710433959961, -59.75636291503906, -58.195621490478516, -56.63488006591797, -55.07413864135742, -53.513397216796875, -51.95265579223633, -50.39191436767578, -48.831172943115234, -47.27043151855469, -45.70969009399414, -44.148948669433594, -42.58820724487305, -41.0274658203125, -39.46672439575195, -37.905982971191406, -36.34524154663086, -34.78450393676758, -33.22376251220703, -31.663021087646484, -30.102279663085938, -28.54153823852539, -26.980796813964844, -25.420055389404297, -23.85931396484375, -22.298572540283203, -20.737831115722656, -19.17708969116211, -17.616348266601562, -16.055606842041016, -14.494865417480469, -12.934124946594238, -11.373383522033691, -9.812642097473145, -8.251900672912598, -6.691159248352051, -5.130418300628662, -3.5696768760681152, -2.0089354515075684, -0.4481945037841797, 1.1125469207763672, 2.673288345336914, 4.234029769897461, 5.794771194458008, 7.3555121421813965, 8.916254043579102, 10.476995468139648, 12.037735939025879, 13.598477363586426, 15.159218788146973, 16.719959259033203, 18.28070068359375, 19.841442108154297, 21.402183532714844, 22.96292495727539, 24.523666381835938, 26.084407806396484, 27.64514923095703]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 9.0, 8.0, 6.0, 8.0, 17.0, 7.0, 11.0, 18.0, 16.0, 20.0, 18.0, 24.0, 31.0, 30.0, 29.0, 43.0, 38.0, 37.0, 48.0, 47.0, 34.0, 39.0, 45.0, 47.0, 46.0, 35.0, 34.0, 25.0, 26.0, 37.0, 17.0, 17.0, 17.0, 20.0, 14.0, 9.0, 16.0, 8.0, 14.0, 7.0, 7.0, 4.0, 5.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.54753875732422, -35.44721603393555, -34.34689712524414, -33.24657440185547, -32.1462516784668, -31.045930862426758, -29.94561004638672, -28.845287322998047, -27.744966506958008, -26.64464569091797, -25.544322967529297, -24.444002151489258, -23.34368133544922, -22.243358612060547, -21.143037796020508, -20.04271697998047, -18.942394256591797, -17.842073440551758, -16.741750717163086, -15.641429901123047, -14.541108131408691, -13.440786361694336, -12.340465545654297, -11.240143775939941, -10.139822006225586, -9.03950023651123, -7.939178943634033, -6.838857650756836, -5.7385358810424805, -4.638214111328125, -3.5378928184509277, -2.4375715255737305, -1.337249755859375, -0.23692822456359863, 0.8633933067321777, 1.963714838027954, 3.0640363693237305, 4.164358139038086, 5.264679431915283, 6.3650007247924805, 7.465322494506836, 8.565644264221191, 9.665966033935547, 10.766286849975586, 11.866608619689941, 12.966930389404297, 14.067251205444336, 15.167572975158691, 16.267894744873047, 17.368215560913086, 18.468538284301758, 19.568859100341797, 20.66918182373047, 21.769502639770508, 22.869823455810547, 23.97014617919922, 25.070466995239258, 26.170787811279297, 27.27111053466797, 28.371431350708008, 29.471752166748047, 30.57207489013672, 31.672395706176758, 32.7727165222168, 33.87303924560547]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 8.0, 4.0, 10.0, 6.0, 13.0, 19.0, 22.0, 21.0, 25.0, 24.0, 27.0, 29.0, 31.0, 40.0, 38.0, 49.0, 43.0, 29.0, 44.0, 44.0, 45.0, 38.0, 44.0, 41.0, 29.0, 44.0, 25.0, 28.0, 27.0, 16.0, 21.0, 11.0, 13.0, 28.0, 17.0, 9.0, 13.0, 7.0, 4.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.94122314453125, -4.7886962890625, -4.63616943359375, -4.483642578125, -4.33111572265625, -4.1785888671875, -4.02606201171875, -3.87353515625, -3.72100830078125, -3.5684814453125, -3.41595458984375, -3.263427734375, -3.11090087890625, -2.9583740234375, -2.80584716796875, -2.6533203125, -2.50079345703125, -2.3482666015625, -2.19573974609375, -2.043212890625, -1.89068603515625, -1.7381591796875, -1.58563232421875, -1.43310546875, -1.28057861328125, -1.1280517578125, -0.97552490234375, -0.822998046875, -0.67047119140625, -0.5179443359375, -0.36541748046875, -0.212890625, -0.06036376953125, 0.0921630859375, 0.24468994140625, 0.397216796875, 0.54974365234375, 0.7022705078125, 0.85479736328125, 1.00732421875, 1.15985107421875, 1.3123779296875, 1.46490478515625, 1.617431640625, 1.76995849609375, 1.9224853515625, 2.07501220703125, 2.2275390625, 2.38006591796875, 2.5325927734375, 2.68511962890625, 2.837646484375, 2.99017333984375, 3.1427001953125, 3.29522705078125, 3.44775390625, 3.60028076171875, 3.7528076171875, 3.90533447265625, 4.057861328125, 4.21038818359375, 4.3629150390625, 4.51544189453125, 4.66796875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 11.0, 5.0, 10.0, 15.0, 28.0, 22.0, 48.0, 67.0, 83.0, 132.0, 181.0, 318.0, 434.0, 635.0, 981.0, 1553.0, 2576.0, 4599.0, 8495.0, 18672.0, 56504.0, 264990.0, 1179047.0, 1901380.0, 583416.0, 112375.0, 30231.0, 12347.0, 6183.0, 3334.0, 1905.0, 1248.0, 828.0, 513.0, 362.0, 233.0, 166.0, 117.0, 76.0, 47.0, 38.0, 24.0, 18.0, 14.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.18359375, -6.9608154296875, -6.738037109375, -6.5152587890625, -6.29248046875, -6.0697021484375, -5.846923828125, -5.6241455078125, -5.4013671875, -5.1785888671875, -4.955810546875, -4.7330322265625, -4.51025390625, -4.2874755859375, -4.064697265625, -3.8419189453125, -3.619140625, -3.3963623046875, -3.173583984375, -2.9508056640625, -2.72802734375, -2.5052490234375, -2.282470703125, -2.0596923828125, -1.8369140625, -1.6141357421875, -1.391357421875, -1.1685791015625, -0.94580078125, -0.7230224609375, -0.500244140625, -0.2774658203125, -0.0546875, 0.1680908203125, 0.390869140625, 0.6136474609375, 0.83642578125, 1.0592041015625, 1.281982421875, 1.5047607421875, 1.7275390625, 1.9503173828125, 2.173095703125, 2.3958740234375, 2.61865234375, 2.8414306640625, 3.064208984375, 3.2869873046875, 3.509765625, 3.7325439453125, 3.955322265625, 4.1781005859375, 4.40087890625, 4.6236572265625, 4.846435546875, 5.0692138671875, 5.2919921875, 5.5147705078125, 5.737548828125, 5.9603271484375, 6.18310546875, 6.4058837890625, 6.628662109375, 6.8514404296875, 7.07421875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 6.0, 11.0, 11.0, 22.0, 29.0, 34.0, 53.0, 94.0, 111.0, 166.0, 253.0, 332.0, 470.0, 595.0, 532.0, 411.0, 273.0, 195.0, 122.0, 96.0, 73.0, 50.0, 31.0, 20.0, 21.0, 17.0, 5.0, 8.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.03070068359375, -5.7528076171875, -5.47491455078125, -5.197021484375, -4.91912841796875, -4.6412353515625, -4.36334228515625, -4.08544921875, -3.80755615234375, -3.5296630859375, -3.25177001953125, -2.973876953125, -2.69598388671875, -2.4180908203125, -2.14019775390625, -1.8623046875, -1.58441162109375, -1.3065185546875, -1.02862548828125, -0.750732421875, -0.47283935546875, -0.1949462890625, 0.08294677734375, 0.36083984375, 0.63873291015625, 0.9166259765625, 1.19451904296875, 1.472412109375, 1.75030517578125, 2.0281982421875, 2.30609130859375, 2.583984375, 2.86187744140625, 3.1397705078125, 3.41766357421875, 3.695556640625, 3.97344970703125, 4.2513427734375, 4.52923583984375, 4.80712890625, 5.08502197265625, 5.3629150390625, 5.64080810546875, 5.918701171875, 6.19659423828125, 6.4744873046875, 6.75238037109375, 7.0302734375, 7.30816650390625, 7.5860595703125, 7.86395263671875, 8.141845703125, 8.41973876953125, 8.6976318359375, 8.97552490234375, 9.25341796875, 9.53131103515625, 9.8092041015625, 10.08709716796875, 10.364990234375, 10.64288330078125, 10.9207763671875, 11.19866943359375, 11.4765625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 16.0, 25.0, 51.0, 63.0, 116.0, 190.0, 352.0, 710.0, 1305.0, 3265.0, 10706.0, 55111.0, 482682.0, 3038526.0, 524381.0, 59084.0, 11487.0, 3352.0, 1382.0, 580.0, 362.0, 181.0, 124.0, 87.0, 48.0, 29.0, 20.0, 10.0, 9.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.484375, -15.092529296875, -14.70068359375, -14.308837890625, -13.9169921875, -13.525146484375, -13.13330078125, -12.741455078125, -12.349609375, -11.957763671875, -11.56591796875, -11.174072265625, -10.7822265625, -10.390380859375, -9.99853515625, -9.606689453125, -9.21484375, -8.822998046875, -8.43115234375, -8.039306640625, -7.6474609375, -7.255615234375, -6.86376953125, -6.471923828125, -6.080078125, -5.688232421875, -5.29638671875, -4.904541015625, -4.5126953125, -4.120849609375, -3.72900390625, -3.337158203125, -2.9453125, -2.553466796875, -2.16162109375, -1.769775390625, -1.3779296875, -0.986083984375, -0.59423828125, -0.202392578125, 0.189453125, 0.581298828125, 0.97314453125, 1.364990234375, 1.7568359375, 2.148681640625, 2.54052734375, 2.932373046875, 3.32421875, 3.716064453125, 4.10791015625, 4.499755859375, 4.8916015625, 5.283447265625, 5.67529296875, 6.067138671875, 6.458984375, 6.850830078125, 7.24267578125, 7.634521484375, 8.0263671875, 8.418212890625, 8.81005859375, 9.201904296875, 9.59375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 206.0, 764.0, 45.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-447.92669677734375, -438.25347900390625, -428.5802307128906, -418.9070129394531, -409.2337951660156, -399.560546875, -389.8873291015625, -380.214111328125, -370.5408935546875, -360.86767578125, -351.1944274902344, -341.5212097167969, -331.8479919433594, -322.17474365234375, -312.50152587890625, -302.82830810546875, -293.1550598144531, -283.4818420410156, -273.80859375, -264.1353759765625, -254.462158203125, -244.78892517089844, -235.11569213867188, -225.44247436523438, -215.7692413330078, -206.09600830078125, -196.42279052734375, -186.7495574951172, -177.07632446289062, -167.40310668945312, -157.72987365722656, -148.056640625, -138.38343811035156, -128.710205078125, -119.0369873046875, -109.36375427246094, -99.6905288696289, -90.01730346679688, -80.34407043457031, -70.67084503173828, -60.99761962890625, -51.32439422607422, -41.65116500854492, -31.977937698364258, -22.304710388183594, -12.631484985351562, -2.9582557678222656, 6.714973449707031, 16.388198852539062, 26.061426162719727, 35.73465347290039, 45.40788269042969, 55.08110809326172, 64.75433349609375, 74.42756652832031, 84.10079193115234, 93.77401733398438, 103.4472427368164, 113.12046813964844, 122.793701171875, 132.4669189453125, 142.14015197753906, 151.81338500976562, 161.48660278320312, 171.1598358154297]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 10.0, 9.0, 4.0, 5.0, 9.0, 12.0, 13.0, 20.0, 15.0, 16.0, 29.0, 21.0, 15.0, 26.0, 34.0, 29.0, 30.0, 35.0, 39.0, 45.0, 37.0, 43.0, 57.0, 35.0, 43.0, 31.0, 39.0, 45.0, 34.0, 27.0, 29.0, 25.0, 22.0, 14.0, 13.0, 26.0, 12.0, 11.0, 15.0, 10.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.649154663085938, -25.79157257080078, -24.933988571166992, -24.076406478881836, -23.218822479248047, -22.36124038696289, -21.503658294677734, -20.646076202392578, -19.78849220275879, -18.930910110473633, -18.073326110839844, -17.215744018554688, -16.35816192626953, -15.500577926635742, -14.642995834350586, -13.785412788391113, -12.92782974243164, -12.070246696472168, -11.212663650512695, -10.355081558227539, -9.497498512268066, -8.639915466308594, -7.782332897186279, -6.924750328063965, -6.067167282104492, -5.2095842361450195, -4.352001667022705, -3.4944188594818115, -2.636836051940918, -1.7792530059814453, -0.9216704368591309, -0.0640878677368164, 0.7934951782226562, 1.6510779857635498, 2.5086607933044434, 3.366243600845337, 4.2238264083862305, 5.081409454345703, 5.938992023468018, 6.796574592590332, 7.654157638549805, 8.511740684509277, 9.36932373046875, 10.226905822753906, 11.084488868713379, 11.942071914672852, 12.799654006958008, 13.65723705291748, 14.514820098876953, 15.372403144836426, 16.2299861907959, 17.087568283081055, 17.945152282714844, 18.802734375, 19.660316467285156, 20.517898559570312, 21.3754825592041, 22.233064651489258, 23.090648651123047, 23.948230743408203, 24.80581283569336, 25.66339683532715, 26.520978927612305, 27.378562927246094, 28.23614501953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 8.0, 12.0, 7.0, 18.0, 22.0, 20.0, 22.0, 31.0, 30.0, 40.0, 36.0, 32.0, 46.0, 38.0, 66.0, 44.0, 42.0, 43.0, 56.0, 50.0, 33.0, 33.0, 36.0, 33.0, 21.0, 27.0, 28.0, 17.0, 14.0, 20.0, 16.0, 9.0, 8.0, 3.0, 6.0, 2.0, 7.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-5.44921875, -5.306182861328125, -5.16314697265625, -5.020111083984375, -4.8770751953125, -4.734039306640625, -4.59100341796875, -4.447967529296875, -4.304931640625, -4.161895751953125, -4.01885986328125, -3.875823974609375, -3.7327880859375, -3.589752197265625, -3.44671630859375, -3.303680419921875, -3.16064453125, -3.017608642578125, -2.87457275390625, -2.731536865234375, -2.5885009765625, -2.445465087890625, -2.30242919921875, -2.159393310546875, -2.016357421875, -1.873321533203125, -1.73028564453125, -1.587249755859375, -1.4442138671875, -1.301177978515625, -1.15814208984375, -1.015106201171875, -0.8720703125, -0.729034423828125, -0.58599853515625, -0.442962646484375, -0.2999267578125, -0.156890869140625, -0.01385498046875, 0.129180908203125, 0.272216796875, 0.415252685546875, 0.55828857421875, 0.701324462890625, 0.8443603515625, 0.987396240234375, 1.13043212890625, 1.273468017578125, 1.41650390625, 1.559539794921875, 1.70257568359375, 1.845611572265625, 1.9886474609375, 2.131683349609375, 2.27471923828125, 2.417755126953125, 2.560791015625, 2.703826904296875, 2.84686279296875, 2.989898681640625, 3.1329345703125, 3.275970458984375, 3.41900634765625, 3.562042236328125, 3.705078125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 8.0, 15.0, 21.0, 23.0, 45.0, 55.0, 87.0, 120.0, 181.0, 272.0, 341.0, 591.0, 748.0, 1114.0, 1586.0, 2414.0, 3563.0, 5278.0, 8065.0, 12486.0, 19564.0, 31987.0, 54557.0, 98413.0, 202989.0, 286732.0, 135587.0, 71202.0, 40636.0, 24684.0, 15408.0, 9885.0, 6417.0, 4317.0, 2903.0, 1955.0, 1316.0, 893.0, 613.0, 478.0, 310.0, 212.0, 153.0, 106.0, 70.0, 51.0, 36.0, 19.0, 14.0, 13.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.1273193359375, -0.12324333190917969, -0.11916732788085938, -0.11509132385253906, -0.11101531982421875, -0.10693931579589844, -0.10286331176757812, -0.09878730773925781, -0.0947113037109375, -0.09063529968261719, -0.08655929565429688, -0.08248329162597656, -0.07840728759765625, -0.07433128356933594, -0.07025527954101562, -0.06617927551269531, -0.062103271484375, -0.05802726745605469, -0.053951263427734375, -0.04987525939941406, -0.04579925537109375, -0.04172325134277344, -0.037647247314453125, -0.03357124328613281, -0.0294952392578125, -0.025419235229492188, -0.021343231201171875, -0.017267227172851562, -0.01319122314453125, -0.009115219116210938, -0.005039215087890625, -0.0009632110595703125, 0.00311279296875, 0.0071887969970703125, 0.011264801025390625, 0.015340805053710938, 0.01941680908203125, 0.023492813110351562, 0.027568817138671875, 0.03164482116699219, 0.0357208251953125, 0.03979682922363281, 0.043872833251953125, 0.04794883728027344, 0.05202484130859375, 0.05610084533691406, 0.060176849365234375, 0.06425285339355469, 0.068328857421875, 0.07240486145019531, 0.07648086547851562, 0.08055686950683594, 0.08463287353515625, 0.08870887756347656, 0.09278488159179688, 0.09686088562011719, 0.1009368896484375, 0.10501289367675781, 0.10908889770507812, 0.11316490173339844, 0.11724090576171875, 0.12131690979003906, 0.12539291381835938, 0.1294689178466797, 0.133544921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 0.0, 3.0, 7.0, 3.0, 3.0, 10.0, 10.0, 25.0, 13.0, 27.0, 22.0, 19.0, 24.0, 29.0, 35.0, 39.0, 30.0, 51.0, 33.0, 45.0, 50.0, 34.0, 1069.0, 47.0, 25.0, 48.0, 36.0, 46.0, 32.0, 28.0, 26.0, 24.0, 25.0, 22.0, 20.0, 12.0, 16.0, 9.0, 8.0, 6.0, 5.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.3359375, -3.24365234375, -3.1513671875, -3.05908203125, -2.966796875, -2.87451171875, -2.7822265625, -2.68994140625, -2.59765625, -2.50537109375, -2.4130859375, -2.32080078125, -2.228515625, -2.13623046875, -2.0439453125, -1.95166015625, -1.859375, -1.76708984375, -1.6748046875, -1.58251953125, -1.490234375, -1.39794921875, -1.3056640625, -1.21337890625, -1.12109375, -1.02880859375, -0.9365234375, -0.84423828125, -0.751953125, -0.65966796875, -0.5673828125, -0.47509765625, -0.3828125, -0.29052734375, -0.1982421875, -0.10595703125, -0.013671875, 0.07861328125, 0.1708984375, 0.26318359375, 0.35546875, 0.44775390625, 0.5400390625, 0.63232421875, 0.724609375, 0.81689453125, 0.9091796875, 1.00146484375, 1.09375, 1.18603515625, 1.2783203125, 1.37060546875, 1.462890625, 1.55517578125, 1.6474609375, 1.73974609375, 1.83203125, 1.92431640625, 2.0166015625, 2.10888671875, 2.201171875, 2.29345703125, 2.3857421875, 2.47802734375, 2.5703125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 16.0, 19.0, 31.0, 38.0, 52.0, 98.0, 149.0, 207.0, 337.0, 494.0, 714.0, 1231.0, 1803.0, 2800.0, 4305.0, 6842.0, 11080.0, 17663.0, 29312.0, 50391.0, 90965.0, 176127.0, 1330005.0, 165103.0, 85649.0, 47554.0, 28325.0, 16988.0, 10515.0, 6529.0, 4169.0, 2665.0, 1667.0, 1129.0, 723.0, 502.0, 310.0, 219.0, 135.0, 88.0, 69.0, 29.0, 25.0, 22.0, 13.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.07928466796875, -0.07698345184326172, -0.07468223571777344, -0.07238101959228516, -0.07007980346679688, -0.0677785873413086, -0.06547737121582031, -0.06317615509033203, -0.06087493896484375, -0.05857372283935547, -0.05627250671386719, -0.053971290588378906, -0.051670074462890625, -0.049368858337402344, -0.04706764221191406, -0.04476642608642578, -0.0424652099609375, -0.04016399383544922, -0.03786277770996094, -0.035561561584472656, -0.033260345458984375, -0.030959129333496094, -0.028657913208007812, -0.02635669708251953, -0.02405548095703125, -0.02175426483154297, -0.019453048706054688, -0.017151832580566406, -0.014850616455078125, -0.012549400329589844, -0.010248184204101562, -0.007946968078613281, -0.005645751953125, -0.0033445358276367188, -0.0010433197021484375, 0.0012578964233398438, 0.003559112548828125, 0.005860328674316406, 0.008161544799804688, 0.010462760925292969, 0.01276397705078125, 0.015065193176269531, 0.017366409301757812, 0.019667625427246094, 0.021968841552734375, 0.024270057678222656, 0.026571273803710938, 0.02887248992919922, 0.0311737060546875, 0.03347492218017578, 0.03577613830566406, 0.038077354431152344, 0.040378570556640625, 0.042679786682128906, 0.04498100280761719, 0.04728221893310547, 0.04958343505859375, 0.05188465118408203, 0.05418586730957031, 0.056487083435058594, 0.058788299560546875, 0.061089515686035156, 0.06339073181152344, 0.06569194793701172, 0.0679931640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 3.0, 3.0, 8.0, 7.0, 11.0, 13.0, 12.0, 18.0, 29.0, 26.0, 39.0, 44.0, 64.0, 74.0, 66.0, 87.0, 104.0, 68.0, 56.0, 49.0, 43.0, 34.0, 28.0, 20.0, 11.0, 15.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5212764739990234e-05, -2.4444423615932465e-05, -2.3676082491874695e-05, -2.2907741367816925e-05, -2.2139400243759155e-05, -2.1371059119701385e-05, -2.0602717995643616e-05, -1.9834376871585846e-05, -1.9066035747528076e-05, -1.8297694623470306e-05, -1.7529353499412537e-05, -1.6761012375354767e-05, -1.5992671251296997e-05, -1.5224330127239227e-05, -1.4455989003181458e-05, -1.3687647879123688e-05, -1.2919306755065918e-05, -1.2150965631008148e-05, -1.1382624506950378e-05, -1.0614283382892609e-05, -9.845942258834839e-06, -9.077601134777069e-06, -8.3092600107193e-06, -7.5409188866615295e-06, -6.77257776260376e-06, -6.00423663854599e-06, -5.23589551448822e-06, -4.4675543904304504e-06, -3.6992132663726807e-06, -2.930872142314911e-06, -2.162531018257141e-06, -1.3941898941993713e-06, -6.258487701416016e-07, 1.424923539161682e-07, 9.10833477973938e-07, 1.6791746020317078e-06, 2.4475157260894775e-06, 3.2158568501472473e-06, 3.984197974205017e-06, 4.752539098262787e-06, 5.520880222320557e-06, 6.289221346378326e-06, 7.057562470436096e-06, 7.825903594493866e-06, 8.594244718551636e-06, 9.362585842609406e-06, 1.0130926966667175e-05, 1.0899268090724945e-05, 1.1667609214782715e-05, 1.2435950338840485e-05, 1.3204291462898254e-05, 1.3972632586956024e-05, 1.4740973711013794e-05, 1.5509314835071564e-05, 1.6277655959129333e-05, 1.7045997083187103e-05, 1.7814338207244873e-05, 1.8582679331302643e-05, 1.9351020455360413e-05, 2.0119361579418182e-05, 2.0887702703475952e-05, 2.1656043827533722e-05, 2.2424384951591492e-05, 2.319272607564926e-05, 2.396106719970703e-05]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 3.0, 7.0, 12.0, 20.0, 14.0, 17.0, 22.0, 35.0, 55.0, 77.0, 97.0, 185.0, 336.0, 1186.0, 883476.0, 161273.0, 874.0, 323.0, 156.0, 115.0, 59.0, 53.0, 37.0, 23.0, 20.0, 17.0, 11.0, 6.0, 9.0, 3.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005550384521484375, -0.0005370825529098511, -0.0005191266536712646, -0.0005011707544326782, -0.0004832148551940918, -0.00046525895595550537, -0.00044730305671691895, -0.0004293471574783325, -0.0004113912582397461, -0.00039343535900115967, -0.00037547945976257324, -0.0003575235605239868, -0.0003395676612854004, -0.00032161176204681396, -0.00030365586280822754, -0.0002856999635696411, -0.0002677440643310547, -0.00024978816509246826, -0.00023183226585388184, -0.0002138763666152954, -0.00019592046737670898, -0.00017796456813812256, -0.00016000866889953613, -0.0001420527696609497, -0.00012409687042236328, -0.00010614097118377686, -8.818507194519043e-05, -7.0229172706604e-05, -5.227327346801758e-05, -3.431737422943115e-05, -1.6361474990844727e-05, 1.5944242477416992e-06, 1.9550323486328125e-05, 3.750622272491455e-05, 5.5462121963500977e-05, 7.34180212020874e-05, 9.137392044067383e-05, 0.00010932981967926025, 0.00012728571891784668, 0.0001452416181564331, 0.00016319751739501953, 0.00018115341663360596, 0.00019910931587219238, 0.0002170652151107788, 0.00023502111434936523, 0.00025297701358795166, 0.0002709329128265381, 0.0002888888120651245, 0.00030684471130371094, 0.00032480061054229736, 0.0003427565097808838, 0.0003607124090194702, 0.00037866830825805664, 0.00039662420749664307, 0.0004145801067352295, 0.0004325360059738159, 0.00045049190521240234, 0.00046844780445098877, 0.0004864037036895752, 0.0005043596029281616, 0.000522315502166748, 0.0005402714014053345, 0.0005582273006439209, 0.0005761831998825073, 0.0005941390991210938]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 127.0, 889.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.112586637143977e-05, -1.6318066627718508e-05, -1.5102668839972466e-06, 1.3297532859724015e-05, 2.8105332603445277e-05, 4.291312870918773e-05, 5.77209320908878e-05, 7.252873911056668e-05, 8.733653521630913e-05, 0.00010214433132205158, 0.00011695213470375165, 0.00013175993808545172, 0.00014656773419119418, 0.00016137553029693663, 0.00017618332640267909, 0.00019099113706033677, 0.00020579893316607922, 0.00022060672927182168, 0.00023541453992947936, 0.0002502223360352218, 0.00026503013214096427, 0.0002798379282467067, 0.0002946457243524492, 0.00030945352045819163, 0.0003242613165639341, 0.00033906911266967654, 0.000353876908775419, 0.00036868470488116145, 0.0003834925009869039, 0.00039830029709264636, 0.00041310812230221927, 0.0004279159184079617, 0.00044272374361753464, 0.0004575315397232771, 0.00047233933582901955, 0.000487147131934762, 0.0005019549280405045, 0.0005167627241462469, 0.0005315705202519894, 0.0005463783163577318, 0.0005611861124634743, 0.0005759939085692167, 0.0005908017046749592, 0.0006056095007807016, 0.0006204172968864441, 0.0006352250929921865, 0.000650032889097929, 0.0006648406852036715, 0.0006796485395170748, 0.0006944563356228173, 0.0007092641317285597, 0.0007240719278343022, 0.0007388797239400446, 0.0007536875200457871, 0.0007684953161515296, 0.0007833031704649329, 0.0007981109665706754, 0.0008129187626764178, 0.0008277265587821603, 0.0008425343548879027, 0.0008573421509936452, 0.0008721499470993876, 0.0008869577432051301, 0.0009017655393108726, 0.000916573335416615]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 16.0, 22.0, 52.0, 74.0, 82.0, 110.0, 111.0, 132.0, 110.0, 92.0, 73.0, 54.0, 28.0, 23.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.056748002767563e-05, -3.947131335735321e-05, -3.837514668703079e-05, -3.7278980016708374e-05, -3.6182813346385956e-05, -3.508664667606354e-05, -3.399048000574112e-05, -3.28943133354187e-05, -3.179814666509628e-05, -3.0701979994773865e-05, -2.9605813324451447e-05, -2.850964665412903e-05, -2.741347998380661e-05, -2.6317313313484192e-05, -2.5221146643161774e-05, -2.4124979972839355e-05, -2.3028813302516937e-05, -2.193264663219452e-05, -2.08364799618721e-05, -1.9740313291549683e-05, -1.8644146621227264e-05, -1.7547979950904846e-05, -1.6451813280582428e-05, -1.535564661026001e-05, -1.4259479939937592e-05, -1.3163313269615173e-05, -1.2067146599292755e-05, -1.0970979928970337e-05, -9.874813258647919e-06, -8.7786465883255e-06, -7.682479918003082e-06, -6.586313247680664e-06, -5.490146577358246e-06, -4.393979907035828e-06, -3.2978132367134094e-06, -2.201646566390991e-06, -1.105479896068573e-06, -9.313225746154785e-09, 1.0868534445762634e-06, 2.1830201148986816e-06, 3.2791867852211e-06, 4.375353455543518e-06, 5.471520125865936e-06, 6.5676867961883545e-06, 7.663853466510773e-06, 8.760020136833191e-06, 9.856186807155609e-06, 1.0952353477478027e-05, 1.2048520147800446e-05, 1.3144686818122864e-05, 1.4240853488445282e-05, 1.53370201587677e-05, 1.643318682909012e-05, 1.7529353499412537e-05, 1.8625520169734955e-05, 1.9721686840057373e-05, 2.081785351037979e-05, 2.191402018070221e-05, 2.3010186851024628e-05, 2.4106353521347046e-05, 2.5202520191669464e-05, 2.6298686861991882e-05, 2.73948535323143e-05, 2.849102020263672e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 8.0, 12.0, 7.0, 18.0, 22.0, 20.0, 22.0, 31.0, 30.0, 40.0, 36.0, 32.0, 46.0, 38.0, 66.0, 44.0, 42.0, 43.0, 56.0, 50.0, 33.0, 33.0, 36.0, 33.0, 21.0, 27.0, 28.0, 17.0, 14.0, 20.0, 16.0, 9.0, 8.0, 3.0, 6.0, 2.0, 7.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-5.44921875, -5.306182861328125, -5.16314697265625, -5.020111083984375, -4.8770751953125, -4.734039306640625, -4.59100341796875, -4.447967529296875, -4.304931640625, -4.161895751953125, -4.01885986328125, -3.875823974609375, -3.7327880859375, -3.589752197265625, -3.44671630859375, -3.303680419921875, -3.16064453125, -3.017608642578125, -2.87457275390625, -2.731536865234375, -2.5885009765625, -2.445465087890625, -2.30242919921875, -2.159393310546875, -2.016357421875, -1.873321533203125, -1.73028564453125, -1.587249755859375, -1.4442138671875, -1.301177978515625, -1.15814208984375, -1.015106201171875, -0.8720703125, -0.729034423828125, -0.58599853515625, -0.442962646484375, -0.2999267578125, -0.156890869140625, -0.01385498046875, 0.129180908203125, 0.272216796875, 0.415252685546875, 0.55828857421875, 0.701324462890625, 0.8443603515625, 0.987396240234375, 1.13043212890625, 1.273468017578125, 1.41650390625, 1.559539794921875, 1.70257568359375, 1.845611572265625, 1.9886474609375, 2.131683349609375, 2.27471923828125, 2.417755126953125, 2.560791015625, 2.703826904296875, 2.84686279296875, 2.989898681640625, 3.1329345703125, 3.275970458984375, 3.41900634765625, 3.562042236328125, 3.705078125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 17.0, 27.0, 29.0, 52.0, 81.0, 99.0, 143.0, 191.0, 325.0, 488.0, 783.0, 1366.0, 2652.0, 6948.0, 24529.0, 130674.0, 617978.0, 209936.0, 35515.0, 9165.0, 3405.0, 1579.0, 880.0, 544.0, 382.0, 222.0, 145.0, 105.0, 66.0, 54.0, 33.0, 26.0, 20.0, 19.0, 17.0, 7.0, 7.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.2784423828125, -7.978759765625, -7.6790771484375, -7.37939453125, -7.0797119140625, -6.780029296875, -6.4803466796875, -6.1806640625, -5.8809814453125, -5.581298828125, -5.2816162109375, -4.98193359375, -4.6822509765625, -4.382568359375, -4.0828857421875, -3.783203125, -3.4835205078125, -3.183837890625, -2.8841552734375, -2.58447265625, -2.2847900390625, -1.985107421875, -1.6854248046875, -1.3857421875, -1.0860595703125, -0.786376953125, -0.4866943359375, -0.18701171875, 0.1126708984375, 0.412353515625, 0.7120361328125, 1.01171875, 1.3114013671875, 1.611083984375, 1.9107666015625, 2.21044921875, 2.5101318359375, 2.809814453125, 3.1094970703125, 3.4091796875, 3.7088623046875, 4.008544921875, 4.3082275390625, 4.60791015625, 4.9075927734375, 5.207275390625, 5.5069580078125, 5.806640625, 6.1063232421875, 6.406005859375, 6.7056884765625, 7.00537109375, 7.3050537109375, 7.604736328125, 7.9044189453125, 8.2041015625, 8.5037841796875, 8.803466796875, 9.1031494140625, 9.40283203125, 9.7025146484375, 10.002197265625, 10.3018798828125, 10.6015625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 13.0, 8.0, 13.0, 10.0, 13.0, 18.0, 17.0, 25.0, 21.0, 37.0, 26.0, 37.0, 48.0, 64.0, 79.0, 119.0, 179.0, 1358.0, 300.0, 175.0, 93.0, 72.0, 44.0, 48.0, 31.0, 18.0, 37.0, 24.0, 13.0, 21.0, 13.0, 13.0, 17.0, 6.0, 10.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6953125, -9.3603515625, -9.025390625, -8.6904296875, -8.35546875, -8.0205078125, -7.685546875, -7.3505859375, -7.015625, -6.6806640625, -6.345703125, -6.0107421875, -5.67578125, -5.3408203125, -5.005859375, -4.6708984375, -4.3359375, -4.0009765625, -3.666015625, -3.3310546875, -2.99609375, -2.6611328125, -2.326171875, -1.9912109375, -1.65625, -1.3212890625, -0.986328125, -0.6513671875, -0.31640625, 0.0185546875, 0.353515625, 0.6884765625, 1.0234375, 1.3583984375, 1.693359375, 2.0283203125, 2.36328125, 2.6982421875, 3.033203125, 3.3681640625, 3.703125, 4.0380859375, 4.373046875, 4.7080078125, 5.04296875, 5.3779296875, 5.712890625, 6.0478515625, 6.3828125, 6.7177734375, 7.052734375, 7.3876953125, 7.72265625, 8.0576171875, 8.392578125, 8.7275390625, 9.0625, 9.3974609375, 9.732421875, 10.0673828125, 10.40234375, 10.7373046875, 11.072265625, 11.4072265625, 11.7421875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 11.0, 7.0, 15.0, 14.0, 17.0, 27.0, 36.0, 55.0, 73.0, 113.0, 153.0, 296.0, 502.0, 1143.0, 6134.0, 2329544.0, 800401.0, 4759.0, 1029.0, 478.0, 287.0, 176.0, 139.0, 93.0, 52.0, 37.0, 27.0, 22.0, 16.0, 11.0, 8.0, 7.0, 3.0, 3.0, 8.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-35.71875, -34.82470703125, -33.9306640625, -33.03662109375, -32.142578125, -31.24853515625, -30.3544921875, -29.46044921875, -28.56640625, -27.67236328125, -26.7783203125, -25.88427734375, -24.990234375, -24.09619140625, -23.2021484375, -22.30810546875, -21.4140625, -20.52001953125, -19.6259765625, -18.73193359375, -17.837890625, -16.94384765625, -16.0498046875, -15.15576171875, -14.26171875, -13.36767578125, -12.4736328125, -11.57958984375, -10.685546875, -9.79150390625, -8.8974609375, -8.00341796875, -7.109375, -6.21533203125, -5.3212890625, -4.42724609375, -3.533203125, -2.63916015625, -1.7451171875, -0.85107421875, 0.04296875, 0.93701171875, 1.8310546875, 2.72509765625, 3.619140625, 4.51318359375, 5.4072265625, 6.30126953125, 7.1953125, 8.08935546875, 8.9833984375, 9.87744140625, 10.771484375, 11.66552734375, 12.5595703125, 13.45361328125, 14.34765625, 15.24169921875, 16.1357421875, 17.02978515625, 17.923828125, 18.81787109375, 19.7119140625, 20.60595703125, 21.5]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 16.0, 56.0, 173.0, 381.0, 263.0, 90.0, 25.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.12750244140625, -109.86357116699219, -106.5996322631836, -103.33570098876953, -100.07176208496094, -96.80783081054688, -93.54389953613281, -90.27996063232422, -87.01602935791016, -83.7520980834961, -80.4881591796875, -77.22422790527344, -73.96028900146484, -70.69635772705078, -67.43241882324219, -64.16848754882812, -60.9045524597168, -57.64061737060547, -54.37668228149414, -51.11274719238281, -47.84881591796875, -44.58488082885742, -41.320945739746094, -38.05701446533203, -34.79307556152344, -31.52914047241211, -28.265207290649414, -25.001272201538086, -21.73733901977539, -18.473403930664062, -15.209468841552734, -11.945535659790039, -8.681602478027344, -5.417668342590332, -2.153733730316162, 1.1102008819580078, 4.3741350173950195, 7.638069152832031, 10.90200424194336, 14.165937423706055, 17.429872512817383, 20.69380760192871, 23.957740783691406, 27.221675872802734, 30.485610961914062, 33.749542236328125, 37.01348114013672, 40.27741241455078, 43.54134750366211, 46.80528259277344, 50.069217681884766, 53.333152770996094, 56.597084045410156, 59.861019134521484, 63.12495422363281, 66.38888549804688, 69.65282440185547, 72.91675567626953, 76.18069458007812, 79.44462585449219, 82.70856475830078, 85.97249603271484, 89.23643493652344, 92.5003662109375, 95.76429748535156]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 8.0, 7.0, 11.0, 9.0, 9.0, 6.0, 14.0, 18.0, 21.0, 24.0, 29.0, 27.0, 40.0, 32.0, 40.0, 45.0, 39.0, 38.0, 49.0, 53.0, 42.0, 40.0, 40.0, 40.0, 29.0, 48.0, 25.0, 26.0, 27.0, 22.0, 20.0, 23.0, 16.0, 14.0, 11.0, 13.0, 8.0, 1.0, 7.0, 4.0, 7.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.15962028503418, -30.116466522216797, -29.07331085205078, -28.0301570892334, -26.987003326416016, -25.94384765625, -24.900693893432617, -23.857540130615234, -22.81438446044922, -21.771230697631836, -20.72807502746582, -19.684921264648438, -18.641765594482422, -17.59861183166504, -16.555458068847656, -15.512303352355957, -14.469148635864258, -13.425993919372559, -12.38283920288086, -11.339685440063477, -10.296530723571777, -9.253376007080078, -8.210222244262695, -7.167067527770996, -6.123912811279297, -5.080758094787598, -4.037603855133057, -2.9944493770599365, -1.9512948989868164, -0.9081401824951172, 0.13501405715942383, 1.1781682968139648, 2.221324920654297, 3.264479398727417, 4.307633876800537, 5.350788116455078, 6.393942832946777, 7.437097549438477, 8.48025131225586, 9.523406028747559, 10.566560745239258, 11.609715461730957, 12.652870178222656, 13.696023941040039, 14.739178657531738, 15.782333374023438, 16.82548713684082, 17.868640899658203, 18.91179656982422, 19.9549503326416, 20.998106002807617, 22.041259765625, 23.084415435791016, 24.1275691986084, 25.17072296142578, 26.213878631591797, 27.25703239440918, 28.300186157226562, 29.343341827392578, 30.38649559020996, 31.429649353027344, 32.47280502319336, 33.515960693359375, 34.559112548828125, 35.60226821899414]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 13.0, 11.0, 9.0, 11.0, 12.0, 15.0, 26.0, 14.0, 25.0, 37.0, 44.0, 39.0, 48.0, 46.0, 46.0, 53.0, 54.0, 48.0, 37.0, 42.0, 52.0, 45.0, 36.0, 31.0, 29.0, 26.0, 21.0, 23.0, 19.0, 20.0, 14.0, 9.0, 7.0, 8.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.423095703125, -5.26806640625, -5.113037109375, -4.9580078125, -4.802978515625, -4.64794921875, -4.492919921875, -4.337890625, -4.182861328125, -4.02783203125, -3.872802734375, -3.7177734375, -3.562744140625, -3.40771484375, -3.252685546875, -3.09765625, -2.942626953125, -2.78759765625, -2.632568359375, -2.4775390625, -2.322509765625, -2.16748046875, -2.012451171875, -1.857421875, -1.702392578125, -1.54736328125, -1.392333984375, -1.2373046875, -1.082275390625, -0.92724609375, -0.772216796875, -0.6171875, -0.462158203125, -0.30712890625, -0.152099609375, 0.0029296875, 0.157958984375, 0.31298828125, 0.468017578125, 0.623046875, 0.778076171875, 0.93310546875, 1.088134765625, 1.2431640625, 1.398193359375, 1.55322265625, 1.708251953125, 1.86328125, 2.018310546875, 2.17333984375, 2.328369140625, 2.4833984375, 2.638427734375, 2.79345703125, 2.948486328125, 3.103515625, 3.258544921875, 3.41357421875, 3.568603515625, 3.7236328125, 3.878662109375, 4.03369140625, 4.188720703125, 4.34375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 13.0, 18.0, 33.0, 44.0, 58.0, 82.0, 110.0, 184.0, 262.0, 456.0, 672.0, 1145.0, 1938.0, 3302.0, 6231.0, 12028.0, 29490.0, 166986.0, 1327875.0, 2212347.0, 349306.0, 47892.0, 15859.0, 7726.0, 3964.0, 2415.0, 1424.0, 851.0, 554.0, 354.0, 215.0, 143.0, 102.0, 55.0, 44.0, 27.0, 20.0, 19.0, 11.0, 2.0, 9.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-9.7734375, -9.50323486328125, -9.2330322265625, -8.96282958984375, -8.692626953125, -8.42242431640625, -8.1522216796875, -7.88201904296875, -7.61181640625, -7.34161376953125, -7.0714111328125, -6.80120849609375, -6.531005859375, -6.26080322265625, -5.9906005859375, -5.72039794921875, -5.4501953125, -5.17999267578125, -4.9097900390625, -4.63958740234375, -4.369384765625, -4.09918212890625, -3.8289794921875, -3.55877685546875, -3.28857421875, -3.01837158203125, -2.7481689453125, -2.47796630859375, -2.207763671875, -1.93756103515625, -1.6673583984375, -1.39715576171875, -1.126953125, -0.85675048828125, -0.5865478515625, -0.31634521484375, -0.046142578125, 0.22406005859375, 0.4942626953125, 0.76446533203125, 1.03466796875, 1.30487060546875, 1.5750732421875, 1.84527587890625, 2.115478515625, 2.38568115234375, 2.6558837890625, 2.92608642578125, 3.1962890625, 3.46649169921875, 3.7366943359375, 4.00689697265625, 4.277099609375, 4.54730224609375, 4.8175048828125, 5.08770751953125, 5.35791015625, 5.62811279296875, 5.8983154296875, 6.16851806640625, 6.438720703125, 6.70892333984375, 6.9791259765625, 7.24932861328125, 7.51953125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 11.0, 10.0, 15.0, 29.0, 36.0, 59.0, 79.0, 123.0, 189.0, 271.0, 354.0, 456.0, 633.0, 485.0, 367.0, 276.0, 190.0, 166.0, 103.0, 72.0, 40.0, 29.0, 25.0, 10.0, 9.0, 10.0, 5.0, 7.0, 7.0, 4.0, 2.0, 1.0], "bins": [-10.6875, -10.44818115234375, -10.2088623046875, -9.96954345703125, -9.730224609375, -9.49090576171875, -9.2515869140625, -9.01226806640625, -8.77294921875, -8.53363037109375, -8.2943115234375, -8.05499267578125, -7.815673828125, -7.57635498046875, -7.3370361328125, -7.09771728515625, -6.8583984375, -6.61907958984375, -6.3797607421875, -6.14044189453125, -5.901123046875, -5.66180419921875, -5.4224853515625, -5.18316650390625, -4.94384765625, -4.70452880859375, -4.4652099609375, -4.22589111328125, -3.986572265625, -3.74725341796875, -3.5079345703125, -3.26861572265625, -3.029296875, -2.78997802734375, -2.5506591796875, -2.31134033203125, -2.072021484375, -1.83270263671875, -1.5933837890625, -1.35406494140625, -1.11474609375, -0.87542724609375, -0.6361083984375, -0.39678955078125, -0.157470703125, 0.08184814453125, 0.3211669921875, 0.56048583984375, 0.7998046875, 1.03912353515625, 1.2784423828125, 1.51776123046875, 1.757080078125, 1.99639892578125, 2.2357177734375, 2.47503662109375, 2.71435546875, 2.95367431640625, 3.1929931640625, 3.43231201171875, 3.671630859375, 3.91094970703125, 4.1502685546875, 4.38958740234375, 4.62890625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 12.0, 12.0, 21.0, 22.0, 43.0, 50.0, 99.0, 140.0, 248.0, 454.0, 892.0, 2325.0, 8671.0, 74407.0, 1934769.0, 2080096.0, 78560.0, 9166.0, 2289.0, 929.0, 442.0, 244.0, 137.0, 86.0, 46.0, 38.0, 23.0, 24.0, 10.0, 6.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.035888671875, -7.63427734375, -7.232666015625, -6.8310546875, -6.429443359375, -6.02783203125, -5.626220703125, -5.224609375, -4.822998046875, -4.42138671875, -4.019775390625, -3.6181640625, -3.216552734375, -2.81494140625, -2.413330078125, -2.01171875, -1.610107421875, -1.20849609375, -0.806884765625, -0.4052734375, -0.003662109375, 0.39794921875, 0.799560546875, 1.201171875, 1.602783203125, 2.00439453125, 2.406005859375, 2.8076171875, 3.209228515625, 3.61083984375, 4.012451171875, 4.4140625, 4.815673828125, 5.21728515625, 5.618896484375, 6.0205078125, 6.422119140625, 6.82373046875, 7.225341796875, 7.626953125, 8.028564453125, 8.43017578125, 8.831787109375, 9.2333984375, 9.635009765625, 10.03662109375, 10.438232421875, 10.83984375, 11.241455078125, 11.64306640625, 12.044677734375, 12.4462890625, 12.847900390625, 13.24951171875, 13.651123046875, 14.052734375, 14.454345703125, 14.85595703125, 15.257568359375, 15.6591796875, 16.060791015625, 16.46240234375, 16.864013671875, 17.265625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 11.0, 25.0, 60.0, 154.0, 228.0, 255.0, 177.0, 65.0, 26.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.32100296020508, -57.27447509765625, -55.22795104980469, -53.18142318725586, -51.13489532470703, -49.08837127685547, -47.04184341430664, -44.99531555175781, -42.94879150390625, -40.90226364135742, -38.85573959350586, -36.80921173095703, -34.76268768310547, -32.71615982055664, -30.669631958007812, -28.623106002807617, -26.576580047607422, -24.530054092407227, -22.48352813720703, -20.437000274658203, -18.390474319458008, -16.343948364257812, -14.2974214553833, -12.250894546508789, -10.204368591308594, -8.157842636108398, -6.111315727233887, -4.064789295196533, -2.0182628631591797, 0.028263092041015625, 2.0747900009155273, 4.121316909790039, 6.167839050292969, 8.214365005493164, 10.260891914367676, 12.307418823242188, 14.353944778442383, 16.400470733642578, 18.446998596191406, 20.4935245513916, 22.540050506591797, 24.586576461791992, 26.633102416992188, 28.679630279541016, 30.72615623474121, 32.772682189941406, 34.819210052490234, 36.86573791503906, 38.912261962890625, 40.95878982543945, 43.005313873291016, 45.051841735839844, 47.098365783691406, 49.144893646240234, 51.19142150878906, 53.237945556640625, 55.28447341918945, 57.33100128173828, 59.377525329589844, 61.42405319213867, 63.4705810546875, 65.51710510253906, 67.56362915039062, 69.61016082763672, 71.65668487548828]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 0.0, 6.0, 5.0, 11.0, 11.0, 18.0, 13.0, 16.0, 18.0, 21.0, 21.0, 24.0, 25.0, 41.0, 38.0, 34.0, 38.0, 35.0, 36.0, 52.0, 38.0, 33.0, 51.0, 33.0, 41.0, 34.0, 29.0, 36.0, 29.0, 32.0, 27.0, 24.0, 23.0, 17.0, 16.0, 13.0, 13.0, 13.0, 12.0, 6.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.01355743408203, -19.318288803100586, -18.623018264770508, -17.927749633789062, -17.232479095458984, -16.53721046447754, -15.841940879821777, -15.146671295166016, -14.451401710510254, -13.756132125854492, -13.06086254119873, -12.365592956542969, -11.670324325561523, -10.975053787231445, -10.27978515625, -9.584515571594238, -8.889245986938477, -8.193976402282715, -7.498706817626953, -6.80343770980835, -6.108168125152588, -5.412898540496826, -4.717629432678223, -4.022359848022461, -3.327090263366699, -2.6318206787109375, -1.9365513324737549, -1.2412819862365723, -0.5460124015808105, 0.14925718307495117, 0.8445262908935547, 1.5397958755493164, 2.2350635528564453, 2.930333137512207, 3.6256024837493896, 4.320871829986572, 5.016141414642334, 5.711410999298096, 6.406680107116699, 7.101949691772461, 7.797219276428223, 8.492488861083984, 9.187758445739746, 9.883028030395508, 10.578296661376953, 11.273567199707031, 11.968835830688477, 12.664105415344238, 13.359375, 14.054644584655762, 14.749914169311523, 15.445182800292969, 16.140453338623047, 16.835721969604492, 17.530990600585938, 18.226261138916016, 18.921531677246094, 19.61680030822754, 20.312070846557617, 21.007339477539062, 21.70261001586914, 22.397878646850586, 23.09314727783203, 23.78841781616211, 24.483686447143555]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 11.0, 7.0, 12.0, 14.0, 17.0, 18.0, 21.0, 22.0, 30.0, 29.0, 46.0, 39.0, 37.0, 44.0, 47.0, 47.0, 41.0, 51.0, 49.0, 43.0, 40.0, 42.0, 36.0, 36.0, 41.0, 25.0, 27.0, 24.0, 17.0, 14.0, 12.0, 14.0, 8.0, 10.0, 5.0, 7.0, 1.0, 5.0, 2.0, 0.0, 4.0, 3.0, 1.0], "bins": [-5.04296875, -4.910308837890625, -4.77764892578125, -4.644989013671875, -4.5123291015625, -4.379669189453125, -4.24700927734375, -4.114349365234375, -3.981689453125, -3.849029541015625, -3.71636962890625, -3.583709716796875, -3.4510498046875, -3.318389892578125, -3.18572998046875, -3.053070068359375, -2.92041015625, -2.787750244140625, -2.65509033203125, -2.522430419921875, -2.3897705078125, -2.257110595703125, -2.12445068359375, -1.991790771484375, -1.859130859375, -1.726470947265625, -1.59381103515625, -1.461151123046875, -1.3284912109375, -1.195831298828125, -1.06317138671875, -0.930511474609375, -0.7978515625, -0.665191650390625, -0.53253173828125, -0.399871826171875, -0.2672119140625, -0.134552001953125, -0.00189208984375, 0.130767822265625, 0.263427734375, 0.396087646484375, 0.52874755859375, 0.661407470703125, 0.7940673828125, 0.926727294921875, 1.05938720703125, 1.192047119140625, 1.32470703125, 1.457366943359375, 1.59002685546875, 1.722686767578125, 1.8553466796875, 1.988006591796875, 2.12066650390625, 2.253326416015625, 2.385986328125, 2.518646240234375, 2.65130615234375, 2.783966064453125, 2.9166259765625, 3.049285888671875, 3.18194580078125, 3.314605712890625, 3.447265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 16.0, 17.0, 29.0, 37.0, 77.0, 92.0, 106.0, 155.0, 263.0, 363.0, 569.0, 829.0, 1220.0, 1857.0, 2664.0, 4303.0, 6663.0, 10687.0, 17318.0, 28955.0, 51365.0, 96684.0, 202182.0, 304709.0, 144129.0, 72047.0, 39557.0, 22728.0, 13949.0, 8726.0, 5609.0, 3470.0, 2394.0, 1574.0, 1045.0, 659.0, 451.0, 341.0, 216.0, 127.0, 117.0, 78.0, 53.0, 32.0, 30.0, 12.0, 15.0, 10.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.12255859375, -0.11876201629638672, -0.11496543884277344, -0.11116886138916016, -0.10737228393554688, -0.1035757064819336, -0.09977912902832031, -0.09598255157470703, -0.09218597412109375, -0.08838939666748047, -0.08459281921386719, -0.0807962417602539, -0.07699966430664062, -0.07320308685302734, -0.06940650939941406, -0.06560993194580078, -0.0618133544921875, -0.05801677703857422, -0.05422019958496094, -0.050423622131347656, -0.046627044677734375, -0.042830467224121094, -0.03903388977050781, -0.03523731231689453, -0.03144073486328125, -0.02764415740966797, -0.023847579956054688, -0.020051002502441406, -0.016254425048828125, -0.012457847595214844, -0.008661270141601562, -0.004864692687988281, -0.001068115234375, 0.0027284622192382812, 0.0065250396728515625, 0.010321617126464844, 0.014118194580078125, 0.017914772033691406, 0.021711349487304688, 0.02550792694091797, 0.02930450439453125, 0.03310108184814453, 0.03689765930175781, 0.040694236755371094, 0.044490814208984375, 0.048287391662597656, 0.05208396911621094, 0.05588054656982422, 0.0596771240234375, 0.06347370147705078, 0.06727027893066406, 0.07106685638427734, 0.07486343383789062, 0.0786600112915039, 0.08245658874511719, 0.08625316619873047, 0.09004974365234375, 0.09384632110595703, 0.09764289855957031, 0.1014394760131836, 0.10523605346679688, 0.10903263092041016, 0.11282920837402344, 0.11662578582763672, 0.12042236328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 0.0, 5.0, 5.0, 8.0, 10.0, 6.0, 5.0, 18.0, 10.0, 12.0, 21.0, 25.0, 28.0, 19.0, 25.0, 32.0, 35.0, 28.0, 37.0, 35.0, 45.0, 53.0, 40.0, 1067.0, 35.0, 33.0, 49.0, 37.0, 35.0, 42.0, 27.0, 38.0, 26.0, 21.0, 21.0, 17.0, 15.0, 7.0, 12.0, 7.0, 10.0, 4.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.79296875, -2.70611572265625, -2.6192626953125, -2.53240966796875, -2.445556640625, -2.35870361328125, -2.2718505859375, -2.18499755859375, -2.09814453125, -2.01129150390625, -1.9244384765625, -1.83758544921875, -1.750732421875, -1.66387939453125, -1.5770263671875, -1.49017333984375, -1.4033203125, -1.31646728515625, -1.2296142578125, -1.14276123046875, -1.055908203125, -0.96905517578125, -0.8822021484375, -0.79534912109375, -0.70849609375, -0.62164306640625, -0.5347900390625, -0.44793701171875, -0.361083984375, -0.27423095703125, -0.1873779296875, -0.10052490234375, -0.013671875, 0.07318115234375, 0.1600341796875, 0.24688720703125, 0.333740234375, 0.42059326171875, 0.5074462890625, 0.59429931640625, 0.68115234375, 0.76800537109375, 0.8548583984375, 0.94171142578125, 1.028564453125, 1.11541748046875, 1.2022705078125, 1.28912353515625, 1.3759765625, 1.46282958984375, 1.5496826171875, 1.63653564453125, 1.723388671875, 1.81024169921875, 1.8970947265625, 1.98394775390625, 2.07080078125, 2.15765380859375, 2.2445068359375, 2.33135986328125, 2.418212890625, 2.50506591796875, 2.5919189453125, 2.67877197265625, 2.765625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 24.0, 36.0, 71.0, 117.0, 160.0, 260.0, 421.0, 663.0, 1093.0, 1659.0, 2615.0, 4261.0, 6714.0, 11127.0, 17900.0, 29421.0, 48055.0, 82686.0, 159994.0, 1345616.0, 168742.0, 86185.0, 50158.0, 30251.0, 18677.0, 11358.0, 6970.0, 4488.0, 2785.0, 1634.0, 1116.0, 677.0, 414.0, 247.0, 171.0, 119.0, 66.0, 53.0, 35.0, 15.0, 14.0, 13.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.0843505859375, -0.08197689056396484, -0.07960319519042969, -0.07722949981689453, -0.07485580444335938, -0.07248210906982422, -0.07010841369628906, -0.0677347183227539, -0.06536102294921875, -0.0629873275756836, -0.06061363220214844, -0.05823993682861328, -0.055866241455078125, -0.05349254608154297, -0.05111885070800781, -0.048745155334472656, -0.0463714599609375, -0.043997764587402344, -0.04162406921386719, -0.03925037384033203, -0.036876678466796875, -0.03450298309326172, -0.03212928771972656, -0.029755592346191406, -0.02738189697265625, -0.025008201599121094, -0.022634506225585938, -0.02026081085205078, -0.017887115478515625, -0.015513420104980469, -0.013139724731445312, -0.010766029357910156, -0.008392333984375, -0.006018638610839844, -0.0036449432373046875, -0.0012712478637695312, 0.001102447509765625, 0.0034761428833007812, 0.0058498382568359375, 0.008223533630371094, 0.01059722900390625, 0.012970924377441406, 0.015344619750976562, 0.01771831512451172, 0.020092010498046875, 0.02246570587158203, 0.024839401245117188, 0.027213096618652344, 0.0295867919921875, 0.031960487365722656, 0.03433418273925781, 0.03670787811279297, 0.039081573486328125, 0.04145526885986328, 0.04382896423339844, 0.046202659606933594, 0.04857635498046875, 0.050950050354003906, 0.05332374572753906, 0.05569744110107422, 0.058071136474609375, 0.06044483184814453, 0.06281852722167969, 0.06519222259521484, 0.06756591796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 5.0, 6.0, 8.0, 8.0, 14.0, 15.0, 21.0, 19.0, 26.0, 24.0, 35.0, 29.0, 29.0, 31.0, 36.0, 41.0, 60.0, 80.0, 81.0, 60.0, 51.0, 47.0, 37.0, 40.0, 28.0, 20.0, 22.0, 17.0, 18.0, 17.0, 11.0, 11.0, 8.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.676248550415039e-05, -2.5918707251548767e-05, -2.5074928998947144e-05, -2.423115074634552e-05, -2.3387372493743896e-05, -2.2543594241142273e-05, -2.169981598854065e-05, -2.0856037735939026e-05, -2.0012259483337402e-05, -1.916848123073578e-05, -1.8324702978134155e-05, -1.7480924725532532e-05, -1.6637146472930908e-05, -1.5793368220329285e-05, -1.4949589967727661e-05, -1.4105811715126038e-05, -1.3262033462524414e-05, -1.241825520992279e-05, -1.1574476957321167e-05, -1.0730698704719543e-05, -9.88692045211792e-06, -9.043142199516296e-06, -8.199363946914673e-06, -7.355585694313049e-06, -6.511807441711426e-06, -5.668029189109802e-06, -4.824250936508179e-06, -3.980472683906555e-06, -3.1366944313049316e-06, -2.292916178703308e-06, -1.4491379261016846e-06, -6.05359673500061e-07, 2.384185791015625e-07, 1.082196831703186e-06, 1.9259750843048096e-06, 2.769753336906433e-06, 3.6135315895080566e-06, 4.45730984210968e-06, 5.301088094711304e-06, 6.144866347312927e-06, 6.988644599914551e-06, 7.832422852516174e-06, 8.676201105117798e-06, 9.519979357719421e-06, 1.0363757610321045e-05, 1.1207535862922668e-05, 1.2051314115524292e-05, 1.2895092368125916e-05, 1.3738870620727539e-05, 1.4582648873329163e-05, 1.5426427125930786e-05, 1.627020537853241e-05, 1.7113983631134033e-05, 1.7957761883735657e-05, 1.880154013633728e-05, 1.9645318388938904e-05, 2.0489096641540527e-05, 2.133287489414215e-05, 2.2176653146743774e-05, 2.3020431399345398e-05, 2.386420965194702e-05, 2.4707987904548645e-05, 2.555176615715027e-05, 2.6395544409751892e-05, 2.7239322662353516e-05]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 6.0, 4.0, 3.0, 10.0, 8.0, 11.0, 12.0, 14.0, 24.0, 29.0, 36.0, 34.0, 47.0, 57.0, 86.0, 129.0, 162.0, 283.0, 476.0, 947.0, 51970.0, 990660.0, 1802.0, 573.0, 345.0, 199.0, 147.0, 89.0, 75.0, 62.0, 55.0, 38.0, 29.0, 31.0, 23.0, 13.0, 18.0, 8.0, 3.0, 9.0, 6.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0005249977111816406, -0.0005086958408355713, -0.000492393970489502, -0.0004760921001434326, -0.0004597902297973633, -0.00044348835945129395, -0.0004271864891052246, -0.0004108846187591553, -0.00039458274841308594, -0.0003782808780670166, -0.00036197900772094727, -0.00034567713737487793, -0.0003293752670288086, -0.00031307339668273926, -0.0002967715263366699, -0.0002804696559906006, -0.00026416778564453125, -0.0002478659152984619, -0.00023156404495239258, -0.00021526217460632324, -0.0001989603042602539, -0.00018265843391418457, -0.00016635656356811523, -0.0001500546932220459, -0.00013375282287597656, -0.00011745095252990723, -0.00010114908218383789, -8.484721183776855e-05, -6.854534149169922e-05, -5.224347114562988e-05, -3.594160079956055e-05, -1.963973045349121e-05, -3.337860107421875e-06, 1.2964010238647461e-05, 2.9265880584716797e-05, 4.556775093078613e-05, 6.186962127685547e-05, 7.81714916229248e-05, 9.447336196899414e-05, 0.00011077523231506348, 0.0001270771026611328, 0.00014337897300720215, 0.00015968084335327148, 0.00017598271369934082, 0.00019228458404541016, 0.0002085864543914795, 0.00022488832473754883, 0.00024119019508361816, 0.0002574920654296875, 0.00027379393577575684, 0.00029009580612182617, 0.0003063976764678955, 0.00032269954681396484, 0.0003390014171600342, 0.0003553032875061035, 0.00037160515785217285, 0.0003879070281982422, 0.0004042088985443115, 0.00042051076889038086, 0.0004368126392364502, 0.00045311450958251953, 0.00046941637992858887, 0.0004857182502746582, 0.0005020201206207275, 0.0005183219909667969]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 73.0, 943.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232105518691242e-05, -1.6994339603115804e-05, -1.6676240193191916e-06, 1.3659089745488018e-05, 2.8985807148274034e-05, 4.431252455106005e-05, 5.963923467788845e-05, 7.496595208067447e-05, 9.029266948346049e-05, 0.0001056193868862465, 0.00012094610428903252, 0.0001362728071399033, 0.00015159952454268932, 0.00016692624194547534, 0.00018225295934826136, 0.00019757967675104737, 0.0002129063941538334, 0.0002282331115566194, 0.00024355982895940542, 0.00025888654636219144, 0.00027421326376497746, 0.00028953998116776347, 0.0003048666985705495, 0.0003201934159733355, 0.0003355201333761215, 0.00035084685077890754, 0.00036617356818169355, 0.00038150028558447957, 0.0003968270029872656, 0.0004121537203900516, 0.0004274804377928376, 0.00044280715519562364, 0.00045813381439074874, 0.00047346053179353476, 0.0004887872491963208, 0.0005041139665991068, 0.0005194406840018928, 0.0005347674014046788, 0.0005500941188074648, 0.0005654208362102509, 0.0005807475536130369, 0.0005960742710158229, 0.0006114009884186089, 0.0006267277058213949, 0.0006420544232241809, 0.000657381140626967, 0.000672707858029753, 0.000688034575432539, 0.0007033612346276641, 0.0007186879520304501, 0.0007340146694332361, 0.0007493413868360221, 0.0007646681042388082, 0.0007799948216415942, 0.0007953215390443802, 0.0008106482564471662, 0.0008259749738499522, 0.0008413016912527382, 0.0008566284086555243, 0.0008719551260583103, 0.0008872818434610963, 0.0009026085608638823, 0.0009179352782666683, 0.0009332619956694543, 0.0009485887130722404]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 11.0, 26.0, 25.0, 43.0, 60.0, 84.0, 90.0, 101.0, 90.0, 100.0, 106.0, 76.0, 66.0, 43.0, 46.0, 15.0, 13.0, 8.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8995018005371094e-05, -4.765857011079788e-05, -4.632212221622467e-05, -4.498567432165146e-05, -4.364922642707825e-05, -4.2312778532505035e-05, -4.0976330637931824e-05, -3.963988274335861e-05, -3.83034348487854e-05, -3.696698695421219e-05, -3.563053905963898e-05, -3.4294091165065765e-05, -3.2957643270492554e-05, -3.162119537591934e-05, -3.028474748134613e-05, -2.894829958677292e-05, -2.7611851692199707e-05, -2.6275403797626495e-05, -2.4938955903053284e-05, -2.3602508008480072e-05, -2.226606011390686e-05, -2.092961221933365e-05, -1.9593164324760437e-05, -1.8256716430187225e-05, -1.6920268535614014e-05, -1.5583820641040802e-05, -1.424737274646759e-05, -1.2910924851894379e-05, -1.1574476957321167e-05, -1.0238029062747955e-05, -8.901581168174744e-06, -7.565133273601532e-06, -6.22868537902832e-06, -4.892237484455109e-06, -3.555789589881897e-06, -2.2193416953086853e-06, -8.828938007354736e-07, 4.5355409383773804e-07, 1.7900019884109497e-06, 3.1264498829841614e-06, 4.462897777557373e-06, 5.799345672130585e-06, 7.135793566703796e-06, 8.472241461277008e-06, 9.80868935585022e-06, 1.1145137250423431e-05, 1.2481585144996643e-05, 1.3818033039569855e-05, 1.5154480934143066e-05, 1.6490928828716278e-05, 1.782737672328949e-05, 1.91638246178627e-05, 2.0500272512435913e-05, 2.1836720407009125e-05, 2.3173168301582336e-05, 2.4509616196155548e-05, 2.584606409072876e-05, 2.718251198530197e-05, 2.8518959879875183e-05, 2.9855407774448395e-05, 3.1191855669021606e-05, 3.252830356359482e-05, 3.386475145816803e-05, 3.520119935274124e-05, 3.653764724731445e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 11.0, 7.0, 12.0, 14.0, 17.0, 18.0, 21.0, 22.0, 30.0, 29.0, 46.0, 39.0, 37.0, 44.0, 47.0, 47.0, 41.0, 51.0, 49.0, 43.0, 40.0, 42.0, 36.0, 36.0, 41.0, 25.0, 27.0, 24.0, 17.0, 14.0, 12.0, 14.0, 8.0, 10.0, 5.0, 7.0, 1.0, 5.0, 2.0, 0.0, 4.0, 3.0, 1.0], "bins": [-5.04296875, -4.910308837890625, -4.77764892578125, -4.644989013671875, -4.5123291015625, -4.379669189453125, -4.24700927734375, -4.114349365234375, -3.981689453125, -3.849029541015625, -3.71636962890625, -3.583709716796875, -3.4510498046875, -3.318389892578125, -3.18572998046875, -3.053070068359375, -2.92041015625, -2.787750244140625, -2.65509033203125, -2.522430419921875, -2.3897705078125, -2.257110595703125, -2.12445068359375, -1.991790771484375, -1.859130859375, -1.726470947265625, -1.59381103515625, -1.461151123046875, -1.3284912109375, -1.195831298828125, -1.06317138671875, -0.930511474609375, -0.7978515625, -0.665191650390625, -0.53253173828125, -0.399871826171875, -0.2672119140625, -0.134552001953125, -0.00189208984375, 0.130767822265625, 0.263427734375, 0.396087646484375, 0.52874755859375, 0.661407470703125, 0.7940673828125, 0.926727294921875, 1.05938720703125, 1.192047119140625, 1.32470703125, 1.457366943359375, 1.59002685546875, 1.722686767578125, 1.8553466796875, 1.988006591796875, 2.12066650390625, 2.253326416015625, 2.385986328125, 2.518646240234375, 2.65130615234375, 2.783966064453125, 2.9166259765625, 3.049285888671875, 3.18194580078125, 3.314605712890625, 3.447265625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 6.0, 16.0, 23.0, 26.0, 29.0, 36.0, 68.0, 73.0, 109.0, 170.0, 257.0, 506.0, 943.0, 2120.0, 5845.0, 23653.0, 173162.0, 664811.0, 146087.0, 20986.0, 5418.0, 1963.0, 894.0, 462.0, 290.0, 167.0, 120.0, 76.0, 56.0, 38.0, 33.0, 26.0, 18.0, 12.0, 15.0, 8.0, 2.0, 3.0, 7.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5703125, -8.33526611328125, -8.1002197265625, -7.86517333984375, -7.630126953125, -7.39508056640625, -7.1600341796875, -6.92498779296875, -6.68994140625, -6.45489501953125, -6.2198486328125, -5.98480224609375, -5.749755859375, -5.51470947265625, -5.2796630859375, -5.04461669921875, -4.8095703125, -4.57452392578125, -4.3394775390625, -4.10443115234375, -3.869384765625, -3.63433837890625, -3.3992919921875, -3.16424560546875, -2.92919921875, -2.69415283203125, -2.4591064453125, -2.22406005859375, -1.989013671875, -1.75396728515625, -1.5189208984375, -1.28387451171875, -1.048828125, -0.81378173828125, -0.5787353515625, -0.34368896484375, -0.108642578125, 0.12640380859375, 0.3614501953125, 0.59649658203125, 0.83154296875, 1.06658935546875, 1.3016357421875, 1.53668212890625, 1.771728515625, 2.00677490234375, 2.2418212890625, 2.47686767578125, 2.7119140625, 2.94696044921875, 3.1820068359375, 3.41705322265625, 3.652099609375, 3.88714599609375, 4.1221923828125, 4.35723876953125, 4.59228515625, 4.82733154296875, 5.0623779296875, 5.29742431640625, 5.532470703125, 5.76751708984375, 6.0025634765625, 6.23760986328125, 6.47265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 1.0, 1.0, 10.0, 11.0, 10.0, 14.0, 19.0, 22.0, 22.0, 36.0, 32.0, 58.0, 71.0, 99.0, 176.0, 1554.0, 381.0, 147.0, 96.0, 56.0, 50.0, 37.0, 41.0, 20.0, 26.0, 18.0, 11.0, 9.0, 11.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3515625, -10.943603515625, -10.53564453125, -10.127685546875, -9.7197265625, -9.311767578125, -8.90380859375, -8.495849609375, -8.087890625, -7.679931640625, -7.27197265625, -6.864013671875, -6.4560546875, -6.048095703125, -5.64013671875, -5.232177734375, -4.82421875, -4.416259765625, -4.00830078125, -3.600341796875, -3.1923828125, -2.784423828125, -2.37646484375, -1.968505859375, -1.560546875, -1.152587890625, -0.74462890625, -0.336669921875, 0.0712890625, 0.479248046875, 0.88720703125, 1.295166015625, 1.703125, 2.111083984375, 2.51904296875, 2.927001953125, 3.3349609375, 3.742919921875, 4.15087890625, 4.558837890625, 4.966796875, 5.374755859375, 5.78271484375, 6.190673828125, 6.5986328125, 7.006591796875, 7.41455078125, 7.822509765625, 8.23046875, 8.638427734375, 9.04638671875, 9.454345703125, 9.8623046875, 10.270263671875, 10.67822265625, 11.086181640625, 11.494140625, 11.902099609375, 12.31005859375, 12.718017578125, 13.1259765625, 13.533935546875, 13.94189453125, 14.349853515625, 14.7578125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 2.0, 6.0, 11.0, 5.0, 15.0, 17.0, 18.0, 28.0, 48.0, 51.0, 86.0, 160.0, 309.0, 595.0, 1984.0, 2612038.0, 527574.0, 1541.0, 509.0, 270.0, 139.0, 89.0, 51.0, 41.0, 27.0, 17.0, 22.0, 13.0, 12.0, 6.0, 9.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.5625, -29.687744140625, -28.81298828125, -27.938232421875, -27.0634765625, -26.188720703125, -25.31396484375, -24.439208984375, -23.564453125, -22.689697265625, -21.81494140625, -20.940185546875, -20.0654296875, -19.190673828125, -18.31591796875, -17.441162109375, -16.56640625, -15.691650390625, -14.81689453125, -13.942138671875, -13.0673828125, -12.192626953125, -11.31787109375, -10.443115234375, -9.568359375, -8.693603515625, -7.81884765625, -6.944091796875, -6.0693359375, -5.194580078125, -4.31982421875, -3.445068359375, -2.5703125, -1.695556640625, -0.82080078125, 0.053955078125, 0.9287109375, 1.803466796875, 2.67822265625, 3.552978515625, 4.427734375, 5.302490234375, 6.17724609375, 7.052001953125, 7.9267578125, 8.801513671875, 9.67626953125, 10.551025390625, 11.42578125, 12.300537109375, 13.17529296875, 14.050048828125, 14.9248046875, 15.799560546875, 16.67431640625, 17.549072265625, 18.423828125, 19.298583984375, 20.17333984375, 21.048095703125, 21.9228515625, 22.797607421875, 23.67236328125, 24.547119140625, 25.421875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 48.0, 515.0, 402.0, 46.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.54981231689453, -99.91535949707031, -97.2809066772461, -94.64645385742188, -92.01200866699219, -89.37755584716797, -86.74310302734375, -84.10865020751953, -81.47419738769531, -78.8397445678711, -76.20529174804688, -73.57083892822266, -70.93638610839844, -68.30194091796875, -65.66748809814453, -63.03303527832031, -60.398582458496094, -57.764129638671875, -55.129676818847656, -52.4952278137207, -49.860774993896484, -47.226322174072266, -44.59187316894531, -41.957420349121094, -39.322967529296875, -36.688514709472656, -34.05406188964844, -31.419612884521484, -28.785160064697266, -26.150707244873047, -23.51625633239746, -20.881805419921875, -18.247344970703125, -15.612893104553223, -12.97844123840332, -10.343989372253418, -7.709537506103516, -5.075085639953613, -2.440633773803711, 0.193817138671875, 2.8282699584960938, 5.462721824645996, 8.097173690795898, 10.7316255569458, 13.366077423095703, 16.000530242919922, 18.634981155395508, 21.269432067871094, 23.903884887695312, 26.53833770751953, 29.172788619995117, 31.807239532470703, 34.44169235229492, 37.07614517211914, 39.710594177246094, 42.34504699707031, 44.97949981689453, 47.61395263671875, 50.24840545654297, 52.88285446166992, 55.51730728149414, 58.15176010131836, 60.78620910644531, 63.42066192626953, 66.05511474609375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 2.0, 11.0, 5.0, 9.0, 10.0, 10.0, 9.0, 14.0, 13.0, 22.0, 19.0, 21.0, 21.0, 29.0, 29.0, 28.0, 28.0, 25.0, 26.0, 36.0, 33.0, 45.0, 38.0, 44.0, 54.0, 34.0, 29.0, 41.0, 28.0, 39.0, 35.0, 30.0, 34.0, 19.0, 13.0, 17.0, 8.0, 20.0, 7.0, 14.0, 11.0, 7.0, 8.0, 8.0, 3.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-20.943878173828125, -20.30788230895996, -19.671886444091797, -19.035890579223633, -18.39989471435547, -17.763896942138672, -17.127901077270508, -16.491905212402344, -15.85590934753418, -15.219913482666016, -14.583917617797852, -13.947920799255371, -13.311924934387207, -12.675929069519043, -12.039932250976562, -11.403936386108398, -10.767940521240234, -10.13194465637207, -9.495948791503906, -8.859951972961426, -8.223956108093262, -7.587960243225098, -6.951963901519775, -6.315967559814453, -5.679971694946289, -5.043975830078125, -4.407979488372803, -3.7719833850860596, -3.1359872817993164, -2.4999911785125732, -1.86399507522583, -1.2279987335205078, -0.5920028686523438, 0.043993234634399414, 0.6799893379211426, 1.3159854412078857, 1.951981544494629, 2.587977647781372, 3.2239737510681152, 3.8599700927734375, 4.495965957641602, 5.131961822509766, 5.767958164215088, 6.40395450592041, 7.039950370788574, 7.675946235656738, 8.311943054199219, 8.947938919067383, 9.583934783935547, 10.219930648803711, 10.855926513671875, 11.491923332214355, 12.12791919708252, 12.763915061950684, 13.399911880493164, 14.035907745361328, 14.671903610229492, 15.307899475097656, 15.94389533996582, 16.579891204833984, 17.21588897705078, 17.851884841918945, 18.48788070678711, 19.123876571655273, 19.759872436523438]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 13.0, 12.0, 11.0, 8.0, 14.0, 18.0, 24.0, 19.0, 25.0, 36.0, 44.0, 48.0, 41.0, 46.0, 51.0, 44.0, 69.0, 43.0, 59.0, 37.0, 40.0, 37.0, 40.0, 49.0, 41.0, 16.0, 22.0, 26.0, 14.0, 16.0, 8.0, 9.0, 4.0, 4.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.41796875, -6.256072998046875, -6.09417724609375, -5.932281494140625, -5.7703857421875, -5.608489990234375, -5.44659423828125, -5.284698486328125, -5.122802734375, -4.960906982421875, -4.79901123046875, -4.637115478515625, -4.4752197265625, -4.313323974609375, -4.15142822265625, -3.989532470703125, -3.82763671875, -3.665740966796875, -3.50384521484375, -3.341949462890625, -3.1800537109375, -3.018157958984375, -2.85626220703125, -2.694366455078125, -2.532470703125, -2.370574951171875, -2.20867919921875, -2.046783447265625, -1.8848876953125, -1.722991943359375, -1.56109619140625, -1.399200439453125, -1.2373046875, -1.075408935546875, -0.91351318359375, -0.751617431640625, -0.5897216796875, -0.427825927734375, -0.26593017578125, -0.104034423828125, 0.057861328125, 0.219757080078125, 0.38165283203125, 0.543548583984375, 0.7054443359375, 0.867340087890625, 1.02923583984375, 1.191131591796875, 1.35302734375, 1.514923095703125, 1.67681884765625, 1.838714599609375, 2.0006103515625, 2.162506103515625, 2.32440185546875, 2.486297607421875, 2.648193359375, 2.810089111328125, 2.97198486328125, 3.133880615234375, 3.2957763671875, 3.457672119140625, 3.61956787109375, 3.781463623046875, 3.943359375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 11.0, 10.0, 19.0, 24.0, 36.0, 51.0, 85.0, 85.0, 139.0, 196.0, 267.0, 386.0, 520.0, 794.0, 1642.0, 5174.0, 37487.0, 978445.0, 3035509.0, 117069.0, 10662.0, 2455.0, 1077.0, 631.0, 453.0, 285.0, 210.0, 156.0, 120.0, 75.0, 62.0, 38.0, 29.0, 20.0, 19.0, 12.0, 6.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-27.890625, -27.16064453125, -26.4306640625, -25.70068359375, -24.970703125, -24.24072265625, -23.5107421875, -22.78076171875, -22.05078125, -21.32080078125, -20.5908203125, -19.86083984375, -19.130859375, -18.40087890625, -17.6708984375, -16.94091796875, -16.2109375, -15.48095703125, -14.7509765625, -14.02099609375, -13.291015625, -12.56103515625, -11.8310546875, -11.10107421875, -10.37109375, -9.64111328125, -8.9111328125, -8.18115234375, -7.451171875, -6.72119140625, -5.9912109375, -5.26123046875, -4.53125, -3.80126953125, -3.0712890625, -2.34130859375, -1.611328125, -0.88134765625, -0.1513671875, 0.57861328125, 1.30859375, 2.03857421875, 2.7685546875, 3.49853515625, 4.228515625, 4.95849609375, 5.6884765625, 6.41845703125, 7.1484375, 7.87841796875, 8.6083984375, 9.33837890625, 10.068359375, 10.79833984375, 11.5283203125, 12.25830078125, 12.98828125, 13.71826171875, 14.4482421875, 15.17822265625, 15.908203125, 16.63818359375, 17.3681640625, 18.09814453125, 18.828125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 10.0, 15.0, 18.0, 28.0, 49.0, 48.0, 57.0, 98.0, 164.0, 197.0, 257.0, 390.0, 512.0, 539.0, 474.0, 347.0, 241.0, 180.0, 132.0, 90.0, 78.0, 47.0, 37.0, 15.0, 17.0, 15.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0078125, -9.697509765625, -9.38720703125, -9.076904296875, -8.7666015625, -8.456298828125, -8.14599609375, -7.835693359375, -7.525390625, -7.215087890625, -6.90478515625, -6.594482421875, -6.2841796875, -5.973876953125, -5.66357421875, -5.353271484375, -5.04296875, -4.732666015625, -4.42236328125, -4.112060546875, -3.8017578125, -3.491455078125, -3.18115234375, -2.870849609375, -2.560546875, -2.250244140625, -1.93994140625, -1.629638671875, -1.3193359375, -1.009033203125, -0.69873046875, -0.388427734375, -0.078125, 0.232177734375, 0.54248046875, 0.852783203125, 1.1630859375, 1.473388671875, 1.78369140625, 2.093994140625, 2.404296875, 2.714599609375, 3.02490234375, 3.335205078125, 3.6455078125, 3.955810546875, 4.26611328125, 4.576416015625, 4.88671875, 5.197021484375, 5.50732421875, 5.817626953125, 6.1279296875, 6.438232421875, 6.74853515625, 7.058837890625, 7.369140625, 7.679443359375, 7.98974609375, 8.300048828125, 8.6103515625, 8.920654296875, 9.23095703125, 9.541259765625, 9.8515625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 12.0, 19.0, 17.0, 42.0, 100.0, 152.0, 357.0, 839.0, 2335.0, 8567.0, 41095.0, 269639.0, 2125595.0, 1518943.0, 186666.0, 30004.0, 6527.0, 1963.0, 747.0, 306.0, 182.0, 83.0, 39.0, 18.0, 9.0, 3.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.625, -11.271728515625, -10.91845703125, -10.565185546875, -10.2119140625, -9.858642578125, -9.50537109375, -9.152099609375, -8.798828125, -8.445556640625, -8.09228515625, -7.739013671875, -7.3857421875, -7.032470703125, -6.67919921875, -6.325927734375, -5.97265625, -5.619384765625, -5.26611328125, -4.912841796875, -4.5595703125, -4.206298828125, -3.85302734375, -3.499755859375, -3.146484375, -2.793212890625, -2.43994140625, -2.086669921875, -1.7333984375, -1.380126953125, -1.02685546875, -0.673583984375, -0.3203125, 0.032958984375, 0.38623046875, 0.739501953125, 1.0927734375, 1.446044921875, 1.79931640625, 2.152587890625, 2.505859375, 2.859130859375, 3.21240234375, 3.565673828125, 3.9189453125, 4.272216796875, 4.62548828125, 4.978759765625, 5.33203125, 5.685302734375, 6.03857421875, 6.391845703125, 6.7451171875, 7.098388671875, 7.45166015625, 7.804931640625, 8.158203125, 8.511474609375, 8.86474609375, 9.218017578125, 9.5712890625, 9.924560546875, 10.27783203125, 10.631103515625, 10.984375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 14.0, 12.0, 23.0, 33.0, 52.0, 55.0, 73.0, 68.0, 104.0, 110.0, 109.0, 92.0, 71.0, 59.0, 34.0, 35.0, 28.0, 8.0, 10.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.87713623046875, -89.54345703125, -87.20978546142578, -84.87610626220703, -82.54243469238281, -80.20875549316406, -77.87508392333984, -75.5414047241211, -73.20773315429688, -70.87405395507812, -68.5403823852539, -66.20670318603516, -63.87303161621094, -61.53935623168945, -59.20568084716797, -56.87200164794922, -54.538326263427734, -52.20465087890625, -49.870975494384766, -47.53730010986328, -45.2036247253418, -42.86994934082031, -40.53627014160156, -38.202598571777344, -35.868919372558594, -33.53524398803711, -31.201568603515625, -28.86789321899414, -26.534217834472656, -24.200542449951172, -21.866865158081055, -19.53318977355957, -17.19951629638672, -14.865840911865234, -12.53216552734375, -10.19848918914795, -7.864813804626465, -5.5311384201049805, -3.1974620819091797, -0.8637866973876953, 1.469888687133789, 3.8035643100738525, 6.137239933013916, 8.470915794372559, 10.804591178894043, 13.138266563415527, 15.471942901611328, 17.805618286132812, 20.139293670654297, 22.47296905517578, 24.806644439697266, 27.14031982421875, 29.473995208740234, 31.80767059326172, 34.14134979248047, 36.47502136230469, 38.80870056152344, 41.14237594604492, 43.476051330566406, 45.80972671508789, 48.143402099609375, 50.47707748413086, 52.810752868652344, 55.144432067871094, 57.47810363769531]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 3.0, 8.0, 4.0, 10.0, 9.0, 17.0, 19.0, 19.0, 28.0, 29.0, 26.0, 21.0, 35.0, 36.0, 49.0, 53.0, 42.0, 49.0, 53.0, 50.0, 37.0, 44.0, 33.0, 49.0, 47.0, 42.0, 28.0, 29.0, 22.0, 11.0, 14.0, 22.0, 10.0, 12.0, 9.0, 9.0, 2.0, 10.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.572113037109375, -47.25437545776367, -45.93663787841797, -44.618896484375, -43.3011589050293, -41.983421325683594, -40.665679931640625, -39.34794235229492, -38.03020477294922, -36.712467193603516, -35.39472961425781, -34.076988220214844, -32.75925064086914, -31.441513061523438, -30.1237735748291, -28.806034088134766, -27.488296508789062, -26.17055892944336, -24.852819442749023, -23.535079956054688, -22.217342376708984, -20.89960479736328, -19.581865310668945, -18.26412582397461, -16.946388244628906, -15.628649711608887, -14.310911178588867, -12.993172645568848, -11.675434112548828, -10.357695579528809, -9.039957046508789, -7.7222185134887695, -6.40447998046875, -5.0867414474487305, -3.769002914428711, -2.4512643814086914, -1.1335258483886719, 0.18421268463134766, 1.5019512176513672, 2.8196897506713867, 4.137428283691406, 5.455166816711426, 6.772905349731445, 8.090643882751465, 9.408382415771484, 10.726120948791504, 12.043859481811523, 13.361598014831543, 14.679336547851562, 15.997075080871582, 17.3148136138916, 18.632553100585938, 19.95029067993164, 21.268028259277344, 22.58576774597168, 23.903507232666016, 25.22124481201172, 26.538982391357422, 27.856721878051758, 29.174461364746094, 30.492198944091797, 31.8099365234375, 33.12767791748047, 34.44541549682617, 35.763153076171875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 4.0, 7.0, 4.0, 5.0, 10.0, 13.0, 19.0, 18.0, 23.0, 26.0, 25.0, 37.0, 36.0, 42.0, 49.0, 45.0, 53.0, 47.0, 49.0, 39.0, 51.0, 44.0, 48.0, 31.0, 47.0, 42.0, 26.0, 36.0, 24.0, 20.0, 13.0, 16.0, 9.0, 8.0, 4.0, 5.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-91.9375, -89.36328125, -86.7890625, -84.21484375, -81.640625, -79.06640625, -76.4921875, -73.91796875, -71.34375, -68.76953125, -66.1953125, -63.62109375, -61.046875, -58.47265625, -55.8984375, -53.32421875, -50.75, -48.17578125, -45.6015625, -43.02734375, -40.453125, -37.87890625, -35.3046875, -32.73046875, -30.15625, -27.58203125, -25.0078125, -22.43359375, -19.859375, -17.28515625, -14.7109375, -12.13671875, -9.5625, -6.98828125, -4.4140625, -1.83984375, 0.734375, 3.30859375, 5.8828125, 8.45703125, 11.03125, 13.60546875, 16.1796875, 18.75390625, 21.328125, 23.90234375, 26.4765625, 29.05078125, 31.625, 34.19921875, 36.7734375, 39.34765625, 41.921875, 44.49609375, 47.0703125, 49.64453125, 52.21875, 54.79296875, 57.3671875, 59.94140625, 62.515625, 65.08984375, 67.6640625, 70.23828125, 72.8125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 12.0, 8.0, 16.0, 28.0, 36.0, 55.0, 85.0, 124.0, 189.0, 268.0, 374.0, 586.0, 814.0, 1174.0, 1761.0, 2606.0, 3660.0, 5619.0, 8409.0, 12769.0, 20089.0, 32012.0, 53175.0, 93582.0, 179974.0, 273227.0, 150337.0, 80524.0, 46364.0, 28148.0, 17638.0, 11425.0, 7557.0, 5113.0, 3437.0, 2342.0, 1658.0, 1045.0, 711.0, 527.0, 352.0, 235.0, 152.0, 112.0, 85.0, 38.0, 39.0, 23.0, 15.0, 11.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-2.033203125, -1.9722747802734375, -1.911346435546875, -1.8504180908203125, -1.78948974609375, -1.7285614013671875, -1.667633056640625, -1.6067047119140625, -1.5457763671875, -1.4848480224609375, -1.423919677734375, -1.3629913330078125, -1.30206298828125, -1.2411346435546875, -1.180206298828125, -1.1192779541015625, -1.058349609375, -0.9974212646484375, -0.936492919921875, -0.8755645751953125, -0.81463623046875, -0.7537078857421875, -0.692779541015625, -0.6318511962890625, -0.5709228515625, -0.5099945068359375, -0.449066162109375, -0.3881378173828125, -0.32720947265625, -0.2662811279296875, -0.205352783203125, -0.1444244384765625, -0.08349609375, -0.0225677490234375, 0.038360595703125, 0.0992889404296875, 0.16021728515625, 0.2211456298828125, 0.282073974609375, 0.3430023193359375, 0.4039306640625, 0.4648590087890625, 0.525787353515625, 0.5867156982421875, 0.64764404296875, 0.7085723876953125, 0.769500732421875, 0.8304290771484375, 0.891357421875, 0.9522857666015625, 1.013214111328125, 1.0741424560546875, 1.13507080078125, 1.1959991455078125, 1.256927490234375, 1.3178558349609375, 1.3787841796875, 1.4397125244140625, 1.500640869140625, 1.5615692138671875, 1.62249755859375, 1.6834259033203125, 1.744354248046875, 1.8052825927734375, 1.8662109375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 8.0, 4.0, 4.0, 3.0, 8.0, 11.0, 10.0, 7.0, 12.0, 12.0, 23.0, 29.0, 23.0, 18.0, 21.0, 34.0, 33.0, 35.0, 37.0, 33.0, 35.0, 46.0, 38.0, 1067.0, 27.0, 38.0, 45.0, 33.0, 39.0, 28.0, 32.0, 30.0, 26.0, 23.0, 21.0, 23.0, 22.0, 17.0, 19.0, 15.0, 4.0, 8.0, 6.0, 5.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-43.78125, -42.453125, -41.125, -39.796875, -38.46875, -37.140625, -35.8125, -34.484375, -33.15625, -31.828125, -30.5, -29.171875, -27.84375, -26.515625, -25.1875, -23.859375, -22.53125, -21.203125, -19.875, -18.546875, -17.21875, -15.890625, -14.5625, -13.234375, -11.90625, -10.578125, -9.25, -7.921875, -6.59375, -5.265625, -3.9375, -2.609375, -1.28125, 0.046875, 1.375, 2.703125, 4.03125, 5.359375, 6.6875, 8.015625, 9.34375, 10.671875, 12.0, 13.328125, 14.65625, 15.984375, 17.3125, 18.640625, 19.96875, 21.296875, 22.625, 23.953125, 25.28125, 26.609375, 27.9375, 29.265625, 30.59375, 31.921875, 33.25, 34.578125, 35.90625, 37.234375, 38.5625, 39.890625, 41.21875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 23.0, 25.0, 34.0, 33.0, 69.0, 108.0, 185.0, 254.0, 388.0, 638.0, 1022.0, 1640.0, 2629.0, 4368.0, 7470.0, 12674.0, 21963.0, 38743.0, 70736.0, 145498.0, 1386785.0, 199735.0, 89290.0, 47951.0, 26914.0, 15288.0, 8994.0, 5271.0, 3178.0, 1950.0, 1166.0, 736.0, 483.0, 301.0, 193.0, 113.0, 84.0, 66.0, 34.0, 28.0, 24.0, 12.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6220703125, -1.5724334716796875, -1.522796630859375, -1.4731597900390625, -1.42352294921875, -1.3738861083984375, -1.324249267578125, -1.2746124267578125, -1.2249755859375, -1.1753387451171875, -1.125701904296875, -1.0760650634765625, -1.02642822265625, -0.9767913818359375, -0.927154541015625, -0.8775177001953125, -0.827880859375, -0.7782440185546875, -0.728607177734375, -0.6789703369140625, -0.62933349609375, -0.5796966552734375, -0.530059814453125, -0.4804229736328125, -0.4307861328125, -0.3811492919921875, -0.331512451171875, -0.2818756103515625, -0.23223876953125, -0.1826019287109375, -0.132965087890625, -0.0833282470703125, -0.03369140625, 0.0159454345703125, 0.065582275390625, 0.1152191162109375, 0.16485595703125, 0.2144927978515625, 0.264129638671875, 0.3137664794921875, 0.3634033203125, 0.4130401611328125, 0.462677001953125, 0.5123138427734375, 0.56195068359375, 0.6115875244140625, 0.661224365234375, 0.7108612060546875, 0.760498046875, 0.8101348876953125, 0.859771728515625, 0.9094085693359375, 0.95904541015625, 1.0086822509765625, 1.058319091796875, 1.1079559326171875, 1.1575927734375, 1.2072296142578125, 1.256866455078125, 1.3065032958984375, 1.35614013671875, 1.4057769775390625, 1.455413818359375, 1.5050506591796875, 1.5546875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 2.0, 6.0, 7.0, 8.0, 11.0, 9.0, 16.0, 18.0, 29.0, 18.0, 36.0, 57.0, 84.0, 143.0, 184.0, 101.0, 60.0, 39.0, 33.0, 20.0, 16.0, 17.0, 12.0, 9.0, 8.0, 13.0, 3.0, 5.0, 4.0, 3.0, 6.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007486343383789062, -0.0007245838642120361, -0.000700533390045166, -0.0006764829158782959, -0.0006524324417114258, -0.0006283819675445557, -0.0006043314933776855, -0.0005802810192108154, -0.0005562305450439453, -0.0005321800708770752, -0.0005081295967102051, -0.00048407912254333496, -0.00046002864837646484, -0.0004359781742095947, -0.0004119277000427246, -0.0003878772258758545, -0.0003638267517089844, -0.00033977627754211426, -0.00031572580337524414, -0.000291675329208374, -0.0002676248550415039, -0.0002435743808746338, -0.00021952390670776367, -0.00019547343254089355, -0.00017142295837402344, -0.00014737248420715332, -0.0001233220100402832, -9.927153587341309e-05, -7.522106170654297e-05, -5.117058753967285e-05, -2.7120113372802734e-05, -3.069639205932617e-06, 2.09808349609375e-05, 4.503130912780762e-05, 6.908178329467773e-05, 9.313225746154785e-05, 0.00011718273162841797, 0.00014123320579528809, 0.0001652836799621582, 0.00018933415412902832, 0.00021338462829589844, 0.00023743510246276855, 0.00026148557662963867, 0.0002855360507965088, 0.0003095865249633789, 0.000333636999130249, 0.00035768747329711914, 0.00038173794746398926, 0.0004057884216308594, 0.0004298388957977295, 0.0004538893699645996, 0.0004779398441314697, 0.0005019903182983398, 0.00052604079246521, 0.0005500912666320801, 0.0005741417407989502, 0.0005981922149658203, 0.0006222426891326904, 0.0006462931632995605, 0.0006703436374664307, 0.0006943941116333008, 0.0007184445858001709, 0.000742495059967041, 0.0007665455341339111, 0.0007905960083007812]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 8.0, 5.0, 14.0, 15.0, 21.0, 29.0, 44.0, 81.0, 106.0, 147.0, 235.0, 395.0, 666.0, 1178.0, 2278.0, 4290.0, 9518.0, 24744.0, 80080.0, 547384.0, 287878.0, 55363.0, 18510.0, 7685.0, 3528.0, 1774.0, 1012.0, 566.0, 341.0, 238.0, 127.0, 97.0, 64.0, 31.0, 27.0, 23.0, 14.0, 12.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0031375885009765625, -0.0030421018600463867, -0.002946615219116211, -0.002851128578186035, -0.0027556419372558594, -0.0026601552963256836, -0.002564668655395508, -0.002469182014465332, -0.0023736953735351562, -0.0022782087326049805, -0.0021827220916748047, -0.002087235450744629, -0.001991748809814453, -0.0018962621688842773, -0.0018007755279541016, -0.0017052888870239258, -0.00160980224609375, -0.0015143156051635742, -0.0014188289642333984, -0.0013233423233032227, -0.0012278556823730469, -0.001132369041442871, -0.0010368824005126953, -0.0009413957595825195, -0.0008459091186523438, -0.000750422477722168, -0.0006549358367919922, -0.0005594491958618164, -0.0004639625549316406, -0.00036847591400146484, -0.00027298927307128906, -0.00017750263214111328, -8.20159912109375e-05, 1.3470649719238281e-05, 0.00010895729064941406, 0.00020444393157958984, 0.0002999305725097656, 0.0003954172134399414, 0.0004909038543701172, 0.000586390495300293, 0.0006818771362304688, 0.0007773637771606445, 0.0008728504180908203, 0.0009683370590209961, 0.0010638236999511719, 0.0011593103408813477, 0.0012547969818115234, 0.0013502836227416992, 0.001445770263671875, 0.0015412569046020508, 0.0016367435455322266, 0.0017322301864624023, 0.0018277168273925781, 0.001923203468322754, 0.0020186901092529297, 0.0021141767501831055, 0.0022096633911132812, 0.002305150032043457, 0.002400636672973633, 0.0024961233139038086, 0.0025916099548339844, 0.00268709659576416, 0.002782583236694336, 0.0028780698776245117, 0.0029735565185546875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 14.0, 23.0, 30.0, 53.0, 110.0, 151.0, 149.0, 114.0, 93.0, 64.0, 49.0, 26.0, 14.0, 22.0, 16.0, 11.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005212380783632398, -0.00048411329044029117, -0.0004469884734135121, -0.00040986365638673306, -0.00037273886846378446, -0.00033561408054083586, -0.0002984892635140568, -0.00026136444648727775, -0.00022423965856432915, -0.00018711485608946532, -0.0001499900536146015, -0.00011286525113973767, -7.574044866487384e-05, -3.861564619001001e-05, -1.490843715146184e-06, 3.563397331163287e-05, 7.275876123458147e-05, 0.0001098835637094453, 0.00014700836618430912, 0.00018413316865917295, 0.00022125797113403678, 0.0002583827590569854, 0.00029550757608376443, 0.0003326323931105435, 0.0003697571810334921, 0.0004068819689564407, 0.00044400678598321974, 0.0004811316030099988, 0.0005182563909329474, 0.000555381178855896, 0.0005925060249865055, 0.0006296308129094541, 0.0006667557172477245, 0.0007038805051706731, 0.0007410052930936217, 0.0007781301392242312, 0.0008152549271471798, 0.0008523797150701284, 0.000889504561200738, 0.0009266293491236866, 0.0009637541370466352, 0.0010008789831772447, 0.0010380037128925323, 0.0010751285590231419, 0.0011122534051537514, 0.001149378134869039, 0.0011865029809996486, 0.0012236277107149363, 0.0012607525568455458, 0.0012978774029761553, 0.001335002132691443, 0.0013721269788220525, 0.0014092517085373402, 0.0014463765546679497, 0.0014835014007985592, 0.0015206262469291687, 0.0015577509766444564, 0.001594875822775066, 0.0016320005524903536, 0.001669125398620963, 0.0017062502447515726, 0.0017433749744668603, 0.0017804998205974698, 0.0018176245503127575, 0.001854749396443367]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 9.0, 10.0, 6.0, 8.0, 16.0, 14.0, 16.0, 16.0, 22.0, 21.0, 23.0, 22.0, 22.0, 23.0, 31.0, 32.0, 31.0, 29.0, 43.0, 36.0, 30.0, 32.0, 30.0, 36.0, 34.0, 32.0, 36.0, 29.0, 27.0, 26.0, 31.0, 18.0, 14.0, 17.0, 22.0, 17.0, 12.0, 27.0, 8.0, 10.0, 8.0, 11.0, 12.0, 8.0, 6.0, 10.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.0006614327430725098, -0.0006406772881746292, -0.0006199218332767487, -0.0005991663783788681, -0.0005784109234809875, -0.000557655468583107, -0.0005369000136852264, -0.0005161445587873459, -0.0004953891038894653, -0.0004746336489915848, -0.0004538781940937042, -0.00043312273919582367, -0.0004123672842979431, -0.00039161182940006256, -0.000370856374502182, -0.00035010091960430145, -0.0003293454647064209, -0.00030859000980854034, -0.0002878345549106598, -0.00026707910001277924, -0.0002463236451148987, -0.00022556819021701813, -0.00020481273531913757, -0.00018405728042125702, -0.00016330182552337646, -0.0001425463706254959, -0.00012179091572761536, -0.0001010354608297348, -8.028000593185425e-05, -5.9524551033973694e-05, -3.876909613609314e-05, -1.8013641238212585e-05, 2.7418136596679688e-06, 2.3497268557548523e-05, 4.425272345542908e-05, 6.500817835330963e-05, 8.576363325119019e-05, 0.00010651908814907074, 0.0001272745430469513, 0.00014802999794483185, 0.0001687854528427124, 0.00018954090774059296, 0.0002102963626384735, 0.00023105181753635406, 0.0002518072724342346, 0.0002725627273321152, 0.00029331818222999573, 0.0003140736371278763, 0.00033482909202575684, 0.0003555845469236374, 0.00037634000182151794, 0.0003970954567193985, 0.00041785091161727905, 0.0004386063665151596, 0.00045936182141304016, 0.0004801172763109207, 0.0005008727312088013, 0.0005216281861066818, 0.0005423836410045624, 0.0005631390959024429, 0.0005838945508003235, 0.000604650005698204, 0.0006254054605960846, 0.0006461609154939651, 0.0006669163703918457]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 4.0, 7.0, 4.0, 5.0, 10.0, 13.0, 19.0, 18.0, 23.0, 26.0, 25.0, 37.0, 36.0, 42.0, 49.0, 45.0, 53.0, 47.0, 49.0, 39.0, 51.0, 44.0, 48.0, 31.0, 47.0, 42.0, 26.0, 36.0, 24.0, 20.0, 13.0, 16.0, 9.0, 8.0, 4.0, 5.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-91.9375, -89.36328125, -86.7890625, -84.21484375, -81.640625, -79.06640625, -76.4921875, -73.91796875, -71.34375, -68.76953125, -66.1953125, -63.62109375, -61.046875, -58.47265625, -55.8984375, -53.32421875, -50.75, -48.17578125, -45.6015625, -43.02734375, -40.453125, -37.87890625, -35.3046875, -32.73046875, -30.15625, -27.58203125, -25.0078125, -22.43359375, -19.859375, -17.28515625, -14.7109375, -12.13671875, -9.5625, -6.98828125, -4.4140625, -1.83984375, 0.734375, 3.30859375, 5.8828125, 8.45703125, 11.03125, 13.60546875, 16.1796875, 18.75390625, 21.328125, 23.90234375, 26.4765625, 29.05078125, 31.625, 34.19921875, 36.7734375, 39.34765625, 41.921875, 44.49609375, 47.0703125, 49.64453125, 52.21875, 54.79296875, 57.3671875, 59.94140625, 62.515625, 65.08984375, 67.6640625, 70.23828125, 72.8125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 6.0, 4.0, 7.0, 10.0, 10.0, 25.0, 24.0, 30.0, 41.0, 57.0, 72.0, 115.0, 147.0, 263.0, 556.0, 1436.0, 5549.0, 33997.0, 252073.0, 583496.0, 145306.0, 19511.0, 3627.0, 1046.0, 415.0, 219.0, 145.0, 93.0, 72.0, 52.0, 38.0, 31.0, 23.0, 12.0, 10.0, 9.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.59375, -15.1527099609375, -14.711669921875, -14.2706298828125, -13.82958984375, -13.3885498046875, -12.947509765625, -12.5064697265625, -12.0654296875, -11.6243896484375, -11.183349609375, -10.7423095703125, -10.30126953125, -9.8602294921875, -9.419189453125, -8.9781494140625, -8.537109375, -8.0960693359375, -7.655029296875, -7.2139892578125, -6.77294921875, -6.3319091796875, -5.890869140625, -5.4498291015625, -5.0087890625, -4.5677490234375, -4.126708984375, -3.6856689453125, -3.24462890625, -2.8035888671875, -2.362548828125, -1.9215087890625, -1.48046875, -1.0394287109375, -0.598388671875, -0.1573486328125, 0.28369140625, 0.7247314453125, 1.165771484375, 1.6068115234375, 2.0478515625, 2.4888916015625, 2.929931640625, 3.3709716796875, 3.81201171875, 4.2530517578125, 4.694091796875, 5.1351318359375, 5.576171875, 6.0172119140625, 6.458251953125, 6.8992919921875, 7.34033203125, 7.7813720703125, 8.222412109375, 8.6634521484375, 9.1044921875, 9.5455322265625, 9.986572265625, 10.4276123046875, 10.86865234375, 11.3096923828125, 11.750732421875, 12.1917724609375, 12.6328125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 11.0, 15.0, 21.0, 26.0, 31.0, 29.0, 52.0, 67.0, 62.0, 78.0, 72.0, 2094.0, 73.0, 64.0, 67.0, 54.0, 39.0, 43.0, 25.0, 24.0, 20.0, 23.0, 12.0, 10.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.5, -143.78125, -139.0625, -134.34375, -129.625, -124.90625, -120.1875, -115.46875, -110.75, -106.03125, -101.3125, -96.59375, -91.875, -87.15625, -82.4375, -77.71875, -73.0, -68.28125, -63.5625, -58.84375, -54.125, -49.40625, -44.6875, -39.96875, -35.25, -30.53125, -25.8125, -21.09375, -16.375, -11.65625, -6.9375, -2.21875, 2.5, 7.21875, 11.9375, 16.65625, 21.375, 26.09375, 30.8125, 35.53125, 40.25, 44.96875, 49.6875, 54.40625, 59.125, 63.84375, 68.5625, 73.28125, 78.0, 82.71875, 87.4375, 92.15625, 96.875, 101.59375, 106.3125, 111.03125, 115.75, 120.46875, 125.1875, 129.90625, 134.625, 139.34375, 144.0625, 148.78125, 153.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 11.0, 4.0, 14.0, 21.0, 14.0, 27.0, 40.0, 57.0, 62.0, 107.0, 146.0, 246.0, 380.0, 759.0, 1488.0, 5189.0, 41045.0, 2666396.0, 398727.0, 24184.0, 3796.0, 1330.0, 584.0, 342.0, 210.0, 139.0, 97.0, 61.0, 59.0, 38.0, 26.0, 25.0, 16.0, 7.0, 7.0, 8.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.203125, -15.6611328125, -15.119140625, -14.5771484375, -14.03515625, -13.4931640625, -12.951171875, -12.4091796875, -11.8671875, -11.3251953125, -10.783203125, -10.2412109375, -9.69921875, -9.1572265625, -8.615234375, -8.0732421875, -7.53125, -6.9892578125, -6.447265625, -5.9052734375, -5.36328125, -4.8212890625, -4.279296875, -3.7373046875, -3.1953125, -2.6533203125, -2.111328125, -1.5693359375, -1.02734375, -0.4853515625, 0.056640625, 0.5986328125, 1.140625, 1.6826171875, 2.224609375, 2.7666015625, 3.30859375, 3.8505859375, 4.392578125, 4.9345703125, 5.4765625, 6.0185546875, 6.560546875, 7.1025390625, 7.64453125, 8.1865234375, 8.728515625, 9.2705078125, 9.8125, 10.3544921875, 10.896484375, 11.4384765625, 11.98046875, 12.5224609375, 13.064453125, 13.6064453125, 14.1484375, 14.6904296875, 15.232421875, 15.7744140625, 16.31640625, 16.8583984375, 17.400390625, 17.9423828125, 18.484375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 9.0, 17.0, 57.0, 120.0, 254.0, 254.0, 151.0, 59.0, 23.0, 17.0, 10.0, 9.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.1093444824219, -293.635009765625, -284.1606750488281, -274.68634033203125, -265.2120056152344, -255.7376708984375, -246.26333618164062, -236.78900146484375, -227.31466674804688, -217.84033203125, -208.36599731445312, -198.89166259765625, -189.41732788085938, -179.9429931640625, -170.46865844726562, -160.99432373046875, -151.52000427246094, -142.04566955566406, -132.5713348388672, -123.09700012207031, -113.62266540527344, -104.14833068847656, -94.67400360107422, -85.19966888427734, -75.72533416748047, -66.2509994506836, -56.77666473388672, -47.30233383178711, -37.827999114990234, -28.35366439819336, -18.87933349609375, -9.404998779296875, 0.0693359375, 9.543669700622559, 19.018003463745117, 28.49233627319336, 37.966670989990234, 47.44100570678711, 56.91533660888672, 66.3896713256836, 75.86400604248047, 85.33834075927734, 94.81267547607422, 104.28700256347656, 113.76133728027344, 123.23567199707031, 132.7100067138672, 142.18434143066406, 151.65867614746094, 161.1330108642578, 170.6073455810547, 180.08168029785156, 189.55601501464844, 199.0303497314453, 208.50466918945312, 217.97900390625, 227.45333862304688, 236.92767333984375, 246.40200805664062, 255.8763427734375, 265.3506774902344, 274.82501220703125, 284.2993469238281, 293.773681640625, 303.2480163574219]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 12.0, 9.0, 8.0, 13.0, 11.0, 13.0, 19.0, 30.0, 26.0, 35.0, 28.0, 38.0, 38.0, 28.0, 42.0, 40.0, 39.0, 42.0, 38.0, 40.0, 42.0, 40.0, 43.0, 41.0, 39.0, 28.0, 24.0, 35.0, 29.0, 15.0, 15.0, 18.0, 13.0, 10.0, 13.0, 8.0, 6.0, 4.0, 8.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-156.87940979003906, -151.856201171875, -146.8330078125, -141.80979919433594, -136.78659057617188, -131.7633819580078, -126.74018096923828, -121.71697998046875, -116.69377136230469, -111.67056274414062, -106.6473617553711, -101.62416076660156, -96.6009521484375, -91.57774353027344, -86.5545425415039, -81.53134155273438, -76.50813293457031, -71.48492431640625, -66.46172332763672, -61.43851852416992, -56.415313720703125, -51.39210891723633, -46.36890411376953, -41.345699310302734, -36.32249450683594, -31.29928970336914, -26.276084899902344, -21.252880096435547, -16.22967529296875, -11.206470489501953, -6.183265686035156, -1.1600608825683594, 3.863128662109375, 8.886333465576172, 13.909538269042969, 18.932743072509766, 23.955947875976562, 28.97915267944336, 34.002357482910156, 39.02556228637695, 44.04876708984375, 49.07197189331055, 54.095176696777344, 59.11838150024414, 64.14158630371094, 69.164794921875, 74.18799591064453, 79.21119689941406, 84.23440551757812, 89.25761413574219, 94.28081512451172, 99.30401611328125, 104.32722473144531, 109.35043334960938, 114.3736343383789, 119.39683532714844, 124.4200439453125, 129.44325256347656, 134.46646118164062, 139.48965454101562, 144.5128631591797, 149.53607177734375, 154.55926513671875, 159.5824737548828, 164.60568237304688]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 8.0, 14.0, 18.0, 30.0, 30.0, 53.0, 56.0, 69.0, 115.0, 138.0, 159.0, 243.0, 314.0, 353.0, 437.0, 553.0, 638.0, 984.0, 1039746.0, 1083.0, 748.0, 593.0, 479.0, 391.0, 287.0, 213.0, 191.0, 153.0, 102.0, 78.0, 67.0, 62.0, 36.0, 25.0, 19.0, 17.0, 11.0, 11.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-38.89784622192383, -37.62857437133789, -36.35930252075195, -35.09002685546875, -33.82075500488281, -32.551483154296875, -31.282211303710938, -30.012939453125, -28.743667602539062, -27.474395751953125, -26.205121994018555, -24.935850143432617, -23.66657829284668, -22.39730453491211, -21.128032684326172, -19.858760833740234, -18.589487075805664, -17.320215225219727, -16.050941467285156, -14.781669616699219, -13.512397766113281, -12.243124961853027, -10.973852157592773, -9.704580307006836, -8.435307502746582, -7.166035175323486, -5.896762847900391, -4.627490043640137, -3.358217716217041, -2.0889453887939453, -0.8196725845336914, 0.4495992660522461, 1.7188720703125, 2.9881443977355957, 4.257416725158691, 5.526689529418945, 6.795961856842041, 8.065234184265137, 9.33450698852539, 10.603778839111328, 11.873051643371582, 13.142324447631836, 14.411596298217773, 15.680869102478027, 16.95014190673828, 18.21941375732422, 19.488685607910156, 20.757957458496094, 22.027231216430664, 23.2965030670166, 24.565776824951172, 25.83504867553711, 27.104320526123047, 28.373592376708984, 29.642866134643555, 30.912137985229492, 32.18141174316406, 33.45068359375, 34.71995544433594, 35.989227294921875, 37.25850296020508, 38.527774810791016, 39.79704666137695, 41.06631851196289, 42.33559036254883]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 10.0, 12.0, 33.0, 59.0, 182.0, 51454536.0, 8177.0, 84.0, 23.0, 27.0, 7.0, 5.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2281.809814453125, -2207.866455078125, -2133.9228515625, -2059.9794921875, -1986.0361328125, -1912.0926513671875, -1838.149169921875, -1764.205810546875, -1690.2623291015625, -1616.31884765625, -1542.37548828125, -1468.4320068359375, -1394.488525390625, -1320.545166015625, -1246.6016845703125, -1172.658203125, -1098.71484375, -1024.7713623046875, -950.8280029296875, -876.884521484375, -802.9411010742188, -728.9976806640625, -655.05419921875, -581.1107788085938, -507.1673583984375, -433.22393798828125, -359.2804870605469, -285.3370361328125, -211.39361572265625, -137.4501953125, -63.506744384765625, 10.43670654296875, 84.380126953125, 158.3235626220703, 232.26699829101562, 306.21044921875, 380.15386962890625, 454.0972900390625, 528.040771484375, 601.9841918945312, 675.9276123046875, 749.8710327148438, 823.814453125, 897.7579345703125, 971.7013549804688, 1045.644775390625, 1119.5882568359375, 1193.53173828125, 1267.47509765625, 1341.4185791015625, 1415.3619384765625, 1489.305419921875, 1563.248779296875, 1637.1922607421875, 1711.1357421875, 1785.0791015625, 1859.0225830078125, 1932.966064453125, 2006.909423828125, 2080.852783203125, 2154.79638671875, 2228.73974609375, 2302.68310546875, 2376.626708984375, 2450.570068359375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 15.0, 19.0, 35.0, 80.0, 119.0, 165.0, 213.0, 297.0, 461.0, 803.0, 1165.0, 1776.0, 2620.0, 3816.0, 5889.0, 9121.0, 14016.0, 21174.0, 33270.0, 53917.0, 86441.0, 141644.0, 235643.0, 395484.0, 3773484.0, 611754.0, 349607.0, 209475.0, 127556.0, 77625.0, 47701.0, 29848.0, 19393.0, 12685.0, 8232.0, 5272.0, 3460.0, 2378.0, 1612.0, 1135.0, 678.0, 457.0, 303.0, 196.0, 147.0, 102.0, 72.0, 23.0, 17.0, 4.0, 6.0, 3.0, 9.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.305419921875, -0.2958412170410156, -0.28626251220703125, -0.2766838073730469, -0.2671051025390625, -0.2575263977050781, -0.24794769287109375, -0.23836898803710938, -0.228790283203125, -0.21921157836914062, -0.20963287353515625, -0.20005416870117188, -0.1904754638671875, -0.18089675903320312, -0.17131805419921875, -0.16173934936523438, -0.15216064453125, -0.14258193969726562, -0.13300323486328125, -0.12342453002929688, -0.1138458251953125, -0.10426712036132812, -0.09468841552734375, -0.08510971069335938, -0.075531005859375, -0.06595230102539062, -0.05637359619140625, -0.046794891357421875, -0.0372161865234375, -0.027637481689453125, -0.01805877685546875, -0.008480072021484375, 0.0010986328125, 0.010677337646484375, 0.02025604248046875, 0.029834747314453125, 0.0394134521484375, 0.048992156982421875, 0.05857086181640625, 0.06814956665039062, 0.077728271484375, 0.08730697631835938, 0.09688568115234375, 0.10646438598632812, 0.1160430908203125, 0.12562179565429688, 0.13520050048828125, 0.14477920532226562, 0.15435791015625, 0.16393661499023438, 0.17351531982421875, 0.18309402465820312, 0.1926727294921875, 0.20225143432617188, 0.21183013916015625, 0.22140884399414062, 0.230987548828125, 0.24056625366210938, 0.25014495849609375, 0.2597236633300781, 0.2693023681640625, 0.2788810729980469, 0.28845977783203125, 0.2980384826660156, 0.3076171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 9.0, 9.0, 9.0, 5.0, 10.0, 20.0, 17.0, 19.0, 43.0, 21.0, 26.0, 32.0, 44.0, 39.0, 40.0, 46.0, 48.0, 63.0, 1065.0, 37.0, 50.0, 40.0, 37.0, 31.0, 38.0, 36.0, 24.0, 24.0, 28.0, 26.0, 27.0, 16.0, 10.0, 10.0, 13.0, 4.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.90625, -17.205810546875, -16.50537109375, -15.804931640625, -15.1044921875, -14.404052734375, -13.70361328125, -13.003173828125, -12.302734375, -11.602294921875, -10.90185546875, -10.201416015625, -9.5009765625, -8.800537109375, -8.10009765625, -7.399658203125, -6.69921875, -5.998779296875, -5.29833984375, -4.597900390625, -3.8974609375, -3.197021484375, -2.49658203125, -1.796142578125, -1.095703125, -0.395263671875, 0.30517578125, 1.005615234375, 1.7060546875, 2.406494140625, 3.10693359375, 3.807373046875, 4.5078125, 5.208251953125, 5.90869140625, 6.609130859375, 7.3095703125, 8.010009765625, 8.71044921875, 9.410888671875, 10.111328125, 10.811767578125, 11.51220703125, 12.212646484375, 12.9130859375, 13.613525390625, 14.31396484375, 15.014404296875, 15.71484375, 16.415283203125, 17.11572265625, 17.816162109375, 18.5166015625, 19.217041015625, 19.91748046875, 20.617919921875, 21.318359375, 22.018798828125, 22.71923828125, 23.419677734375, 24.1201171875, 24.820556640625, 25.52099609375, 26.221435546875, 26.921875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [8.0, 2.0, 8.0, 21.0, 22.0, 29.0, 35.0, 53.0, 89.0, 149.0, 195.0, 255.0, 363.0, 547.0, 807.0, 1201.0, 1827.0, 2784.0, 4041.0, 6229.0, 9228.0, 13565.0, 21080.0, 32238.0, 48380.0, 72720.0, 109372.0, 164375.0, 247477.0, 374141.0, 3677110.0, 502462.0, 336762.0, 222709.0, 148499.0, 98437.0, 65766.0, 43223.0, 28396.0, 18872.0, 12523.0, 8320.0, 5601.0, 3849.0, 2606.0, 1587.0, 1110.0, 823.0, 520.0, 377.0, 220.0, 143.0, 111.0, 68.0, 39.0, 22.0, 19.0, 10.0, 12.0, 7.0, 5.0, 2.0, 3.0, 2.0], "bins": [-0.2069091796875, -0.20020675659179688, -0.19350433349609375, -0.18680191040039062, -0.1800994873046875, -0.17339706420898438, -0.16669464111328125, -0.15999221801757812, -0.153289794921875, -0.14658737182617188, -0.13988494873046875, -0.13318252563476562, -0.1264801025390625, -0.11977767944335938, -0.11307525634765625, -0.10637283325195312, -0.09967041015625, -0.09296798706054688, -0.08626556396484375, -0.07956314086914062, -0.0728607177734375, -0.06615829467773438, -0.05945587158203125, -0.052753448486328125, -0.046051025390625, -0.039348602294921875, -0.03264617919921875, -0.025943756103515625, -0.0192413330078125, -0.012538909912109375, -0.00583648681640625, 0.000865936279296875, 0.007568359375, 0.014270782470703125, 0.02097320556640625, 0.027675628662109375, 0.0343780517578125, 0.041080474853515625, 0.04778289794921875, 0.054485321044921875, 0.061187744140625, 0.06789016723632812, 0.07459259033203125, 0.08129501342773438, 0.0879974365234375, 0.09469985961914062, 0.10140228271484375, 0.10810470581054688, 0.11480712890625, 0.12150955200195312, 0.12821197509765625, 0.13491439819335938, 0.1416168212890625, 0.14831924438476562, 0.15502166748046875, 0.16172409057617188, 0.168426513671875, 0.17512893676757812, 0.18183135986328125, 0.18853378295898438, 0.1952362060546875, 0.20193862915039062, 0.20864105224609375, 0.21534347534179688, 0.2220458984375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 6.0, 3.0, 4.0, 12.0, 12.0, 10.0, 19.0, 19.0, 27.0, 21.0, 18.0, 20.0, 30.0, 41.0, 37.0, 50.0, 46.0, 51.0, 47.0, 1074.0, 40.0, 46.0, 44.0, 38.0, 28.0, 27.0, 37.0, 36.0, 32.0, 25.0, 18.0, 21.0, 19.0, 7.0, 10.0, 14.0, 9.0, 11.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.84326171875, -19.1552734375, -18.46728515625, -17.779296875, -17.09130859375, -16.4033203125, -15.71533203125, -15.02734375, -14.33935546875, -13.6513671875, -12.96337890625, -12.275390625, -11.58740234375, -10.8994140625, -10.21142578125, -9.5234375, -8.83544921875, -8.1474609375, -7.45947265625, -6.771484375, -6.08349609375, -5.3955078125, -4.70751953125, -4.01953125, -3.33154296875, -2.6435546875, -1.95556640625, -1.267578125, -0.57958984375, 0.1083984375, 0.79638671875, 1.484375, 2.17236328125, 2.8603515625, 3.54833984375, 4.236328125, 4.92431640625, 5.6123046875, 6.30029296875, 6.98828125, 7.67626953125, 8.3642578125, 9.05224609375, 9.740234375, 10.42822265625, 11.1162109375, 11.80419921875, 12.4921875, 13.18017578125, 13.8681640625, 14.55615234375, 15.244140625, 15.93212890625, 16.6201171875, 17.30810546875, 17.99609375, 18.68408203125, 19.3720703125, 20.06005859375, 20.748046875, 21.43603515625, 22.1240234375, 22.81201171875, 23.5]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 1.0, 2.0, 0.0, 5.0, 7.0, 8.0, 9.0, 12.0, 7.0, 34.0, 49.0, 28.0, 53.0, 103.0, 101.0, 120.0, 183.0, 248.0, 335.0, 483.0, 570.0, 989.0, 1520.0, 2801.0, 5452.0, 12309.0, 32597.0, 98478.0, 5867391.0, 182408.0, 49820.0, 18112.0, 7548.0, 3859.0, 1874.0, 1200.0, 788.0, 491.0, 407.0, 285.0, 140.0, 129.0, 101.0, 97.0, 82.0, 62.0, 34.0, 27.0, 12.0, 18.0, 13.0, 11.0, 9.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-1.08984375, -1.05548095703125, -1.0211181640625, -0.98675537109375, -0.952392578125, -0.91802978515625, -0.8836669921875, -0.84930419921875, -0.81494140625, -0.78057861328125, -0.7462158203125, -0.71185302734375, -0.677490234375, -0.64312744140625, -0.6087646484375, -0.57440185546875, -0.5400390625, -0.50567626953125, -0.4713134765625, -0.43695068359375, -0.402587890625, -0.36822509765625, -0.3338623046875, -0.29949951171875, -0.26513671875, -0.23077392578125, -0.1964111328125, -0.16204833984375, -0.127685546875, -0.09332275390625, -0.0589599609375, -0.02459716796875, 0.009765625, 0.04412841796875, 0.0784912109375, 0.11285400390625, 0.147216796875, 0.18157958984375, 0.2159423828125, 0.25030517578125, 0.28466796875, 0.31903076171875, 0.3533935546875, 0.38775634765625, 0.422119140625, 0.45648193359375, 0.4908447265625, 0.52520751953125, 0.5595703125, 0.59393310546875, 0.6282958984375, 0.66265869140625, 0.697021484375, 0.73138427734375, 0.7657470703125, 0.80010986328125, 0.83447265625, 0.86883544921875, 0.9031982421875, 0.93756103515625, 0.971923828125, 1.00628662109375, 1.0406494140625, 1.07501220703125, 1.109375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 8.0, 6.0, 9.0, 12.0, 14.0, 8.0, 13.0, 17.0, 20.0, 24.0, 24.0, 23.0, 35.0, 39.0, 44.0, 24.0, 32.0, 43.0, 35.0, 130.0, 963.0, 41.0, 39.0, 42.0, 41.0, 38.0, 33.0, 29.0, 24.0, 32.0, 26.0, 18.0, 23.0, 24.0, 15.0, 15.0, 12.0, 13.0, 9.0, 3.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-22.109375, -21.460205078125, -20.81103515625, -20.161865234375, -19.5126953125, -18.863525390625, -18.21435546875, -17.565185546875, -16.916015625, -16.266845703125, -15.61767578125, -14.968505859375, -14.3193359375, -13.670166015625, -13.02099609375, -12.371826171875, -11.72265625, -11.073486328125, -10.42431640625, -9.775146484375, -9.1259765625, -8.476806640625, -7.82763671875, -7.178466796875, -6.529296875, -5.880126953125, -5.23095703125, -4.581787109375, -3.9326171875, -3.283447265625, -2.63427734375, -1.985107421875, -1.3359375, -0.686767578125, -0.03759765625, 0.611572265625, 1.2607421875, 1.909912109375, 2.55908203125, 3.208251953125, 3.857421875, 4.506591796875, 5.15576171875, 5.804931640625, 6.4541015625, 7.103271484375, 7.75244140625, 8.401611328125, 9.05078125, 9.699951171875, 10.34912109375, 10.998291015625, 11.6474609375, 12.296630859375, 12.94580078125, 13.594970703125, 14.244140625, 14.893310546875, 15.54248046875, 16.191650390625, 16.8408203125, 17.489990234375, 18.13916015625, 18.788330078125, 19.4375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 7.0, 10.0, 7.0, 11.0, 24.0, 43.0, 121.0, 576.0, 94.0, 47.0, 20.0, 14.0, 7.0, 9.0, 0.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.609596252441406, -30.35159683227539, -28.093595504760742, -25.835594177246094, -23.577594757080078, -21.319595336914062, -19.061594009399414, -16.803592681884766, -14.54559326171875, -12.287592887878418, -10.029592514038086, -7.771592140197754, -5.513591766357422, -3.25559139251709, -0.9975910186767578, 1.2604093551635742, 3.5184097290039062, 5.776410102844238, 8.03441047668457, 10.292410850524902, 12.550411224365234, 14.808411598205566, 17.0664119720459, 19.324413299560547, 21.582412719726562, 23.840412139892578, 26.098413467407227, 28.356414794921875, 30.61441421508789, 32.872413635253906, 35.13041687011719, 37.3884162902832, 39.64640808105469, 41.9044075012207, 44.16240692138672, 46.42041015625, 48.678409576416016, 50.93640899658203, 53.19441223144531, 55.45241165161133, 57.710411071777344, 59.96841049194336, 62.226409912109375, 64.48441314697266, 66.74241638183594, 69.00041198730469, 71.25841522216797, 73.51641082763672, 75.7744140625, 78.03241729736328, 80.29041290283203, 82.54841613769531, 84.80641174316406, 87.06441497802734, 89.32241821289062, 91.58041381835938, 93.83841705322266, 96.09642028808594, 98.35441589355469, 100.61241912841797, 102.87042236328125, 105.12841796875, 107.38642120361328, 109.64441680908203, 111.90242004394531]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 6.0, 15.0, 41.0, 89.0, 128.0, 204.0, 175.0, 143.0, 95.0, 57.0, 16.0, 15.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-142.48895263671875, -138.94940185546875, -135.40985107421875, -131.87030029296875, -128.33074951171875, -124.79119873046875, -121.25164794921875, -117.71209716796875, -114.17254638671875, -110.63299560546875, -107.09344482421875, -103.55389404296875, -100.01434326171875, -96.47479248046875, -92.93524169921875, -89.39569091796875, -85.85614776611328, -82.31659698486328, -78.77704620361328, -75.23749542236328, -71.69794464111328, -68.15839385986328, -64.61885070800781, -61.07929611206055, -57.53974533081055, -54.00019454956055, -50.46064376831055, -46.92109680175781, -43.38154602050781, -39.84199523925781, -36.30244445800781, -32.76289367675781, -29.223342895507812, -25.683792114257812, -22.144241333007812, -18.604692459106445, -15.065141677856445, -11.525590896606445, -7.986042022705078, -4.446491241455078, -0.9069404602050781, 2.6326098442077637, 6.1721601486206055, 9.711709976196289, 13.251260757446289, 16.79081153869629, 20.330360412597656, 23.869911193847656, 27.409461975097656, 30.949012756347656, 34.488563537597656, 38.028114318847656, 41.567665100097656, 45.107215881347656, 48.64676284790039, 52.18631362915039, 55.72586441040039, 59.26541519165039, 62.80496597290039, 66.34451293945312, 69.88406372070312, 73.42361450195312, 76.96316528320312, 80.50271606445312, 84.04226684570312]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 5.0, 5.0, 2.0, 7.0, 5.0, 6.0, 7.0, 9.0, 12.0, 8.0, 6.0, 18.0, 19.0, 14.0, 9.0, 18.0, 15.0, 17.0, 17.0, 7.0, 6.0, 6.0, 13.0, 21.0, 27.0, 38.0, 63.0, 76.0, 122.0, 198.0, 299.0, 411.0, 615.0, 976.0, 1463.0, 2143.0, 3053.0, 4361.0, 7366.0, 19397.0, 4128318.0, 9138.0, 5087.0, 3560.0, 2228.0, 1450.0, 1120.0, 775.0, 534.0, 378.0, 278.0, 192.0, 105.0, 85.0, 60.0, 51.0, 33.0, 17.0, 10.0, 10.0, 6.0], "bins": [-1.1142578125, -1.0884170532226562, -1.0625762939453125, -1.0367355346679688, -1.010894775390625, -0.9850540161132812, -0.9592132568359375, -0.9333724975585938, -0.90753173828125, -0.8816909790039062, -0.8558502197265625, -0.8300094604492188, -0.804168701171875, -0.7783279418945312, -0.7524871826171875, -0.7266464233398438, -0.7008056640625, -0.6749649047851562, -0.6491241455078125, -0.6232833862304688, -0.597442626953125, -0.5716018676757812, -0.5457611083984375, -0.5199203491210938, -0.49407958984375, -0.46823883056640625, -0.4423980712890625, -0.41655731201171875, -0.390716552734375, -0.36487579345703125, -0.3390350341796875, -0.31319427490234375, -0.287353515625, -0.26151275634765625, -0.2356719970703125, -0.20983123779296875, -0.183990478515625, -0.15814971923828125, -0.1323089599609375, -0.10646820068359375, -0.08062744140625, -0.05478668212890625, -0.0289459228515625, -0.00310516357421875, 0.022735595703125, 0.04857635498046875, 0.0744171142578125, 0.10025787353515625, 0.1260986328125, 0.15193939208984375, 0.1777801513671875, 0.20362091064453125, 0.229461669921875, 0.25530242919921875, 0.2811431884765625, 0.30698394775390625, 0.33282470703125, 0.35866546630859375, 0.3845062255859375, 0.41034698486328125, 0.436187744140625, 0.46202850341796875, 0.4878692626953125, 0.5137100219726562, 0.53955078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 9.0, 5.0, 10.0, 7.0, 14.0, 12.0, 24.0, 280.0, 548.0, 21.0, 15.0, 10.0, 11.0, 11.0, 5.0, 5.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.07016754150390625, -0.0684967041015625, -0.06682586669921875, -0.065155029296875, -0.06348419189453125, -0.0618133544921875, -0.06014251708984375, -0.0584716796875, -0.05680084228515625, -0.0551300048828125, -0.05345916748046875, -0.051788330078125, -0.05011749267578125, -0.0484466552734375, -0.04677581787109375, -0.04510498046875, -0.04343414306640625, -0.0417633056640625, -0.04009246826171875, -0.038421630859375, -0.03675079345703125, -0.0350799560546875, -0.03340911865234375, -0.03173828125, -0.03006744384765625, -0.0283966064453125, -0.02672576904296875, -0.025054931640625, -0.02338409423828125, -0.0217132568359375, -0.02004241943359375, -0.01837158203125, -0.01670074462890625, -0.0150299072265625, -0.01335906982421875, -0.011688232421875, -0.01001739501953125, -0.0083465576171875, -0.00667572021484375, -0.0050048828125, -0.00333404541015625, -0.0016632080078125, 7.62939453125e-06, 0.001678466796875, 0.00334930419921875, 0.0050201416015625, 0.00669097900390625, 0.00836181640625, 0.01003265380859375, 0.0117034912109375, 0.01337432861328125, 0.015045166015625, 0.01671600341796875, 0.0183868408203125, 0.02005767822265625, 0.021728515625, 0.02339935302734375, 0.0250701904296875, 0.02674102783203125, 0.028411865234375, 0.03008270263671875, 0.0317535400390625, 0.03342437744140625, 0.03509521484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 10.0, 13.0, 14.0, 24.0, 38.0, 43.0, 61.0, 83.0, 108.0, 157.0, 199.0, 266.0, 410.0, 539.0, 783.0, 1189.0, 1617.0, 2263.0, 3379.0, 5071.0, 8398.0, 14991.0, 40091.0, 4006589.0, 58468.0, 19406.0, 9832.0, 6229.0, 4309.0, 2708.0, 1929.0, 1351.0, 1003.0, 753.0, 574.0, 374.0, 265.0, 230.0, 155.0, 111.0, 71.0, 47.0, 40.0, 22.0, 22.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.1383228302001953, -0.13394546508789062, -0.12956809997558594, -0.12519073486328125, -0.12081336975097656, -0.11643600463867188, -0.11205863952636719, -0.1076812744140625, -0.10330390930175781, -0.09892654418945312, -0.09454917907714844, -0.09017181396484375, -0.08579444885253906, -0.08141708374023438, -0.07703971862792969, -0.072662353515625, -0.06828498840332031, -0.06390762329101562, -0.05953025817871094, -0.05515289306640625, -0.05077552795410156, -0.046398162841796875, -0.04202079772949219, -0.0376434326171875, -0.03326606750488281, -0.028888702392578125, -0.024511337280273438, -0.02013397216796875, -0.015756607055664062, -0.011379241943359375, -0.0070018768310546875, -0.00262451171875, 0.0017528533935546875, 0.006130218505859375, 0.010507583618164062, 0.01488494873046875, 0.019262313842773438, 0.023639678955078125, 0.028017044067382812, 0.0323944091796875, 0.03677177429199219, 0.041149139404296875, 0.04552650451660156, 0.04990386962890625, 0.05428123474121094, 0.058658599853515625, 0.06303596496582031, 0.067413330078125, 0.07179069519042969, 0.07616806030273438, 0.08054542541503906, 0.08492279052734375, 0.08930015563964844, 0.09367752075195312, 0.09805488586425781, 0.1024322509765625, 0.10680961608886719, 0.11118698120117188, 0.11556434631347656, 0.11994171142578125, 0.12431907653808594, 0.12869644165039062, 0.1330738067626953, 0.137451171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 4.0, 5.0, 6.0, 6.0, 7.0, 12.0, 11.0, 14.0, 9.0, 12.0, 23.0, 82.0, 3659.0, 36.0, 14.0, 12.0, 14.0, 9.0, 7.0, 5.0, 18.0, 2.0, 14.0, 11.0, 9.0, 4.0, 4.0, 9.0, 2.0, 7.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.036751747131347656, -0.03517341613769531, -0.03359508514404297, -0.032016754150390625, -0.03043842315673828, -0.028860092163085938, -0.027281761169433594, -0.02570343017578125, -0.024125099182128906, -0.022546768188476562, -0.02096843719482422, -0.019390106201171875, -0.01781177520751953, -0.016233444213867188, -0.014655113220214844, -0.0130767822265625, -0.011498451232910156, -0.009920120239257812, -0.008341789245605469, -0.006763458251953125, -0.005185127258300781, -0.0036067962646484375, -0.0020284652709960938, -0.00045013427734375, 0.0011281967163085938, 0.0027065277099609375, 0.004284858703613281, 0.005863189697265625, 0.007441520690917969, 0.009019851684570312, 0.010598182678222656, 0.012176513671875, 0.013754844665527344, 0.015333175659179688, 0.01691150665283203, 0.018489837646484375, 0.02006816864013672, 0.021646499633789062, 0.023224830627441406, 0.02480316162109375, 0.026381492614746094, 0.027959823608398438, 0.02953815460205078, 0.031116485595703125, 0.03269481658935547, 0.03427314758300781, 0.035851478576660156, 0.0374298095703125, 0.039008140563964844, 0.04058647155761719, 0.04216480255126953, 0.043743133544921875, 0.04532146453857422, 0.04689979553222656, 0.048478126525878906, 0.05005645751953125, 0.051634788513183594, 0.05321311950683594, 0.05479145050048828, 0.056369781494140625, 0.05794811248779297, 0.05952644348144531, 0.061104774475097656, 0.06268310546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 102.0, 807.0, 56.0, 23.0, 11.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42133864760398865, -0.3698539137840271, -0.31836917996406555, -0.266884446144104, -0.21539971232414246, -0.1639149785041809, -0.11243024468421936, -0.06094551086425781, -0.009460777044296265, 0.04202395677566528, 0.09350869059562683, 0.14499342441558838, 0.19647815823554993, 0.24796289205551147, 0.299447625875473, 0.35093235969543457, 0.4024170935153961, 0.45390182733535767, 0.5053865909576416, 0.5568712949752808, 0.6083559989929199, 0.6598407626152039, 0.7113255262374878, 0.762810230255127, 0.8142949342727661, 0.8657796382904053, 0.9172644019126892, 0.9687491655349731, 1.0202338695526123, 1.0717185735702515, 1.1232032775878906, 1.1746881008148193, 1.226172924041748, 1.2776576280593872, 1.3291423320770264, 1.380627155303955, 1.4321118593215942, 1.4835965633392334, 1.535081386566162, 1.5865660905838013, 1.6380507946014404, 1.6895354986190796, 1.7410202026367188, 1.7925050258636475, 1.8439897298812866, 1.8954744338989258, 1.9469592571258545, 1.9984439611434937, 2.049928665161133, 2.1014134883880615, 2.152898073196411, 2.20438289642334, 2.2558674812316895, 2.307352304458618, 2.358837127685547, 2.4103217124938965, 2.461806535720825, 2.513291358947754, 2.5647759437561035, 2.6162607669830322, 2.667745590209961, 2.7192301750183105, 2.7707149982452393, 2.822199583053589, 2.8736844062805176]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 8.0, 20.0, 28.0, 47.0, 94.0, 102.0, 129.0, 159.0, 131.0, 106.0, 69.0, 43.0, 19.0, 16.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6487737894058228, -0.6323053240776062, -0.6158367991447449, -0.5993683338165283, -0.582899808883667, -0.5664313435554504, -0.5499628782272339, -0.5334943532943726, -0.517025887966156, -0.5005574226379395, -0.4840888977050781, -0.4676204323768616, -0.45115193724632263, -0.4346834421157837, -0.41821497678756714, -0.4017464816570282, -0.38527798652648926, -0.3688094913959503, -0.3523409962654114, -0.3358725309371948, -0.3194040358066559, -0.30293554067611694, -0.2864670753479004, -0.26999858021736145, -0.2535300850868225, -0.23706158995628357, -0.22059310972690582, -0.20412462949752808, -0.18765613436698914, -0.1711876392364502, -0.15471915900707245, -0.1382506787776947, -0.12178218364715576, -0.10531369596719742, -0.08884520828723907, -0.07237672060728073, -0.05590823292732239, -0.039439745247364044, -0.0229712575674057, -0.006502769887447357, 0.009965717792510986, 0.02643420547246933, 0.04290269315242767, 0.05937118083238602, 0.07583966851234436, 0.0923081561923027, 0.10877664387226105, 0.1252451241016388, 0.14171361923217773, 0.15818211436271667, 0.17465059459209442, 0.19111907482147217, 0.2075875699520111, 0.22405606508255005, 0.2405245453119278, 0.25699302554130554, 0.2734615206718445, 0.2899300158023834, 0.30639851093292236, 0.3228669762611389, 0.33933547139167786, 0.3558039665222168, 0.37227243185043335, 0.3887409269809723, 0.40520942211151123]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 11.0, 11.0, 10.0, 11.0, 10.0, 24.0, 25.0, 33.0, 67.0, 100.0, 190.0, 329.0, 707.0, 1530.0, 3652.0, 10069.0, 36651.0, 953156.0, 27813.0, 8397.0, 3021.0, 1349.0, 598.0, 291.0, 167.0, 112.0, 57.0, 45.0, 25.0, 14.0, 21.0, 15.0, 9.0, 10.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.50634765625, -0.4928131103515625, -0.479278564453125, -0.4657440185546875, -0.45220947265625, -0.4386749267578125, -0.425140380859375, -0.4116058349609375, -0.3980712890625, -0.3845367431640625, -0.371002197265625, -0.3574676513671875, -0.34393310546875, -0.3303985595703125, -0.316864013671875, -0.3033294677734375, -0.289794921875, -0.2762603759765625, -0.262725830078125, -0.2491912841796875, -0.23565673828125, -0.2221221923828125, -0.208587646484375, -0.1950531005859375, -0.1815185546875, -0.1679840087890625, -0.154449462890625, -0.1409149169921875, -0.12738037109375, -0.1138458251953125, -0.100311279296875, -0.0867767333984375, -0.0732421875, -0.0597076416015625, -0.046173095703125, -0.0326385498046875, -0.01910400390625, -0.0055694580078125, 0.007965087890625, 0.0214996337890625, 0.0350341796875, 0.0485687255859375, 0.062103271484375, 0.0756378173828125, 0.08917236328125, 0.1027069091796875, 0.116241455078125, 0.1297760009765625, 0.143310546875, 0.1568450927734375, 0.170379638671875, 0.1839141845703125, 0.19744873046875, 0.2109832763671875, 0.224517822265625, 0.2380523681640625, 0.2515869140625, 0.2651214599609375, 0.278656005859375, 0.2921905517578125, 0.30572509765625, 0.3192596435546875, 0.332794189453125, 0.3463287353515625, 0.35986328125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 8.0, 8.0, 13.0, 13.0, 28.0, 690.0, 132.0, 24.0, 13.0, 13.0, 11.0, 9.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06956815719604492, -0.06790828704833984, -0.06624841690063477, -0.06458854675292969, -0.06292867660522461, -0.06126880645751953, -0.05960893630981445, -0.057949066162109375, -0.0562891960144043, -0.05462932586669922, -0.05296945571899414, -0.05130958557128906, -0.049649715423583984, -0.047989845275878906, -0.04632997512817383, -0.04467010498046875, -0.04301023483276367, -0.041350364685058594, -0.039690494537353516, -0.03803062438964844, -0.03637075424194336, -0.03471088409423828, -0.0330510139465332, -0.031391143798828125, -0.029731273651123047, -0.02807140350341797, -0.02641153335571289, -0.024751663208007812, -0.023091793060302734, -0.021431922912597656, -0.019772052764892578, -0.0181121826171875, -0.016452312469482422, -0.014792442321777344, -0.013132572174072266, -0.011472702026367188, -0.00981283187866211, -0.008152961730957031, -0.006493091583251953, -0.004833221435546875, -0.003173351287841797, -0.0015134811401367188, 0.00014638900756835938, 0.0018062591552734375, 0.0034661293029785156, 0.005125999450683594, 0.006785869598388672, 0.00844573974609375, 0.010105609893798828, 0.011765480041503906, 0.013425350189208984, 0.015085220336914062, 0.01674509048461914, 0.01840496063232422, 0.020064830780029297, 0.021724700927734375, 0.023384571075439453, 0.02504444122314453, 0.02670431137084961, 0.028364181518554688, 0.030024051666259766, 0.031683921813964844, 0.03334379196166992, 0.035003662109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 7.0, 7.0, 3.0, 10.0, 13.0, 19.0, 39.0, 40.0, 70.0, 86.0, 123.0, 157.0, 300.0, 436.0, 631.0, 980.0, 1599.0, 2707.0, 4341.0, 7200.0, 12613.0, 23867.0, 52977.0, 193349.0, 574393.0, 94603.0, 35700.0, 17396.0, 9619.0, 5821.0, 3481.0, 2224.0, 1382.0, 828.0, 525.0, 351.0, 223.0, 166.0, 85.0, 54.0, 48.0, 32.0, 14.0, 14.0, 17.0, 3.0, 0.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0811767578125, -0.07830524444580078, -0.07543373107910156, -0.07256221771240234, -0.06969070434570312, -0.0668191909790039, -0.06394767761230469, -0.06107616424560547, -0.05820465087890625, -0.05533313751220703, -0.05246162414550781, -0.049590110778808594, -0.046718597412109375, -0.043847084045410156, -0.04097557067871094, -0.03810405731201172, -0.0352325439453125, -0.03236103057861328, -0.029489517211914062, -0.026618003845214844, -0.023746490478515625, -0.020874977111816406, -0.018003463745117188, -0.015131950378417969, -0.01226043701171875, -0.009388923645019531, -0.0065174102783203125, -0.0036458969116210938, -0.000774383544921875, 0.0020971298217773438, 0.0049686431884765625, 0.007840156555175781, 0.010711669921875, 0.013583183288574219, 0.016454696655273438, 0.019326210021972656, 0.022197723388671875, 0.025069236755371094, 0.027940750122070312, 0.03081226348876953, 0.03368377685546875, 0.03655529022216797, 0.03942680358886719, 0.042298316955566406, 0.045169830322265625, 0.048041343688964844, 0.05091285705566406, 0.05378437042236328, 0.0566558837890625, 0.05952739715576172, 0.06239891052246094, 0.06527042388916016, 0.06814193725585938, 0.0710134506225586, 0.07388496398925781, 0.07675647735595703, 0.07962799072265625, 0.08249950408935547, 0.08537101745605469, 0.0882425308227539, 0.09111404418945312, 0.09398555755615234, 0.09685707092285156, 0.09972858428955078, 0.10260009765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 7.0, 12.0, 5.0, 13.0, 15.0, 14.0, 17.0, 23.0, 31.0, 24.0, 32.0, 31.0, 39.0, 45.0, 50.0, 52.0, 50.0, 49.0, 54.0, 52.0, 46.0, 43.0, 44.0, 39.0, 34.0, 31.0, 21.0, 14.0, 18.0, 18.0, 15.0, 11.0, 10.0, 12.0, 8.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11492919921875, -0.11171340942382812, -0.10849761962890625, -0.10528182983398438, -0.1020660400390625, -0.09885025024414062, -0.09563446044921875, -0.09241867065429688, -0.089202880859375, -0.08598709106445312, -0.08277130126953125, -0.07955551147460938, -0.0763397216796875, -0.07312393188476562, -0.06990814208984375, -0.06669235229492188, -0.0634765625, -0.060260772705078125, -0.05704498291015625, -0.053829193115234375, -0.0506134033203125, -0.047397613525390625, -0.04418182373046875, -0.040966033935546875, -0.037750244140625, -0.034534454345703125, -0.03131866455078125, -0.028102874755859375, -0.0248870849609375, -0.021671295166015625, -0.01845550537109375, -0.015239715576171875, -0.01202392578125, -0.008808135986328125, -0.00559234619140625, -0.002376556396484375, 0.0008392333984375, 0.004055023193359375, 0.00727081298828125, 0.010486602783203125, 0.013702392578125, 0.016918182373046875, 0.02013397216796875, 0.023349761962890625, 0.0265655517578125, 0.029781341552734375, 0.03299713134765625, 0.036212921142578125, 0.0394287109375, 0.042644500732421875, 0.04586029052734375, 0.049076080322265625, 0.0522918701171875, 0.055507659912109375, 0.05872344970703125, 0.061939239501953125, 0.065155029296875, 0.06837081909179688, 0.07158660888671875, 0.07480239868164062, 0.0780181884765625, 0.08123397827148438, 0.08444976806640625, 0.08766555786132812, 0.09088134765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 1.0, 7.0, 5.0, 15.0, 25.0, 30.0, 86.0, 223.0, 533.0, 3417.0, 315995.0, 723306.0, 3944.0, 584.0, 194.0, 84.0, 45.0, 20.0, 12.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.003032684326171875, -0.0029653310775756836, -0.002897977828979492, -0.0028306245803833008, -0.0027632713317871094, -0.002695918083190918, -0.0026285648345947266, -0.002561211585998535, -0.0024938583374023438, -0.0024265050888061523, -0.002359151840209961, -0.0022917985916137695, -0.002224445343017578, -0.0021570920944213867, -0.0020897388458251953, -0.002022385597229004, -0.0019550323486328125, -0.001887679100036621, -0.0018203258514404297, -0.0017529726028442383, -0.0016856193542480469, -0.0016182661056518555, -0.001550912857055664, -0.0014835596084594727, -0.0014162063598632812, -0.0013488531112670898, -0.0012814998626708984, -0.001214146614074707, -0.0011467933654785156, -0.0010794401168823242, -0.0010120868682861328, -0.0009447336196899414, -0.00087738037109375, -0.0008100271224975586, -0.0007426738739013672, -0.0006753206253051758, -0.0006079673767089844, -0.000540614128112793, -0.00047326087951660156, -0.00040590763092041016, -0.00033855438232421875, -0.00027120113372802734, -0.00020384788513183594, -0.00013649463653564453, -6.914138793945312e-05, -1.7881393432617188e-06, 6.556510925292969e-05, 0.0001329183578491211, 0.0002002716064453125, 0.0002676248550415039, 0.0003349781036376953, 0.0004023313522338867, 0.0004696846008300781, 0.0005370378494262695, 0.0006043910980224609, 0.0006717443466186523, 0.0007390975952148438, 0.0008064508438110352, 0.0008738040924072266, 0.000941157341003418, 0.0010085105895996094, 0.0010758638381958008, 0.0011432170867919922, 0.0012105703353881836, 0.001277923583984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 11.0, 16.0, 20.0, 33.0, 57.0, 91.0, 110.0, 123.0, 126.0, 124.0, 84.0, 70.0, 52.0, 26.0, 14.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.947185516357422e-06, -4.702247679233551e-06, -4.45730984210968e-06, -4.212372004985809e-06, -3.9674341678619385e-06, -3.7224963307380676e-06, -3.4775584936141968e-06, -3.232620656490326e-06, -2.987682819366455e-06, -2.7427449822425842e-06, -2.4978071451187134e-06, -2.2528693079948425e-06, -2.0079314708709717e-06, -1.7629936337471008e-06, -1.51805579662323e-06, -1.2731179594993591e-06, -1.0281801223754883e-06, -7.832422852516174e-07, -5.383044481277466e-07, -2.9336661100387573e-07, -4.842877388000488e-08, 1.9650906324386597e-07, 4.414469003677368e-07, 6.863847374916077e-07, 9.313225746154785e-07, 1.1762604117393494e-06, 1.4211982488632202e-06, 1.666136085987091e-06, 1.911073923110962e-06, 2.1560117602348328e-06, 2.4009495973587036e-06, 2.6458874344825745e-06, 2.8908252716064453e-06, 3.135763108730316e-06, 3.380700945854187e-06, 3.625638782978058e-06, 3.870576620101929e-06, 4.1155144572257996e-06, 4.36045229434967e-06, 4.605390131473541e-06, 4.850327968597412e-06, 5.095265805721283e-06, 5.340203642845154e-06, 5.585141479969025e-06, 5.8300793170928955e-06, 6.075017154216766e-06, 6.319954991340637e-06, 6.564892828464508e-06, 6.809830665588379e-06, 7.05476850271225e-06, 7.299706339836121e-06, 7.5446441769599915e-06, 7.789582014083862e-06, 8.034519851207733e-06, 8.279457688331604e-06, 8.524395525455475e-06, 8.769333362579346e-06, 9.014271199703217e-06, 9.259209036827087e-06, 9.504146873950958e-06, 9.749084711074829e-06, 9.9940225481987e-06, 1.023896038532257e-05, 1.0483898222446442e-05, 1.0728836059570312e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 20.0, 20.0, 38.0, 49.0, 66.0, 82.0, 156.0, 229.0, 384.0, 666.0, 1227.0, 2264.0, 4851.0, 12491.0, 45787.0, 763153.0, 175818.0, 25255.0, 8352.0, 3498.0, 1767.0, 949.0, 527.0, 289.0, 205.0, 109.0, 82.0, 46.0, 32.0, 30.0, 19.0, 19.0, 11.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003559589385986328, -0.0003426782786846161, -0.00032939761877059937, -0.00031611695885658264, -0.0003028362989425659, -0.0002895556390285492, -0.00027627497911453247, -0.00026299431920051575, -0.000249713659286499, -0.0002364329993724823, -0.00022315233945846558, -0.00020987167954444885, -0.00019659101963043213, -0.0001833103597164154, -0.00017002969980239868, -0.00015674903988838196, -0.00014346837997436523, -0.0001301877200603485, -0.00011690706014633179, -0.00010362640023231506, -9.034574031829834e-05, -7.706508040428162e-05, -6.378442049026489e-05, -5.050376057624817e-05, -3.7223100662231445e-05, -2.394244074821472e-05, -1.0661780834197998e-05, 2.6188790798187256e-06, 1.589953899383545e-05, 2.9180198907852173e-05, 4.2460858821868896e-05, 5.574151873588562e-05, 6.902217864990234e-05, 8.230283856391907e-05, 9.558349847793579e-05, 0.00010886415839195251, 0.00012214481830596924, 0.00013542547821998596, 0.00014870613813400269, 0.0001619867980480194, 0.00017526745796203613, 0.00018854811787605286, 0.00020182877779006958, 0.0002151094377040863, 0.00022839009761810303, 0.00024167075753211975, 0.0002549514174461365, 0.0002682320773601532, 0.0002815127372741699, 0.00029479339718818665, 0.00030807405710220337, 0.0003213547170162201, 0.0003346353769302368, 0.00034791603684425354, 0.00036119669675827026, 0.000374477356672287, 0.0003877580165863037, 0.00040103867650032043, 0.00041431933641433716, 0.0004275999963283539, 0.0004408806562423706, 0.00045416131615638733, 0.00046744197607040405, 0.0004807226359844208, 0.0004940032958984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 5.0, 6.0, 3.0, 6.0, 15.0, 18.0, 23.0, 28.0, 32.0, 75.0, 102.0, 126.0, 139.0, 128.0, 100.0, 62.0, 35.0, 27.0, 22.0, 12.0, 9.0, 9.0, 6.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005497932434082031, -0.0005358085036277771, -0.0005218237638473511, -0.000507839024066925, -0.000493854284286499, -0.000479869544506073, -0.00046588480472564697, -0.00045190006494522095, -0.0004379153251647949, -0.0004239305853843689, -0.00040994584560394287, -0.00039596110582351685, -0.0003819763660430908, -0.0003679916262626648, -0.00035400688648223877, -0.00034002214670181274, -0.0003260374069213867, -0.0003120526671409607, -0.00029806792736053467, -0.00028408318758010864, -0.0002700984477996826, -0.0002561137080192566, -0.00024212896823883057, -0.00022814422845840454, -0.00021415948867797852, -0.0002001747488975525, -0.00018619000911712646, -0.00017220526933670044, -0.00015822052955627441, -0.0001442357897758484, -0.00013025104999542236, -0.00011626631021499634, -0.00010228157043457031, -8.829683065414429e-05, -7.431209087371826e-05, -6.0327351093292236e-05, -4.634261131286621e-05, -3.2357871532440186e-05, -1.837313175201416e-05, -4.388391971588135e-06, 9.59634780883789e-06, 2.3581087589263916e-05, 3.756582736968994e-05, 5.155056715011597e-05, 6.553530693054199e-05, 7.952004671096802e-05, 9.350478649139404e-05, 0.00010748952627182007, 0.0001214742660522461, 0.00013545900583267212, 0.00014944374561309814, 0.00016342848539352417, 0.0001774132251739502, 0.00019139796495437622, 0.00020538270473480225, 0.00021936744451522827, 0.0002333521842956543, 0.0002473369240760803, 0.00026132166385650635, 0.0002753064036369324, 0.0002892911434173584, 0.0003032758831977844, 0.00031726062297821045, 0.0003312453627586365, 0.0003452301025390625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 10.0, 18.0, 67.0, 210.0, 468.0, 129.0, 43.0, 24.0, 13.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1336874961853027, -2.0842418670654297, -2.0347962379455566, -1.9853506088256836, -1.935904860496521, -1.886459231376648, -1.837013602256775, -1.7875679731369019, -1.7381223440170288, -1.6886767148971558, -1.6392310857772827, -1.5897853374481201, -1.540339708328247, -1.490894079208374, -1.441448450088501, -1.392002820968628, -1.3425571918487549, -1.2931115627288818, -1.2436659336090088, -1.1942203044891357, -1.1447745561599731, -1.0953289270401, -1.045883297920227, -0.996437668800354, -0.9469919204711914, -0.8975462913513184, -0.8481006026268005, -0.7986549735069275, -0.7492093443870544, -0.6997636556625366, -0.6503180265426636, -0.6008723974227905, -0.5514267683029175, -0.5019811391830444, -0.452535480260849, -0.40308982133865356, -0.3536441922187805, -0.3041985332965851, -0.25475287437438965, -0.2053072452545166, -0.15586158633232117, -0.10641594231128693, -0.05697029083967209, -0.007524639368057251, 0.04192100465297699, 0.09136664867401123, 0.14081230759620667, 0.1902579367160797, 0.23970359563827515, 0.2891492545604706, 0.33859488368034363, 0.38804054260253906, 0.4374861717224121, 0.48693183064460754, 0.536377489566803, 0.585823118686676, 0.6352688074111938, 0.6847144365310669, 0.7341601252555847, 0.7836057543754578, 0.8330513834953308, 0.8824970722198486, 0.9319427013397217, 0.9813883304595947, 1.0308339595794678]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 5.0, 2.0, 3.0, 8.0, 9.0, 8.0, 13.0, 21.0, 32.0, 46.0, 59.0, 91.0, 120.0, 146.0, 130.0, 103.0, 64.0, 35.0, 28.0, 10.0, 13.0, 8.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.375314712524414, -1.323342204093933, -1.2713695764541626, -1.2193970680236816, -1.1674244403839111, -1.1154519319534302, -1.0634794235229492, -1.0115067958831787, -0.9595342874526978, -0.907561719417572, -0.8555891513824463, -0.8036166429519653, -0.7516440749168396, -0.6996715068817139, -0.6476989388465881, -0.5957263708114624, -0.5437538027763367, -0.49178123474121094, -0.4398086965084076, -0.38783612847328186, -0.3358635902404785, -0.2838910222053528, -0.23191845417022705, -0.1799459159374237, -0.12797334790229797, -0.07600079476833344, -0.0240282341837883, 0.027944326400756836, 0.07991687953472137, 0.1318894326686859, 0.18386200070381165, 0.235834538936615, 0.2878071069717407, 0.33977967500686646, 0.3917522132396698, 0.44372478127479553, 0.4956973195075989, 0.5476698875427246, 0.5996424555778503, 0.6516150236129761, 0.703587532043457, 0.7555601000785828, 0.8075326681137085, 0.8595051765441895, 0.9114777445793152, 0.9634503126144409, 1.0154228210449219, 1.0673954486846924, 1.119368076324463, 1.1713405847549438, 1.2233132123947144, 1.2752857208251953, 1.3272583484649658, 1.3792308568954468, 1.4312033653259277, 1.4831759929656982, 1.5351485013961792, 1.5871210098266602, 1.6390936374664307, 1.6910661458969116, 1.7430387735366821, 1.795011281967163, 1.8469839096069336, 1.8989564180374146, 1.9509289264678955]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 13.0, 11.0, 17.0, 44.0, 49.0, 84.0, 128.0, 255.0, 781.0, 5220.0, 4152388.0, 31020.0, 3238.0, 671.0, 199.0, 78.0, 28.0, 15.0, 16.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.64453125, -7.46612548828125, -7.2877197265625, -7.10931396484375, -6.930908203125, -6.75250244140625, -6.5740966796875, -6.39569091796875, -6.21728515625, -6.03887939453125, -5.8604736328125, -5.68206787109375, -5.503662109375, -5.32525634765625, -5.1468505859375, -4.96844482421875, -4.7900390625, -4.61163330078125, -4.4332275390625, -4.25482177734375, -4.076416015625, -3.89801025390625, -3.7196044921875, -3.54119873046875, -3.36279296875, -3.18438720703125, -3.0059814453125, -2.82757568359375, -2.649169921875, -2.47076416015625, -2.2923583984375, -2.11395263671875, -1.935546875, -1.75714111328125, -1.5787353515625, -1.40032958984375, -1.221923828125, -1.04351806640625, -0.8651123046875, -0.68670654296875, -0.50830078125, -0.32989501953125, -0.1514892578125, 0.02691650390625, 0.205322265625, 0.38372802734375, 0.5621337890625, 0.74053955078125, 0.9189453125, 1.09735107421875, 1.2757568359375, 1.45416259765625, 1.632568359375, 1.81097412109375, 1.9893798828125, 2.16778564453125, 2.34619140625, 2.52459716796875, 2.7030029296875, 2.88140869140625, 3.059814453125, 3.23822021484375, 3.4166259765625, 3.59503173828125, 3.7734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 8.0, 6.0, 9.0, 12.0, 16.0, 12.0, 29.0, 794.0, 31.0, 22.0, 15.0, 10.0, 13.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06951904296875, -0.06789207458496094, -0.06626510620117188, -0.06463813781738281, -0.06301116943359375, -0.06138420104980469, -0.059757232666015625, -0.05813026428222656, -0.0565032958984375, -0.05487632751464844, -0.053249359130859375, -0.05162239074707031, -0.04999542236328125, -0.04836845397949219, -0.046741485595703125, -0.04511451721191406, -0.043487548828125, -0.04186058044433594, -0.040233612060546875, -0.03860664367675781, -0.03697967529296875, -0.03535270690917969, -0.033725738525390625, -0.03209877014160156, -0.0304718017578125, -0.028844833374023438, -0.027217864990234375, -0.025590896606445312, -0.02396392822265625, -0.022336959838867188, -0.020709991455078125, -0.019083023071289062, -0.0174560546875, -0.015829086303710938, -0.014202117919921875, -0.012575149536132812, -0.01094818115234375, -0.009321212768554688, -0.007694244384765625, -0.0060672760009765625, -0.0044403076171875, -0.0028133392333984375, -0.001186370849609375, 0.0004405975341796875, 0.00206756591796875, 0.0036945343017578125, 0.005321502685546875, 0.0069484710693359375, 0.008575439453125, 0.010202407836914062, 0.011829376220703125, 0.013456344604492188, 0.01508331298828125, 0.016710281372070312, 0.018337249755859375, 0.019964218139648438, 0.0215911865234375, 0.023218154907226562, 0.024845123291015625, 0.026472091674804688, 0.02809906005859375, 0.029726028442382812, 0.031352996826171875, 0.03297996520996094, 0.03460693359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 12.0, 4.0, 7.0, 7.0, 21.0, 23.0, 38.0, 40.0, 72.0, 111.0, 166.0, 313.0, 499.0, 954.0, 1553.0, 2927.0, 5734.0, 12848.0, 33847.0, 155834.0, 3900736.0, 46938.0, 16502.0, 7087.0, 3419.0, 1901.0, 1100.0, 624.0, 329.0, 228.0, 122.0, 72.0, 56.0, 44.0, 21.0, 20.0, 15.0, 14.0, 16.0, 6.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.316162109375, -0.3066215515136719, -0.29708099365234375, -0.2875404357910156, -0.2779998779296875, -0.2684593200683594, -0.25891876220703125, -0.24937820434570312, -0.239837646484375, -0.23029708862304688, -0.22075653076171875, -0.21121597290039062, -0.2016754150390625, -0.19213485717773438, -0.18259429931640625, -0.17305374145507812, -0.16351318359375, -0.15397262573242188, -0.14443206787109375, -0.13489151000976562, -0.1253509521484375, -0.11581039428710938, -0.10626983642578125, -0.09672927856445312, -0.087188720703125, -0.07764816284179688, -0.06810760498046875, -0.058567047119140625, -0.0490264892578125, -0.039485931396484375, -0.02994537353515625, -0.020404815673828125, -0.0108642578125, -0.001323699951171875, 0.00821685791015625, 0.017757415771484375, 0.0272979736328125, 0.036838531494140625, 0.04637908935546875, 0.055919647216796875, 0.065460205078125, 0.07500076293945312, 0.08454132080078125, 0.09408187866210938, 0.1036224365234375, 0.11316299438476562, 0.12270355224609375, 0.13224411010742188, 0.14178466796875, 0.15132522583007812, 0.16086578369140625, 0.17040634155273438, 0.1799468994140625, 0.18948745727539062, 0.19902801513671875, 0.20856857299804688, 0.218109130859375, 0.22764968872070312, 0.23719024658203125, 0.24673080444335938, 0.2562713623046875, 0.2658119201660156, 0.27535247802734375, 0.2848930358886719, 0.29443359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 9.0, 5.0, 3.0, 7.0, 4.0, 6.0, 7.0, 13.0, 10.0, 8.0, 12.0, 14.0, 29.0, 20.0, 21.0, 15.0, 25.0, 40.0, 3518.0, 60.0, 37.0, 29.0, 24.0, 15.0, 28.0, 17.0, 16.0, 16.0, 13.0, 9.0, 8.0, 7.0, 4.0, 6.0, 9.0, 1.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0396728515625, -0.03838634490966797, -0.03709983825683594, -0.035813331604003906, -0.034526824951171875, -0.033240318298339844, -0.03195381164550781, -0.03066730499267578, -0.02938079833984375, -0.02809429168701172, -0.026807785034179688, -0.025521278381347656, -0.024234771728515625, -0.022948265075683594, -0.021661758422851562, -0.02037525177001953, -0.0190887451171875, -0.01780223846435547, -0.016515731811523438, -0.015229225158691406, -0.013942718505859375, -0.012656211853027344, -0.011369705200195312, -0.010083198547363281, -0.00879669189453125, -0.007510185241699219, -0.0062236785888671875, -0.004937171936035156, -0.003650665283203125, -0.0023641586303710938, -0.0010776519775390625, 0.00020885467529296875, 0.001495361328125, 0.0027818679809570312, 0.0040683746337890625, 0.005354881286621094, 0.006641387939453125, 0.007927894592285156, 0.009214401245117188, 0.010500907897949219, 0.01178741455078125, 0.013073921203613281, 0.014360427856445312, 0.015646934509277344, 0.016933441162109375, 0.018219947814941406, 0.019506454467773438, 0.02079296112060547, 0.0220794677734375, 0.02336597442626953, 0.024652481079101562, 0.025938987731933594, 0.027225494384765625, 0.028512001037597656, 0.029798507690429688, 0.03108501434326172, 0.03237152099609375, 0.03365802764892578, 0.03494453430175781, 0.036231040954589844, 0.037517547607421875, 0.038804054260253906, 0.04009056091308594, 0.04137706756591797, 0.04266357421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 17.0, 712.0, 251.0, 26.0, 6.0, 1.0, 1.0, 2.0], "bins": [-1.9284051656723022, -1.895041584968567, -1.8616780042648315, -1.8283144235610962, -1.7949507236480713, -1.761587142944336, -1.7282235622406006, -1.6948599815368652, -1.6614964008331299, -1.6281328201293945, -1.5947692394256592, -1.5614056587219238, -1.5280420780181885, -1.4946783781051636, -1.4613147974014282, -1.4279512166976929, -1.3945876359939575, -1.3612240552902222, -1.3278604745864868, -1.2944968938827515, -1.2611331939697266, -1.2277696132659912, -1.1944060325622559, -1.1610424518585205, -1.1276788711547852, -1.0943152904510498, -1.0609517097473145, -1.027588129043579, -0.994224488735199, -0.9608609080314636, -0.9274972677230835, -0.8941336870193481, -0.8607701659202576, -0.8274065852165222, -0.7940429449081421, -0.7606793642044067, -0.7273157835006714, -0.693952202796936, -0.6605886220932007, -0.6272249817848206, -0.5938614010810852, -0.5604978203773499, -0.5271341800689697, -0.4937705993652344, -0.460407018661499, -0.42704343795776367, -0.39367982745170593, -0.3603162169456482, -0.32695263624191284, -0.2935890555381775, -0.26022544503211975, -0.2268618494272232, -0.19349825382232666, -0.16013465821743011, -0.12677106261253357, -0.09340746700763702, -0.060043856501579285, -0.02668026089668274, 0.006683334708213806, 0.04004693031311035, 0.0734105259180069, 0.10677412152290344, 0.1401377171278, 0.17350131273269653, 0.20686490833759308]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 5.0, 10.0, 12.0, 22.0, 27.0, 32.0, 44.0, 83.0, 81.0, 88.0, 114.0, 99.0, 85.0, 78.0, 59.0, 51.0, 25.0, 19.0, 14.0, 6.0, 3.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17440110445022583, -0.16763702034950256, -0.1608729511499405, -0.15410886704921722, -0.14734479784965515, -0.14058071374893188, -0.13381662964820862, -0.12705256044864655, -0.12028848379850388, -0.1135244071483612, -0.10676033049821854, -0.09999625384807587, -0.0932321697473526, -0.08646810054779053, -0.07970401644706726, -0.07293993979692459, -0.06617586314678192, -0.05941178649663925, -0.05264770984649658, -0.045883629471063614, -0.039119552820920944, -0.032355476170778275, -0.025591395795345306, -0.018827319145202637, -0.012063242495059967, -0.005299164913594723, 0.0014649126678705215, 0.00822899118065834, 0.01499306783080101, 0.02175714448094368, 0.028521224856376648, 0.03528530150651932, 0.04204937815666199, 0.04881345480680466, 0.05557753145694733, 0.062341611832380295, 0.06910568475723267, 0.07586976885795593, 0.0826338455080986, 0.08939792215824127, 0.09616199880838394, 0.10292607545852661, 0.10969015210866928, 0.11645422875881195, 0.12321831285953522, 0.1299823820590973, 0.13674646615982056, 0.14351055026054382, 0.1502746194601059, 0.15703870356082916, 0.16380277276039124, 0.1705668568611145, 0.17733092606067657, 0.18409501016139984, 0.19085907936096191, 0.19762316346168518, 0.20438724756240845, 0.2111513316631317, 0.2179154008626938, 0.22467948496341705, 0.23144355416297913, 0.2382076382637024, 0.24497172236442566, 0.2517358064651489, 0.2584998607635498]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 5.0, 13.0, 15.0, 17.0, 36.0, 29.0, 49.0, 85.0, 119.0, 245.0, 388.0, 938.0, 2646.0, 8701.0, 47105.0, 961590.0, 18673.0, 4835.0, 1587.0, 635.0, 310.0, 175.0, 101.0, 80.0, 31.0, 28.0, 26.0, 16.0, 20.0, 10.0, 13.0, 7.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52392578125, -0.5094795227050781, -0.49503326416015625, -0.4805870056152344, -0.4661407470703125, -0.4516944885253906, -0.43724822998046875, -0.4228019714355469, -0.408355712890625, -0.3939094543457031, -0.37946319580078125, -0.3650169372558594, -0.3505706787109375, -0.3361244201660156, -0.32167816162109375, -0.3072319030761719, -0.29278564453125, -0.2783393859863281, -0.26389312744140625, -0.24944686889648438, -0.2350006103515625, -0.22055435180664062, -0.20610809326171875, -0.19166183471679688, -0.177215576171875, -0.16276931762695312, -0.14832305908203125, -0.13387680053710938, -0.1194305419921875, -0.10498428344726562, -0.09053802490234375, -0.07609176635742188, -0.0616455078125, -0.047199249267578125, -0.03275299072265625, -0.018306732177734375, -0.0038604736328125, 0.010585784912109375, 0.02503204345703125, 0.039478302001953125, 0.053924560546875, 0.06837081909179688, 0.08281707763671875, 0.09726333618164062, 0.1117095947265625, 0.12615585327148438, 0.14060211181640625, 0.15504837036132812, 0.16949462890625, 0.18394088745117188, 0.19838714599609375, 0.21283340454101562, 0.2272796630859375, 0.24172592163085938, 0.25617218017578125, 0.2706184387207031, 0.285064697265625, 0.2995109558105469, 0.31395721435546875, 0.3284034729003906, 0.3428497314453125, 0.3572959899902344, 0.37174224853515625, 0.3861885070800781, 0.400634765625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 7.0, 7.0, 12.0, 17.0, 18.0, 35.0, 741.0, 85.0, 24.0, 11.0, 10.0, 8.0, 7.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06854248046875, -0.06693553924560547, -0.06532859802246094, -0.0637216567993164, -0.062114715576171875, -0.060507774353027344, -0.05890083312988281, -0.05729389190673828, -0.05568695068359375, -0.05408000946044922, -0.05247306823730469, -0.050866127014160156, -0.049259185791015625, -0.047652244567871094, -0.04604530334472656, -0.04443836212158203, -0.0428314208984375, -0.04122447967529297, -0.03961753845214844, -0.038010597229003906, -0.036403656005859375, -0.034796714782714844, -0.03318977355957031, -0.03158283233642578, -0.02997589111328125, -0.02836894989013672, -0.026762008666992188, -0.025155067443847656, -0.023548126220703125, -0.021941184997558594, -0.020334243774414062, -0.01872730255126953, -0.017120361328125, -0.015513420104980469, -0.013906478881835938, -0.012299537658691406, -0.010692596435546875, -0.009085655212402344, -0.0074787139892578125, -0.005871772766113281, -0.00426483154296875, -0.0026578903198242188, -0.0010509490966796875, 0.0005559921264648438, 0.002162933349609375, 0.0037698745727539062, 0.0053768157958984375, 0.006983757019042969, 0.0085906982421875, 0.010197639465332031, 0.011804580688476562, 0.013411521911621094, 0.015018463134765625, 0.016625404357910156, 0.018232345581054688, 0.01983928680419922, 0.02144622802734375, 0.02305316925048828, 0.024660110473632812, 0.026267051696777344, 0.027873992919921875, 0.029480934143066406, 0.031087875366210938, 0.03269481658935547, 0.0343017578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 5.0, 12.0, 8.0, 13.0, 17.0, 14.0, 26.0, 56.0, 65.0, 108.0, 149.0, 283.0, 633.0, 1601.0, 5593.0, 28189.0, 427878.0, 544104.0, 30742.0, 5937.0, 1652.0, 644.0, 311.0, 163.0, 104.0, 54.0, 46.0, 35.0, 18.0, 21.0, 16.0, 12.0, 7.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223876953125, -0.21709823608398438, -0.21031951904296875, -0.20354080200195312, -0.1967620849609375, -0.18998336791992188, -0.18320465087890625, -0.17642593383789062, -0.169647216796875, -0.16286849975585938, -0.15608978271484375, -0.14931106567382812, -0.1425323486328125, -0.13575363159179688, -0.12897491455078125, -0.12219619750976562, -0.11541748046875, -0.10863876342773438, -0.10186004638671875, -0.09508132934570312, -0.0883026123046875, -0.08152389526367188, -0.07474517822265625, -0.06796646118164062, -0.061187744140625, -0.054409027099609375, -0.04763031005859375, -0.040851593017578125, -0.0340728759765625, -0.027294158935546875, -0.02051544189453125, -0.013736724853515625, -0.0069580078125, -0.000179290771484375, 0.00659942626953125, 0.013378143310546875, 0.0201568603515625, 0.026935577392578125, 0.03371429443359375, 0.040493011474609375, 0.047271728515625, 0.054050445556640625, 0.06082916259765625, 0.06760787963867188, 0.0743865966796875, 0.08116531372070312, 0.08794403076171875, 0.09472274780273438, 0.10150146484375, 0.10828018188476562, 0.11505889892578125, 0.12183761596679688, 0.1286163330078125, 0.13539505004882812, 0.14217376708984375, 0.14895248413085938, 0.155731201171875, 0.16250991821289062, 0.16928863525390625, 0.17606735229492188, 0.1828460693359375, 0.18962478637695312, 0.19640350341796875, 0.20318222045898438, 0.2099609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 2.0, 10.0, 7.0, 6.0, 10.0, 15.0, 16.0, 24.0, 26.0, 24.0, 25.0, 37.0, 40.0, 40.0, 38.0, 40.0, 51.0, 55.0, 57.0, 44.0, 47.0, 56.0, 59.0, 43.0, 33.0, 31.0, 31.0, 30.0, 19.0, 15.0, 13.0, 16.0, 4.0, 12.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.06517601013183594, -0.06303024291992188, -0.06088447570800781, -0.05873870849609375, -0.05659294128417969, -0.054447174072265625, -0.05230140686035156, -0.0501556396484375, -0.04800987243652344, -0.045864105224609375, -0.04371833801269531, -0.04157257080078125, -0.03942680358886719, -0.037281036376953125, -0.03513526916503906, -0.032989501953125, -0.030843734741210938, -0.028697967529296875, -0.026552200317382812, -0.02440643310546875, -0.022260665893554688, -0.020114898681640625, -0.017969131469726562, -0.0158233642578125, -0.013677597045898438, -0.011531829833984375, -0.009386062622070312, -0.00724029541015625, -0.0050945281982421875, -0.002948760986328125, -0.0008029937744140625, 0.0013427734375, 0.0034885406494140625, 0.005634307861328125, 0.0077800750732421875, 0.00992584228515625, 0.012071609497070312, 0.014217376708984375, 0.016363143920898438, 0.0185089111328125, 0.020654678344726562, 0.022800445556640625, 0.024946212768554688, 0.02709197998046875, 0.029237747192382812, 0.031383514404296875, 0.03352928161621094, 0.035675048828125, 0.03782081604003906, 0.039966583251953125, 0.04211235046386719, 0.04425811767578125, 0.04640388488769531, 0.048549652099609375, 0.05069541931152344, 0.0528411865234375, 0.05498695373535156, 0.057132720947265625, 0.05927848815917969, 0.06142425537109375, 0.06357002258300781, 0.06571578979492188, 0.06786155700683594, 0.07000732421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 14.0, 21.0, 36.0, 55.0, 72.0, 144.0, 235.0, 537.0, 1197.0, 3571.0, 13871.0, 127809.0, 844439.0, 44660.0, 7805.0, 2334.0, 847.0, 397.0, 191.0, 104.0, 57.0, 39.0, 17.0, 14.0, 9.0, 8.0, 6.0, 4.0, 3.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.006805419921875, -0.00658804178237915, -0.006370663642883301, -0.006153285503387451, -0.0059359073638916016, -0.005718529224395752, -0.005501151084899902, -0.005283772945404053, -0.005066394805908203, -0.0048490166664123535, -0.004631638526916504, -0.004414260387420654, -0.004196882247924805, -0.003979504108428955, -0.0037621259689331055, -0.003544747829437256, -0.0033273696899414062, -0.0031099915504455566, -0.002892613410949707, -0.0026752352714538574, -0.002457857131958008, -0.002240478992462158, -0.0020231008529663086, -0.001805722713470459, -0.0015883445739746094, -0.0013709664344787598, -0.0011535882949829102, -0.0009362101554870605, -0.0007188320159912109, -0.0005014538764953613, -0.0002840757369995117, -6.669759750366211e-05, 0.0001506805419921875, 0.0003680586814880371, 0.0005854368209838867, 0.0008028149604797363, 0.001020193099975586, 0.0012375712394714355, 0.0014549493789672852, 0.0016723275184631348, 0.0018897056579589844, 0.002107083797454834, 0.0023244619369506836, 0.002541840076446533, 0.002759218215942383, 0.0029765963554382324, 0.003193974494934082, 0.0034113526344299316, 0.0036287307739257812, 0.003846108913421631, 0.0040634870529174805, 0.00428086519241333, 0.00449824333190918, 0.004715621471405029, 0.004932999610900879, 0.0051503777503967285, 0.005367755889892578, 0.005585134029388428, 0.005802512168884277, 0.006019890308380127, 0.0062372684478759766, 0.006454646587371826, 0.006672024726867676, 0.006889402866363525, 0.007106781005859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 15.0, 5.0, 20.0, 25.0, 31.0, 16.0, 44.0, 33.0, 23.0, 62.0, 58.0, 76.0, 28.0, 67.0, 77.0, 33.0, 62.0, 60.0, 44.0, 21.0, 33.0, 38.0, 29.0, 9.0, 25.0, 19.0, 10.0, 8.0, 3.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.9373914003372192e-06, -2.8349459171295166e-06, -2.732500433921814e-06, -2.6300549507141113e-06, -2.5276094675064087e-06, -2.425163984298706e-06, -2.3227185010910034e-06, -2.2202730178833008e-06, -2.117827534675598e-06, -2.0153820514678955e-06, -1.912936568260193e-06, -1.8104910850524902e-06, -1.7080456018447876e-06, -1.605600118637085e-06, -1.5031546354293823e-06, -1.4007091522216797e-06, -1.298263669013977e-06, -1.1958181858062744e-06, -1.0933727025985718e-06, -9.909272193908691e-07, -8.884817361831665e-07, -7.860362529754639e-07, -6.835907697677612e-07, -5.811452865600586e-07, -4.78699803352356e-07, -3.762543201446533e-07, -2.738088369369507e-07, -1.7136335372924805e-07, -6.891787052154541e-08, 3.3527612686157227e-08, 1.3597309589385986e-07, 2.384185791015625e-07, 3.4086406230926514e-07, 4.4330954551696777e-07, 5.457550287246704e-07, 6.48200511932373e-07, 7.506459951400757e-07, 8.530914783477783e-07, 9.55536961555481e-07, 1.0579824447631836e-06, 1.1604279279708862e-06, 1.2628734111785889e-06, 1.3653188943862915e-06, 1.4677643775939941e-06, 1.5702098608016968e-06, 1.6726553440093994e-06, 1.775100827217102e-06, 1.8775463104248047e-06, 1.9799917936325073e-06, 2.08243727684021e-06, 2.1848827600479126e-06, 2.2873282432556152e-06, 2.389773726463318e-06, 2.4922192096710205e-06, 2.594664692878723e-06, 2.6971101760864258e-06, 2.7995556592941284e-06, 2.902001142501831e-06, 3.0044466257095337e-06, 3.1068921089172363e-06, 3.209337592124939e-06, 3.3117830753326416e-06, 3.4142285585403442e-06, 3.516674041748047e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 6.0, 6.0, 2.0, 8.0, 15.0, 16.0, 31.0, 41.0, 56.0, 118.0, 252.0, 610.0, 1667.0, 6121.0, 74479.0, 939650.0, 19757.0, 3681.0, 1124.0, 469.0, 199.0, 90.0, 44.0, 34.0, 21.0, 16.0, 10.0, 5.0, 7.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0118255615234375, -0.011447429656982422, -0.011069297790527344, -0.010691165924072266, -0.010313034057617188, -0.00993490219116211, -0.009556770324707031, -0.009178638458251953, -0.008800506591796875, -0.008422374725341797, -0.008044242858886719, -0.007666110992431641, -0.0072879791259765625, -0.006909847259521484, -0.006531715393066406, -0.006153583526611328, -0.00577545166015625, -0.005397319793701172, -0.005019187927246094, -0.004641056060791016, -0.0042629241943359375, -0.0038847923278808594, -0.0035066604614257812, -0.003128528594970703, -0.002750396728515625, -0.002372264862060547, -0.0019941329956054688, -0.0016160011291503906, -0.0012378692626953125, -0.0008597373962402344, -0.00048160552978515625, -0.00010347366333007812, 0.000274658203125, 0.0006527900695800781, 0.0010309219360351562, 0.0014090538024902344, 0.0017871856689453125, 0.0021653175354003906, 0.0025434494018554688, 0.002921581268310547, 0.003299713134765625, 0.003677845001220703, 0.004055976867675781, 0.004434108734130859, 0.0048122406005859375, 0.005190372467041016, 0.005568504333496094, 0.005946636199951172, 0.00632476806640625, 0.006702899932861328, 0.007081031799316406, 0.007459163665771484, 0.007837295532226562, 0.00821542739868164, 0.008593559265136719, 0.008971691131591797, 0.009349822998046875, 0.009727954864501953, 0.010106086730957031, 0.01048421859741211, 0.010862350463867188, 0.011240482330322266, 0.011618614196777344, 0.011996746063232422, 0.0123748779296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 22.0, 43.0, 69.0, 83.0, 136.0, 142.0, 129.0, 102.0, 68.0, 40.0, 38.0, 20.0, 10.0, 12.0, 8.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00383758544921875, -0.003719627857208252, -0.003601670265197754, -0.003483712673187256, -0.003365755081176758, -0.0032477974891662598, -0.0031298398971557617, -0.0030118823051452637, -0.0028939247131347656, -0.0027759671211242676, -0.0026580095291137695, -0.0025400519371032715, -0.0024220943450927734, -0.0023041367530822754, -0.0021861791610717773, -0.0020682215690612793, -0.0019502639770507812, -0.0018323063850402832, -0.0017143487930297852, -0.0015963912010192871, -0.001478433609008789, -0.001360476016998291, -0.001242518424987793, -0.001124560832977295, -0.0010066032409667969, -0.0008886456489562988, -0.0007706880569458008, -0.0006527304649353027, -0.0005347728729248047, -0.00041681528091430664, -0.0002988576889038086, -0.00018090009689331055, -6.29425048828125e-05, 5.501508712768555e-05, 0.0001729726791381836, 0.00029093027114868164, 0.0004088878631591797, 0.0005268454551696777, 0.0006448030471801758, 0.0007627606391906738, 0.0008807182312011719, 0.00099867582321167, 0.001116633415222168, 0.001234591007232666, 0.001352548599243164, 0.0014705061912536621, 0.0015884637832641602, 0.0017064213752746582, 0.0018243789672851562, 0.0019423365592956543, 0.0020602941513061523, 0.0021782517433166504, 0.0022962093353271484, 0.0024141669273376465, 0.0025321245193481445, 0.0026500821113586426, 0.0027680397033691406, 0.0028859972953796387, 0.0030039548873901367, 0.0031219124794006348, 0.003239870071411133, 0.003357827663421631, 0.003475785255432129, 0.003593742847442627, 0.003711700439453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 15.0, 12.0, 21.0, 56.0, 103.0, 273.0, 277.0, 114.0, 49.0, 26.0, 17.0, 11.0, 8.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.676802396774292, -0.6569158434867859, -0.637029230594635, -0.6171426773071289, -0.597256064414978, -0.5773695111274719, -0.557482898235321, -0.5375963449478149, -0.5177097320556641, -0.49782314896583557, -0.4779365658760071, -0.4580499827861786, -0.4381633996963501, -0.418276846408844, -0.3983902633190155, -0.378503680229187, -0.3586171269416809, -0.3387305438518524, -0.3188439607620239, -0.29895737767219543, -0.27907079458236694, -0.25918424129486084, -0.23929765820503235, -0.21941107511520386, -0.19952449202537537, -0.17963790893554688, -0.15975132584571838, -0.1398647576570511, -0.1199781745672226, -0.1000915914773941, -0.08020501583814621, -0.060318440198898315, -0.040431857109069824, -0.02054527774453163, -0.0006586983799934387, 0.019227880984544754, 0.03911446034908295, 0.05900104343891144, 0.07888761907815933, 0.09877419471740723, 0.11866077780723572, 0.1385473608970642, 0.1584339439868927, 0.17832051217556, 0.1982070952653885, 0.21809367835521698, 0.23798024654388428, 0.25786682963371277, 0.27775341272354126, 0.29763999581336975, 0.31752657890319824, 0.33741316199302673, 0.3572997450828552, 0.37718629837036133, 0.3970728814601898, 0.4169594645500183, 0.4368460476398468, 0.4567326307296753, 0.4766192138195038, 0.4965057969093323, 0.5163923501968384, 0.5362789630889893, 0.5561655163764954, 0.5760520696640015, 0.5959386825561523]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 6.0, 6.0, 13.0, 10.0, 23.0, 31.0, 34.0, 53.0, 45.0, 51.0, 73.0, 63.0, 77.0, 78.0, 61.0, 74.0, 59.0, 46.0, 52.0, 33.0, 15.0, 17.0, 12.0, 11.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5613155364990234, -0.5438988208770752, -0.5264820456504822, -0.5090653300285339, -0.4916485548019409, -0.4742318391799927, -0.45681509375572205, -0.4393983483314514, -0.4219816029071808, -0.40456485748291016, -0.3871481120586395, -0.3697313666343689, -0.35231465101242065, -0.33489787578582764, -0.3174811601638794, -0.30006441473960876, -0.28264766931533813, -0.2652309238910675, -0.24781417846679688, -0.23039744794368744, -0.2129807025194168, -0.19556395709514618, -0.17814722657203674, -0.1607304811477661, -0.14331373572349548, -0.12589699029922485, -0.10848025232553482, -0.09106351435184479, -0.07364676892757416, -0.05623002350330353, -0.038813285529613495, -0.021396547555923462, -0.003979742527008057, 0.013436999171972275, 0.030853740870952606, 0.04827048256993294, 0.06568722426891327, 0.0831039696931839, 0.10052070766687393, 0.11793744564056396, 0.1353541910648346, 0.15277093648910522, 0.17018768191337585, 0.1876044124364853, 0.20502115786075592, 0.22243790328502655, 0.239854633808136, 0.2572713792324066, 0.27468812465667725, 0.2921048700809479, 0.3095216155052185, 0.32693836092948914, 0.34435510635375977, 0.361771821975708, 0.37918856739997864, 0.39660531282424927, 0.4140220582485199, 0.4314388036727905, 0.44885554909706116, 0.4662722945213318, 0.48368901014328003, 0.501105785369873, 0.5185225009918213, 0.5359392166137695, 0.5533559918403625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 10.0, 13.0, 22.0, 40.0, 68.0, 80.0, 147.0, 344.0, 2120.0, 132294.0, 4055522.0, 2897.0, 524.0, 151.0, 30.0, 14.0, 5.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.541015625, -3.458740234375, -3.37646484375, -3.294189453125, -3.2119140625, -3.129638671875, -3.04736328125, -2.965087890625, -2.8828125, -2.800537109375, -2.71826171875, -2.635986328125, -2.5537109375, -2.471435546875, -2.38916015625, -2.306884765625, -2.224609375, -2.142333984375, -2.06005859375, -1.977783203125, -1.8955078125, -1.813232421875, -1.73095703125, -1.648681640625, -1.56640625, -1.484130859375, -1.40185546875, -1.319580078125, -1.2373046875, -1.155029296875, -1.07275390625, -0.990478515625, -0.908203125, -0.825927734375, -0.74365234375, -0.661376953125, -0.5791015625, -0.496826171875, -0.41455078125, -0.332275390625, -0.25, -0.167724609375, -0.08544921875, -0.003173828125, 0.0791015625, 0.161376953125, 0.24365234375, 0.325927734375, 0.408203125, 0.490478515625, 0.57275390625, 0.655029296875, 0.7373046875, 0.819580078125, 0.90185546875, 0.984130859375, 1.06640625, 1.148681640625, 1.23095703125, 1.313232421875, 1.3955078125, 1.477783203125, 1.56005859375, 1.642333984375, 1.724609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 4.0, 3.0, 20.0, 18.0, 34.0, 472.0, 355.0, 28.0, 18.0, 13.0, 5.0, 9.0, 6.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.068359375, -0.06676816940307617, -0.06517696380615234, -0.06358575820922852, -0.06199455261230469, -0.06040334701538086, -0.05881214141845703, -0.0572209358215332, -0.055629730224609375, -0.05403852462768555, -0.05244731903076172, -0.05085611343383789, -0.04926490783691406, -0.047673702239990234, -0.046082496643066406, -0.04449129104614258, -0.04290008544921875, -0.04130887985229492, -0.039717674255371094, -0.038126468658447266, -0.03653526306152344, -0.03494405746459961, -0.03335285186767578, -0.03176164627075195, -0.030170440673828125, -0.028579235076904297, -0.02698802947998047, -0.02539682388305664, -0.023805618286132812, -0.022214412689208984, -0.020623207092285156, -0.019032001495361328, -0.0174407958984375, -0.015849590301513672, -0.014258384704589844, -0.012667179107666016, -0.011075973510742188, -0.00948476791381836, -0.007893562316894531, -0.006302356719970703, -0.004711151123046875, -0.003119945526123047, -0.0015287399291992188, 6.246566772460938e-05, 0.0016536712646484375, 0.0032448768615722656, 0.004836082458496094, 0.006427288055419922, 0.00801849365234375, 0.009609699249267578, 0.011200904846191406, 0.012792110443115234, 0.014383316040039062, 0.01597452163696289, 0.01756572723388672, 0.019156932830810547, 0.020748138427734375, 0.022339344024658203, 0.02393054962158203, 0.02552175521850586, 0.027112960815429688, 0.028704166412353516, 0.030295372009277344, 0.03188657760620117, 0.033477783203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 14.0, 11.0, 16.0, 22.0, 20.0, 40.0, 44.0, 53.0, 104.0, 170.0, 367.0, 1250.0, 6679.0, 87319.0, 4050847.0, 41500.0, 4117.0, 903.0, 284.0, 147.0, 94.0, 46.0, 46.0, 36.0, 36.0, 19.0, 8.0, 15.0, 12.0, 12.0, 6.0, 7.0, 6.0, 4.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.468505859375, -0.4525642395019531, -0.43662261962890625, -0.4206809997558594, -0.4047393798828125, -0.3887977600097656, -0.37285614013671875, -0.3569145202636719, -0.340972900390625, -0.3250312805175781, -0.30908966064453125, -0.2931480407714844, -0.2772064208984375, -0.2612648010253906, -0.24532318115234375, -0.22938156127929688, -0.21343994140625, -0.19749832153320312, -0.18155670166015625, -0.16561508178710938, -0.1496734619140625, -0.13373184204101562, -0.11779022216796875, -0.10184860229492188, -0.085906982421875, -0.06996536254882812, -0.05402374267578125, -0.038082122802734375, -0.0221405029296875, -0.006198883056640625, 0.00974273681640625, 0.025684356689453125, 0.0416259765625, 0.057567596435546875, 0.07350921630859375, 0.08945083618164062, 0.1053924560546875, 0.12133407592773438, 0.13727569580078125, 0.15321731567382812, 0.169158935546875, 0.18510055541992188, 0.20104217529296875, 0.21698379516601562, 0.2329254150390625, 0.24886703491210938, 0.26480865478515625, 0.2807502746582031, 0.29669189453125, 0.3126335144042969, 0.32857513427734375, 0.3445167541503906, 0.3604583740234375, 0.3763999938964844, 0.39234161376953125, 0.4082832336425781, 0.424224853515625, 0.4401664733886719, 0.45610809326171875, 0.4720497131347656, 0.4879913330078125, 0.5039329528808594, 0.5198745727539062, 0.5358161926269531, 0.5517578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 4.0, 10.0, 8.0, 11.0, 7.0, 9.0, 21.0, 26.0, 29.0, 25.0, 33.0, 47.0, 58.0, 64.0, 97.0, 143.0, 725.0, 2130.0, 154.0, 92.0, 60.0, 53.0, 46.0, 43.0, 26.0, 30.0, 26.0, 20.0, 16.0, 4.0, 7.0, 10.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040740966796875, -0.03954458236694336, -0.03834819793701172, -0.03715181350708008, -0.03595542907714844, -0.0347590446472168, -0.033562660217285156, -0.032366275787353516, -0.031169891357421875, -0.029973506927490234, -0.028777122497558594, -0.027580738067626953, -0.026384353637695312, -0.025187969207763672, -0.02399158477783203, -0.02279520034790039, -0.02159881591796875, -0.02040243148803711, -0.01920604705810547, -0.018009662628173828, -0.016813278198242188, -0.015616893768310547, -0.014420509338378906, -0.013224124908447266, -0.012027740478515625, -0.010831356048583984, -0.009634971618652344, -0.008438587188720703, -0.0072422027587890625, -0.006045818328857422, -0.004849433898925781, -0.0036530494689941406, -0.0024566650390625, -0.0012602806091308594, -6.389617919921875e-05, 0.0011324882507324219, 0.0023288726806640625, 0.003525257110595703, 0.004721641540527344, 0.005918025970458984, 0.007114410400390625, 0.008310794830322266, 0.009507179260253906, 0.010703563690185547, 0.011899948120117188, 0.013096332550048828, 0.014292716979980469, 0.01548910140991211, 0.01668548583984375, 0.01788187026977539, 0.01907825469970703, 0.020274639129638672, 0.021471023559570312, 0.022667407989501953, 0.023863792419433594, 0.025060176849365234, 0.026256561279296875, 0.027452945709228516, 0.028649330139160156, 0.029845714569091797, 0.031042098999023438, 0.03223848342895508, 0.03343486785888672, 0.03463125228881836, 0.03582763671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 14.0, 32.0, 110.0, 407.0, 299.0, 77.0, 28.0, 13.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2762466073036194, -0.26598450541496277, -0.25572240352630615, -0.24546028673648834, -0.23519818484783173, -0.2249360829591751, -0.2146739661693573, -0.20441186428070068, -0.19414976239204407, -0.18388766050338745, -0.17362555861473083, -0.16336344182491302, -0.1531013399362564, -0.1428392380475998, -0.13257712125778198, -0.12231501936912537, -0.11205291748046875, -0.10179081559181213, -0.09152870625257492, -0.08126659691333771, -0.07100449502468109, -0.06074238941073418, -0.05048028379678726, -0.04021817445755005, -0.029956072568893433, -0.019693966954946518, -0.009431861340999603, 0.0008302442729473114, 0.011092349886894226, 0.02135445550084114, 0.031616561114788055, 0.04187867045402527, 0.05214080214500427, 0.06240290775895119, 0.0726650133728981, 0.08292712271213531, 0.09318922460079193, 0.10345132648944855, 0.11371343582868576, 0.12397554516792297, 0.1342376470565796, 0.1444997489452362, 0.15476185083389282, 0.16502396762371063, 0.17528606951236725, 0.18554817140102386, 0.19581028819084167, 0.2060723900794983, 0.2163344919681549, 0.22659659385681152, 0.23685869574546814, 0.24712081253528595, 0.25738292932510376, 0.2676450312137604, 0.277907133102417, 0.2881692349910736, 0.2984313368797302, 0.30869343876838684, 0.31895554065704346, 0.3292176425457001, 0.3394797444343567, 0.3497418761253357, 0.3600039780139923, 0.3702660799026489, 0.38052818179130554]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 14.0, 22.0, 18.0, 22.0, 45.0, 45.0, 73.0, 69.0, 95.0, 96.0, 92.0, 68.0, 64.0, 65.0, 64.0, 42.0, 32.0, 17.0, 13.0, 4.0, 12.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18686902523040771, -0.17826081812381744, -0.16965261101722717, -0.1610444039106369, -0.15243619680404663, -0.14382797479629517, -0.1352197676897049, -0.12661156058311462, -0.11800335347652435, -0.10939514636993408, -0.10078693926334381, -0.09217872470617294, -0.08357051759958267, -0.0749623104929924, -0.06635409593582153, -0.05774588882923126, -0.04913768172264099, -0.04052947461605072, -0.03192126378417015, -0.02331305481493473, -0.01470484584569931, -0.006096638739109039, 0.00251157209277153, 0.0111197829246521, 0.01972799003124237, 0.02833619900047779, 0.03694440796971321, 0.04555261880159378, 0.05416082590818405, 0.06276903301477432, 0.07137724757194519, 0.07998545467853546, 0.08859366178512573, 0.097201868891716, 0.10581007599830627, 0.11441829055547714, 0.12302649766206741, 0.13163471221923828, 0.14024291932582855, 0.14885112643241882, 0.1574593335390091, 0.16606754064559937, 0.17467574775218964, 0.1832839548587799, 0.19189217686653137, 0.20050036907196045, 0.20910859107971191, 0.21771679818630219, 0.22632500529289246, 0.23493321239948273, 0.243541419506073, 0.25214964151382446, 0.26075783371925354, 0.269366055727005, 0.2779742479324341, 0.28658246994018555, 0.295190691947937, 0.3037989139556885, 0.31240710616111755, 0.321015328168869, 0.3296235203742981, 0.33823174238204956, 0.34683993458747864, 0.3554481565952301, 0.3640563488006592]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 7.0, 12.0, 8.0, 26.0, 21.0, 33.0, 49.0, 70.0, 100.0, 125.0, 193.0, 349.0, 800.0, 1980.0, 6107.0, 47049.0, 964274.0, 20165.0, 4174.0, 1433.0, 664.0, 320.0, 197.0, 118.0, 71.0, 51.0, 43.0, 23.0, 10.0, 17.0, 14.0, 7.0, 8.0, 2.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.44140625, -0.4298973083496094, -0.41838836669921875, -0.4068794250488281, -0.3953704833984375, -0.3838615417480469, -0.37235260009765625, -0.3608436584472656, -0.349334716796875, -0.3378257751464844, -0.32631683349609375, -0.3148078918457031, -0.3032989501953125, -0.2917900085449219, -0.28028106689453125, -0.2687721252441406, -0.25726318359375, -0.24575424194335938, -0.23424530029296875, -0.22273635864257812, -0.2112274169921875, -0.19971847534179688, -0.18820953369140625, -0.17670059204101562, -0.165191650390625, -0.15368270874023438, -0.14217376708984375, -0.13066482543945312, -0.1191558837890625, -0.10764694213867188, -0.09613800048828125, -0.08462905883789062, -0.0731201171875, -0.061611175537109375, -0.05010223388671875, -0.038593292236328125, -0.0270843505859375, -0.015575408935546875, -0.00406646728515625, 0.007442474365234375, 0.018951416015625, 0.030460357666015625, 0.04196929931640625, 0.053478240966796875, 0.0649871826171875, 0.07649612426757812, 0.08800506591796875, 0.09951400756835938, 0.11102294921875, 0.12253189086914062, 0.13404083251953125, 0.14554977416992188, 0.1570587158203125, 0.16856765747070312, 0.18007659912109375, 0.19158554077148438, 0.203094482421875, 0.21460342407226562, 0.22611236572265625, 0.23762130737304688, 0.2491302490234375, 0.2606391906738281, 0.27214813232421875, 0.2836570739746094, 0.295166015625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 5.0, 18.0, 29.0, 126.0, 481.0, 241.0, 40.0, 17.0, 10.0, 10.0, 4.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0634765625, -0.06195354461669922, -0.06043052673339844, -0.058907508850097656, -0.057384490966796875, -0.055861473083496094, -0.05433845520019531, -0.05281543731689453, -0.05129241943359375, -0.04976940155029297, -0.04824638366699219, -0.046723365783691406, -0.045200347900390625, -0.043677330017089844, -0.04215431213378906, -0.04063129425048828, -0.0391082763671875, -0.03758525848388672, -0.03606224060058594, -0.034539222717285156, -0.033016204833984375, -0.031493186950683594, -0.029970169067382812, -0.02844715118408203, -0.02692413330078125, -0.02540111541748047, -0.023878097534179688, -0.022355079650878906, -0.020832061767578125, -0.019309043884277344, -0.017786026000976562, -0.01626300811767578, -0.014739990234375, -0.013216972351074219, -0.011693954467773438, -0.010170936584472656, -0.008647918701171875, -0.007124900817871094, -0.0056018829345703125, -0.004078865051269531, -0.00255584716796875, -0.0010328292846679688, 0.0004901885986328125, 0.0020132064819335938, 0.003536224365234375, 0.005059242248535156, 0.0065822601318359375, 0.008105278015136719, 0.0096282958984375, 0.011151313781738281, 0.012674331665039062, 0.014197349548339844, 0.015720367431640625, 0.017243385314941406, 0.018766403198242188, 0.02028942108154297, 0.02181243896484375, 0.02333545684814453, 0.024858474731445312, 0.026381492614746094, 0.027904510498046875, 0.029427528381347656, 0.030950546264648438, 0.03247356414794922, 0.03399658203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 6.0, 3.0, 5.0, 2.0, 10.0, 9.0, 10.0, 8.0, 13.0, 22.0, 28.0, 29.0, 42.0, 72.0, 78.0, 145.0, 227.0, 323.0, 632.0, 1303.0, 4062.0, 24422.0, 511371.0, 475486.0, 23275.0, 4027.0, 1282.0, 593.0, 330.0, 207.0, 145.0, 96.0, 58.0, 52.0, 39.0, 23.0, 29.0, 15.0, 17.0, 8.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2001953125, -0.1939373016357422, -0.18767929077148438, -0.18142127990722656, -0.17516326904296875, -0.16890525817871094, -0.16264724731445312, -0.1563892364501953, -0.1501312255859375, -0.1438732147216797, -0.13761520385742188, -0.13135719299316406, -0.12509918212890625, -0.11884117126464844, -0.11258316040039062, -0.10632514953613281, -0.100067138671875, -0.09380912780761719, -0.08755111694335938, -0.08129310607910156, -0.07503509521484375, -0.06877708435058594, -0.06251907348632812, -0.05626106262207031, -0.0500030517578125, -0.04374504089355469, -0.037487030029296875, -0.031229019165039062, -0.02497100830078125, -0.018712997436523438, -0.012454986572265625, -0.0061969757080078125, 6.103515625e-05, 0.0063190460205078125, 0.012577056884765625, 0.018835067749023438, 0.02509307861328125, 0.03135108947753906, 0.037609100341796875, 0.04386711120605469, 0.0501251220703125, 0.05638313293457031, 0.06264114379882812, 0.06889915466308594, 0.07515716552734375, 0.08141517639160156, 0.08767318725585938, 0.09393119812011719, 0.100189208984375, 0.10644721984863281, 0.11270523071289062, 0.11896324157714844, 0.12522125244140625, 0.13147926330566406, 0.13773727416992188, 0.1439952850341797, 0.1502532958984375, 0.1565113067626953, 0.16276931762695312, 0.16902732849121094, 0.17528533935546875, 0.18154335021972656, 0.18780136108398438, 0.1940593719482422, 0.2003173828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 11.0, 8.0, 15.0, 15.0, 16.0, 24.0, 23.0, 23.0, 28.0, 28.0, 29.0, 32.0, 28.0, 43.0, 31.0, 36.0, 36.0, 38.0, 43.0, 40.0, 37.0, 46.0, 37.0, 35.0, 33.0, 31.0, 23.0, 36.0, 17.0, 19.0, 18.0, 17.0, 14.0, 8.0, 10.0, 7.0, 12.0, 1.0, 6.0, 3.0, 6.0, 5.0, 4.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.057708740234375, -0.05591249465942383, -0.054116249084472656, -0.052320003509521484, -0.05052375793457031, -0.04872751235961914, -0.04693126678466797, -0.0451350212097168, -0.043338775634765625, -0.04154253005981445, -0.03974628448486328, -0.03795003890991211, -0.03615379333496094, -0.034357547760009766, -0.032561302185058594, -0.030765056610107422, -0.02896881103515625, -0.027172565460205078, -0.025376319885253906, -0.023580074310302734, -0.021783828735351562, -0.01998758316040039, -0.01819133758544922, -0.016395092010498047, -0.014598846435546875, -0.012802600860595703, -0.011006355285644531, -0.00921010971069336, -0.0074138641357421875, -0.005617618560791016, -0.0038213729858398438, -0.002025127410888672, -0.0002288818359375, 0.0015673637390136719, 0.0033636093139648438, 0.005159854888916016, 0.0069561004638671875, 0.00875234603881836, 0.010548591613769531, 0.012344837188720703, 0.014141082763671875, 0.015937328338623047, 0.01773357391357422, 0.01952981948852539, 0.021326065063476562, 0.023122310638427734, 0.024918556213378906, 0.026714801788330078, 0.02851104736328125, 0.030307292938232422, 0.032103538513183594, 0.033899784088134766, 0.03569602966308594, 0.03749227523803711, 0.03928852081298828, 0.04108476638793945, 0.042881011962890625, 0.0446772575378418, 0.04647350311279297, 0.04826974868774414, 0.05006599426269531, 0.051862239837646484, 0.053658485412597656, 0.05545473098754883, 0.0572509765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 4.0, 2.0, 8.0, 10.0, 11.0, 13.0, 18.0, 26.0, 36.0, 38.0, 61.0, 108.0, 188.0, 321.0, 658.0, 1653.0, 6250.0, 45289.0, 826878.0, 149475.0, 12723.0, 2746.0, 1010.0, 419.0, 223.0, 130.0, 67.0, 67.0, 31.0, 21.0, 12.0, 12.0, 7.0, 7.0, 10.0, 4.0, 1.0, 0.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0252838134765625, -0.024460315704345703, -0.023636817932128906, -0.02281332015991211, -0.021989822387695312, -0.021166324615478516, -0.02034282684326172, -0.019519329071044922, -0.018695831298828125, -0.017872333526611328, -0.01704883575439453, -0.016225337982177734, -0.015401840209960938, -0.01457834243774414, -0.013754844665527344, -0.012931346893310547, -0.01210784912109375, -0.011284351348876953, -0.010460853576660156, -0.00963735580444336, -0.008813858032226562, -0.007990360260009766, -0.007166862487792969, -0.006343364715576172, -0.005519866943359375, -0.004696369171142578, -0.0038728713989257812, -0.0030493736267089844, -0.0022258758544921875, -0.0014023780822753906, -0.0005788803100585938, 0.0002446174621582031, 0.001068115234375, 0.0018916130065917969, 0.0027151107788085938, 0.0035386085510253906, 0.0043621063232421875, 0.005185604095458984, 0.006009101867675781, 0.006832599639892578, 0.007656097412109375, 0.008479595184326172, 0.009303092956542969, 0.010126590728759766, 0.010950088500976562, 0.01177358627319336, 0.012597084045410156, 0.013420581817626953, 0.01424407958984375, 0.015067577362060547, 0.015891075134277344, 0.01671457290649414, 0.017538070678710938, 0.018361568450927734, 0.01918506622314453, 0.020008563995361328, 0.020832061767578125, 0.021655559539794922, 0.02247905731201172, 0.023302555084228516, 0.024126052856445312, 0.02494955062866211, 0.025773048400878906, 0.026596546173095703, 0.0274200439453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 3.0, 3.0, 6.0, 15.0, 4.0, 11.0, 9.0, 27.0, 17.0, 32.0, 32.0, 27.0, 50.0, 22.0, 47.0, 28.0, 64.0, 28.0, 63.0, 50.0, 21.0, 50.0, 31.0, 64.0, 24.0, 46.0, 34.0, 22.0, 22.0, 10.0, 28.0, 17.0, 21.0, 0.0, 18.0, 9.0, 5.0, 11.0, 2.0, 10.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.946704626083374e-06, -2.853572368621826e-06, -2.7604401111602783e-06, -2.6673078536987305e-06, -2.5741755962371826e-06, -2.4810433387756348e-06, -2.387911081314087e-06, -2.294778823852539e-06, -2.201646566390991e-06, -2.1085143089294434e-06, -2.0153820514678955e-06, -1.9222497940063477e-06, -1.8291175365447998e-06, -1.735985279083252e-06, -1.642853021621704e-06, -1.5497207641601562e-06, -1.4565885066986084e-06, -1.3634562492370605e-06, -1.2703239917755127e-06, -1.1771917343139648e-06, -1.084059476852417e-06, -9.909272193908691e-07, -8.977949619293213e-07, -8.046627044677734e-07, -7.115304470062256e-07, -6.183981895446777e-07, -5.252659320831299e-07, -4.3213367462158203e-07, -3.390014171600342e-07, -2.4586915969848633e-07, -1.5273690223693848e-07, -5.960464477539063e-08, 3.3527612686157227e-08, 1.2665987014770508e-07, 2.1979212760925293e-07, 3.129243850708008e-07, 4.0605664253234863e-07, 4.991888999938965e-07, 5.923211574554443e-07, 6.854534149169922e-07, 7.7858567237854e-07, 8.717179298400879e-07, 9.648501873016357e-07, 1.0579824447631836e-06, 1.1511147022247314e-06, 1.2442469596862793e-06, 1.3373792171478271e-06, 1.430511474609375e-06, 1.5236437320709229e-06, 1.6167759895324707e-06, 1.7099082469940186e-06, 1.8030405044555664e-06, 1.8961727619171143e-06, 1.989305019378662e-06, 2.08243727684021e-06, 2.175569534301758e-06, 2.2687017917633057e-06, 2.3618340492248535e-06, 2.4549663066864014e-06, 2.5480985641479492e-06, 2.641230821609497e-06, 2.734363079071045e-06, 2.8274953365325928e-06, 2.9206275939941406e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 8.0, 9.0, 17.0, 18.0, 27.0, 46.0, 134.0, 309.0, 1047.0, 8493.0, 971368.0, 63732.0, 2411.0, 512.0, 196.0, 105.0, 45.0, 27.0, 16.0, 13.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0712890625, -0.06923723220825195, -0.0671854019165039, -0.06513357162475586, -0.06308174133300781, -0.061029911041259766, -0.05897808074951172, -0.05692625045776367, -0.054874420166015625, -0.05282258987426758, -0.05077075958251953, -0.048718929290771484, -0.04666709899902344, -0.04461526870727539, -0.042563438415527344, -0.0405116081237793, -0.03845977783203125, -0.0364079475402832, -0.034356117248535156, -0.03230428695678711, -0.030252456665039062, -0.028200626373291016, -0.02614879608154297, -0.024096965789794922, -0.022045135498046875, -0.019993305206298828, -0.01794147491455078, -0.015889644622802734, -0.013837814331054688, -0.01178598403930664, -0.009734153747558594, -0.007682323455810547, -0.0056304931640625, -0.003578662872314453, -0.0015268325805664062, 0.0005249977111816406, 0.0025768280029296875, 0.004628658294677734, 0.006680488586425781, 0.008732318878173828, 0.010784149169921875, 0.012835979461669922, 0.014887809753417969, 0.016939640045166016, 0.018991470336914062, 0.02104330062866211, 0.023095130920410156, 0.025146961212158203, 0.02719879150390625, 0.029250621795654297, 0.031302452087402344, 0.03335428237915039, 0.03540611267089844, 0.037457942962646484, 0.03950977325439453, 0.04156160354614258, 0.043613433837890625, 0.04566526412963867, 0.04771709442138672, 0.049768924713134766, 0.05182075500488281, 0.05387258529663086, 0.055924415588378906, 0.05797624588012695, 0.060028076171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 13.0, 13.0, 30.0, 39.0, 55.0, 62.0, 93.0, 123.0, 122.0, 123.0, 113.0, 65.0, 52.0, 19.0, 16.0, 12.0, 17.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017333984375, -0.01674628257751465, -0.016158580780029297, -0.015570878982543945, -0.014983177185058594, -0.014395475387573242, -0.01380777359008789, -0.013220071792602539, -0.012632369995117188, -0.012044668197631836, -0.011456966400146484, -0.010869264602661133, -0.010281562805175781, -0.00969386100769043, -0.009106159210205078, -0.008518457412719727, -0.007930755615234375, -0.0073430538177490234, -0.006755352020263672, -0.00616765022277832, -0.005579948425292969, -0.004992246627807617, -0.004404544830322266, -0.003816843032836914, -0.0032291412353515625, -0.002641439437866211, -0.0020537376403808594, -0.0014660358428955078, -0.0008783340454101562, -0.0002906322479248047, 0.0002970695495605469, 0.0008847713470458984, 0.00147247314453125, 0.0020601749420166016, 0.002647876739501953, 0.0032355785369873047, 0.0038232803344726562, 0.004410982131958008, 0.004998683929443359, 0.005586385726928711, 0.0061740875244140625, 0.006761789321899414, 0.007349491119384766, 0.007937192916870117, 0.008524894714355469, 0.00911259651184082, 0.009700298309326172, 0.010288000106811523, 0.010875701904296875, 0.011463403701782227, 0.012051105499267578, 0.01263880729675293, 0.013226509094238281, 0.013814210891723633, 0.014401912689208984, 0.014989614486694336, 0.015577316284179688, 0.01616501808166504, 0.01675271987915039, 0.017340421676635742, 0.017928123474121094, 0.018515825271606445, 0.019103527069091797, 0.01969122886657715, 0.0202789306640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 74.0, 922.0, 17.0, 2.0], "bins": [-10.2124662399292, -10.045994758605957, -9.879522323608398, -9.713050842285156, -9.546579360961914, -9.380107879638672, -9.21363639831543, -9.047163963317871, -8.880692481994629, -8.714221000671387, -8.547748565673828, -8.381277084350586, -8.214805603027344, -8.048334121704102, -7.881862163543701, -7.715390205383301, -7.548918724060059, -7.382447242736816, -7.215975284576416, -7.049503326416016, -6.883031845092773, -6.716560363769531, -6.550088405609131, -6.3836164474487305, -6.217144966125488, -6.050673484802246, -5.884201526641846, -5.717729568481445, -5.551258087158203, -5.384786605834961, -5.2183146476745605, -5.05184268951416, -4.88537073135376, -4.718898773193359, -4.552427291870117, -4.385955810546875, -4.219483852386475, -4.053011894226074, -3.886540412902832, -3.7200686931610107, -3.5535969734191895, -3.387125253677368, -3.220653533935547, -3.0541818141937256, -2.8877100944519043, -2.721238374710083, -2.5547666549682617, -2.3882949352264404, -2.221823215484619, -2.055351495742798, -1.8888797760009766, -1.7224080562591553, -1.555936336517334, -1.3894646167755127, -1.2229928970336914, -1.0565211772918701, -0.8900494575500488, -0.7235777378082275, -0.5571060180664062, -0.39063429832458496, -0.22416257858276367, -0.05769085884094238, 0.1087808609008789, 0.2752525806427002, 0.4417243003845215]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 18.0, 24.0, 29.0, 36.0, 47.0, 60.0, 59.0, 85.0, 82.0, 93.0, 81.0, 69.0, 68.0, 62.0, 46.0, 45.0, 20.0, 18.0, 14.0, 19.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.017906904220581, -0.9920983910560608, -0.9662898778915405, -0.9404813647270203, -0.9146728515625, -0.8888643383979797, -0.8630558252334595, -0.8372472524642944, -0.811438798904419, -0.7856302857398987, -0.7598217725753784, -0.7340132594108582, -0.7082047462463379, -0.6823962330818176, -0.6565877199172974, -0.6307791471481323, -0.6049706339836121, -0.5791621208190918, -0.5533536076545715, -0.5275450944900513, -0.501736581325531, -0.47592806816101074, -0.4501195251941681, -0.4243110120296478, -0.39850249886512756, -0.3726939857006073, -0.34688547253608704, -0.3210769295692444, -0.2952684164047241, -0.26945990324020386, -0.2436513900756836, -0.21784287691116333, -0.1920343041419983, -0.16622579097747803, -0.14041727781295776, -0.1146087497472763, -0.08880023658275604, -0.06299172341823578, -0.03718319535255432, -0.011374682188034058, 0.014433830976486206, 0.04024234786629677, 0.06605086475610733, 0.09185938537120819, 0.11766789853572845, 0.14347641170024872, 0.16928493976593018, 0.19509345293045044, 0.2209019660949707, 0.24671047925949097, 0.27251899242401123, 0.2983275055885315, 0.32413601875305176, 0.349944531917572, 0.3757530748844147, 0.40156158804893494, 0.4273701012134552, 0.45317861437797546, 0.4789871275424957, 0.5047956705093384, 0.5306041836738586, 0.5564126968383789, 0.5822212100028992, 0.6080297231674194, 0.6338382363319397]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 8.0, 21.0, 20.0, 43.0, 94.0, 174.0, 653.0, 10043.0, 4179860.0, 2754.0, 398.0, 124.0, 40.0, 20.0, 9.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.693359375, -1.6542587280273438, -1.6151580810546875, -1.5760574340820312, -1.536956787109375, -1.4978561401367188, -1.4587554931640625, -1.4196548461914062, -1.38055419921875, -1.3414535522460938, -1.3023529052734375, -1.2632522583007812, -1.224151611328125, -1.1850509643554688, -1.1459503173828125, -1.1068496704101562, -1.0677490234375, -1.0286483764648438, -0.9895477294921875, -0.9504470825195312, -0.911346435546875, -0.8722457885742188, -0.8331451416015625, -0.7940444946289062, -0.75494384765625, -0.7158432006835938, -0.6767425537109375, -0.6376419067382812, -0.598541259765625, -0.5594406127929688, -0.5203399658203125, -0.48123931884765625, -0.442138671875, -0.40303802490234375, -0.3639373779296875, -0.32483673095703125, -0.285736083984375, -0.24663543701171875, -0.2075347900390625, -0.16843414306640625, -0.12933349609375, -0.09023284912109375, -0.0511322021484375, -0.01203155517578125, 0.027069091796875, 0.06616973876953125, 0.1052703857421875, 0.14437103271484375, 0.1834716796875, 0.22257232666015625, 0.2616729736328125, 0.30077362060546875, 0.339874267578125, 0.37897491455078125, 0.4180755615234375, 0.45717620849609375, 0.49627685546875, 0.5353775024414062, 0.5744781494140625, 0.6135787963867188, 0.652679443359375, 0.6917800903320312, 0.7308807373046875, 0.7699813842773438, 0.80908203125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 15.0, 18.0, 79.0, 282.0, 358.0, 151.0, 43.0, 17.0, 8.0, 11.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07012939453125, -0.06850957870483398, -0.06688976287841797, -0.06526994705200195, -0.06365013122558594, -0.06203031539916992, -0.060410499572753906, -0.05879068374633789, -0.057170867919921875, -0.05555105209350586, -0.053931236267089844, -0.05231142044067383, -0.05069160461425781, -0.0490717887878418, -0.04745197296142578, -0.045832157135009766, -0.04421234130859375, -0.042592525482177734, -0.04097270965576172, -0.0393528938293457, -0.03773307800292969, -0.03611326217651367, -0.034493446350097656, -0.03287363052368164, -0.031253814697265625, -0.02963399887084961, -0.028014183044433594, -0.026394367218017578, -0.024774551391601562, -0.023154735565185547, -0.02153491973876953, -0.019915103912353516, -0.0182952880859375, -0.016675472259521484, -0.015055656433105469, -0.013435840606689453, -0.011816024780273438, -0.010196208953857422, -0.008576393127441406, -0.006956577301025391, -0.005336761474609375, -0.0037169456481933594, -0.0020971298217773438, -0.0004773139953613281, 0.0011425018310546875, 0.002762317657470703, 0.004382133483886719, 0.006001949310302734, 0.00762176513671875, 0.009241580963134766, 0.010861396789550781, 0.012481212615966797, 0.014101028442382812, 0.015720844268798828, 0.017340660095214844, 0.01896047592163086, 0.020580291748046875, 0.02220010757446289, 0.023819923400878906, 0.025439739227294922, 0.027059555053710938, 0.028679370880126953, 0.03029918670654297, 0.031919002532958984, 0.033538818359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 10.0, 8.0, 10.0, 6.0, 17.0, 19.0, 29.0, 41.0, 37.0, 99.0, 168.0, 439.0, 1386.0, 5362.0, 30939.0, 4003842.0, 133835.0, 13281.0, 3081.0, 927.0, 321.0, 159.0, 73.0, 53.0, 37.0, 13.0, 19.0, 11.0, 12.0, 6.0, 4.0, 9.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.23557472229003906, -0.22859573364257812, -0.2216167449951172, -0.21463775634765625, -0.2076587677001953, -0.20067977905273438, -0.19370079040527344, -0.1867218017578125, -0.17974281311035156, -0.17276382446289062, -0.1657848358154297, -0.15880584716796875, -0.1518268585205078, -0.14484786987304688, -0.13786888122558594, -0.130889892578125, -0.12391090393066406, -0.11693191528320312, -0.10995292663574219, -0.10297393798828125, -0.09599494934082031, -0.08901596069335938, -0.08203697204589844, -0.0750579833984375, -0.06807899475097656, -0.061100006103515625, -0.05412101745605469, -0.04714202880859375, -0.04016304016113281, -0.033184051513671875, -0.026205062866210938, -0.01922607421875, -0.012247085571289062, -0.005268096923828125, 0.0017108917236328125, 0.00868988037109375, 0.015668869018554688, 0.022647857666015625, 0.029626846313476562, 0.0366058349609375, 0.04358482360839844, 0.050563812255859375, 0.05754280090332031, 0.06452178955078125, 0.07150077819824219, 0.07847976684570312, 0.08545875549316406, 0.092437744140625, 0.09941673278808594, 0.10639572143554688, 0.11337471008300781, 0.12035369873046875, 0.1273326873779297, 0.13431167602539062, 0.14129066467285156, 0.1482696533203125, 0.15524864196777344, 0.16222763061523438, 0.1692066192626953, 0.17618560791015625, 0.1831645965576172, 0.19014358520507812, 0.19712257385253906, 0.2041015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 8.0, 3.0, 2.0, 7.0, 4.0, 8.0, 4.0, 21.0, 15.0, 17.0, 18.0, 26.0, 42.0, 74.0, 114.0, 541.0, 2688.0, 169.0, 96.0, 51.0, 25.0, 22.0, 13.0, 17.0, 12.0, 13.0, 8.0, 10.0, 4.0, 3.0, 6.0, 11.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02978515625, -0.02876424789428711, -0.02774333953857422, -0.026722431182861328, -0.025701522827148438, -0.024680614471435547, -0.023659706115722656, -0.022638797760009766, -0.021617889404296875, -0.020596981048583984, -0.019576072692871094, -0.018555164337158203, -0.017534255981445312, -0.016513347625732422, -0.015492439270019531, -0.01447153091430664, -0.01345062255859375, -0.01242971420288086, -0.011408805847167969, -0.010387897491455078, -0.009366989135742188, -0.008346080780029297, -0.007325172424316406, -0.006304264068603516, -0.005283355712890625, -0.004262447357177734, -0.0032415390014648438, -0.002220630645751953, -0.0011997222900390625, -0.00017881393432617188, 0.0008420944213867188, 0.0018630027770996094, 0.0028839111328125, 0.0039048194885253906, 0.004925727844238281, 0.005946636199951172, 0.0069675445556640625, 0.007988452911376953, 0.009009361267089844, 0.010030269622802734, 0.011051177978515625, 0.012072086334228516, 0.013092994689941406, 0.014113903045654297, 0.015134811401367188, 0.016155719757080078, 0.01717662811279297, 0.01819753646850586, 0.01921844482421875, 0.02023935317993164, 0.02126026153564453, 0.022281169891357422, 0.023302078247070312, 0.024322986602783203, 0.025343894958496094, 0.026364803314208984, 0.027385711669921875, 0.028406620025634766, 0.029427528381347656, 0.030448436737060547, 0.03146934509277344, 0.03249025344848633, 0.03351116180419922, 0.03453207015991211, 0.035552978515625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [14.0, 996.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11113691329956055, -0.0392327681183815, 0.032671377062797546, 0.104575514793396, 0.17647966742515564, 0.24838382005691528, 0.32028794288635254, 0.39219212532043457, 0.4640962481498718, 0.5360003709793091, 0.6079045534133911, 0.6798086762428284, 0.7517127990722656, 0.8236169815063477, 0.8955211043357849, 0.9674252867698669, 1.0393294095993042, 1.1112335920333862, 1.1831376552581787, 1.2550418376922607, 1.3269460201263428, 1.3988502025604248, 1.4707542657852173, 1.5426584482192993, 1.6145625114440918, 1.6864666938781738, 1.7583707571029663, 1.8302749395370483, 1.9021791219711304, 1.9740831851959229, 2.045987367630005, 2.117891550064087, 2.189795732498169, 2.261699914932251, 2.333604097366333, 2.405508041381836, 2.477412223815918, 2.54931640625, 2.621220588684082, 2.693124771118164, 2.765028953552246, 2.836933135986328, 2.90883731842041, 2.980741500854492, 3.052645444869995, 3.124549627304077, 3.196453809738159, 3.268357992172241, 3.340261936187744, 3.412166118621826, 3.484070301055908, 3.5559744834899902, 3.627878427505493, 3.699782609939575, 3.7716867923736572, 3.8435909748077393, 3.9154951572418213, 3.9873993396759033, 4.059303283691406, 4.131207466125488, 4.20311164855957, 4.275015830993652, 4.346920013427734, 4.418824195861816, 4.490728378295898]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 17.0, 33.0, 49.0, 94.0, 110.0, 127.0, 150.0, 128.0, 96.0, 55.0, 47.0, 38.0, 18.0, 13.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2729620337486267, -0.2641071677207947, -0.25525230169296265, -0.24639743566513062, -0.23754256963729858, -0.22868770360946655, -0.21983282268047333, -0.2109779566526413, -0.20212309062480927, -0.19326822459697723, -0.1844133585691452, -0.17555849254131317, -0.16670361161231995, -0.15784874558448792, -0.14899387955665588, -0.14013901352882385, -0.13128414750099182, -0.12242928147315979, -0.11357441544532776, -0.10471954196691513, -0.0958646759390831, -0.08700980991125107, -0.07815493643283844, -0.06930007040500641, -0.06044520437717438, -0.051590338349342346, -0.042735468596220016, -0.03388059884309769, -0.025025732815265656, -0.016170866787433624, -0.0073159970343112946, 0.0015388727188110352, 0.010393738746643066, 0.019248606637120247, 0.028103474527597427, 0.03695834428071976, 0.04581321030855179, 0.05466807633638382, 0.06352294981479645, 0.07237781584262848, 0.08123268187046051, 0.09008754789829254, 0.09894241392612457, 0.1077972874045372, 0.11665215343236923, 0.12550702691078186, 0.1343618929386139, 0.14321675896644592, 0.15207162499427795, 0.16092649102210999, 0.16978135704994202, 0.17863622307777405, 0.18749108910560608, 0.1963459551334381, 0.20520083606243134, 0.21405570209026337, 0.2229105681180954, 0.23176543414592743, 0.24062030017375946, 0.2494751662015915, 0.2583300471305847, 0.26718491315841675, 0.2760397791862488, 0.2848946452140808, 0.29374951124191284]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 9.0, 0.0, 3.0, 10.0, 6.0, 13.0, 12.0, 15.0, 31.0, 38.0, 56.0, 79.0, 124.0, 219.0, 411.0, 874.0, 2266.0, 9629.0, 622627.0, 399385.0, 8782.0, 2110.0, 797.0, 414.0, 219.0, 128.0, 91.0, 66.0, 47.0, 36.0, 15.0, 11.0, 10.0, 6.0, 2.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.32816314697265625, -0.3172149658203125, -0.30626678466796875, -0.295318603515625, -0.28437042236328125, -0.2734222412109375, -0.26247406005859375, -0.25152587890625, -0.24057769775390625, -0.2296295166015625, -0.21868133544921875, -0.207733154296875, -0.19678497314453125, -0.1858367919921875, -0.17488861083984375, -0.1639404296875, -0.15299224853515625, -0.1420440673828125, -0.13109588623046875, -0.120147705078125, -0.10919952392578125, -0.0982513427734375, -0.08730316162109375, -0.07635498046875, -0.06540679931640625, -0.0544586181640625, -0.04351043701171875, -0.032562255859375, -0.02161407470703125, -0.0106658935546875, 0.00028228759765625, 0.01123046875, 0.02217864990234375, 0.0331268310546875, 0.04407501220703125, 0.055023193359375, 0.06597137451171875, 0.0769195556640625, 0.08786773681640625, 0.09881591796875, 0.10976409912109375, 0.1207122802734375, 0.13166046142578125, 0.142608642578125, 0.15355682373046875, 0.1645050048828125, 0.17545318603515625, 0.1864013671875, 0.19734954833984375, 0.2082977294921875, 0.21924591064453125, 0.230194091796875, 0.24114227294921875, 0.2520904541015625, 0.26303863525390625, 0.27398681640625, 0.28493499755859375, 0.2958831787109375, 0.30683135986328125, 0.317779541015625, 0.32872772216796875, 0.3396759033203125, 0.35062408447265625, 0.361572265625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 22.0, 40.0, 204.0, 375.0, 227.0, 66.0, 19.0, 9.0, 13.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06549072265625, -0.06395387649536133, -0.062417030334472656, -0.060880184173583984, -0.05934333801269531, -0.05780649185180664, -0.05626964569091797, -0.0547327995300293, -0.053195953369140625, -0.05165910720825195, -0.05012226104736328, -0.04858541488647461, -0.04704856872558594, -0.045511722564697266, -0.043974876403808594, -0.04243803024291992, -0.04090118408203125, -0.03936433792114258, -0.037827491760253906, -0.036290645599365234, -0.03475379943847656, -0.03321695327758789, -0.03168010711669922, -0.030143260955810547, -0.028606414794921875, -0.027069568634033203, -0.02553272247314453, -0.02399587631225586, -0.022459030151367188, -0.020922183990478516, -0.019385337829589844, -0.017848491668701172, -0.0163116455078125, -0.014774799346923828, -0.013237953186035156, -0.011701107025146484, -0.010164260864257812, -0.00862741470336914, -0.007090568542480469, -0.005553722381591797, -0.004016876220703125, -0.002480030059814453, -0.0009431838989257812, 0.0005936622619628906, 0.0021305084228515625, 0.0036673545837402344, 0.005204200744628906, 0.006741046905517578, 0.00827789306640625, 0.009814739227294922, 0.011351585388183594, 0.012888431549072266, 0.014425277709960938, 0.01596212387084961, 0.01749897003173828, 0.019035816192626953, 0.020572662353515625, 0.022109508514404297, 0.02364635467529297, 0.02518320083618164, 0.026720046997070312, 0.028256893157958984, 0.029793739318847656, 0.03133058547973633, 0.032867431640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 5.0, 5.0, 7.0, 11.0, 14.0, 12.0, 23.0, 28.0, 31.0, 44.0, 57.0, 95.0, 135.0, 259.0, 427.0, 947.0, 3402.0, 29165.0, 759658.0, 238073.0, 12474.0, 1949.0, 741.0, 342.0, 213.0, 115.0, 93.0, 51.0, 40.0, 28.0, 20.0, 17.0, 14.0, 12.0, 11.0, 9.0, 10.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2294921875, -0.22270965576171875, -0.2159271240234375, -0.20914459228515625, -0.202362060546875, -0.19557952880859375, -0.1887969970703125, -0.18201446533203125, -0.17523193359375, -0.16844940185546875, -0.1616668701171875, -0.15488433837890625, -0.148101806640625, -0.14131927490234375, -0.1345367431640625, -0.12775421142578125, -0.1209716796875, -0.11418914794921875, -0.1074066162109375, -0.10062408447265625, -0.093841552734375, -0.08705902099609375, -0.0802764892578125, -0.07349395751953125, -0.06671142578125, -0.05992889404296875, -0.0531463623046875, -0.04636383056640625, -0.039581298828125, -0.03279876708984375, -0.0260162353515625, -0.01923370361328125, -0.012451171875, -0.00566864013671875, 0.0011138916015625, 0.00789642333984375, 0.014678955078125, 0.02146148681640625, 0.0282440185546875, 0.03502655029296875, 0.04180908203125, 0.04859161376953125, 0.0553741455078125, 0.06215667724609375, 0.068939208984375, 0.07572174072265625, 0.0825042724609375, 0.08928680419921875, 0.0960693359375, 0.10285186767578125, 0.1096343994140625, 0.11641693115234375, 0.123199462890625, 0.12998199462890625, 0.1367645263671875, 0.14354705810546875, 0.15032958984375, 0.15711212158203125, 0.1638946533203125, 0.17067718505859375, 0.177459716796875, 0.18424224853515625, 0.1910247802734375, 0.19780731201171875, 0.20458984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 8.0, 12.0, 7.0, 11.0, 16.0, 14.0, 16.0, 28.0, 23.0, 23.0, 38.0, 39.0, 37.0, 36.0, 45.0, 45.0, 46.0, 47.0, 45.0, 52.0, 50.0, 46.0, 37.0, 28.0, 32.0, 32.0, 32.0, 31.0, 20.0, 19.0, 19.0, 13.0, 14.0, 8.0, 9.0, 3.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0670166015625, -0.06479549407958984, -0.06257438659667969, -0.06035327911376953, -0.058132171630859375, -0.05591106414794922, -0.05368995666503906, -0.051468849182128906, -0.04924774169921875, -0.047026634216308594, -0.04480552673339844, -0.04258441925048828, -0.040363311767578125, -0.03814220428466797, -0.03592109680175781, -0.033699989318847656, -0.0314788818359375, -0.029257774353027344, -0.027036666870117188, -0.02481555938720703, -0.022594451904296875, -0.02037334442138672, -0.018152236938476562, -0.015931129455566406, -0.01371002197265625, -0.011488914489746094, -0.009267807006835938, -0.007046699523925781, -0.004825592041015625, -0.0026044845581054688, -0.0003833770751953125, 0.0018377304077148438, 0.004058837890625, 0.006279945373535156, 0.008501052856445312, 0.010722160339355469, 0.012943267822265625, 0.015164375305175781, 0.017385482788085938, 0.019606590270996094, 0.02182769775390625, 0.024048805236816406, 0.026269912719726562, 0.02849102020263672, 0.030712127685546875, 0.03293323516845703, 0.03515434265136719, 0.037375450134277344, 0.0395965576171875, 0.041817665100097656, 0.04403877258300781, 0.04625988006591797, 0.048480987548828125, 0.05070209503173828, 0.05292320251464844, 0.055144309997558594, 0.05736541748046875, 0.059586524963378906, 0.06180763244628906, 0.06402873992919922, 0.06624984741210938, 0.06847095489501953, 0.07069206237792969, 0.07291316986083984, 0.07513427734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 14.0, 19.0, 33.0, 51.0, 118.0, 278.0, 949.0, 6723.0, 869387.0, 166310.0, 3577.0, 656.0, 196.0, 88.0, 51.0, 24.0, 15.0, 18.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0670166015625, -0.06497764587402344, -0.06293869018554688, -0.06089973449707031, -0.05886077880859375, -0.05682182312011719, -0.054782867431640625, -0.05274391174316406, -0.0507049560546875, -0.04866600036621094, -0.046627044677734375, -0.04458808898925781, -0.04254913330078125, -0.04051017761230469, -0.038471221923828125, -0.03643226623535156, -0.034393310546875, -0.03235435485839844, -0.030315399169921875, -0.028276443481445312, -0.02623748779296875, -0.024198532104492188, -0.022159576416015625, -0.020120620727539062, -0.0180816650390625, -0.016042709350585938, -0.014003753662109375, -0.011964797973632812, -0.00992584228515625, -0.007886886596679688, -0.005847930908203125, -0.0038089752197265625, -0.00177001953125, 0.0002689361572265625, 0.002307891845703125, 0.0043468475341796875, 0.00638580322265625, 0.008424758911132812, 0.010463714599609375, 0.012502670288085938, 0.0145416259765625, 0.016580581665039062, 0.018619537353515625, 0.020658493041992188, 0.02269744873046875, 0.024736404418945312, 0.026775360107421875, 0.028814315795898438, 0.030853271484375, 0.03289222717285156, 0.034931182861328125, 0.03697013854980469, 0.03900909423828125, 0.04104804992675781, 0.043087005615234375, 0.04512596130371094, 0.0471649169921875, 0.04920387268066406, 0.051242828369140625, 0.05328178405761719, 0.05532073974609375, 0.05735969543457031, 0.059398651123046875, 0.06143760681152344, 0.0634765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 11.0, 21.0, 25.0, 50.0, 66.0, 90.0, 121.0, 148.0, 111.0, 111.0, 74.0, 49.0, 39.0, 25.0, 15.0, 9.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.238719940185547e-06, -8.926726877689362e-06, -8.614733815193176e-06, -8.302740752696991e-06, -7.990747690200806e-06, -7.67875462770462e-06, -7.366761565208435e-06, -7.05476850271225e-06, -6.7427754402160645e-06, -6.430782377719879e-06, -6.118789315223694e-06, -5.8067962527275085e-06, -5.494803190231323e-06, -5.182810127735138e-06, -4.870817065238953e-06, -4.558824002742767e-06, -4.246830940246582e-06, -3.934837877750397e-06, -3.6228448152542114e-06, -3.310851752758026e-06, -2.998858690261841e-06, -2.6868656277656555e-06, -2.3748725652694702e-06, -2.062879502773285e-06, -1.7508864402770996e-06, -1.4388933777809143e-06, -1.126900315284729e-06, -8.149072527885437e-07, -5.029141902923584e-07, -1.909211277961731e-07, 1.210719347000122e-07, 4.330649971961975e-07, 7.450580596923828e-07, 1.0570511221885681e-06, 1.3690441846847534e-06, 1.6810372471809387e-06, 1.993030309677124e-06, 2.3050233721733093e-06, 2.6170164346694946e-06, 2.92900949716568e-06, 3.2410025596618652e-06, 3.5529956221580505e-06, 3.864988684654236e-06, 4.176981747150421e-06, 4.4889748096466064e-06, 4.800967872142792e-06, 5.112960934638977e-06, 5.424953997135162e-06, 5.736947059631348e-06, 6.048940122127533e-06, 6.360933184623718e-06, 6.6729262471199036e-06, 6.984919309616089e-06, 7.296912372112274e-06, 7.6089054346084595e-06, 7.920898497104645e-06, 8.23289155960083e-06, 8.544884622097015e-06, 8.8568776845932e-06, 9.168870747089386e-06, 9.480863809585571e-06, 9.792856872081757e-06, 1.0104849934577942e-05, 1.0416842997074127e-05, 1.0728836059570312e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 1.0, 0.0, 6.0, 3.0, 9.0, 9.0, 10.0, 18.0, 26.0, 28.0, 62.0, 91.0, 166.0, 346.0, 961.0, 4545.0, 67351.0, 946744.0, 23895.0, 2911.0, 722.0, 266.0, 126.0, 81.0, 51.0, 35.0, 28.0, 14.0, 15.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.052520751953125, -0.05084562301635742, -0.049170494079589844, -0.047495365142822266, -0.04582023620605469, -0.04414510726928711, -0.04246997833251953, -0.04079484939575195, -0.039119720458984375, -0.0374445915222168, -0.03576946258544922, -0.03409433364868164, -0.03241920471191406, -0.030744075775146484, -0.029068946838378906, -0.027393817901611328, -0.02571868896484375, -0.024043560028076172, -0.022368431091308594, -0.020693302154541016, -0.019018173217773438, -0.01734304428100586, -0.01566791534423828, -0.013992786407470703, -0.012317657470703125, -0.010642528533935547, -0.008967399597167969, -0.007292270660400391, -0.0056171417236328125, -0.003942012786865234, -0.0022668838500976562, -0.0005917549133300781, 0.0010833740234375, 0.002758502960205078, 0.004433631896972656, 0.006108760833740234, 0.0077838897705078125, 0.00945901870727539, 0.011134147644042969, 0.012809276580810547, 0.014484405517578125, 0.016159534454345703, 0.01783466339111328, 0.01950979232788086, 0.021184921264648438, 0.022860050201416016, 0.024535179138183594, 0.026210308074951172, 0.02788543701171875, 0.029560565948486328, 0.031235694885253906, 0.032910823822021484, 0.03458595275878906, 0.03626108169555664, 0.03793621063232422, 0.0396113395690918, 0.041286468505859375, 0.04296159744262695, 0.04463672637939453, 0.04631185531616211, 0.04798698425292969, 0.049662113189697266, 0.051337242126464844, 0.05301237106323242, 0.0546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 13.0, 11.0, 15.0, 25.0, 31.0, 34.0, 47.0, 82.0, 77.0, 97.0, 97.0, 101.0, 60.0, 76.0, 60.0, 38.0, 23.0, 21.0, 13.0, 10.0, 11.0, 4.0, 10.0, 3.0, 2.0, 5.0, 1.0, 1.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.017669677734375, -0.017124652862548828, -0.016579627990722656, -0.016034603118896484, -0.015489578247070312, -0.01494455337524414, -0.014399528503417969, -0.013854503631591797, -0.013309478759765625, -0.012764453887939453, -0.012219429016113281, -0.01167440414428711, -0.011129379272460938, -0.010584354400634766, -0.010039329528808594, -0.009494304656982422, -0.00894927978515625, -0.008404254913330078, -0.007859230041503906, -0.007314205169677734, -0.0067691802978515625, -0.006224155426025391, -0.005679130554199219, -0.005134105682373047, -0.004589080810546875, -0.004044055938720703, -0.0034990310668945312, -0.0029540061950683594, -0.0024089813232421875, -0.0018639564514160156, -0.0013189315795898438, -0.0007739067077636719, -0.0002288818359375, 0.0003161430358886719, 0.0008611679077148438, 0.0014061927795410156, 0.0019512176513671875, 0.0024962425231933594, 0.0030412673950195312, 0.003586292266845703, 0.004131317138671875, 0.004676342010498047, 0.005221366882324219, 0.005766391754150391, 0.0063114166259765625, 0.006856441497802734, 0.007401466369628906, 0.007946491241455078, 0.00849151611328125, 0.009036540985107422, 0.009581565856933594, 0.010126590728759766, 0.010671615600585938, 0.01121664047241211, 0.011761665344238281, 0.012306690216064453, 0.012851715087890625, 0.013396739959716797, 0.013941764831542969, 0.01448678970336914, 0.015031814575195312, 0.015576839447021484, 0.016121864318847656, 0.016666889190673828, 0.0172119140625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 9.0, 19.0, 187.0, 740.0, 55.0, 6.0, 0.0, 2.0], "bins": [-4.710071563720703, -4.63070011138916, -4.551328659057617, -4.471957206726074, -4.392585754394531, -4.3132147789001465, -4.2338433265686035, -4.1544718742370605, -4.075100421905518, -3.9957289695739746, -3.9163575172424316, -3.8369863033294678, -3.757614850997925, -3.678243398666382, -3.598872184753418, -3.519500732421875, -3.440129280090332, -3.360757827758789, -3.281386375427246, -3.2020151615142822, -3.1226437091827393, -3.0432722568511963, -2.9639010429382324, -2.8845295906066895, -2.8051581382751465, -2.7257866859436035, -2.6464152336120605, -2.5670440196990967, -2.4876725673675537, -2.4083011150360107, -2.328929901123047, -2.249558448791504, -2.170186996459961, -2.090815544128418, -2.011444091796875, -1.9320728778839111, -1.8527014255523682, -1.7733299732208252, -1.6939586400985718, -1.6145873069763184, -1.5352157354354858, -1.4558444023132324, -1.3764729499816895, -1.2971014976501465, -1.217730164527893, -1.1383588314056396, -1.0589873790740967, -0.9796159863471985, -0.9002445936203003, -0.8208732008934021, -0.7415018081665039, -0.6621304154396057, -0.5827590227127075, -0.5033876299858093, -0.42401623725891113, -0.34464484453201294, -0.26527345180511475, -0.18590205907821655, -0.10653066635131836, -0.027159273624420166, 0.05221211910247803, 0.13158351182937622, 0.21095490455627441, 0.2903262972831726, 0.3696976900100708]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 15.0, 12.0, 23.0, 20.0, 30.0, 27.0, 41.0, 35.0, 46.0, 48.0, 53.0, 76.0, 71.0, 60.0, 54.0, 58.0, 58.0, 47.0, 42.0, 34.0, 33.0, 28.0, 17.0, 15.0, 11.0, 11.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5025835633277893, -0.484005868434906, -0.4654281735420227, -0.4468504786491394, -0.4282727837562561, -0.4096950888633728, -0.3911173939704895, -0.3725396990776062, -0.3539620041847229, -0.3353843092918396, -0.3168066143989563, -0.298228919506073, -0.2796512246131897, -0.2610735297203064, -0.2424958348274231, -0.2239181399345398, -0.2053404450416565, -0.1867627501487732, -0.1681850552558899, -0.1496073603630066, -0.1310296654701233, -0.11245197057723999, -0.09387427568435669, -0.07529658079147339, -0.05671888589859009, -0.03814119100570679, -0.019563496112823486, -0.0009858012199401855, 0.017591893672943115, 0.036169588565826416, 0.05474728345870972, 0.07332497835159302, 0.0919027328491211, 0.1104804277420044, 0.1290581226348877, 0.147635817527771, 0.1662135124206543, 0.1847912073135376, 0.2033689022064209, 0.2219465970993042, 0.2405242919921875, 0.2591019868850708, 0.2776796817779541, 0.2962573766708374, 0.3148350715637207, 0.333412766456604, 0.3519904613494873, 0.3705681562423706, 0.3891458511352539, 0.4077235460281372, 0.4263012409210205, 0.4448789358139038, 0.4634566307067871, 0.4820343255996704, 0.5006120204925537, 0.519189715385437, 0.5377674102783203, 0.5563451051712036, 0.5749228000640869, 0.5935004949569702, 0.6120781898498535, 0.6306558847427368, 0.6492335796356201, 0.6678112745285034, 0.6863889694213867]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 9.0, 12.0, 15.0, 35.0, 64.0, 134.0, 457.0, 4143.0, 4184657.0, 4071.0, 475.0, 129.0, 39.0, 13.0, 13.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9248046875, -0.9040184020996094, -0.8832321166992188, -0.8624458312988281, -0.8416595458984375, -0.8208732604980469, -0.8000869750976562, -0.7793006896972656, -0.758514404296875, -0.7377281188964844, -0.7169418334960938, -0.6961555480957031, -0.6753692626953125, -0.6545829772949219, -0.6337966918945312, -0.6130104064941406, -0.59222412109375, -0.5714378356933594, -0.5506515502929688, -0.5298652648925781, -0.5090789794921875, -0.4882926940917969, -0.46750640869140625, -0.4467201232910156, -0.425933837890625, -0.4051475524902344, -0.38436126708984375, -0.3635749816894531, -0.3427886962890625, -0.3220024108886719, -0.30121612548828125, -0.2804298400878906, -0.2596435546875, -0.23885726928710938, -0.21807098388671875, -0.19728469848632812, -0.1764984130859375, -0.15571212768554688, -0.13492584228515625, -0.11413955688476562, -0.093353271484375, -0.07256698608398438, -0.05178070068359375, -0.030994415283203125, -0.0102081298828125, 0.010578155517578125, 0.03136444091796875, 0.052150726318359375, 0.07293701171875, 0.09372329711914062, 0.11450958251953125, 0.13529586791992188, 0.1560821533203125, 0.17686843872070312, 0.19765472412109375, 0.21844100952148438, 0.239227294921875, 0.2600135803222656, 0.28079986572265625, 0.3015861511230469, 0.3223724365234375, 0.3431587219238281, 0.36394500732421875, 0.3847312927246094, 0.405517578125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 13.0, 33.0, 107.0, 236.0, 299.0, 191.0, 64.0, 25.0, 10.0, 7.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.069091796875, -0.06749773025512695, -0.0659036636352539, -0.06430959701538086, -0.06271553039550781, -0.061121463775634766, -0.05952739715576172, -0.05793333053588867, -0.056339263916015625, -0.05474519729614258, -0.05315113067626953, -0.051557064056396484, -0.04996299743652344, -0.04836893081665039, -0.046774864196777344, -0.0451807975769043, -0.04358673095703125, -0.0419926643371582, -0.040398597717285156, -0.03880453109741211, -0.03721046447753906, -0.035616397857666016, -0.03402233123779297, -0.03242826461791992, -0.030834197998046875, -0.029240131378173828, -0.02764606475830078, -0.026051998138427734, -0.024457931518554688, -0.02286386489868164, -0.021269798278808594, -0.019675731658935547, -0.0180816650390625, -0.016487598419189453, -0.014893531799316406, -0.01329946517944336, -0.011705398559570312, -0.010111331939697266, -0.008517265319824219, -0.006923198699951172, -0.005329132080078125, -0.003735065460205078, -0.0021409988403320312, -0.0005469322204589844, 0.0010471343994140625, 0.0026412010192871094, 0.004235267639160156, 0.005829334259033203, 0.00742340087890625, 0.009017467498779297, 0.010611534118652344, 0.01220560073852539, 0.013799667358398438, 0.015393733978271484, 0.01698780059814453, 0.018581867218017578, 0.020175933837890625, 0.021770000457763672, 0.02336406707763672, 0.024958133697509766, 0.026552200317382812, 0.02814626693725586, 0.029740333557128906, 0.03133440017700195, 0.032928466796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 17.0, 10.0, 38.0, 54.0, 105.0, 249.0, 633.0, 1805.0, 6439.0, 49280.0, 4082744.0, 44453.0, 5811.0, 1478.0, 533.0, 276.0, 133.0, 79.0, 40.0, 21.0, 14.0, 13.0, 16.0, 4.0, 6.0, 0.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.197021484375, -0.19190216064453125, -0.1867828369140625, -0.18166351318359375, -0.176544189453125, -0.17142486572265625, -0.1663055419921875, -0.16118621826171875, -0.15606689453125, -0.15094757080078125, -0.1458282470703125, -0.14070892333984375, -0.135589599609375, -0.13047027587890625, -0.1253509521484375, -0.12023162841796875, -0.1151123046875, -0.10999298095703125, -0.1048736572265625, -0.09975433349609375, -0.094635009765625, -0.08951568603515625, -0.0843963623046875, -0.07927703857421875, -0.07415771484375, -0.06903839111328125, -0.0639190673828125, -0.05879974365234375, -0.053680419921875, -0.04856109619140625, -0.0434417724609375, -0.03832244873046875, -0.033203125, -0.02808380126953125, -0.0229644775390625, -0.01784515380859375, -0.012725830078125, -0.00760650634765625, -0.0024871826171875, 0.00263214111328125, 0.00775146484375, 0.01287078857421875, 0.0179901123046875, 0.02310943603515625, 0.028228759765625, 0.03334808349609375, 0.0384674072265625, 0.04358673095703125, 0.0487060546875, 0.05382537841796875, 0.0589447021484375, 0.06406402587890625, 0.069183349609375, 0.07430267333984375, 0.0794219970703125, 0.08454132080078125, 0.08966064453125, 0.09477996826171875, 0.0998992919921875, 0.10501861572265625, 0.110137939453125, 0.11525726318359375, 0.1203765869140625, 0.12549591064453125, 0.130615234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 4.0, 3.0, 6.0, 3.0, 13.0, 13.0, 23.0, 22.0, 43.0, 78.0, 199.0, 2912.0, 458.0, 116.0, 59.0, 30.0, 24.0, 14.0, 11.0, 5.0, 9.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0278778076171875, -0.0267946720123291, -0.025711536407470703, -0.024628400802612305, -0.023545265197753906, -0.022462129592895508, -0.02137899398803711, -0.02029585838317871, -0.019212722778320312, -0.018129587173461914, -0.017046451568603516, -0.015963315963745117, -0.014880180358886719, -0.01379704475402832, -0.012713909149169922, -0.011630773544311523, -0.010547637939453125, -0.009464502334594727, -0.008381366729736328, -0.00729823112487793, -0.006215095520019531, -0.005131959915161133, -0.004048824310302734, -0.002965688705444336, -0.0018825531005859375, -0.0007994174957275391, 0.0002837181091308594, 0.0013668537139892578, 0.0024499893188476562, 0.0035331249237060547, 0.004616260528564453, 0.0056993961334228516, 0.00678253173828125, 0.007865667343139648, 0.008948802947998047, 0.010031938552856445, 0.011115074157714844, 0.012198209762573242, 0.01328134536743164, 0.014364480972290039, 0.015447616577148438, 0.016530752182006836, 0.017613887786865234, 0.018697023391723633, 0.01978015899658203, 0.02086329460144043, 0.021946430206298828, 0.023029565811157227, 0.024112701416015625, 0.025195837020874023, 0.026278972625732422, 0.02736210823059082, 0.02844524383544922, 0.029528379440307617, 0.030611515045166016, 0.031694650650024414, 0.03277778625488281, 0.03386092185974121, 0.03494405746459961, 0.03602719306945801, 0.037110328674316406, 0.038193464279174805, 0.0392765998840332, 0.0403597354888916, 0.04144287109375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 27.0, 131.0, 656.0, 168.0, 18.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10392990708351135, -0.09312894940376282, -0.08232798427343369, -0.07152701914310455, -0.06072606146335602, -0.049925100058317184, -0.03912413865327835, -0.02832317352294922, -0.017522215843200684, -0.00672125443816185, 0.004079706966876984, 0.014880668371915817, 0.02568162977695465, 0.036482591181993484, 0.04728355258703232, 0.05808451771736145, 0.06888547539710999, 0.07968643307685852, 0.09048739820718765, 0.10128836333751678, 0.11208932101726532, 0.12289027869701385, 0.13369125127792358, 0.14449220895767212, 0.15529316663742065, 0.1660941243171692, 0.17689508199691772, 0.18769605457782745, 0.198497012257576, 0.20929796993732452, 0.22009894251823425, 0.2308999001979828, 0.2417008876800537, 0.25250184535980225, 0.2633028030395508, 0.2741037607192993, 0.28490471839904785, 0.2957057058811188, 0.3065066635608673, 0.31730762124061584, 0.3281085789203644, 0.3389095366001129, 0.34971049427986145, 0.36051145195961, 0.3713124394416809, 0.38211339712142944, 0.392914354801178, 0.4037153124809265, 0.41451627016067505, 0.4253172278404236, 0.4361181855201721, 0.44691914319992065, 0.4577201008796692, 0.4685210883617401, 0.47932204604148865, 0.4901230037212372, 0.5009239912033081, 0.5117249488830566, 0.5225259065628052, 0.5333268642425537, 0.5441278219223022, 0.5549287796020508, 0.5657297372817993, 0.5765306949615479, 0.5873316526412964]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 10.0, 12.0, 21.0, 24.0, 28.0, 38.0, 59.0, 53.0, 59.0, 72.0, 87.0, 82.0, 78.0, 68.0, 69.0, 56.0, 50.0, 40.0, 31.0, 24.0, 12.0, 13.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09586948156356812, -0.0916474238038063, -0.0874253660440445, -0.08320330828428268, -0.07898125052452087, -0.07475919276475906, -0.07053713500499725, -0.06631507724523544, -0.06209301948547363, -0.05787096172571182, -0.05364890396595001, -0.0494268462061882, -0.04520478844642639, -0.04098273068666458, -0.03676067292690277, -0.03253861516714096, -0.02831655740737915, -0.02409449964761734, -0.01987244188785553, -0.01565038412809372, -0.01142832636833191, -0.007206268608570099, -0.0029842108488082886, 0.0012378469109535217, 0.005459904670715332, 0.009681962430477142, 0.013904020190238953, 0.018126077950000763, 0.022348135709762573, 0.026570193469524384, 0.030792251229286194, 0.035014308989048004, 0.039236366748809814, 0.043458424508571625, 0.047680482268333435, 0.051902540028095245, 0.056124597787857056, 0.060346655547618866, 0.06456871330738068, 0.06879077106714249, 0.0730128288269043, 0.07723488658666611, 0.08145694434642792, 0.08567900210618973, 0.08990105986595154, 0.09412311762571335, 0.09834517538547516, 0.10256723314523697, 0.10678929090499878, 0.11101134866476059, 0.1152334064245224, 0.11945546418428421, 0.12367752194404602, 0.12789958715438843, 0.13212163746356964, 0.13634368777275085, 0.14056575298309326, 0.14478781819343567, 0.14900986850261688, 0.1532319188117981, 0.1574539840221405, 0.1616760492324829, 0.16589809954166412, 0.17012014985084534, 0.17434221506118774]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 5.0, 6.0, 3.0, 16.0, 6.0, 14.0, 9.0, 15.0, 31.0, 41.0, 65.0, 94.0, 122.0, 197.0, 326.0, 626.0, 1236.0, 2975.0, 12965.0, 422508.0, 586310.0, 14930.0, 3179.0, 1298.0, 614.0, 319.0, 201.0, 131.0, 70.0, 61.0, 37.0, 36.0, 20.0, 17.0, 15.0, 13.0, 9.0, 9.0, 7.0, 3.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.182861328125, -0.1771526336669922, -0.17144393920898438, -0.16573524475097656, -0.16002655029296875, -0.15431785583496094, -0.14860916137695312, -0.1429004669189453, -0.1371917724609375, -0.1314830780029297, -0.12577438354492188, -0.12006568908691406, -0.11435699462890625, -0.10864830017089844, -0.10293960571289062, -0.09723091125488281, -0.091522216796875, -0.08581352233886719, -0.08010482788085938, -0.07439613342285156, -0.06868743896484375, -0.06297874450683594, -0.057270050048828125, -0.05156135559082031, -0.0458526611328125, -0.04014396667480469, -0.034435272216796875, -0.028726577758789062, -0.02301788330078125, -0.017309188842773438, -0.011600494384765625, -0.0058917999267578125, -0.00018310546875, 0.0055255889892578125, 0.011234283447265625, 0.016942977905273438, 0.02265167236328125, 0.028360366821289062, 0.034069061279296875, 0.03977775573730469, 0.0454864501953125, 0.05119514465332031, 0.056903839111328125, 0.06261253356933594, 0.06832122802734375, 0.07402992248535156, 0.07973861694335938, 0.08544731140136719, 0.091156005859375, 0.09686470031738281, 0.10257339477539062, 0.10828208923339844, 0.11399078369140625, 0.11969947814941406, 0.12540817260742188, 0.1311168670654297, 0.1368255615234375, 0.1425342559814453, 0.14824295043945312, 0.15395164489746094, 0.15966033935546875, 0.16536903381347656, 0.17107772827148438, 0.1767864227294922, 0.1824951171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 8.0, 43.0, 114.0, 246.0, 305.0, 167.0, 58.0, 24.0, 10.0, 4.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06610107421875, -0.06457233428955078, -0.06304359436035156, -0.061514854431152344, -0.059986114501953125, -0.058457374572753906, -0.05692863464355469, -0.05539989471435547, -0.05387115478515625, -0.05234241485595703, -0.05081367492675781, -0.049284934997558594, -0.047756195068359375, -0.046227455139160156, -0.04469871520996094, -0.04316997528076172, -0.0416412353515625, -0.04011249542236328, -0.03858375549316406, -0.037055015563964844, -0.035526275634765625, -0.033997535705566406, -0.03246879577636719, -0.03094005584716797, -0.02941131591796875, -0.02788257598876953, -0.026353836059570312, -0.024825096130371094, -0.023296356201171875, -0.021767616271972656, -0.020238876342773438, -0.01871013641357422, -0.017181396484375, -0.01565265655517578, -0.014123916625976562, -0.012595176696777344, -0.011066436767578125, -0.009537696838378906, -0.008008956909179688, -0.006480216979980469, -0.00495147705078125, -0.0034227371215820312, -0.0018939971923828125, -0.00036525726318359375, 0.001163482666015625, 0.0026922225952148438, 0.0042209625244140625, 0.005749702453613281, 0.0072784423828125, 0.008807182312011719, 0.010335922241210938, 0.011864662170410156, 0.013393402099609375, 0.014922142028808594, 0.016450881958007812, 0.01797962188720703, 0.01950836181640625, 0.02103710174560547, 0.022565841674804688, 0.024094581604003906, 0.025623321533203125, 0.027152061462402344, 0.028680801391601562, 0.03020954132080078, 0.03173828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 12.0, 12.0, 9.0, 17.0, 13.0, 20.0, 27.0, 39.0, 54.0, 68.0, 108.0, 167.0, 326.0, 669.0, 1894.0, 8193.0, 64663.0, 804528.0, 148602.0, 14308.0, 2851.0, 887.0, 418.0, 246.0, 130.0, 65.0, 51.0, 44.0, 19.0, 16.0, 11.0, 15.0, 6.0, 5.0, 6.0, 9.0, 8.0, 5.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1458740234375, -0.1416645050048828, -0.13745498657226562, -0.13324546813964844, -0.12903594970703125, -0.12482643127441406, -0.12061691284179688, -0.11640739440917969, -0.1121978759765625, -0.10798835754394531, -0.10377883911132812, -0.09956932067871094, -0.09535980224609375, -0.09115028381347656, -0.08694076538085938, -0.08273124694824219, -0.078521728515625, -0.07431221008300781, -0.07010269165039062, -0.06589317321777344, -0.06168365478515625, -0.05747413635253906, -0.053264617919921875, -0.04905509948730469, -0.0448455810546875, -0.04063606262207031, -0.036426544189453125, -0.03221702575683594, -0.02800750732421875, -0.023797988891601562, -0.019588470458984375, -0.015378952026367188, -0.01116943359375, -0.0069599151611328125, -0.002750396728515625, 0.0014591217041015625, 0.00566864013671875, 0.009878158569335938, 0.014087677001953125, 0.018297195434570312, 0.0225067138671875, 0.026716232299804688, 0.030925750732421875, 0.03513526916503906, 0.03934478759765625, 0.04355430603027344, 0.047763824462890625, 0.05197334289550781, 0.056182861328125, 0.06039237976074219, 0.06460189819335938, 0.06881141662597656, 0.07302093505859375, 0.07723045349121094, 0.08143997192382812, 0.08564949035644531, 0.0898590087890625, 0.09406852722167969, 0.09827804565429688, 0.10248756408691406, 0.10669708251953125, 0.11090660095214844, 0.11511611938476562, 0.11932563781738281, 0.12353515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 7.0, 10.0, 6.0, 6.0, 5.0, 8.0, 17.0, 7.0, 16.0, 22.0, 28.0, 35.0, 15.0, 31.0, 42.0, 36.0, 51.0, 53.0, 48.0, 44.0, 52.0, 41.0, 41.0, 48.0, 30.0, 25.0, 29.0, 28.0, 35.0, 30.0, 24.0, 21.0, 20.0, 14.0, 16.0, 11.0, 10.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056427001953125, -0.0544896125793457, -0.052552223205566406, -0.05061483383178711, -0.04867744445800781, -0.046740055084228516, -0.04480266571044922, -0.04286527633666992, -0.040927886962890625, -0.03899049758911133, -0.03705310821533203, -0.035115718841552734, -0.03317832946777344, -0.03124094009399414, -0.029303550720214844, -0.027366161346435547, -0.02542877197265625, -0.023491382598876953, -0.021553993225097656, -0.01961660385131836, -0.017679214477539062, -0.015741825103759766, -0.013804435729980469, -0.011867046356201172, -0.009929656982421875, -0.007992267608642578, -0.006054878234863281, -0.004117488861083984, -0.0021800994873046875, -0.00024271011352539062, 0.0016946792602539062, 0.003632068634033203, 0.0055694580078125, 0.007506847381591797, 0.009444236755371094, 0.01138162612915039, 0.013319015502929688, 0.015256404876708984, 0.01719379425048828, 0.019131183624267578, 0.021068572998046875, 0.023005962371826172, 0.02494335174560547, 0.026880741119384766, 0.028818130493164062, 0.03075551986694336, 0.032692909240722656, 0.03463029861450195, 0.03656768798828125, 0.03850507736206055, 0.040442466735839844, 0.04237985610961914, 0.04431724548339844, 0.046254634857177734, 0.04819202423095703, 0.05012941360473633, 0.052066802978515625, 0.05400419235229492, 0.05594158172607422, 0.057878971099853516, 0.05981636047363281, 0.06175374984741211, 0.0636911392211914, 0.0656285285949707, 0.06756591796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 6.0, 6.0, 9.0, 6.0, 15.0, 16.0, 20.0, 40.0, 40.0, 77.0, 101.0, 153.0, 282.0, 407.0, 695.0, 1397.0, 3081.0, 8693.0, 35645.0, 346716.0, 575894.0, 56107.0, 11538.0, 3806.0, 1616.0, 818.0, 483.0, 297.0, 172.0, 113.0, 80.0, 52.0, 33.0, 28.0, 24.0, 17.0, 11.0, 15.0, 9.0, 3.0, 7.0, 7.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01100921630859375, -0.01060330867767334, -0.01019740104675293, -0.00979149341583252, -0.00938558578491211, -0.0089796781539917, -0.008573770523071289, -0.008167862892150879, -0.007761955261230469, -0.007356047630310059, -0.0069501399993896484, -0.006544232368469238, -0.006138324737548828, -0.005732417106628418, -0.005326509475708008, -0.004920601844787598, -0.0045146942138671875, -0.004108786582946777, -0.003702878952026367, -0.003296971321105957, -0.002891063690185547, -0.0024851560592651367, -0.0020792484283447266, -0.0016733407974243164, -0.0012674331665039062, -0.0008615255355834961, -0.00045561790466308594, -4.971027374267578e-05, 0.0003561973571777344, 0.0007621049880981445, 0.0011680126190185547, 0.0015739202499389648, 0.001979827880859375, 0.002385735511779785, 0.0027916431427001953, 0.0031975507736206055, 0.0036034584045410156, 0.004009366035461426, 0.004415273666381836, 0.004821181297302246, 0.005227088928222656, 0.005632996559143066, 0.0060389041900634766, 0.006444811820983887, 0.006850719451904297, 0.007256627082824707, 0.007662534713745117, 0.008068442344665527, 0.008474349975585938, 0.008880257606506348, 0.009286165237426758, 0.009692072868347168, 0.010097980499267578, 0.010503888130187988, 0.010909795761108398, 0.011315703392028809, 0.011721611022949219, 0.012127518653869629, 0.012533426284790039, 0.01293933391571045, 0.01334524154663086, 0.01375114917755127, 0.01415705680847168, 0.01456296443939209, 0.0149688720703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 11.0, 22.0, 15.0, 25.0, 43.0, 36.0, 62.0, 98.0, 96.0, 108.0, 78.0, 109.0, 74.0, 53.0, 48.0, 19.0, 26.0, 18.0, 5.0, 6.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.225440979003906e-06, -7.95070081949234e-06, -7.675960659980774e-06, -7.401220500469208e-06, -7.126480340957642e-06, -6.8517401814460754e-06, -6.577000021934509e-06, -6.302259862422943e-06, -6.027519702911377e-06, -5.752779543399811e-06, -5.478039383888245e-06, -5.2032992243766785e-06, -4.928559064865112e-06, -4.653818905353546e-06, -4.37907874584198e-06, -4.104338586330414e-06, -3.829598426818848e-06, -3.5548582673072815e-06, -3.2801181077957153e-06, -3.005377948284149e-06, -2.730637788772583e-06, -2.455897629261017e-06, -2.1811574697494507e-06, -1.9064173102378845e-06, -1.6316771507263184e-06, -1.3569369912147522e-06, -1.082196831703186e-06, -8.074566721916199e-07, -5.327165126800537e-07, -2.5797635316848755e-07, 1.6763806343078613e-08, 2.915039658546448e-07, 5.662441253662109e-07, 8.409842848777771e-07, 1.1157244443893433e-06, 1.3904646039009094e-06, 1.6652047634124756e-06, 1.9399449229240417e-06, 2.214685082435608e-06, 2.489425241947174e-06, 2.7641654014587402e-06, 3.0389055609703064e-06, 3.3136457204818726e-06, 3.5883858799934387e-06, 3.863126039505005e-06, 4.137866199016571e-06, 4.412606358528137e-06, 4.687346518039703e-06, 4.9620866775512695e-06, 5.236826837062836e-06, 5.511566996574402e-06, 5.786307156085968e-06, 6.061047315597534e-06, 6.3357874751091e-06, 6.6105276346206665e-06, 6.885267794132233e-06, 7.160007953643799e-06, 7.434748113155365e-06, 7.709488272666931e-06, 7.984228432178497e-06, 8.258968591690063e-06, 8.53370875120163e-06, 8.808448910713196e-06, 9.083189070224762e-06, 9.357929229736328e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 10.0, 8.0, 11.0, 20.0, 33.0, 47.0, 93.0, 166.0, 455.0, 1603.0, 13613.0, 895335.0, 131307.0, 4427.0, 872.0, 280.0, 123.0, 60.0, 34.0, 17.0, 16.0, 8.0, 6.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033172607421875, -0.031978607177734375, -0.03078460693359375, -0.029590606689453125, -0.0283966064453125, -0.027202606201171875, -0.02600860595703125, -0.024814605712890625, -0.02362060546875, -0.022426605224609375, -0.02123260498046875, -0.020038604736328125, -0.0188446044921875, -0.017650604248046875, -0.01645660400390625, -0.015262603759765625, -0.014068603515625, -0.012874603271484375, -0.01168060302734375, -0.010486602783203125, -0.0092926025390625, -0.008098602294921875, -0.00690460205078125, -0.005710601806640625, -0.0045166015625, -0.003322601318359375, -0.00212860107421875, -0.000934600830078125, 0.0002593994140625, 0.001453399658203125, 0.00264739990234375, 0.003841400146484375, 0.005035400390625, 0.006229400634765625, 0.00742340087890625, 0.008617401123046875, 0.0098114013671875, 0.011005401611328125, 0.01219940185546875, 0.013393402099609375, 0.01458740234375, 0.015781402587890625, 0.01697540283203125, 0.018169403076171875, 0.0193634033203125, 0.020557403564453125, 0.02175140380859375, 0.022945404052734375, 0.024139404296875, 0.025333404541015625, 0.02652740478515625, 0.027721405029296875, 0.0289154052734375, 0.030109405517578125, 0.03130340576171875, 0.032497406005859375, 0.03369140625, 0.034885406494140625, 0.03607940673828125, 0.037273406982421875, 0.0384674072265625, 0.039661407470703125, 0.04085540771484375, 0.042049407958984375, 0.043243408203125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 5.0, 11.0, 10.0, 17.0, 24.0, 38.0, 62.0, 74.0, 106.0, 105.0, 108.0, 121.0, 82.0, 68.0, 42.0, 42.0, 22.0, 21.0, 9.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0208740234375, -0.020327329635620117, -0.019780635833740234, -0.01923394203186035, -0.01868724822998047, -0.018140554428100586, -0.017593860626220703, -0.01704716682434082, -0.016500473022460938, -0.015953779220581055, -0.015407085418701172, -0.014860391616821289, -0.014313697814941406, -0.013767004013061523, -0.01322031021118164, -0.012673616409301758, -0.012126922607421875, -0.011580228805541992, -0.01103353500366211, -0.010486841201782227, -0.009940147399902344, -0.009393453598022461, -0.008846759796142578, -0.008300065994262695, -0.0077533721923828125, -0.00720667839050293, -0.006659984588623047, -0.006113290786743164, -0.005566596984863281, -0.0050199031829833984, -0.004473209381103516, -0.003926515579223633, -0.00337982177734375, -0.002833127975463867, -0.0022864341735839844, -0.0017397403717041016, -0.0011930465698242188, -0.0006463527679443359, -9.965896606445312e-05, 0.0004470348358154297, 0.0009937286376953125, 0.0015404224395751953, 0.002087116241455078, 0.002633810043334961, 0.0031805038452148438, 0.0037271976470947266, 0.004273891448974609, 0.004820585250854492, 0.005367279052734375, 0.005913972854614258, 0.006460666656494141, 0.0070073604583740234, 0.007554054260253906, 0.008100748062133789, 0.008647441864013672, 0.009194135665893555, 0.009740829467773438, 0.01028752326965332, 0.010834217071533203, 0.011380910873413086, 0.011927604675292969, 0.012474298477172852, 0.013020992279052734, 0.013567686080932617, 0.0141143798828125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 24.0, 68.0, 145.0, 437.0, 219.0, 60.0, 25.0, 12.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-1.2920843362808228, -1.2675726413726807, -1.2430609464645386, -1.2185492515563965, -1.1940375566482544, -1.1695258617401123, -1.1450140476226807, -1.1205024719238281, -1.0959906578063965, -1.0714789628982544, -1.0469672679901123, -1.0224555730819702, -0.9979438185691833, -0.9734321236610413, -0.9489204287528992, -0.9244087338447571, -0.8998970985412598, -0.8753854036331177, -0.8508737087249756, -0.8263620138168335, -0.8018502593040466, -0.7773385643959045, -0.7528268694877625, -0.7283151745796204, -0.7038034200668335, -0.6792917251586914, -0.6547800302505493, -0.6302683353424072, -0.6057565808296204, -0.5812448859214783, -0.5567331910133362, -0.5322214961051941, -0.507709801197052, -0.4831981062889099, -0.45868638157844543, -0.43417468667030334, -0.40966299176216125, -0.3851512670516968, -0.3606395721435547, -0.3361278772354126, -0.3116161823272705, -0.2871044874191284, -0.26259276270866394, -0.23808106780052185, -0.21356937289237976, -0.18905766308307648, -0.1645459532737732, -0.1400342583656311, -0.11552253365516663, -0.09101083129644394, -0.06649912893772125, -0.04198741912841797, -0.017475716769695282, 0.007035985589027405, 0.03154769539833069, 0.05605939030647278, 0.08057110011577606, 0.10508280247449875, 0.12959450483322144, 0.15410621464252472, 0.178617924451828, 0.2031296193599701, 0.22764132916927338, 0.25215303897857666, 0.27666473388671875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 5.0, 13.0, 10.0, 16.0, 14.0, 22.0, 39.0, 40.0, 55.0, 32.0, 48.0, 47.0, 50.0, 57.0, 64.0, 56.0, 58.0, 48.0, 51.0, 41.0, 46.0, 40.0, 35.0, 22.0, 21.0, 18.0, 11.0, 5.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39217329025268555, -0.37799152731895447, -0.3638097941875458, -0.3496280312538147, -0.3354462683200836, -0.3212645351886749, -0.30708277225494385, -0.29290103912353516, -0.2787192761898041, -0.264537513256073, -0.2503557801246643, -0.23617401719093323, -0.22199226915836334, -0.20781052112579346, -0.19362875819206238, -0.1794470101594925, -0.1652652472257614, -0.15108349919319153, -0.13690173625946045, -0.12271998822689056, -0.10853824019432068, -0.0943564847111702, -0.08017472922801971, -0.06599298119544983, -0.05181122571229935, -0.03762947395443916, -0.02344772033393383, -0.009265966713428497, 0.004915785044431686, 0.01909753680229187, 0.03327929228544235, 0.04746104031801224, 0.06164279580116272, 0.0758245512843132, 0.09000629931688309, 0.10418805480003357, 0.11836980283260345, 0.13255155086517334, 0.14673331379890442, 0.1609150618314743, 0.1750968098640442, 0.18927855789661407, 0.20346032083034515, 0.21764206886291504, 0.23182381689548492, 0.2460055649280548, 0.2601873278617859, 0.2743690609931946, 0.28855085372924805, 0.3027326166629791, 0.3169143497943878, 0.3310961127281189, 0.34527787566185, 0.35945960879325867, 0.37364137172698975, 0.38782310485839844, 0.4020048677921295, 0.4161866307258606, 0.4303683638572693, 0.44455012679100037, 0.45873188972473145, 0.47291362285614014, 0.4870953857898712, 0.5012771487236023, 0.515458881855011]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 9.0, 11.0, 16.0, 38.0, 108.0, 385.0, 11551.0, 4181290.0, 647.0, 143.0, 43.0, 14.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.78955078125, -0.7716712951660156, -0.7537918090820312, -0.7359123229980469, -0.7180328369140625, -0.7001533508300781, -0.6822738647460938, -0.6643943786621094, -0.646514892578125, -0.6286354064941406, -0.6107559204101562, -0.5928764343261719, -0.5749969482421875, -0.5571174621582031, -0.5392379760742188, -0.5213584899902344, -0.50347900390625, -0.4855995178222656, -0.46772003173828125, -0.4498405456542969, -0.4319610595703125, -0.4140815734863281, -0.39620208740234375, -0.3783226013183594, -0.360443115234375, -0.3425636291503906, -0.32468414306640625, -0.3068046569824219, -0.2889251708984375, -0.2710456848144531, -0.25316619873046875, -0.23528671264648438, -0.2174072265625, -0.19952774047851562, -0.18164825439453125, -0.16376876831054688, -0.1458892822265625, -0.12800979614257812, -0.11013031005859375, -0.09225082397460938, -0.074371337890625, -0.056491851806640625, -0.03861236572265625, -0.020732879638671875, -0.0028533935546875, 0.015026092529296875, 0.03290557861328125, 0.050785064697265625, 0.06866455078125, 0.08654403686523438, 0.10442352294921875, 0.12230300903320312, 0.1401824951171875, 0.15806198120117188, 0.17594146728515625, 0.19382095336914062, 0.211700439453125, 0.22957992553710938, 0.24745941162109375, 0.2653388977050781, 0.2832183837890625, 0.3010978698730469, 0.31897735595703125, 0.3368568420410156, 0.354736328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 7.0, 14.0, 26.0, 90.0, 170.0, 298.0, 210.0, 107.0, 42.0, 16.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0677490234375, -0.06619644165039062, -0.06464385986328125, -0.06309127807617188, -0.0615386962890625, -0.059986114501953125, -0.05843353271484375, -0.056880950927734375, -0.055328369140625, -0.053775787353515625, -0.05222320556640625, -0.050670623779296875, -0.0491180419921875, -0.047565460205078125, -0.04601287841796875, -0.044460296630859375, -0.04290771484375, -0.041355133056640625, -0.03980255126953125, -0.038249969482421875, -0.0366973876953125, -0.035144805908203125, -0.03359222412109375, -0.032039642333984375, -0.030487060546875, -0.028934478759765625, -0.02738189697265625, -0.025829315185546875, -0.0242767333984375, -0.022724151611328125, -0.02117156982421875, -0.019618988037109375, -0.01806640625, -0.016513824462890625, -0.01496124267578125, -0.013408660888671875, -0.0118560791015625, -0.010303497314453125, -0.00875091552734375, -0.007198333740234375, -0.005645751953125, -0.004093170166015625, -0.00254058837890625, -0.000988006591796875, 0.0005645751953125, 0.002117156982421875, 0.00366973876953125, 0.005222320556640625, 0.00677490234375, 0.008327484130859375, 0.00988006591796875, 0.011432647705078125, 0.0129852294921875, 0.014537811279296875, 0.01609039306640625, 0.017642974853515625, 0.019195556640625, 0.020748138427734375, 0.02230072021484375, 0.023853302001953125, 0.0254058837890625, 0.026958465576171875, 0.02851104736328125, 0.030063629150390625, 0.0316162109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 9.0, 20.0, 13.0, 30.0, 79.0, 143.0, 233.0, 447.0, 838.0, 1969.0, 5790.0, 31160.0, 3998348.0, 137459.0, 11954.0, 3112.0, 1230.0, 618.0, 323.0, 163.0, 121.0, 75.0, 59.0, 26.0, 15.0, 6.0, 9.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08978271484375, -0.08733844757080078, -0.08489418029785156, -0.08244991302490234, -0.08000564575195312, -0.0775613784790039, -0.07511711120605469, -0.07267284393310547, -0.07022857666015625, -0.06778430938720703, -0.06534004211425781, -0.0628957748413086, -0.060451507568359375, -0.058007240295410156, -0.05556297302246094, -0.05311870574951172, -0.0506744384765625, -0.04823017120361328, -0.04578590393066406, -0.043341636657714844, -0.040897369384765625, -0.038453102111816406, -0.03600883483886719, -0.03356456756591797, -0.03112030029296875, -0.02867603302001953, -0.026231765747070312, -0.023787498474121094, -0.021343231201171875, -0.018898963928222656, -0.016454696655273438, -0.014010429382324219, -0.011566162109375, -0.009121894836425781, -0.0066776275634765625, -0.004233360290527344, -0.001789093017578125, 0.0006551742553710938, 0.0030994415283203125, 0.005543708801269531, 0.00798797607421875, 0.010432243347167969, 0.012876510620117188, 0.015320777893066406, 0.017765045166015625, 0.020209312438964844, 0.022653579711914062, 0.02509784698486328, 0.0275421142578125, 0.02998638153076172, 0.03243064880371094, 0.034874916076660156, 0.037319183349609375, 0.039763450622558594, 0.04220771789550781, 0.04465198516845703, 0.04709625244140625, 0.04954051971435547, 0.05198478698730469, 0.054429054260253906, 0.056873321533203125, 0.059317588806152344, 0.06176185607910156, 0.06420612335205078, 0.066650390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 8.0, 19.0, 22.0, 44.0, 86.0, 309.0, 2904.0, 409.0, 123.0, 39.0, 21.0, 19.0, 14.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0172576904296875, -0.0165555477142334, -0.015853404998779297, -0.015151262283325195, -0.014449119567871094, -0.013746976852416992, -0.01304483413696289, -0.012342691421508789, -0.011640548706054688, -0.010938405990600586, -0.010236263275146484, -0.009534120559692383, -0.008831977844238281, -0.00812983512878418, -0.007427692413330078, -0.0067255496978759766, -0.006023406982421875, -0.0053212642669677734, -0.004619121551513672, -0.00391697883605957, -0.0032148361206054688, -0.002512693405151367, -0.0018105506896972656, -0.001108407974243164, -0.0004062652587890625, 0.00029587745666503906, 0.0009980201721191406, 0.0017001628875732422, 0.0024023056030273438, 0.0031044483184814453, 0.003806591033935547, 0.0045087337493896484, 0.00521087646484375, 0.0059130191802978516, 0.006615161895751953, 0.007317304611206055, 0.008019447326660156, 0.008721590042114258, 0.00942373275756836, 0.010125875473022461, 0.010828018188476562, 0.011530160903930664, 0.012232303619384766, 0.012934446334838867, 0.013636589050292969, 0.01433873176574707, 0.015040874481201172, 0.015743017196655273, 0.016445159912109375, 0.017147302627563477, 0.017849445343017578, 0.01855158805847168, 0.01925373077392578, 0.019955873489379883, 0.020658016204833984, 0.021360158920288086, 0.022062301635742188, 0.02276444435119629, 0.02346658706665039, 0.024168729782104492, 0.024870872497558594, 0.025573015213012695, 0.026275157928466797, 0.0269773006439209, 0.027679443359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 27.0, 943.0, 47.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09849897027015686, -0.07691660523414612, -0.055334243923425674, -0.03375188261270523, -0.012169517576694489, 0.009412847459316254, 0.0309952050447464, 0.05257757008075714, 0.07415993511676788, 0.09574230015277863, 0.11732466518878937, 0.13890701532363892, 0.16048938035964966, 0.1820717453956604, 0.20365411043167114, 0.22523647546768188, 0.24681884050369263, 0.26840120553970337, 0.2899835705757141, 0.31156593561172485, 0.3331483006477356, 0.35473066568374634, 0.3763130307197571, 0.3978953957557678, 0.41947776079177856, 0.4410601258277893, 0.46264249086380005, 0.4842248558998108, 0.5058072209358215, 0.5273895859718323, 0.548971951007843, 0.5705543160438538, 0.5921366810798645, 0.6137190461158752, 0.635301411151886, 0.6568837761878967, 0.6784661412239075, 0.7000485062599182, 0.721630871295929, 0.7432132363319397, 0.7647956013679504, 0.7863779664039612, 0.8079603314399719, 0.8295426964759827, 0.8511250615119934, 0.8727074265480042, 0.8942897915840149, 0.9158721566200256, 0.9374544620513916, 0.9590368270874023, 0.9806191921234131, 1.0022015571594238, 1.0237839221954346, 1.0453662872314453, 1.066948652267456, 1.0885310173034668, 1.1101133823394775, 1.1316957473754883, 1.153278112411499, 1.1748604774475098, 1.1964428424835205, 1.2180252075195312, 1.239607572555542, 1.2611899375915527, 1.2827723026275635]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 11.0, 12.0, 12.0, 20.0, 21.0, 29.0, 34.0, 42.0, 51.0, 34.0, 51.0, 58.0, 71.0, 65.0, 61.0, 61.0, 61.0, 61.0, 40.0, 47.0, 39.0, 31.0, 18.0, 13.0, 11.0, 10.0, 8.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.08346837759017944, -0.08139237016439438, -0.07931636273860931, -0.07724035531282425, -0.07516434788703918, -0.07308834046125412, -0.07101233303546906, -0.06893632560968399, -0.06686031818389893, -0.06478431075811386, -0.0627083033323288, -0.06063229590654373, -0.05855628848075867, -0.0564802810549736, -0.05440427362918854, -0.05232826620340347, -0.05025225877761841, -0.048176251351833344, -0.04610024392604828, -0.044024236500263214, -0.04194822907447815, -0.039872221648693085, -0.03779621422290802, -0.035720206797122955, -0.03364419937133789, -0.031568191945552826, -0.02949218451976776, -0.027416177093982697, -0.025340169668197632, -0.023264162242412567, -0.021188154816627502, -0.019112147390842438, -0.017036139965057373, -0.014960132539272308, -0.012884125113487244, -0.010808117687702179, -0.008732110261917114, -0.0066561028361320496, -0.004580095410346985, -0.00250408798456192, -0.00042808055877685547, 0.0016479268670082092, 0.003723934292793274, 0.005799941718578339, 0.007875949144363403, 0.009951956570148468, 0.012027963995933533, 0.014103971421718597, 0.016179978847503662, 0.018255986273288727, 0.02033199369907379, 0.022408001124858856, 0.02448400855064392, 0.026560015976428986, 0.02863602340221405, 0.030712030827999115, 0.03278803825378418, 0.034864045679569244, 0.03694005310535431, 0.039016060531139374, 0.04109206795692444, 0.0431680753827095, 0.04524408280849457, 0.04732009023427963, 0.0493960976600647]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 7.0, 9.0, 7.0, 12.0, 14.0, 20.0, 28.0, 34.0, 27.0, 48.0, 83.0, 127.0, 249.0, 421.0, 797.0, 1954.0, 6389.0, 71478.0, 913734.0, 44416.0, 5291.0, 1675.0, 713.0, 374.0, 229.0, 148.0, 76.0, 49.0, 29.0, 23.0, 16.0, 20.0, 10.0, 12.0, 12.0, 6.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.1383228302001953, -0.13345718383789062, -0.12859153747558594, -0.12372589111328125, -0.11886024475097656, -0.11399459838867188, -0.10912895202636719, -0.1042633056640625, -0.09939765930175781, -0.09453201293945312, -0.08966636657714844, -0.08480072021484375, -0.07993507385253906, -0.07506942749023438, -0.07020378112792969, -0.065338134765625, -0.06047248840332031, -0.055606842041015625, -0.05074119567871094, -0.04587554931640625, -0.04100990295410156, -0.036144256591796875, -0.03127861022949219, -0.0264129638671875, -0.021547317504882812, -0.016681671142578125, -0.011816024780273438, -0.00695037841796875, -0.0020847320556640625, 0.002780914306640625, 0.0076465606689453125, 0.01251220703125, 0.017377853393554688, 0.022243499755859375, 0.027109146118164062, 0.03197479248046875, 0.03684043884277344, 0.041706085205078125, 0.04657173156738281, 0.0514373779296875, 0.05630302429199219, 0.061168670654296875, 0.06603431701660156, 0.07089996337890625, 0.07576560974121094, 0.08063125610351562, 0.08549690246582031, 0.090362548828125, 0.09522819519042969, 0.10009384155273438, 0.10495948791503906, 0.10982513427734375, 0.11469078063964844, 0.11955642700195312, 0.12442207336425781, 0.1292877197265625, 0.1341533660888672, 0.13901901245117188, 0.14388465881347656, 0.14875030517578125, 0.15361595153808594, 0.15848159790039062, 0.1633472442626953, 0.168212890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 5.0, 10.0, 31.0, 85.0, 186.0, 280.0, 214.0, 117.0, 36.0, 14.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06683349609375, -0.06530237197875977, -0.06377124786376953, -0.0622401237487793, -0.06070899963378906, -0.05917787551879883, -0.057646751403808594, -0.05611562728881836, -0.054584503173828125, -0.05305337905883789, -0.051522254943847656, -0.04999113082885742, -0.04846000671386719, -0.04692888259887695, -0.04539775848388672, -0.043866634368896484, -0.04233551025390625, -0.040804386138916016, -0.03927326202392578, -0.03774213790893555, -0.03621101379394531, -0.03467988967895508, -0.033148765563964844, -0.03161764144897461, -0.030086517333984375, -0.02855539321899414, -0.027024269104003906, -0.025493144989013672, -0.023962020874023438, -0.022430896759033203, -0.02089977264404297, -0.019368648529052734, -0.0178375244140625, -0.016306400299072266, -0.014775276184082031, -0.013244152069091797, -0.011713027954101562, -0.010181903839111328, -0.008650779724121094, -0.007119655609130859, -0.005588531494140625, -0.004057407379150391, -0.0025262832641601562, -0.0009951591491699219, 0.0005359649658203125, 0.002067089080810547, 0.0035982131958007812, 0.005129337310791016, 0.00666046142578125, 0.008191585540771484, 0.009722709655761719, 0.011253833770751953, 0.012784957885742188, 0.014316082000732422, 0.015847206115722656, 0.01737833023071289, 0.018909454345703125, 0.02044057846069336, 0.021971702575683594, 0.023502826690673828, 0.025033950805664062, 0.026565074920654297, 0.02809619903564453, 0.029627323150634766, 0.031158447265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 4.0, 10.0, 7.0, 7.0, 11.0, 20.0, 20.0, 15.0, 31.0, 77.0, 77.0, 196.0, 345.0, 767.0, 2148.0, 8973.0, 60304.0, 741152.0, 207396.0, 20632.0, 4065.0, 1160.0, 489.0, 244.0, 128.0, 78.0, 45.0, 33.0, 17.0, 17.0, 17.0, 13.0, 8.0, 14.0, 4.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.0891103744506836, -0.08550834655761719, -0.08190631866455078, -0.07830429077148438, -0.07470226287841797, -0.07110023498535156, -0.06749820709228516, -0.06389617919921875, -0.060294151306152344, -0.05669212341308594, -0.05309009552001953, -0.049488067626953125, -0.04588603973388672, -0.04228401184082031, -0.038681983947753906, -0.0350799560546875, -0.031477928161621094, -0.027875900268554688, -0.02427387237548828, -0.020671844482421875, -0.01706981658935547, -0.013467788696289062, -0.009865760803222656, -0.00626373291015625, -0.0026617050170898438, 0.0009403228759765625, 0.004542350769042969, 0.008144378662109375, 0.011746406555175781, 0.015348434448242188, 0.018950462341308594, 0.022552490234375, 0.026154518127441406, 0.029756546020507812, 0.03335857391357422, 0.036960601806640625, 0.04056262969970703, 0.04416465759277344, 0.047766685485839844, 0.05136871337890625, 0.054970741271972656, 0.05857276916503906, 0.06217479705810547, 0.06577682495117188, 0.06937885284423828, 0.07298088073730469, 0.0765829086303711, 0.0801849365234375, 0.0837869644165039, 0.08738899230957031, 0.09099102020263672, 0.09459304809570312, 0.09819507598876953, 0.10179710388183594, 0.10539913177490234, 0.10900115966796875, 0.11260318756103516, 0.11620521545410156, 0.11980724334716797, 0.12340927124023438, 0.12701129913330078, 0.1306133270263672, 0.1342153549194336, 0.1378173828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 1.0, 5.0, 7.0, 6.0, 11.0, 12.0, 12.0, 16.0, 16.0, 14.0, 27.0, 14.0, 34.0, 39.0, 35.0, 45.0, 33.0, 51.0, 40.0, 65.0, 55.0, 44.0, 59.0, 42.0, 48.0, 40.0, 46.0, 25.0, 27.0, 21.0, 14.0, 19.0, 19.0, 11.0, 10.0, 6.0, 11.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 6.0], "bins": [-0.08001708984375, -0.07792472839355469, -0.07583236694335938, -0.07374000549316406, -0.07164764404296875, -0.06955528259277344, -0.06746292114257812, -0.06537055969238281, -0.0632781982421875, -0.06118583679199219, -0.059093475341796875, -0.05700111389160156, -0.05490875244140625, -0.05281639099121094, -0.050724029541015625, -0.04863166809082031, -0.046539306640625, -0.04444694519042969, -0.042354583740234375, -0.04026222229003906, -0.03816986083984375, -0.03607749938964844, -0.033985137939453125, -0.03189277648925781, -0.0298004150390625, -0.027708053588867188, -0.025615692138671875, -0.023523330688476562, -0.02143096923828125, -0.019338607788085938, -0.017246246337890625, -0.015153884887695312, -0.0130615234375, -0.010969161987304688, -0.008876800537109375, -0.0067844390869140625, -0.00469207763671875, -0.0025997161865234375, -0.000507354736328125, 0.0015850067138671875, 0.0036773681640625, 0.0057697296142578125, 0.007862091064453125, 0.009954452514648438, 0.01204681396484375, 0.014139175415039062, 0.016231536865234375, 0.018323898315429688, 0.020416259765625, 0.022508621215820312, 0.024600982666015625, 0.026693344116210938, 0.02878570556640625, 0.030878067016601562, 0.032970428466796875, 0.03506278991699219, 0.0371551513671875, 0.03924751281738281, 0.041339874267578125, 0.04343223571777344, 0.04552459716796875, 0.04761695861816406, 0.049709320068359375, 0.05180168151855469, 0.05389404296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 9.0, 8.0, 13.0, 7.0, 12.0, 17.0, 23.0, 30.0, 39.0, 46.0, 62.0, 89.0, 168.0, 284.0, 570.0, 1229.0, 3628.0, 14028.0, 93302.0, 710414.0, 193151.0, 22903.0, 5212.0, 1706.0, 679.0, 348.0, 188.0, 115.0, 72.0, 53.0, 33.0, 24.0, 14.0, 21.0, 16.0, 6.0, 11.0, 4.0, 3.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0146636962890625, -0.014227867126464844, -0.013792037963867188, -0.013356208801269531, -0.012920379638671875, -0.012484550476074219, -0.012048721313476562, -0.011612892150878906, -0.01117706298828125, -0.010741233825683594, -0.010305404663085938, -0.009869575500488281, -0.009433746337890625, -0.008997917175292969, -0.008562088012695312, -0.008126258850097656, -0.0076904296875, -0.007254600524902344, -0.0068187713623046875, -0.006382942199707031, -0.005947113037109375, -0.005511283874511719, -0.0050754547119140625, -0.004639625549316406, -0.00420379638671875, -0.0037679672241210938, -0.0033321380615234375, -0.0028963088989257812, -0.002460479736328125, -0.0020246505737304688, -0.0015888214111328125, -0.0011529922485351562, -0.0007171630859375, -0.00028133392333984375, 0.0001544952392578125, 0.0005903244018554688, 0.001026153564453125, 0.0014619827270507812, 0.0018978118896484375, 0.0023336410522460938, 0.00276947021484375, 0.0032052993774414062, 0.0036411285400390625, 0.004076957702636719, 0.004512786865234375, 0.004948616027832031, 0.0053844451904296875, 0.005820274353027344, 0.006256103515625, 0.006691932678222656, 0.0071277618408203125, 0.007563591003417969, 0.007999420166015625, 0.008435249328613281, 0.008871078491210938, 0.009306907653808594, 0.00974273681640625, 0.010178565979003906, 0.010614395141601562, 0.011050224304199219, 0.011486053466796875, 0.011921882629394531, 0.012357711791992188, 0.012793540954589844, 0.0132293701171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 6.0, 9.0, 5.0, 13.0, 9.0, 21.0, 28.0, 18.0, 40.0, 38.0, 46.0, 78.0, 68.0, 80.0, 93.0, 59.0, 57.0, 79.0, 45.0, 33.0, 47.0, 23.0, 18.0, 18.0, 13.0, 8.0, 8.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.046627044677734e-06, -7.847324013710022e-06, -7.64802098274231e-06, -7.448717951774597e-06, -7.249414920806885e-06, -7.050111889839172e-06, -6.85080885887146e-06, -6.6515058279037476e-06, -6.452202796936035e-06, -6.252899765968323e-06, -6.05359673500061e-06, -5.854293704032898e-06, -5.6549906730651855e-06, -5.455687642097473e-06, -5.256384611129761e-06, -5.057081580162048e-06, -4.857778549194336e-06, -4.6584755182266235e-06, -4.459172487258911e-06, -4.259869456291199e-06, -4.060566425323486e-06, -3.861263394355774e-06, -3.6619603633880615e-06, -3.462657332420349e-06, -3.2633543014526367e-06, -3.0640512704849243e-06, -2.864748239517212e-06, -2.6654452085494995e-06, -2.466142177581787e-06, -2.2668391466140747e-06, -2.0675361156463623e-06, -1.86823308467865e-06, -1.6689300537109375e-06, -1.469627022743225e-06, -1.2703239917755127e-06, -1.0710209608078003e-06, -8.717179298400879e-07, -6.724148988723755e-07, -4.731118679046631e-07, -2.738088369369507e-07, -7.450580596923828e-08, 1.2479722499847412e-07, 3.241002559661865e-07, 5.234032869338989e-07, 7.227063179016113e-07, 9.220093488693237e-07, 1.1213123798370361e-06, 1.3206154108047485e-06, 1.519918441772461e-06, 1.7192214727401733e-06, 1.9185245037078857e-06, 2.117827534675598e-06, 2.3171305656433105e-06, 2.516433596611023e-06, 2.7157366275787354e-06, 2.9150396585464478e-06, 3.11434268951416e-06, 3.3136457204818726e-06, 3.512948751449585e-06, 3.7122517824172974e-06, 3.91155481338501e-06, 4.110857844352722e-06, 4.3101608753204346e-06, 4.509463906288147e-06, 4.708766937255859e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 5.0, 16.0, 28.0, 41.0, 83.0, 165.0, 476.0, 1639.0, 14826.0, 886902.0, 138532.0, 4377.0, 883.0, 309.0, 119.0, 52.0, 32.0, 28.0, 8.0, 9.0, 5.0, 11.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033782958984375, -0.032752037048339844, -0.03172111511230469, -0.03069019317626953, -0.029659271240234375, -0.02862834930419922, -0.027597427368164062, -0.026566505432128906, -0.02553558349609375, -0.024504661560058594, -0.023473739624023438, -0.02244281768798828, -0.021411895751953125, -0.02038097381591797, -0.019350051879882812, -0.018319129943847656, -0.0172882080078125, -0.016257286071777344, -0.015226364135742188, -0.014195442199707031, -0.013164520263671875, -0.012133598327636719, -0.011102676391601562, -0.010071754455566406, -0.00904083251953125, -0.008009910583496094, -0.0069789886474609375, -0.005948066711425781, -0.004917144775390625, -0.0038862228393554688, -0.0028553009033203125, -0.0018243789672851562, -0.00079345703125, 0.00023746490478515625, 0.0012683868408203125, 0.0022993087768554688, 0.003330230712890625, 0.004361152648925781, 0.0053920745849609375, 0.006422996520996094, 0.00745391845703125, 0.008484840393066406, 0.009515762329101562, 0.010546684265136719, 0.011577606201171875, 0.012608528137207031, 0.013639450073242188, 0.014670372009277344, 0.0157012939453125, 0.016732215881347656, 0.017763137817382812, 0.01879405975341797, 0.019824981689453125, 0.02085590362548828, 0.021886825561523438, 0.022917747497558594, 0.02394866943359375, 0.024979591369628906, 0.026010513305664062, 0.02704143524169922, 0.028072357177734375, 0.02910327911376953, 0.030134201049804688, 0.031165122985839844, 0.032196044921875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 4.0, 4.0, 8.0, 17.0, 23.0, 23.0, 42.0, 56.0, 110.0, 127.0, 173.0, 137.0, 114.0, 71.0, 28.0, 24.0, 27.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02081298828125, -0.020172834396362305, -0.01953268051147461, -0.018892526626586914, -0.01825237274169922, -0.017612218856811523, -0.016972064971923828, -0.016331911087036133, -0.015691757202148438, -0.015051603317260742, -0.014411449432373047, -0.013771295547485352, -0.013131141662597656, -0.012490987777709961, -0.011850833892822266, -0.01121068000793457, -0.010570526123046875, -0.00993037223815918, -0.009290218353271484, -0.008650064468383789, -0.008009910583496094, -0.0073697566986083984, -0.006729602813720703, -0.006089448928833008, -0.0054492950439453125, -0.004809141159057617, -0.004168987274169922, -0.0035288333892822266, -0.0028886795043945312, -0.002248525619506836, -0.0016083717346191406, -0.0009682178497314453, -0.00032806396484375, 0.0003120899200439453, 0.0009522438049316406, 0.001592397689819336, 0.0022325515747070312, 0.0028727054595947266, 0.003512859344482422, 0.004153013229370117, 0.0047931671142578125, 0.005433320999145508, 0.006073474884033203, 0.0067136287689208984, 0.007353782653808594, 0.007993936538696289, 0.008634090423583984, 0.00927424430847168, 0.009914398193359375, 0.01055455207824707, 0.011194705963134766, 0.011834859848022461, 0.012475013732910156, 0.013115167617797852, 0.013755321502685547, 0.014395475387573242, 0.015035629272460938, 0.015675783157348633, 0.016315937042236328, 0.016956090927124023, 0.01759624481201172, 0.018236398696899414, 0.01887655258178711, 0.019516706466674805, 0.0201568603515625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 12.0, 24.0, 34.0, 69.0, 145.0, 377.0, 194.0, 79.0, 36.0, 14.0, 4.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9426975250244141, -0.9224910140037537, -0.902284562587738, -0.8820780515670776, -0.861871600151062, -0.8416650891304016, -0.821458637714386, -0.8012521266937256, -0.78104567527771, -0.7608391642570496, -0.7406327128410339, -0.7204262018203735, -0.7002197504043579, -0.6800132393836975, -0.6598067879676819, -0.6396002769470215, -0.6193938255310059, -0.5991873145103455, -0.5789808630943298, -0.5587743520736694, -0.5385679006576538, -0.5183613896369934, -0.4981549382209778, -0.4779484272003174, -0.457741916179657, -0.43753543496131897, -0.41732895374298096, -0.39712247252464294, -0.37691599130630493, -0.3567095100879669, -0.3365030288696289, -0.3162965178489685, -0.2960900664329529, -0.27588358521461487, -0.25567710399627686, -0.23547062277793884, -0.21526414155960083, -0.19505766034126282, -0.1748511642217636, -0.1546446830034256, -0.13443820178508759, -0.11423172056674957, -0.09402523934841156, -0.07381875067949295, -0.05361226946115494, -0.033405788242816925, -0.013199299573898315, 0.007007181644439697, 0.02721366286277771, 0.04742014408111572, 0.06762662529945374, 0.08783311396837234, 0.10803959518671036, 0.12824606895446777, 0.14845256507396698, 0.168659046292305, 0.188865527510643, 0.20907200872898102, 0.22927848994731903, 0.24948498606681824, 0.26969146728515625, 0.28989794850349426, 0.3101044297218323, 0.3303109109401703, 0.3505173921585083]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 2.0, 9.0, 13.0, 12.0, 19.0, 24.0, 24.0, 38.0, 21.0, 39.0, 40.0, 53.0, 51.0, 53.0, 63.0, 60.0, 55.0, 44.0, 62.0, 63.0, 45.0, 36.0, 30.0, 30.0, 18.0, 20.0, 19.0, 6.0, 6.0, 9.0, 4.0, 3.0, 4.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47787147760391235, -0.46428751945495605, -0.45070359110832214, -0.43711966276168823, -0.42353570461273193, -0.40995174646377563, -0.3963678181171417, -0.3827838897705078, -0.3691999316215515, -0.3556159734725952, -0.3420320451259613, -0.3284481167793274, -0.3148641586303711, -0.3012802004814148, -0.2876962721347809, -0.274112343788147, -0.2605283856391907, -0.24694444239139557, -0.23336049914360046, -0.21977655589580536, -0.20619261264801025, -0.19260866940021515, -0.17902472615242004, -0.16544078290462494, -0.15185683965682983, -0.13827289640903473, -0.12468895316123962, -0.11110500991344452, -0.09752106666564941, -0.08393712341785431, -0.0703531801700592, -0.0567692369222641, -0.043185293674468994, -0.02960135042667389, -0.016017407178878784, -0.002433463931083679, 0.011150479316711426, 0.02473442256450653, 0.038318365812301636, 0.05190230906009674, 0.06548625230789185, 0.07907019555568695, 0.09265413880348206, 0.10623808205127716, 0.11982202529907227, 0.13340596854686737, 0.14698991179466248, 0.16057385504245758, 0.17415779829025269, 0.1877417415380478, 0.2013256847858429, 0.214909628033638, 0.2284935712814331, 0.2420775145292282, 0.2556614577770233, 0.2692453861236572, 0.2828293442726135, 0.2964133024215698, 0.30999723076820374, 0.32358115911483765, 0.33716511726379395, 0.35074907541275024, 0.36433300375938416, 0.37791693210601807, 0.39150089025497437]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 5.0, 5.0, 9.0, 20.0, 18.0, 37.0, 82.0, 165.0, 310.0, 917.0, 6135.0, 4138933.0, 44621.0, 2206.0, 460.0, 168.0, 80.0, 40.0, 25.0, 15.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.364013671875, -0.3558788299560547, -0.3477439880371094, -0.33960914611816406, -0.33147430419921875, -0.32333946228027344, -0.3152046203613281, -0.3070697784423828, -0.2989349365234375, -0.2908000946044922, -0.2826652526855469, -0.27453041076660156, -0.26639556884765625, -0.25826072692871094, -0.2501258850097656, -0.2419910430908203, -0.233856201171875, -0.2257213592529297, -0.21758651733398438, -0.20945167541503906, -0.20131683349609375, -0.19318199157714844, -0.18504714965820312, -0.1769123077392578, -0.1687774658203125, -0.1606426239013672, -0.15250778198242188, -0.14437294006347656, -0.13623809814453125, -0.12810325622558594, -0.11996841430664062, -0.11183357238769531, -0.10369873046875, -0.09556388854980469, -0.08742904663085938, -0.07929420471191406, -0.07115936279296875, -0.06302452087402344, -0.054889678955078125, -0.04675483703613281, -0.0386199951171875, -0.030485153198242188, -0.022350311279296875, -0.014215469360351562, -0.00608062744140625, 0.0020542144775390625, 0.010189056396484375, 0.018323898315429688, 0.026458740234375, 0.03459358215332031, 0.042728424072265625, 0.05086326599121094, 0.05899810791015625, 0.06713294982910156, 0.07526779174804688, 0.08340263366699219, 0.0915374755859375, 0.09967231750488281, 0.10780715942382812, 0.11594200134277344, 0.12407684326171875, 0.13221168518066406, 0.14034652709960938, 0.1484813690185547, 0.1566162109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 14.0, 31.0, 94.0, 186.0, 259.0, 211.0, 124.0, 42.0, 15.0, 10.0, 2.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06903076171875, -0.06745004653930664, -0.06586933135986328, -0.06428861618041992, -0.06270790100097656, -0.0611271858215332, -0.059546470642089844, -0.057965755462646484, -0.056385040283203125, -0.054804325103759766, -0.053223609924316406, -0.05164289474487305, -0.05006217956542969, -0.04848146438598633, -0.04690074920654297, -0.04532003402709961, -0.04373931884765625, -0.04215860366821289, -0.04057788848876953, -0.03899717330932617, -0.03741645812988281, -0.03583574295043945, -0.034255027770996094, -0.032674312591552734, -0.031093597412109375, -0.029512882232666016, -0.027932167053222656, -0.026351451873779297, -0.024770736694335938, -0.023190021514892578, -0.02160930633544922, -0.02002859115600586, -0.0184478759765625, -0.01686716079711914, -0.015286445617675781, -0.013705730438232422, -0.012125015258789062, -0.010544300079345703, -0.008963584899902344, -0.007382869720458984, -0.005802154541015625, -0.004221439361572266, -0.0026407241821289062, -0.0010600090026855469, 0.0005207061767578125, 0.002101421356201172, 0.0036821365356445312, 0.005262851715087891, 0.00684356689453125, 0.00842428207397461, 0.010004997253417969, 0.011585712432861328, 0.013166427612304688, 0.014747142791748047, 0.016327857971191406, 0.017908573150634766, 0.019489288330078125, 0.021070003509521484, 0.022650718688964844, 0.024231433868408203, 0.025812149047851562, 0.027392864227294922, 0.02897357940673828, 0.03055429458618164, 0.032135009765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 11.0, 16.0, 23.0, 48.0, 103.0, 268.0, 676.0, 2584.0, 21387.0, 4114351.0, 49130.0, 4244.0, 861.0, 288.0, 127.0, 67.0, 42.0, 21.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2232666015625, -0.2174854278564453, -0.21170425415039062, -0.20592308044433594, -0.20014190673828125, -0.19436073303222656, -0.18857955932617188, -0.1827983856201172, -0.1770172119140625, -0.1712360382080078, -0.16545486450195312, -0.15967369079589844, -0.15389251708984375, -0.14811134338378906, -0.14233016967773438, -0.1365489959716797, -0.130767822265625, -0.12498664855957031, -0.11920547485351562, -0.11342430114746094, -0.10764312744140625, -0.10186195373535156, -0.09608078002929688, -0.09029960632324219, -0.0845184326171875, -0.07873725891113281, -0.07295608520507812, -0.06717491149902344, -0.06139373779296875, -0.05561256408691406, -0.049831390380859375, -0.04405021667480469, -0.03826904296875, -0.03248786926269531, -0.026706695556640625, -0.020925521850585938, -0.01514434814453125, -0.009363174438476562, -0.003582000732421875, 0.0021991729736328125, 0.0079803466796875, 0.013761520385742188, 0.019542694091796875, 0.025323867797851562, 0.03110504150390625, 0.03688621520996094, 0.042667388916015625, 0.04844856262207031, 0.054229736328125, 0.06001091003417969, 0.06579208374023438, 0.07157325744628906, 0.07735443115234375, 0.08313560485839844, 0.08891677856445312, 0.09469795227050781, 0.1004791259765625, 0.10626029968261719, 0.11204147338867188, 0.11782264709472656, 0.12360382080078125, 0.12938499450683594, 0.13516616821289062, 0.1409473419189453, 0.146728515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 15.0, 15.0, 19.0, 45.0, 103.0, 454.0, 2935.0, 291.0, 81.0, 42.0, 14.0, 13.0, 13.0, 6.0, 2.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04827880859375, -0.04638099670410156, -0.044483184814453125, -0.04258537292480469, -0.04068756103515625, -0.03878974914550781, -0.036891937255859375, -0.03499412536621094, -0.0330963134765625, -0.031198501586914062, -0.029300689697265625, -0.027402877807617188, -0.02550506591796875, -0.023607254028320312, -0.021709442138671875, -0.019811630249023438, -0.017913818359375, -0.016016006469726562, -0.014118194580078125, -0.012220382690429688, -0.01032257080078125, -0.008424758911132812, -0.006526947021484375, -0.0046291351318359375, -0.0027313232421875, -0.0008335113525390625, 0.001064300537109375, 0.0029621124267578125, 0.00485992431640625, 0.0067577362060546875, 0.008655548095703125, 0.010553359985351562, 0.012451171875, 0.014348983764648438, 0.016246795654296875, 0.018144607543945312, 0.02004241943359375, 0.021940231323242188, 0.023838043212890625, 0.025735855102539062, 0.0276336669921875, 0.029531478881835938, 0.031429290771484375, 0.03332710266113281, 0.03522491455078125, 0.03712272644042969, 0.039020538330078125, 0.04091835021972656, 0.042816162109375, 0.04471397399902344, 0.046611785888671875, 0.04850959777832031, 0.05040740966796875, 0.05230522155761719, 0.054203033447265625, 0.05610084533691406, 0.0579986572265625, 0.05989646911621094, 0.061794281005859375, 0.06369209289550781, 0.06558990478515625, 0.06748771667480469, 0.06938552856445312, 0.07128334045410156, 0.07318115234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 18.0, 119.0, 737.0, 106.0, 15.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5696476101875305, -0.551016628742218, -0.5323857069015503, -0.5137547254562378, -0.49512380361557007, -0.47649282217025757, -0.45786187052726746, -0.43923091888427734, -0.42059996724128723, -0.4019690155982971, -0.383338063955307, -0.3647071123123169, -0.3460761308670044, -0.32744520902633667, -0.30881422758102417, -0.29018327593803406, -0.27155232429504395, -0.25292137265205383, -0.23429042100906372, -0.21565945446491241, -0.1970285028219223, -0.1783975511789322, -0.15976658463478088, -0.14113563299179077, -0.12250468134880066, -0.10387372970581055, -0.08524277061223984, -0.06661181151866913, -0.047980859875679016, -0.029349908232688904, -0.010718949139118195, 0.007912009954452515, 0.02654290199279785, 0.04517385736107826, 0.06380481272935867, 0.08243577182292938, 0.1010667234659195, 0.1196976751089096, 0.1383286416530609, 0.15695959329605103, 0.17559054493904114, 0.19422149658203125, 0.21285244822502136, 0.23148341476917267, 0.250114381313324, 0.2687453031539917, 0.2873762845993042, 0.3060072362422943, 0.3246381878852844, 0.34326913952827454, 0.36190009117126465, 0.38053104281425476, 0.3991619944572449, 0.4177929759025574, 0.4364239275455475, 0.4550548791885376, 0.4736858308315277, 0.4923167824745178, 0.5109477639198303, 0.529578685760498, 0.5482096672058105, 0.5668405890464783, 0.5854715704917908, 0.6041024923324585, 0.622733473777771]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 22.0, 21.0, 41.0, 68.0, 82.0, 115.0, 117.0, 91.0, 109.0, 110.0, 65.0, 55.0, 41.0, 24.0, 20.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.274170458316803, -0.266547828912735, -0.258925199508667, -0.2513025999069214, -0.2436799705028534, -0.2360573410987854, -0.2284347116947174, -0.2208120971918106, -0.2131894826889038, -0.20556685328483582, -0.19794423878192902, -0.19032160937786102, -0.18269899487495422, -0.17507636547088623, -0.16745373606681824, -0.15983112156391144, -0.15220849215984344, -0.14458586275577545, -0.13696324825286865, -0.12934061884880066, -0.12171800434589386, -0.11409537494182587, -0.10647275298833847, -0.09885013103485107, -0.09122750908136368, -0.08360488712787628, -0.07598226517438889, -0.06835964322090149, -0.060737017542123795, -0.0531143955886364, -0.045491769909858704, -0.03786914795637131, -0.03024652600288391, -0.022623904049396515, -0.01500128023326397, -0.007378656417131424, 0.0002439655363559723, 0.007866587489843369, 0.015489213168621063, 0.02311183512210846, 0.030734457075595856, 0.03835707902908325, 0.04597970098257065, 0.05360232666134834, 0.06122494861483574, 0.06884756684303284, 0.07647019624710083, 0.08409281820058823, 0.09171544015407562, 0.09933806210756302, 0.10696068406105042, 0.11458331346511841, 0.12220592796802521, 0.1298285573720932, 0.137451171875, 0.145073801279068, 0.152696430683136, 0.16031906008720398, 0.16794167459011078, 0.17556430399417877, 0.18318691849708557, 0.19080954790115356, 0.19843217730522156, 0.20605479180812836, 0.21367740631103516]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 8.0, 3.0, 13.0, 19.0, 22.0, 23.0, 35.0, 55.0, 70.0, 125.0, 216.0, 409.0, 864.0, 2146.0, 7425.0, 135682.0, 873565.0, 21627.0, 3596.0, 1342.0, 595.0, 286.0, 148.0, 85.0, 52.0, 41.0, 28.0, 20.0, 15.0, 12.0, 6.0, 8.0, 1.0, 3.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2181396484375, -0.21137428283691406, -0.20460891723632812, -0.1978435516357422, -0.19107818603515625, -0.1843128204345703, -0.17754745483398438, -0.17078208923339844, -0.1640167236328125, -0.15725135803222656, -0.15048599243164062, -0.1437206268310547, -0.13695526123046875, -0.1301898956298828, -0.12342453002929688, -0.11665916442871094, -0.109893798828125, -0.10312843322753906, -0.09636306762695312, -0.08959770202636719, -0.08283233642578125, -0.07606697082519531, -0.06930160522460938, -0.06253623962402344, -0.0557708740234375, -0.04900550842285156, -0.042240142822265625, -0.03547477722167969, -0.02870941162109375, -0.021944046020507812, -0.015178680419921875, -0.008413314819335938, -0.00164794921875, 0.0051174163818359375, 0.011882781982421875, 0.018648147583007812, 0.02541351318359375, 0.03217887878417969, 0.038944244384765625, 0.04570960998535156, 0.0524749755859375, 0.05924034118652344, 0.06600570678710938, 0.07277107238769531, 0.07953643798828125, 0.08630180358886719, 0.09306716918945312, 0.09983253479003906, 0.106597900390625, 0.11336326599121094, 0.12012863159179688, 0.1268939971923828, 0.13365936279296875, 0.1404247283935547, 0.14719009399414062, 0.15395545959472656, 0.1607208251953125, 0.16748619079589844, 0.17425155639648438, 0.1810169219970703, 0.18778228759765625, 0.1945476531982422, 0.20131301879882812, 0.20807838439941406, 0.21484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 0.0, 2.0, 2.0, 9.0, 20.0, 45.0, 119.0, 219.0, 246.0, 183.0, 99.0, 25.0, 16.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0655517578125, -0.06403994560241699, -0.06252813339233398, -0.06101632118225098, -0.05950450897216797, -0.05799269676208496, -0.05648088455200195, -0.054969072341918945, -0.05345726013183594, -0.05194544792175293, -0.05043363571166992, -0.048921823501586914, -0.047410011291503906, -0.0458981990814209, -0.04438638687133789, -0.04287457466125488, -0.041362762451171875, -0.03985095024108887, -0.03833913803100586, -0.03682732582092285, -0.035315513610839844, -0.033803701400756836, -0.03229188919067383, -0.03078007698059082, -0.029268264770507812, -0.027756452560424805, -0.026244640350341797, -0.02473282814025879, -0.02322101593017578, -0.021709203720092773, -0.020197391510009766, -0.018685579299926758, -0.01717376708984375, -0.015661954879760742, -0.014150142669677734, -0.012638330459594727, -0.011126518249511719, -0.009614706039428711, -0.008102893829345703, -0.006591081619262695, -0.0050792694091796875, -0.0035674571990966797, -0.002055644989013672, -0.0005438327789306641, 0.0009679794311523438, 0.0024797916412353516, 0.003991603851318359, 0.005503416061401367, 0.007015228271484375, 0.008527040481567383, 0.01003885269165039, 0.011550664901733398, 0.013062477111816406, 0.014574289321899414, 0.016086101531982422, 0.01759791374206543, 0.019109725952148438, 0.020621538162231445, 0.022133350372314453, 0.02364516258239746, 0.02515697479248047, 0.026668787002563477, 0.028180599212646484, 0.029692411422729492, 0.0312042236328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 6.0, 4.0, 2.0, 14.0, 7.0, 12.0, 6.0, 17.0, 25.0, 26.0, 32.0, 62.0, 86.0, 162.0, 376.0, 1104.0, 4223.0, 20725.0, 148935.0, 724564.0, 124557.0, 17837.0, 3862.0, 1024.0, 395.0, 164.0, 86.0, 55.0, 34.0, 26.0, 22.0, 23.0, 11.0, 20.0, 7.0, 5.0, 6.0, 9.0, 4.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.11279296875, -0.10951995849609375, -0.1062469482421875, -0.10297393798828125, -0.099700927734375, -0.09642791748046875, -0.0931549072265625, -0.08988189697265625, -0.08660888671875, -0.08333587646484375, -0.0800628662109375, -0.07678985595703125, -0.073516845703125, -0.07024383544921875, -0.0669708251953125, -0.06369781494140625, -0.0604248046875, -0.05715179443359375, -0.0538787841796875, -0.05060577392578125, -0.047332763671875, -0.04405975341796875, -0.0407867431640625, -0.03751373291015625, -0.03424072265625, -0.03096771240234375, -0.0276947021484375, -0.02442169189453125, -0.021148681640625, -0.01787567138671875, -0.0146026611328125, -0.01132965087890625, -0.008056640625, -0.00478363037109375, -0.0015106201171875, 0.00176239013671875, 0.005035400390625, 0.00830841064453125, 0.0115814208984375, 0.01485443115234375, 0.01812744140625, 0.02140045166015625, 0.0246734619140625, 0.02794647216796875, 0.031219482421875, 0.03449249267578125, 0.0377655029296875, 0.04103851318359375, 0.0443115234375, 0.04758453369140625, 0.0508575439453125, 0.05413055419921875, 0.057403564453125, 0.06067657470703125, 0.0639495849609375, 0.06722259521484375, 0.07049560546875, 0.07376861572265625, 0.0770416259765625, 0.08031463623046875, 0.083587646484375, 0.08686065673828125, 0.0901336669921875, 0.09340667724609375, 0.0966796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 4.0, 7.0, 4.0, 10.0, 11.0, 14.0, 13.0, 24.0, 15.0, 25.0, 33.0, 31.0, 38.0, 36.0, 44.0, 41.0, 35.0, 39.0, 42.0, 50.0, 48.0, 41.0, 47.0, 41.0, 44.0, 25.0, 42.0, 32.0, 30.0, 23.0, 21.0, 15.0, 8.0, 9.0, 9.0, 12.0, 6.0, 4.0, 4.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05853271484375, -0.05655097961425781, -0.054569244384765625, -0.05258750915527344, -0.05060577392578125, -0.04862403869628906, -0.046642303466796875, -0.04466056823730469, -0.0426788330078125, -0.04069709777832031, -0.038715362548828125, -0.03673362731933594, -0.03475189208984375, -0.03277015686035156, -0.030788421630859375, -0.028806686401367188, -0.026824951171875, -0.024843215942382812, -0.022861480712890625, -0.020879745483398438, -0.01889801025390625, -0.016916275024414062, -0.014934539794921875, -0.012952804565429688, -0.0109710693359375, -0.008989334106445312, -0.007007598876953125, -0.0050258636474609375, -0.00304412841796875, -0.0010623931884765625, 0.000919342041015625, 0.0029010772705078125, 0.0048828125, 0.0068645477294921875, 0.008846282958984375, 0.010828018188476562, 0.01280975341796875, 0.014791488647460938, 0.016773223876953125, 0.018754959106445312, 0.0207366943359375, 0.022718429565429688, 0.024700164794921875, 0.026681900024414062, 0.02866363525390625, 0.030645370483398438, 0.032627105712890625, 0.03460884094238281, 0.036590576171875, 0.03857231140136719, 0.040554046630859375, 0.04253578186035156, 0.04451751708984375, 0.04649925231933594, 0.048480987548828125, 0.05046272277832031, 0.0524444580078125, 0.05442619323730469, 0.056407928466796875, 0.05838966369628906, 0.06037139892578125, 0.06235313415527344, 0.06433486938476562, 0.06631660461425781, 0.06829833984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 11.0, 19.0, 15.0, 31.0, 64.0, 128.0, 340.0, 971.0, 3679.0, 28725.0, 927322.0, 79277.0, 5795.0, 1335.0, 444.0, 162.0, 98.0, 52.0, 21.0, 18.0, 11.0, 10.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04803466796875, -0.046607017517089844, -0.04517936706542969, -0.04375171661376953, -0.042324066162109375, -0.04089641571044922, -0.03946876525878906, -0.038041114807128906, -0.03661346435546875, -0.035185813903808594, -0.03375816345214844, -0.03233051300048828, -0.030902862548828125, -0.02947521209716797, -0.028047561645507812, -0.026619911193847656, -0.0251922607421875, -0.023764610290527344, -0.022336959838867188, -0.02090930938720703, -0.019481658935546875, -0.01805400848388672, -0.016626358032226562, -0.015198707580566406, -0.01377105712890625, -0.012343406677246094, -0.010915756225585938, -0.009488105773925781, -0.008060455322265625, -0.006632804870605469, -0.0052051544189453125, -0.0037775039672851562, -0.002349853515625, -0.0009222030639648438, 0.0005054473876953125, 0.0019330978393554688, 0.003360748291015625, 0.004788398742675781, 0.0062160491943359375, 0.007643699645996094, 0.00907135009765625, 0.010499000549316406, 0.011926651000976562, 0.013354301452636719, 0.014781951904296875, 0.01620960235595703, 0.017637252807617188, 0.019064903259277344, 0.0204925537109375, 0.021920204162597656, 0.023347854614257812, 0.02477550506591797, 0.026203155517578125, 0.02763080596923828, 0.029058456420898438, 0.030486106872558594, 0.03191375732421875, 0.033341407775878906, 0.03476905822753906, 0.03619670867919922, 0.037624359130859375, 0.03905200958251953, 0.04047966003417969, 0.041907310485839844, 0.0433349609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 9.0, 13.0, 10.0, 29.0, 41.0, 92.0, 132.0, 216.0, 176.0, 113.0, 63.0, 40.0, 19.0, 12.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7432495951652527e-05, -1.6804784536361694e-05, -1.6177073121070862e-05, -1.554936170578003e-05, -1.4921650290489197e-05, -1.4293938875198364e-05, -1.3666227459907532e-05, -1.30385160446167e-05, -1.2410804629325867e-05, -1.1783093214035034e-05, -1.1155381798744202e-05, -1.0527670383453369e-05, -9.899958968162537e-06, -9.272247552871704e-06, -8.644536137580872e-06, -8.016824722290039e-06, -7.3891133069992065e-06, -6.761401891708374e-06, -6.1336904764175415e-06, -5.505979061126709e-06, -4.8782676458358765e-06, -4.250556230545044e-06, -3.6228448152542114e-06, -2.995133399963379e-06, -2.3674219846725464e-06, -1.7397105693817139e-06, -1.1119991540908813e-06, -4.842877388000488e-07, 1.434236764907837e-07, 7.711350917816162e-07, 1.3988465070724487e-06, 2.0265579223632812e-06, 2.6542693376541138e-06, 3.2819807529449463e-06, 3.909692168235779e-06, 4.537403583526611e-06, 5.165114998817444e-06, 5.792826414108276e-06, 6.420537829399109e-06, 7.048249244689941e-06, 7.675960659980774e-06, 8.303672075271606e-06, 8.931383490562439e-06, 9.559094905853271e-06, 1.0186806321144104e-05, 1.0814517736434937e-05, 1.1442229151725769e-05, 1.2069940567016602e-05, 1.2697651982307434e-05, 1.3325363397598267e-05, 1.3953074812889099e-05, 1.4580786228179932e-05, 1.5208497643470764e-05, 1.5836209058761597e-05, 1.646392047405243e-05, 1.7091631889343262e-05, 1.7719343304634094e-05, 1.8347054719924927e-05, 1.897476613521576e-05, 1.9602477550506592e-05, 2.0230188965797424e-05, 2.0857900381088257e-05, 2.148561179637909e-05, 2.2113323211669922e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 12.0, 19.0, 36.0, 98.0, 257.0, 865.0, 7045.0, 968891.0, 68395.0, 2180.0, 453.0, 170.0, 70.0, 29.0, 14.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05718994140625, -0.05488014221191406, -0.052570343017578125, -0.05026054382324219, -0.04795074462890625, -0.04564094543457031, -0.043331146240234375, -0.04102134704589844, -0.0387115478515625, -0.03640174865722656, -0.034091949462890625, -0.03178215026855469, -0.02947235107421875, -0.027162551879882812, -0.024852752685546875, -0.022542953491210938, -0.020233154296875, -0.017923355102539062, -0.015613555908203125, -0.013303756713867188, -0.01099395751953125, -0.008684158325195312, -0.006374359130859375, -0.0040645599365234375, -0.0017547607421875, 0.0005550384521484375, 0.002864837646484375, 0.0051746368408203125, 0.00748443603515625, 0.009794235229492188, 0.012104034423828125, 0.014413833618164062, 0.0167236328125, 0.019033432006835938, 0.021343231201171875, 0.023653030395507812, 0.02596282958984375, 0.028272628784179688, 0.030582427978515625, 0.03289222717285156, 0.0352020263671875, 0.03751182556152344, 0.039821624755859375, 0.04213142395019531, 0.04444122314453125, 0.04675102233886719, 0.049060821533203125, 0.05137062072753906, 0.053680419921875, 0.05599021911621094, 0.058300018310546875, 0.06060981750488281, 0.06291961669921875, 0.06522941589355469, 0.06753921508789062, 0.06984901428222656, 0.0721588134765625, 0.07446861267089844, 0.07677841186523438, 0.07908821105957031, 0.08139801025390625, 0.08370780944824219, 0.08601760864257812, 0.08832740783691406, 0.09063720703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 10.0, 20.0, 26.0, 84.0, 173.0, 244.0, 243.0, 102.0, 50.0, 24.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055023193359375, -0.053601741790771484, -0.05218029022216797, -0.05075883865356445, -0.04933738708496094, -0.04791593551635742, -0.046494483947753906, -0.04507303237915039, -0.043651580810546875, -0.04223012924194336, -0.040808677673339844, -0.03938722610473633, -0.03796577453613281, -0.0365443229675293, -0.03512287139892578, -0.033701419830322266, -0.03227996826171875, -0.030858516693115234, -0.02943706512451172, -0.028015613555908203, -0.026594161987304688, -0.025172710418701172, -0.023751258850097656, -0.02232980728149414, -0.020908355712890625, -0.01948690414428711, -0.018065452575683594, -0.016644001007080078, -0.015222549438476562, -0.013801097869873047, -0.012379646301269531, -0.010958194732666016, -0.0095367431640625, -0.008115291595458984, -0.006693840026855469, -0.005272388458251953, -0.0038509368896484375, -0.002429485321044922, -0.0010080337524414062, 0.0004134178161621094, 0.001834869384765625, 0.0032563209533691406, 0.004677772521972656, 0.006099224090576172, 0.0075206756591796875, 0.008942127227783203, 0.010363578796386719, 0.011785030364990234, 0.01320648193359375, 0.014627933502197266, 0.01604938507080078, 0.017470836639404297, 0.018892288208007812, 0.020313739776611328, 0.021735191345214844, 0.02315664291381836, 0.024578094482421875, 0.02599954605102539, 0.027420997619628906, 0.028842449188232422, 0.030263900756835938, 0.03168535232543945, 0.03310680389404297, 0.034528255462646484, 0.03594970703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 10.0, 9.0, 19.0, 17.0, 40.0, 95.0, 163.0, 237.0, 167.0, 108.0, 73.0, 18.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.7336355447769165, -0.7186530828475952, -0.7036706209182739, -0.6886882185935974, -0.6737057566642761, -0.6587232947349548, -0.6437408328056335, -0.6287583708763123, -0.6137759685516357, -0.5987935066223145, -0.5838110446929932, -0.5688286423683167, -0.5538461804389954, -0.5388637185096741, -0.5238812565803528, -0.5088987946510315, -0.4939163327217102, -0.4789338707923889, -0.46395143866539, -0.4489689767360687, -0.4339865446090698, -0.41900408267974854, -0.40402162075042725, -0.38903915882110596, -0.37405672669410706, -0.35907426476478577, -0.34409183263778687, -0.3291093707084656, -0.3141269087791443, -0.2991444766521454, -0.2841620147228241, -0.2691795825958252, -0.2541970908641815, -0.23921464383602142, -0.22423219680786133, -0.20924973487854004, -0.19426728785037994, -0.17928484082221985, -0.16430237889289856, -0.14931993186473846, -0.13433748483657837, -0.11935503780841827, -0.10437258332967758, -0.08939012885093689, -0.0744076818227768, -0.0594252347946167, -0.04444278031587601, -0.029460325837135315, -0.01447787880897522, 0.000504571944475174, 0.015487022697925568, 0.03046947345137596, 0.045451924204826355, 0.06043437123298645, 0.07541682571172714, 0.09039928019046783, 0.10538172721862793, 0.12036417424678802, 0.13534662127494812, 0.1503290832042694, 0.1653115302324295, 0.1802939772605896, 0.1952764391899109, 0.21025888621807098, 0.22524133324623108]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 10.0, 6.0, 20.0, 19.0, 14.0, 23.0, 16.0, 20.0, 31.0, 37.0, 39.0, 32.0, 41.0, 60.0, 56.0, 53.0, 51.0, 64.0, 47.0, 55.0, 61.0, 34.0, 36.0, 23.0, 21.0, 30.0, 24.0, 12.0, 13.0, 13.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.37186551094055176, -0.3591202199459076, -0.3463749289512634, -0.33362966775894165, -0.3208843767642975, -0.3081390857696533, -0.29539379477500916, -0.282648503780365, -0.2699032425880432, -0.25715795159339905, -0.24441267549991608, -0.2316673845052719, -0.21892210841178894, -0.20617681741714478, -0.1934315264225006, -0.18068625032901764, -0.16794095933437347, -0.1551956683397293, -0.14245039224624634, -0.12970510125160217, -0.1169598251581192, -0.10421453416347504, -0.09146925061941147, -0.0787239670753479, -0.06597868353128433, -0.053233399987220764, -0.040488116443157196, -0.02774282917380333, -0.014997545629739761, -0.0022522583603858948, 0.010493025183677673, 0.02323830872774124, 0.03598359227180481, 0.04872887581586838, 0.061474159359931946, 0.07421945035457611, 0.08696472644805908, 0.09971001744270325, 0.11245530098676682, 0.12520058453083038, 0.13794586062431335, 0.15069115161895752, 0.1634364277124405, 0.17618171870708466, 0.18892699480056763, 0.2016722857952118, 0.21441757678985596, 0.22716285288333893, 0.2399081438779831, 0.25265341997146606, 0.26539871096611023, 0.2781440019607544, 0.29088929295539856, 0.3036345839500427, 0.3163798451423645, 0.32912513613700867, 0.34187042713165283, 0.354615718126297, 0.36736100912094116, 0.38010627031326294, 0.3928515613079071, 0.40559685230255127, 0.41834214329719543, 0.4310874342918396, 0.4438326954841614]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 8.0, 10.0, 24.0, 61.0, 128.0, 413.0, 1799.0, 4166144.0, 24526.0, 759.0, 213.0, 93.0, 32.0, 22.0, 10.0, 2.0, 5.0, 1.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.53955078125, -0.5272350311279297, -0.5149192810058594, -0.5026035308837891, -0.49028778076171875, -0.47797203063964844, -0.4656562805175781, -0.4533405303955078, -0.4410247802734375, -0.4287090301513672, -0.4163932800292969, -0.40407752990722656, -0.39176177978515625, -0.37944602966308594, -0.3671302795410156, -0.3548145294189453, -0.342498779296875, -0.3301830291748047, -0.3178672790527344, -0.30555152893066406, -0.29323577880859375, -0.28092002868652344, -0.2686042785644531, -0.2562885284423828, -0.2439727783203125, -0.2316570281982422, -0.21934127807617188, -0.20702552795410156, -0.19470977783203125, -0.18239402770996094, -0.17007827758789062, -0.1577625274658203, -0.14544677734375, -0.1331310272216797, -0.12081527709960938, -0.10849952697753906, -0.09618377685546875, -0.08386802673339844, -0.07155227661132812, -0.05923652648925781, -0.0469207763671875, -0.03460502624511719, -0.022289276123046875, -0.009973526000976562, 0.00234222412109375, 0.014657974243164062, 0.026973724365234375, 0.03928947448730469, 0.051605224609375, 0.06392097473144531, 0.07623672485351562, 0.08855247497558594, 0.10086822509765625, 0.11318397521972656, 0.12549972534179688, 0.1378154754638672, 0.1501312255859375, 0.1624469757080078, 0.17476272583007812, 0.18707847595214844, 0.19939422607421875, 0.21170997619628906, 0.22402572631835938, 0.2363414764404297, 0.2486572265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 8.0, 18.0, 49.0, 115.0, 180.0, 231.0, 176.0, 111.0, 59.0, 26.0, 14.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.067138671875, -0.0655980110168457, -0.0640573501586914, -0.06251668930053711, -0.06097602844238281, -0.059435367584228516, -0.05789470672607422, -0.05635404586791992, -0.054813385009765625, -0.05327272415161133, -0.05173206329345703, -0.050191402435302734, -0.04865074157714844, -0.04711008071899414, -0.045569419860839844, -0.04402875900268555, -0.04248809814453125, -0.04094743728637695, -0.039406776428222656, -0.03786611557006836, -0.03632545471191406, -0.034784793853759766, -0.03324413299560547, -0.03170347213745117, -0.030162811279296875, -0.028622150421142578, -0.02708148956298828, -0.025540828704833984, -0.024000167846679688, -0.02245950698852539, -0.020918846130371094, -0.019378185272216797, -0.0178375244140625, -0.016296863555908203, -0.014756202697753906, -0.01321554183959961, -0.011674880981445312, -0.010134220123291016, -0.008593559265136719, -0.007052898406982422, -0.005512237548828125, -0.003971576690673828, -0.0024309158325195312, -0.0008902549743652344, 0.0006504058837890625, 0.0021910667419433594, 0.0037317276000976562, 0.005272388458251953, 0.00681304931640625, 0.008353710174560547, 0.009894371032714844, 0.01143503189086914, 0.012975692749023438, 0.014516353607177734, 0.01605701446533203, 0.017597675323486328, 0.019138336181640625, 0.020678997039794922, 0.02221965789794922, 0.023760318756103516, 0.025300979614257812, 0.02684164047241211, 0.028382301330566406, 0.029922962188720703, 0.031463623046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 4.0, 7.0, 21.0, 27.0, 32.0, 69.0, 116.0, 244.0, 531.0, 1612.0, 7181.0, 86197.0, 4050819.0, 39730.0, 5412.0, 1342.0, 538.0, 207.0, 83.0, 48.0, 23.0, 21.0, 13.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08120155334472656, -0.07823562622070312, -0.07526969909667969, -0.07230377197265625, -0.06933784484863281, -0.06637191772460938, -0.06340599060058594, -0.0604400634765625, -0.05747413635253906, -0.054508209228515625, -0.05154228210449219, -0.04857635498046875, -0.04561042785644531, -0.042644500732421875, -0.03967857360839844, -0.036712646484375, -0.03374671936035156, -0.030780792236328125, -0.027814865112304688, -0.02484893798828125, -0.021883010864257812, -0.018917083740234375, -0.015951156616210938, -0.0129852294921875, -0.010019302368164062, -0.007053375244140625, -0.0040874481201171875, -0.00112152099609375, 0.0018444061279296875, 0.004810333251953125, 0.0077762603759765625, 0.0107421875, 0.013708114624023438, 0.016674041748046875, 0.019639968872070312, 0.02260589599609375, 0.025571823120117188, 0.028537750244140625, 0.03150367736816406, 0.0344696044921875, 0.03743553161621094, 0.040401458740234375, 0.04336738586425781, 0.04633331298828125, 0.04929924011230469, 0.052265167236328125, 0.05523109436035156, 0.058197021484375, 0.06116294860839844, 0.06412887573242188, 0.06709480285644531, 0.07006072998046875, 0.07302665710449219, 0.07599258422851562, 0.07895851135253906, 0.0819244384765625, 0.08489036560058594, 0.08785629272460938, 0.09082221984863281, 0.09378814697265625, 0.09675407409667969, 0.09972000122070312, 0.10268592834472656, 0.10565185546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 18.0, 28.0, 69.0, 193.0, 1041.0, 2338.0, 184.0, 83.0, 23.0, 21.0, 14.0, 14.0, 10.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034271240234375, -0.03326582908630371, -0.03226041793823242, -0.03125500679016113, -0.030249595642089844, -0.029244184494018555, -0.028238773345947266, -0.027233362197875977, -0.026227951049804688, -0.0252225399017334, -0.02421712875366211, -0.02321171760559082, -0.02220630645751953, -0.021200895309448242, -0.020195484161376953, -0.019190073013305664, -0.018184661865234375, -0.017179250717163086, -0.016173839569091797, -0.015168428421020508, -0.014163017272949219, -0.01315760612487793, -0.01215219497680664, -0.011146783828735352, -0.010141372680664062, -0.009135961532592773, -0.008130550384521484, -0.007125139236450195, -0.006119728088378906, -0.005114316940307617, -0.004108905792236328, -0.003103494644165039, -0.00209808349609375, -0.001092672348022461, -8.726119995117188e-05, 0.0009181499481201172, 0.0019235610961914062, 0.0029289722442626953, 0.003934383392333984, 0.0049397945404052734, 0.0059452056884765625, 0.0069506168365478516, 0.00795602798461914, 0.00896143913269043, 0.009966850280761719, 0.010972261428833008, 0.011977672576904297, 0.012983083724975586, 0.013988494873046875, 0.014993906021118164, 0.015999317169189453, 0.017004728317260742, 0.01801013946533203, 0.01901555061340332, 0.02002096176147461, 0.0210263729095459, 0.022031784057617188, 0.023037195205688477, 0.024042606353759766, 0.025048017501831055, 0.026053428649902344, 0.027058839797973633, 0.028064250946044922, 0.02906966209411621, 0.0300750732421875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 20.0, 126.0, 573.0, 246.0, 38.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46880942583084106, -0.45833492279052734, -0.44786038994789124, -0.4373858869075775, -0.4269113540649414, -0.4164368510246277, -0.40596234798431396, -0.39548784494400024, -0.38501331210136414, -0.3745388090610504, -0.3640642762184143, -0.3535897731781006, -0.34311527013778687, -0.33264073729515076, -0.32216623425483704, -0.3116917014122009, -0.3012171983718872, -0.2907426953315735, -0.2802681624889374, -0.26979365944862366, -0.25931912660598755, -0.24884462356567383, -0.2383701205253601, -0.2278956025838852, -0.21742108464241028, -0.20694656670093536, -0.19647204875946045, -0.18599754571914673, -0.17552302777767181, -0.1650485098361969, -0.15457400679588318, -0.14409948885440826, -0.13362495601177216, -0.12315043807029724, -0.11267592757940292, -0.1022014170885086, -0.09172689914703369, -0.08125238120555878, -0.07077787071466446, -0.06030336022377014, -0.04982884228229523, -0.03935432806611061, -0.028879813849925995, -0.01840529963374138, -0.007930785417556763, 0.0025437287986278534, 0.01301824301481247, 0.023492753505706787, 0.0339672714471817, 0.04444178566336632, 0.054916299879550934, 0.06539081037044525, 0.07586532831192017, 0.08633984625339508, 0.0968143567442894, 0.10728886723518372, 0.11776338517665863, 0.12823790311813354, 0.13871240615844727, 0.14918692409992218, 0.1596614420413971, 0.170135959982872, 0.18061047792434692, 0.19108498096466064, 0.20155949890613556]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 7.0, 22.0, 25.0, 33.0, 47.0, 55.0, 70.0, 68.0, 76.0, 63.0, 80.0, 80.0, 77.0, 74.0, 57.0, 40.0, 35.0, 28.0, 16.0, 13.0, 13.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.13694745302200317, -0.13360752165317535, -0.13026759028434753, -0.12692765891551971, -0.1235877275466919, -0.12024779617786407, -0.11690786480903625, -0.11356793344020844, -0.11022800207138062, -0.1068880707025528, -0.10354813933372498, -0.10020820796489716, -0.09686827659606934, -0.09352834522724152, -0.0901884138584137, -0.08684848248958588, -0.08350855112075806, -0.08016861975193024, -0.07682868838310242, -0.0734887570142746, -0.07014882564544678, -0.06680889427661896, -0.06346896290779114, -0.06012903153896332, -0.0567891001701355, -0.05344916880130768, -0.05010923743247986, -0.04676930606365204, -0.04342937469482422, -0.0400894433259964, -0.03674951195716858, -0.03340958058834076, -0.03006964921951294, -0.02672971785068512, -0.0233897864818573, -0.02004985511302948, -0.01670992374420166, -0.01336999237537384, -0.01003006100654602, -0.006690129637718201, -0.003350198268890381, -1.0266900062561035e-05, 0.003329664468765259, 0.006669595837593079, 0.010009527206420898, 0.013349458575248718, 0.016689389944076538, 0.020029321312904358, 0.023369252681732178, 0.026709184050559998, 0.030049115419387817, 0.03338904678821564, 0.03672897815704346, 0.04006890952587128, 0.0434088408946991, 0.046748772263526917, 0.050088703632354736, 0.053428635001182556, 0.056768566370010376, 0.060108497738838196, 0.06344842910766602, 0.06678836047649384, 0.07012829184532166, 0.07346822321414948, 0.0768081545829773]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 10.0, 10.0, 10.0, 22.0, 30.0, 38.0, 34.0, 76.0, 113.0, 221.0, 334.0, 716.0, 1537.0, 4216.0, 25085.0, 743343.0, 254455.0, 12849.0, 2909.0, 1179.0, 571.0, 295.0, 162.0, 93.0, 70.0, 45.0, 39.0, 17.0, 14.0, 12.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.181396484375, -0.17551612854003906, -0.16963577270507812, -0.1637554168701172, -0.15787506103515625, -0.1519947052001953, -0.14611434936523438, -0.14023399353027344, -0.1343536376953125, -0.12847328186035156, -0.12259292602539062, -0.11671257019042969, -0.11083221435546875, -0.10495185852050781, -0.09907150268554688, -0.09319114685058594, -0.087310791015625, -0.08143043518066406, -0.07555007934570312, -0.06966972351074219, -0.06378936767578125, -0.05790901184082031, -0.052028656005859375, -0.04614830017089844, -0.0402679443359375, -0.03438758850097656, -0.028507232666015625, -0.022626876831054688, -0.01674652099609375, -0.010866165161132812, -0.004985809326171875, 0.0008945465087890625, 0.00677490234375, 0.012655258178710938, 0.018535614013671875, 0.024415969848632812, 0.03029632568359375, 0.03617668151855469, 0.042057037353515625, 0.04793739318847656, 0.0538177490234375, 0.05969810485839844, 0.06557846069335938, 0.07145881652832031, 0.07733917236328125, 0.08321952819824219, 0.08909988403320312, 0.09498023986816406, 0.100860595703125, 0.10674095153808594, 0.11262130737304688, 0.11850166320800781, 0.12438201904296875, 0.1302623748779297, 0.13614273071289062, 0.14202308654785156, 0.1479034423828125, 0.15378379821777344, 0.15966415405273438, 0.1655445098876953, 0.17142486572265625, 0.1773052215576172, 0.18318557739257812, 0.18906593322753906, 0.1949462890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 11.0, 20.0, 32.0, 107.0, 162.0, 230.0, 192.0, 117.0, 70.0, 32.0, 11.0, 8.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06585693359375, -0.06435227394104004, -0.06284761428833008, -0.06134295463562012, -0.059838294982910156, -0.058333635330200195, -0.056828975677490234, -0.05532431602478027, -0.05381965637207031, -0.05231499671936035, -0.05081033706665039, -0.04930567741394043, -0.04780101776123047, -0.04629635810852051, -0.04479169845581055, -0.043287038803100586, -0.041782379150390625, -0.040277719497680664, -0.0387730598449707, -0.03726840019226074, -0.03576374053955078, -0.03425908088684082, -0.03275442123413086, -0.0312497615814209, -0.029745101928710938, -0.028240442276000977, -0.026735782623291016, -0.025231122970581055, -0.023726463317871094, -0.022221803665161133, -0.020717144012451172, -0.01921248435974121, -0.01770782470703125, -0.01620316505432129, -0.014698505401611328, -0.013193845748901367, -0.011689186096191406, -0.010184526443481445, -0.008679866790771484, -0.0071752071380615234, -0.0056705474853515625, -0.0041658878326416016, -0.0026612281799316406, -0.0011565685272216797, 0.00034809112548828125, 0.0018527507781982422, 0.003357410430908203, 0.004862070083618164, 0.006366729736328125, 0.007871389389038086, 0.009376049041748047, 0.010880708694458008, 0.012385368347167969, 0.01389002799987793, 0.01539468765258789, 0.01689934730529785, 0.018404006958007812, 0.019908666610717773, 0.021413326263427734, 0.022917985916137695, 0.024422645568847656, 0.025927305221557617, 0.027431964874267578, 0.02893662452697754, 0.0304412841796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 8.0, 7.0, 10.0, 14.0, 9.0, 13.0, 17.0, 23.0, 34.0, 42.0, 61.0, 84.0, 174.0, 354.0, 729.0, 2010.0, 6977.0, 33028.0, 256805.0, 645553.0, 82118.0, 14502.0, 3653.0, 1210.0, 495.0, 195.0, 131.0, 68.0, 54.0, 48.0, 27.0, 24.0, 24.0, 15.0, 9.0, 7.0, 5.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1019287109375, -0.0989522933959961, -0.09597587585449219, -0.09299945831298828, -0.09002304077148438, -0.08704662322998047, -0.08407020568847656, -0.08109378814697266, -0.07811737060546875, -0.07514095306396484, -0.07216453552246094, -0.06918811798095703, -0.06621170043945312, -0.06323528289794922, -0.06025886535644531, -0.057282447814941406, -0.0543060302734375, -0.051329612731933594, -0.04835319519042969, -0.04537677764892578, -0.042400360107421875, -0.03942394256591797, -0.03644752502441406, -0.033471107482910156, -0.03049468994140625, -0.027518272399902344, -0.024541854858398438, -0.02156543731689453, -0.018589019775390625, -0.015612602233886719, -0.012636184692382812, -0.009659767150878906, -0.006683349609375, -0.0037069320678710938, -0.0007305145263671875, 0.0022459030151367188, 0.005222320556640625, 0.008198738098144531, 0.011175155639648438, 0.014151573181152344, 0.01712799072265625, 0.020104408264160156, 0.023080825805664062, 0.02605724334716797, 0.029033660888671875, 0.03201007843017578, 0.03498649597167969, 0.037962913513183594, 0.0409393310546875, 0.043915748596191406, 0.04689216613769531, 0.04986858367919922, 0.052845001220703125, 0.05582141876220703, 0.05879783630371094, 0.061774253845214844, 0.06475067138671875, 0.06772708892822266, 0.07070350646972656, 0.07367992401123047, 0.07665634155273438, 0.07963275909423828, 0.08260917663574219, 0.0855855941772461, 0.08856201171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 10.0, 14.0, 13.0, 20.0, 29.0, 31.0, 37.0, 28.0, 26.0, 26.0, 39.0, 37.0, 50.0, 46.0, 42.0, 49.0, 49.0, 48.0, 44.0, 45.0, 42.0, 31.0, 27.0, 25.0, 28.0, 29.0, 20.0, 15.0, 13.0, 17.0, 11.0, 10.0, 10.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.057312965393066406, -0.05529975891113281, -0.05328655242919922, -0.051273345947265625, -0.04926013946533203, -0.04724693298339844, -0.045233726501464844, -0.04322052001953125, -0.041207313537597656, -0.03919410705566406, -0.03718090057373047, -0.035167694091796875, -0.03315448760986328, -0.031141281127929688, -0.029128074645996094, -0.0271148681640625, -0.025101661682128906, -0.023088455200195312, -0.02107524871826172, -0.019062042236328125, -0.01704883575439453, -0.015035629272460938, -0.013022422790527344, -0.01100921630859375, -0.008996009826660156, -0.0069828033447265625, -0.004969596862792969, -0.002956390380859375, -0.0009431838989257812, 0.0010700225830078125, 0.0030832290649414062, 0.005096435546875, 0.007109642028808594, 0.009122848510742188, 0.011136054992675781, 0.013149261474609375, 0.015162467956542969, 0.017175674438476562, 0.019188880920410156, 0.02120208740234375, 0.023215293884277344, 0.025228500366210938, 0.02724170684814453, 0.029254913330078125, 0.03126811981201172, 0.03328132629394531, 0.035294532775878906, 0.0373077392578125, 0.039320945739746094, 0.04133415222167969, 0.04334735870361328, 0.045360565185546875, 0.04737377166748047, 0.04938697814941406, 0.051400184631347656, 0.05341339111328125, 0.055426597595214844, 0.05743980407714844, 0.05945301055908203, 0.061466217041015625, 0.06347942352294922, 0.06549263000488281, 0.0675058364868164, 0.06951904296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 17.0, 21.0, 31.0, 44.0, 49.0, 93.0, 142.0, 277.0, 491.0, 919.0, 1950.0, 4811.0, 14739.0, 62551.0, 349190.0, 481840.0, 99182.0, 20864.0, 6377.0, 2378.0, 1140.0, 597.0, 295.0, 190.0, 104.0, 82.0, 50.0, 30.0, 27.0, 15.0, 8.0, 6.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.016845703125, -0.016366243362426758, -0.015886783599853516, -0.015407323837280273, -0.014927864074707031, -0.014448404312133789, -0.013968944549560547, -0.013489484786987305, -0.013010025024414062, -0.01253056526184082, -0.012051105499267578, -0.011571645736694336, -0.011092185974121094, -0.010612726211547852, -0.01013326644897461, -0.009653806686401367, -0.009174346923828125, -0.008694887161254883, -0.00821542739868164, -0.0077359676361083984, -0.007256507873535156, -0.006777048110961914, -0.006297588348388672, -0.00581812858581543, -0.0053386688232421875, -0.004859209060668945, -0.004379749298095703, -0.003900289535522461, -0.0034208297729492188, -0.0029413700103759766, -0.0024619102478027344, -0.001982450485229492, -0.00150299072265625, -0.0010235309600830078, -0.0005440711975097656, -6.461143493652344e-05, 0.00041484832763671875, 0.0008943080902099609, 0.0013737678527832031, 0.0018532276153564453, 0.0023326873779296875, 0.0028121471405029297, 0.003291606903076172, 0.003771066665649414, 0.004250526428222656, 0.0047299861907958984, 0.005209445953369141, 0.005688905715942383, 0.006168365478515625, 0.006647825241088867, 0.007127285003662109, 0.0076067447662353516, 0.008086204528808594, 0.008565664291381836, 0.009045124053955078, 0.00952458381652832, 0.010004043579101562, 0.010483503341674805, 0.010962963104248047, 0.011442422866821289, 0.011921882629394531, 0.012401342391967773, 0.012880802154541016, 0.013360261917114258, 0.0138397216796875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 1.0, 11.0, 9.0, 12.0, 16.0, 6.0, 20.0, 24.0, 27.0, 30.0, 41.0, 42.0, 61.0, 74.0, 77.0, 105.0, 87.0, 62.0, 59.0, 56.0, 32.0, 27.0, 20.0, 15.0, 15.0, 13.0, 9.0, 4.0, 4.0, 7.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2755393981933594e-05, -1.2396834790706635e-05, -1.2038275599479675e-05, -1.1679716408252716e-05, -1.1321157217025757e-05, -1.0962598025798798e-05, -1.0604038834571838e-05, -1.0245479643344879e-05, -9.88692045211792e-06, -9.52836126089096e-06, -9.169802069664001e-06, -8.811242878437042e-06, -8.452683687210083e-06, -8.094124495983124e-06, -7.735565304756165e-06, -7.377006113529205e-06, -7.018446922302246e-06, -6.659887731075287e-06, -6.301328539848328e-06, -5.942769348621368e-06, -5.584210157394409e-06, -5.22565096616745e-06, -4.867091774940491e-06, -4.5085325837135315e-06, -4.149973392486572e-06, -3.791414201259613e-06, -3.432855010032654e-06, -3.0742958188056946e-06, -2.7157366275787354e-06, -2.357177436351776e-06, -1.998618245124817e-06, -1.6400590538978577e-06, -1.2814998626708984e-06, -9.229406714439392e-07, -5.6438148021698e-07, -2.0582228899002075e-07, 1.5273690223693848e-07, 5.112960934638977e-07, 8.698552846908569e-07, 1.2284144759178162e-06, 1.5869736671447754e-06, 1.9455328583717346e-06, 2.304092049598694e-06, 2.662651240825653e-06, 3.0212104320526123e-06, 3.3797696232795715e-06, 3.7383288145065308e-06, 4.09688800573349e-06, 4.455447196960449e-06, 4.8140063881874084e-06, 5.172565579414368e-06, 5.531124770641327e-06, 5.889683961868286e-06, 6.248243153095245e-06, 6.606802344322205e-06, 6.965361535549164e-06, 7.323920726776123e-06, 7.682479918003082e-06, 8.041039109230042e-06, 8.399598300457e-06, 8.75815749168396e-06, 9.11671668291092e-06, 9.475275874137878e-06, 9.833835065364838e-06, 1.0192394256591797e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 4.0, 7.0, 6.0, 6.0, 13.0, 21.0, 30.0, 22.0, 57.0, 108.0, 150.0, 359.0, 922.0, 3107.0, 16013.0, 151147.0, 734291.0, 123969.0, 13771.0, 2929.0, 847.0, 331.0, 151.0, 92.0, 65.0, 34.0, 28.0, 17.0, 13.0, 9.0, 13.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0248565673828125, -0.024155616760253906, -0.023454666137695312, -0.02275371551513672, -0.022052764892578125, -0.02135181427001953, -0.020650863647460938, -0.019949913024902344, -0.01924896240234375, -0.018548011779785156, -0.017847061157226562, -0.01714611053466797, -0.016445159912109375, -0.01574420928955078, -0.015043258666992188, -0.014342308044433594, -0.013641357421875, -0.012940406799316406, -0.012239456176757812, -0.011538505554199219, -0.010837554931640625, -0.010136604309082031, -0.009435653686523438, -0.008734703063964844, -0.00803375244140625, -0.007332801818847656, -0.0066318511962890625, -0.005930900573730469, -0.005229949951171875, -0.004528999328613281, -0.0038280487060546875, -0.0031270980834960938, -0.0024261474609375, -0.0017251968383789062, -0.0010242462158203125, -0.00032329559326171875, 0.000377655029296875, 0.0010786056518554688, 0.0017795562744140625, 0.0024805068969726562, 0.00318145751953125, 0.0038824081420898438, 0.0045833587646484375, 0.005284309387207031, 0.005985260009765625, 0.006686210632324219, 0.0073871612548828125, 0.008088111877441406, 0.0087890625, 0.009490013122558594, 0.010190963745117188, 0.010891914367675781, 0.011592864990234375, 0.012293815612792969, 0.012994766235351562, 0.013695716857910156, 0.01439666748046875, 0.015097618103027344, 0.015798568725585938, 0.01649951934814453, 0.017200469970703125, 0.01790142059326172, 0.018602371215820312, 0.019303321838378906, 0.0200042724609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 9.0, 14.0, 18.0, 17.0, 14.0, 25.0, 35.0, 41.0, 34.0, 53.0, 74.0, 69.0, 82.0, 68.0, 58.0, 61.0, 68.0, 42.0, 41.0, 26.0, 40.0, 28.0, 17.0, 9.0, 7.0, 6.0, 10.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0128173828125, -0.012379169464111328, -0.011940956115722656, -0.011502742767333984, -0.011064529418945312, -0.01062631607055664, -0.010188102722167969, -0.009749889373779297, -0.009311676025390625, -0.008873462677001953, -0.008435249328613281, -0.00799703598022461, -0.0075588226318359375, -0.007120609283447266, -0.006682395935058594, -0.006244182586669922, -0.00580596923828125, -0.005367755889892578, -0.004929542541503906, -0.004491329193115234, -0.0040531158447265625, -0.0036149024963378906, -0.0031766891479492188, -0.002738475799560547, -0.002300262451171875, -0.0018620491027832031, -0.0014238357543945312, -0.0009856224060058594, -0.0005474090576171875, -0.00010919570922851562, 0.00032901763916015625, 0.0007672309875488281, 0.0012054443359375, 0.0016436576843261719, 0.0020818710327148438, 0.0025200843811035156, 0.0029582977294921875, 0.0033965110778808594, 0.0038347244262695312, 0.004272937774658203, 0.004711151123046875, 0.005149364471435547, 0.005587577819824219, 0.006025791168212891, 0.0064640045166015625, 0.006902217864990234, 0.007340431213378906, 0.007778644561767578, 0.00821685791015625, 0.008655071258544922, 0.009093284606933594, 0.009531497955322266, 0.009969711303710938, 0.01040792465209961, 0.010846138000488281, 0.011284351348876953, 0.011722564697265625, 0.012160778045654297, 0.012598991394042969, 0.01303720474243164, 0.013475418090820312, 0.013913631439208984, 0.014351844787597656, 0.014790058135986328, 0.015228271484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 14.0, 66.0, 223.0, 515.0, 146.0, 28.0, 6.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7088868618011475, -1.669607162475586, -1.6303274631500244, -1.591047763824463, -1.551768183708191, -1.5124884843826294, -1.4732087850570679, -1.4339290857315063, -1.3946493864059448, -1.3553696870803833, -1.3160899877548218, -1.2768104076385498, -1.2375307083129883, -1.1982510089874268, -1.1589713096618652, -1.1196916103363037, -1.0804119110107422, -1.0411322116851807, -1.0018525123596191, -0.9625728726387024, -0.9232931733131409, -0.8840135335922241, -0.8447338342666626, -0.8054541349411011, -0.7661745548248291, -0.7268948554992676, -0.6876152157783508, -0.6483355164527893, -0.6090558171272278, -0.569776177406311, -0.5304964780807495, -0.491216778755188, -0.45193707942962646, -0.41265740990638733, -0.3733777105808258, -0.33409804105758667, -0.29481834173202515, -0.255538672208786, -0.21625900268554688, -0.17697930335998535, -0.13769963383674622, -0.09841994941234589, -0.059140272438526154, -0.01986059546470642, 0.01941908895969391, 0.05869877338409424, 0.09797844290733337, 0.1372581422328949, 0.17653781175613403, 0.21581749618053436, 0.2550971806049347, 0.29437685012817383, 0.33365654945373535, 0.3729362189769745, 0.4122158885002136, 0.45149558782577515, 0.4907752573490143, 0.5300549268722534, 0.5693346261978149, 0.6086143255233765, 0.6478939652442932, 0.6871736645698547, 0.7264533042907715, 0.765733003616333, 0.8050127029418945]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 5.0, 8.0, 7.0, 7.0, 15.0, 12.0, 9.0, 21.0, 19.0, 25.0, 26.0, 30.0, 18.0, 40.0, 25.0, 41.0, 41.0, 35.0, 31.0, 32.0, 34.0, 49.0, 35.0, 47.0, 40.0, 34.0, 35.0, 31.0, 33.0, 34.0, 27.0, 23.0, 16.0, 19.0, 18.0, 15.0, 9.0, 2.0, 11.0, 5.0, 6.0, 3.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.3317323327064514, -0.3220420777797699, -0.312351793050766, -0.3026615381240845, -0.29297128319740295, -0.28328102827072144, -0.27359074354171753, -0.263900488615036, -0.2542102336883545, -0.24451996386051178, -0.23482970893383026, -0.22513943910598755, -0.21544918417930603, -0.20575891435146332, -0.1960686445236206, -0.1863783895969391, -0.17668811976909637, -0.16699784994125366, -0.15730759501457214, -0.14761732518672943, -0.1379270702600479, -0.1282368004322052, -0.11854653805494308, -0.10885627567768097, -0.09916601330041885, -0.08947575092315674, -0.07978548854589462, -0.07009522616863251, -0.06040496006608009, -0.05071469768881798, -0.041024431586265564, -0.03133416920900345, -0.021643906831741333, -0.011953643523156643, -0.002263380214571953, 0.007426884025335312, 0.017117146402597427, 0.026807408779859543, 0.03649767488241196, 0.04618793725967407, 0.05587819963693619, 0.0655684620141983, 0.07525872439146042, 0.08494898676872253, 0.09463925659656525, 0.10432951152324677, 0.11401978135108948, 0.12371004372835159, 0.1334003061056137, 0.14309057593345642, 0.15278083086013794, 0.16247110068798065, 0.17216135561466217, 0.18185162544250488, 0.1915418803691864, 0.2012321501970291, 0.21092242002487183, 0.22061268985271454, 0.23030294477939606, 0.23999321460723877, 0.2496834695339203, 0.2593737244606018, 0.2690640091896057, 0.27875426411628723, 0.28844451904296875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 10.0, 5.0, 17.0, 18.0, 33.0, 73.0, 110.0, 234.0, 677.0, 3167.0, 100868.0, 4081788.0, 5833.0, 931.0, 270.0, 112.0, 47.0, 37.0, 18.0, 11.0, 5.0, 5.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.408447265625, -0.3989830017089844, -0.38951873779296875, -0.3800544738769531, -0.3705902099609375, -0.3611259460449219, -0.35166168212890625, -0.3421974182128906, -0.332733154296875, -0.3232688903808594, -0.31380462646484375, -0.3043403625488281, -0.2948760986328125, -0.2854118347167969, -0.27594757080078125, -0.2664833068847656, -0.25701904296875, -0.24755477905273438, -0.23809051513671875, -0.22862625122070312, -0.2191619873046875, -0.20969772338867188, -0.20023345947265625, -0.19076919555664062, -0.181304931640625, -0.17184066772460938, -0.16237640380859375, -0.15291213989257812, -0.1434478759765625, -0.13398361206054688, -0.12451934814453125, -0.11505508422851562, -0.1055908203125, -0.09612655639648438, -0.08666229248046875, -0.07719802856445312, -0.0677337646484375, -0.058269500732421875, -0.04880523681640625, -0.039340972900390625, -0.029876708984375, -0.020412445068359375, -0.01094818115234375, -0.001483917236328125, 0.0079803466796875, 0.017444610595703125, 0.02690887451171875, 0.036373138427734375, 0.04583740234375, 0.055301666259765625, 0.06476593017578125, 0.07423019409179688, 0.0836944580078125, 0.09315872192382812, 0.10262298583984375, 0.11208724975585938, 0.121551513671875, 0.13101577758789062, 0.14048004150390625, 0.14994430541992188, 0.1594085693359375, 0.16887283325195312, 0.17833709716796875, 0.18780136108398438, 0.197265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 1.0, 4.0, 11.0, 25.0, 56.0, 104.0, 151.0, 190.0, 175.0, 126.0, 82.0, 40.0, 18.0, 12.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06890869140625, -0.06733465194702148, -0.06576061248779297, -0.06418657302856445, -0.06261253356933594, -0.06103849411010742, -0.059464454650878906, -0.05789041519165039, -0.056316375732421875, -0.05474233627319336, -0.053168296813964844, -0.05159425735473633, -0.05002021789550781, -0.0484461784362793, -0.04687213897705078, -0.045298099517822266, -0.04372406005859375, -0.042150020599365234, -0.04057598114013672, -0.0390019416809082, -0.03742790222167969, -0.03585386276245117, -0.034279823303222656, -0.03270578384399414, -0.031131744384765625, -0.02955770492553711, -0.027983665466308594, -0.026409626007080078, -0.024835586547851562, -0.023261547088623047, -0.02168750762939453, -0.020113468170166016, -0.0185394287109375, -0.016965389251708984, -0.015391349792480469, -0.013817310333251953, -0.012243270874023438, -0.010669231414794922, -0.009095191955566406, -0.007521152496337891, -0.005947113037109375, -0.004373073577880859, -0.0027990341186523438, -0.0012249946594238281, 0.0003490447998046875, 0.0019230842590332031, 0.0034971237182617188, 0.005071163177490234, 0.00664520263671875, 0.008219242095947266, 0.009793281555175781, 0.011367321014404297, 0.012941360473632812, 0.014515399932861328, 0.016089439392089844, 0.01766347885131836, 0.019237518310546875, 0.02081155776977539, 0.022385597229003906, 0.023959636688232422, 0.025533676147460938, 0.027107715606689453, 0.02868175506591797, 0.030255794525146484, 0.031829833984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 9.0, 10.0, 14.0, 20.0, 35.0, 55.0, 99.0, 227.0, 465.0, 946.0, 2758.0, 10615.0, 109099.0, 3992752.0, 63766.0, 8789.0, 2515.0, 1014.0, 491.0, 294.0, 139.0, 79.0, 34.0, 21.0, 13.0, 9.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12286376953125, -0.11958026885986328, -0.11629676818847656, -0.11301326751708984, -0.10972976684570312, -0.1064462661743164, -0.10316276550292969, -0.09987926483154297, -0.09659576416015625, -0.09331226348876953, -0.09002876281738281, -0.0867452621459961, -0.08346176147460938, -0.08017826080322266, -0.07689476013183594, -0.07361125946044922, -0.0703277587890625, -0.06704425811767578, -0.06376075744628906, -0.060477256774902344, -0.057193756103515625, -0.053910255432128906, -0.05062675476074219, -0.04734325408935547, -0.04405975341796875, -0.04077625274658203, -0.03749275207519531, -0.034209251403808594, -0.030925750732421875, -0.027642250061035156, -0.024358749389648438, -0.02107524871826172, -0.017791748046875, -0.014508247375488281, -0.011224746704101562, -0.007941246032714844, -0.004657745361328125, -0.0013742446899414062, 0.0019092559814453125, 0.005192756652832031, 0.00847625732421875, 0.011759757995605469, 0.015043258666992188, 0.018326759338378906, 0.021610260009765625, 0.024893760681152344, 0.028177261352539062, 0.03146076202392578, 0.0347442626953125, 0.03802776336669922, 0.04131126403808594, 0.044594764709472656, 0.047878265380859375, 0.051161766052246094, 0.05444526672363281, 0.05772876739501953, 0.06101226806640625, 0.06429576873779297, 0.06757926940917969, 0.0708627700805664, 0.07414627075195312, 0.07742977142333984, 0.08071327209472656, 0.08399677276611328, 0.0872802734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 10.0, 26.0, 32.0, 50.0, 112.0, 293.0, 1947.0, 1159.0, 215.0, 75.0, 37.0, 29.0, 16.0, 18.0, 10.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0298309326171875, -0.028531312942504883, -0.027231693267822266, -0.02593207359313965, -0.02463245391845703, -0.023332834243774414, -0.022033214569091797, -0.02073359489440918, -0.019433975219726562, -0.018134355545043945, -0.016834735870361328, -0.015535116195678711, -0.014235496520996094, -0.012935876846313477, -0.01163625717163086, -0.010336637496948242, -0.009037017822265625, -0.007737398147583008, -0.006437778472900391, -0.0051381587982177734, -0.0038385391235351562, -0.002538919448852539, -0.0012392997741699219, 6.031990051269531e-05, 0.0013599395751953125, 0.0026595592498779297, 0.003959178924560547, 0.005258798599243164, 0.006558418273925781, 0.007858037948608398, 0.009157657623291016, 0.010457277297973633, 0.01175689697265625, 0.013056516647338867, 0.014356136322021484, 0.0156557559967041, 0.01695537567138672, 0.018254995346069336, 0.019554615020751953, 0.02085423469543457, 0.022153854370117188, 0.023453474044799805, 0.024753093719482422, 0.02605271339416504, 0.027352333068847656, 0.028651952743530273, 0.02995157241821289, 0.03125119209289551, 0.032550811767578125, 0.03385043144226074, 0.03515005111694336, 0.03644967079162598, 0.037749290466308594, 0.03904891014099121, 0.04034852981567383, 0.041648149490356445, 0.04294776916503906, 0.04424738883972168, 0.0455470085144043, 0.046846628189086914, 0.04814624786376953, 0.04944586753845215, 0.050745487213134766, 0.05204510688781738, 0.0533447265625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 13.0, 97.0, 387.0, 370.0, 88.0, 27.0, 11.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18876919150352478, -0.17548301815986633, -0.16219684481620789, -0.14891065657138824, -0.1356244832277298, -0.12233830988407135, -0.1090521290898323, -0.09576594829559326, -0.08247977495193481, -0.06919360160827637, -0.05590742081403732, -0.04262124374508858, -0.02933506667613983, -0.016048893332481384, -0.00276271253824234, 0.010523468255996704, 0.02380964159965515, 0.0370958186686039, 0.05038199573755264, 0.06366817653179169, 0.07695434987545013, 0.09024052321910858, 0.10352670401334763, 0.11681288480758667, 0.13009905815124512, 0.14338523149490356, 0.156671404838562, 0.16995759308338165, 0.1832437664270401, 0.19652993977069855, 0.2098161280155182, 0.22310230135917664, 0.2363884449005127, 0.24967461824417114, 0.2629607915878296, 0.27624696493148804, 0.2895331382751465, 0.30281931161880493, 0.31610551476478577, 0.3293916881084442, 0.34267786145210266, 0.3559640347957611, 0.36925020813941956, 0.382536381483078, 0.39582258462905884, 0.4091087579727173, 0.42239493131637573, 0.4356811046600342, 0.4489672780036926, 0.4622534513473511, 0.4755396246910095, 0.48882579803466797, 0.5021119713783264, 0.5153981447219849, 0.5286843180656433, 0.5419704914093018, 0.555256724357605, 0.5685428977012634, 0.5818290710449219, 0.5951152443885803, 0.6084014177322388, 0.6216875910758972, 0.6349737644195557, 0.6482599973678589, 0.6615461111068726]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 16.0, 26.0, 36.0, 55.0, 55.0, 74.0, 97.0, 87.0, 91.0, 106.0, 88.0, 81.0, 60.0, 39.0, 28.0, 17.0, 15.0, 12.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20231229066848755, -0.19489799439907074, -0.18748369812965393, -0.18006941676139832, -0.1726551204919815, -0.1652408242225647, -0.1578265279531479, -0.15041223168373108, -0.14299795031547546, -0.13558365404605865, -0.12816935777664185, -0.12075506895780563, -0.11334078013896942, -0.10592648386955261, -0.0985121876001358, -0.091097891330719, -0.08368359506130219, -0.07626929879188538, -0.06885500997304916, -0.061440713703632355, -0.054026421159505844, -0.046612128615379333, -0.039197832345962524, -0.031783539801836014, -0.024369247257709503, -0.016954954713582993, -0.009540660306811333, -0.002126365900039673, 0.005287926644086838, 0.012702219188213348, 0.020116515457630157, 0.027530808001756668, 0.03494510054588318, 0.04235939309000969, 0.0497736856341362, 0.05718798190355301, 0.06460227072238922, 0.07201656699180603, 0.07943086326122284, 0.08684515953063965, 0.09425944834947586, 0.10167374461889267, 0.10908803343772888, 0.11650232970714569, 0.1239166259765625, 0.13133090734481812, 0.13874521851539612, 0.14615949988365173, 0.15357379615306854, 0.16098809242248535, 0.16840238869190216, 0.17581668496131897, 0.18323096632957458, 0.1906452625989914, 0.1980595588684082, 0.205473855137825, 0.21288815140724182, 0.22030244767665863, 0.22771674394607544, 0.23513102531433105, 0.24254532158374786, 0.24995961785316467, 0.2573739290237427, 0.2647882103919983, 0.2722024917602539]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 7.0, 5.0, 5.0, 22.0, 31.0, 57.0, 75.0, 153.0, 276.0, 597.0, 1450.0, 4474.0, 31672.0, 818987.0, 176222.0, 10335.0, 2443.0, 864.0, 348.0, 190.0, 108.0, 67.0, 49.0, 38.0, 20.0, 12.0, 9.0, 9.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1978759765625, -0.1921825408935547, -0.18648910522460938, -0.18079566955566406, -0.17510223388671875, -0.16940879821777344, -0.16371536254882812, -0.1580219268798828, -0.1523284912109375, -0.1466350555419922, -0.14094161987304688, -0.13524818420410156, -0.12955474853515625, -0.12386131286621094, -0.11816787719726562, -0.11247444152832031, -0.106781005859375, -0.10108757019042969, -0.09539413452148438, -0.08970069885253906, -0.08400726318359375, -0.07831382751464844, -0.07262039184570312, -0.06692695617675781, -0.0612335205078125, -0.05554008483886719, -0.049846649169921875, -0.04415321350097656, -0.03845977783203125, -0.03276634216308594, -0.027072906494140625, -0.021379470825195312, -0.01568603515625, -0.009992599487304688, -0.004299163818359375, 0.0013942718505859375, 0.00708770751953125, 0.012781143188476562, 0.018474578857421875, 0.024168014526367188, 0.0298614501953125, 0.03555488586425781, 0.041248321533203125, 0.04694175720214844, 0.05263519287109375, 0.05832862854003906, 0.06402206420898438, 0.06971549987792969, 0.075408935546875, 0.08110237121582031, 0.08679580688476562, 0.09248924255371094, 0.09818267822265625, 0.10387611389160156, 0.10956954956054688, 0.11526298522949219, 0.1209564208984375, 0.1266498565673828, 0.13234329223632812, 0.13803672790527344, 0.14373016357421875, 0.14942359924316406, 0.15511703491210938, 0.1608104705810547, 0.16650390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 12.0, 20.0, 48.0, 78.0, 126.0, 169.0, 180.0, 150.0, 96.0, 55.0, 36.0, 13.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06396484375, -0.062483787536621094, -0.06100273132324219, -0.05952167510986328, -0.058040618896484375, -0.05655956268310547, -0.05507850646972656, -0.053597450256347656, -0.05211639404296875, -0.050635337829589844, -0.04915428161621094, -0.04767322540283203, -0.046192169189453125, -0.04471111297607422, -0.04323005676269531, -0.041749000549316406, -0.0402679443359375, -0.038786888122558594, -0.03730583190917969, -0.03582477569580078, -0.034343719482421875, -0.03286266326904297, -0.03138160705566406, -0.029900550842285156, -0.02841949462890625, -0.026938438415527344, -0.025457382202148438, -0.02397632598876953, -0.022495269775390625, -0.02101421356201172, -0.019533157348632812, -0.018052101135253906, -0.016571044921875, -0.015089988708496094, -0.013608932495117188, -0.012127876281738281, -0.010646820068359375, -0.009165763854980469, -0.0076847076416015625, -0.006203651428222656, -0.00472259521484375, -0.0032415390014648438, -0.0017604827880859375, -0.00027942657470703125, 0.001201629638671875, 0.0026826858520507812, 0.0041637420654296875, 0.005644798278808594, 0.0071258544921875, 0.008606910705566406, 0.010087966918945312, 0.011569023132324219, 0.013050079345703125, 0.014531135559082031, 0.016012191772460938, 0.017493247985839844, 0.01897430419921875, 0.020455360412597656, 0.021936416625976562, 0.02341747283935547, 0.024898529052734375, 0.02637958526611328, 0.027860641479492188, 0.029341697692871094, 0.03082275390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 5.0, 9.0, 14.0, 22.0, 30.0, 53.0, 94.0, 119.0, 190.0, 349.0, 712.0, 1676.0, 5467.0, 27492.0, 241835.0, 682405.0, 71735.0, 11137.0, 2927.0, 1105.0, 496.0, 248.0, 132.0, 85.0, 58.0, 40.0, 42.0, 25.0, 13.0, 11.0, 11.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.11669921875, -0.11329174041748047, -0.10988426208496094, -0.1064767837524414, -0.10306930541992188, -0.09966182708740234, -0.09625434875488281, -0.09284687042236328, -0.08943939208984375, -0.08603191375732422, -0.08262443542480469, -0.07921695709228516, -0.07580947875976562, -0.0724020004272461, -0.06899452209472656, -0.06558704376220703, -0.0621795654296875, -0.05877208709716797, -0.05536460876464844, -0.051957130432128906, -0.048549652099609375, -0.045142173767089844, -0.04173469543457031, -0.03832721710205078, -0.03491973876953125, -0.03151226043701172, -0.028104782104492188, -0.024697303771972656, -0.021289825439453125, -0.017882347106933594, -0.014474868774414062, -0.011067390441894531, -0.007659912109375, -0.004252433776855469, -0.0008449554443359375, 0.0025625228881835938, 0.005970001220703125, 0.009377479553222656, 0.012784957885742188, 0.01619243621826172, 0.01959991455078125, 0.02300739288330078, 0.026414871215820312, 0.029822349548339844, 0.033229827880859375, 0.036637306213378906, 0.04004478454589844, 0.04345226287841797, 0.0468597412109375, 0.05026721954345703, 0.05367469787597656, 0.057082176208496094, 0.060489654541015625, 0.06389713287353516, 0.06730461120605469, 0.07071208953857422, 0.07411956787109375, 0.07752704620361328, 0.08093452453613281, 0.08434200286865234, 0.08774948120117188, 0.0911569595336914, 0.09456443786621094, 0.09797191619873047, 0.10137939453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 9.0, 7.0, 9.0, 19.0, 18.0, 10.0, 19.0, 29.0, 24.0, 31.0, 37.0, 44.0, 45.0, 64.0, 53.0, 83.0, 67.0, 53.0, 61.0, 58.0, 48.0, 41.0, 30.0, 26.0, 34.0, 30.0, 13.0, 15.0, 6.0, 8.0, 1.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08245849609375, -0.07952690124511719, -0.07659530639648438, -0.07366371154785156, -0.07073211669921875, -0.06780052185058594, -0.06486892700195312, -0.06193733215332031, -0.0590057373046875, -0.05607414245605469, -0.053142547607421875, -0.05021095275878906, -0.04727935791015625, -0.04434776306152344, -0.041416168212890625, -0.03848457336425781, -0.035552978515625, -0.03262138366699219, -0.029689788818359375, -0.026758193969726562, -0.02382659912109375, -0.020895004272460938, -0.017963409423828125, -0.015031814575195312, -0.0121002197265625, -0.009168624877929688, -0.006237030029296875, -0.0033054351806640625, -0.00037384033203125, 0.0025577545166015625, 0.005489349365234375, 0.008420944213867188, 0.0113525390625, 0.014284133911132812, 0.017215728759765625, 0.020147323608398438, 0.02307891845703125, 0.026010513305664062, 0.028942108154296875, 0.03187370300292969, 0.0348052978515625, 0.03773689270019531, 0.040668487548828125, 0.04360008239746094, 0.04653167724609375, 0.04946327209472656, 0.052394866943359375, 0.05532646179199219, 0.058258056640625, 0.06118965148925781, 0.06412124633789062, 0.06705284118652344, 0.06998443603515625, 0.07291603088378906, 0.07584762573242188, 0.07877922058105469, 0.0817108154296875, 0.08464241027832031, 0.08757400512695312, 0.09050559997558594, 0.09343719482421875, 0.09636878967285156, 0.09930038452148438, 0.10223197937011719, 0.10516357421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 7.0, 3.0, 16.0, 20.0, 20.0, 36.0, 37.0, 58.0, 127.0, 222.0, 366.0, 748.0, 1530.0, 3680.0, 11208.0, 51219.0, 507324.0, 413189.0, 42514.0, 9951.0, 3391.0, 1378.0, 646.0, 325.0, 190.0, 114.0, 64.0, 40.0, 26.0, 20.0, 18.0, 12.0, 10.0, 6.0, 7.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.022369384765625, -0.021596670150756836, -0.020823955535888672, -0.020051240921020508, -0.019278526306152344, -0.01850581169128418, -0.017733097076416016, -0.01696038246154785, -0.016187667846679688, -0.015414953231811523, -0.01464223861694336, -0.013869524002075195, -0.013096809387207031, -0.012324094772338867, -0.011551380157470703, -0.010778665542602539, -0.010005950927734375, -0.009233236312866211, -0.008460521697998047, -0.007687807083129883, -0.006915092468261719, -0.006142377853393555, -0.005369663238525391, -0.0045969486236572266, -0.0038242340087890625, -0.0030515193939208984, -0.0022788047790527344, -0.0015060901641845703, -0.0007333755493164062, 3.933906555175781e-05, 0.0008120536804199219, 0.001584768295288086, 0.00235748291015625, 0.003130197525024414, 0.003902912139892578, 0.004675626754760742, 0.005448341369628906, 0.00622105598449707, 0.006993770599365234, 0.0077664852142333984, 0.008539199829101562, 0.009311914443969727, 0.01008462905883789, 0.010857343673706055, 0.011630058288574219, 0.012402772903442383, 0.013175487518310547, 0.013948202133178711, 0.014720916748046875, 0.015493631362915039, 0.016266345977783203, 0.017039060592651367, 0.01781177520751953, 0.018584489822387695, 0.01935720443725586, 0.020129919052124023, 0.020902633666992188, 0.02167534828186035, 0.022448062896728516, 0.02322077751159668, 0.023993492126464844, 0.024766206741333008, 0.025538921356201172, 0.026311635971069336, 0.0270843505859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 11.0, 9.0, 19.0, 24.0, 50.0, 173.0, 284.0, 250.0, 90.0, 36.0, 15.0, 16.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.820657730102539e-05, -3.7219375371932983e-05, -3.6232173442840576e-05, -3.524497151374817e-05, -3.425776958465576e-05, -3.3270567655563354e-05, -3.228336572647095e-05, -3.129616379737854e-05, -3.0308961868286133e-05, -2.9321759939193726e-05, -2.833455801010132e-05, -2.734735608100891e-05, -2.6360154151916504e-05, -2.5372952222824097e-05, -2.438575029373169e-05, -2.3398548364639282e-05, -2.2411346435546875e-05, -2.1424144506454468e-05, -2.043694257736206e-05, -1.9449740648269653e-05, -1.8462538719177246e-05, -1.747533679008484e-05, -1.648813486099243e-05, -1.5500932931900024e-05, -1.4513731002807617e-05, -1.352652907371521e-05, -1.2539327144622803e-05, -1.1552125215530396e-05, -1.0564923286437988e-05, -9.577721357345581e-06, -8.590519428253174e-06, -7.603317499160767e-06, -6.616115570068359e-06, -5.628913640975952e-06, -4.641711711883545e-06, -3.6545097827911377e-06, -2.6673078536987305e-06, -1.6801059246063232e-06, -6.92903995513916e-07, 2.942979335784912e-07, 1.2814998626708984e-06, 2.2687017917633057e-06, 3.255903720855713e-06, 4.24310564994812e-06, 5.230307579040527e-06, 6.2175095081329346e-06, 7.204711437225342e-06, 8.191913366317749e-06, 9.179115295410156e-06, 1.0166317224502563e-05, 1.115351915359497e-05, 1.2140721082687378e-05, 1.3127923011779785e-05, 1.4115124940872192e-05, 1.51023268699646e-05, 1.6089528799057007e-05, 1.7076730728149414e-05, 1.806393265724182e-05, 1.905113458633423e-05, 2.0038336515426636e-05, 2.1025538444519043e-05, 2.201274037361145e-05, 2.2999942302703857e-05, 2.3987144231796265e-05, 2.4974346160888672e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 6.0, 6.0, 13.0, 17.0, 26.0, 48.0, 61.0, 88.0, 206.0, 346.0, 809.0, 2476.0, 9910.0, 65308.0, 741409.0, 200026.0, 21023.0, 4363.0, 1306.0, 527.0, 257.0, 90.0, 71.0, 47.0, 34.0, 23.0, 13.0, 9.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0218353271484375, -0.020986318588256836, -0.020137310028076172, -0.019288301467895508, -0.018439292907714844, -0.01759028434753418, -0.016741275787353516, -0.01589226722717285, -0.015043258666992188, -0.014194250106811523, -0.01334524154663086, -0.012496232986450195, -0.011647224426269531, -0.010798215866088867, -0.009949207305908203, -0.009100198745727539, -0.008251190185546875, -0.007402181625366211, -0.006553173065185547, -0.005704164505004883, -0.004855155944824219, -0.004006147384643555, -0.0031571388244628906, -0.0023081302642822266, -0.0014591217041015625, -0.0006101131439208984, 0.00023889541625976562, 0.0010879039764404297, 0.0019369125366210938, 0.002785921096801758, 0.003634929656982422, 0.004483938217163086, 0.00533294677734375, 0.006181955337524414, 0.007030963897705078, 0.007879972457885742, 0.008728981018066406, 0.00957798957824707, 0.010426998138427734, 0.011276006698608398, 0.012125015258789062, 0.012974023818969727, 0.01382303237915039, 0.014672040939331055, 0.015521049499511719, 0.016370058059692383, 0.017219066619873047, 0.01806807518005371, 0.018917083740234375, 0.01976609230041504, 0.020615100860595703, 0.021464109420776367, 0.02231311798095703, 0.023162126541137695, 0.02401113510131836, 0.024860143661499023, 0.025709152221679688, 0.02655816078186035, 0.027407169342041016, 0.02825617790222168, 0.029105186462402344, 0.029954195022583008, 0.030803203582763672, 0.031652212142944336, 0.032501220703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 3.0, 11.0, 8.0, 7.0, 17.0, 14.0, 25.0, 26.0, 42.0, 46.0, 64.0, 56.0, 89.0, 86.0, 90.0, 75.0, 85.0, 63.0, 34.0, 37.0, 17.0, 19.0, 23.0, 8.0, 16.0, 9.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0191192626953125, -0.01856088638305664, -0.01800251007080078, -0.017444133758544922, -0.016885757446289062, -0.016327381134033203, -0.015769004821777344, -0.015210628509521484, -0.014652252197265625, -0.014093875885009766, -0.013535499572753906, -0.012977123260498047, -0.012418746948242188, -0.011860370635986328, -0.011301994323730469, -0.01074361801147461, -0.01018524169921875, -0.00962686538696289, -0.009068489074707031, -0.008510112762451172, -0.007951736450195312, -0.007393360137939453, -0.006834983825683594, -0.006276607513427734, -0.005718231201171875, -0.005159854888916016, -0.004601478576660156, -0.004043102264404297, -0.0034847259521484375, -0.002926349639892578, -0.0023679733276367188, -0.0018095970153808594, -0.001251220703125, -0.0006928443908691406, -0.00013446807861328125, 0.0004239082336425781, 0.0009822845458984375, 0.0015406608581542969, 0.0020990371704101562, 0.0026574134826660156, 0.003215789794921875, 0.0037741661071777344, 0.004332542419433594, 0.004890918731689453, 0.0054492950439453125, 0.006007671356201172, 0.006566047668457031, 0.007124423980712891, 0.00768280029296875, 0.00824117660522461, 0.008799552917480469, 0.009357929229736328, 0.009916305541992188, 0.010474681854248047, 0.011033058166503906, 0.011591434478759766, 0.012149810791015625, 0.012708187103271484, 0.013266563415527344, 0.013824939727783203, 0.014383316040039062, 0.014941692352294922, 0.015500068664550781, 0.01605844497680664, 0.0166168212890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 10.0, 33.0, 90.0, 367.0, 354.0, 107.0, 39.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7725279331207275, -1.7333259582519531, -1.6941239833831787, -1.6549220085144043, -1.6157200336456299, -1.576518177986145, -1.5373162031173706, -1.4981142282485962, -1.4589122533798218, -1.4197102785110474, -1.380508303642273, -1.3413063287734985, -1.3021044731140137, -1.2629024982452393, -1.2237005233764648, -1.1844985485076904, -1.145296573638916, -1.1060945987701416, -1.0668926239013672, -1.0276906490325928, -0.9884887337684631, -0.9492867588996887, -0.9100848436355591, -0.8708828687667847, -0.8316808938980103, -0.7924789190292358, -0.7532769441604614, -0.7140750288963318, -0.6748730540275574, -0.635671079158783, -0.5964691638946533, -0.5572671890258789, -0.5180652141571045, -0.4788632392883301, -0.43966129422187805, -0.400459349155426, -0.3612573742866516, -0.3220553994178772, -0.28285345435142517, -0.24365150928497314, -0.20444953441619873, -0.1652475744485855, -0.1260456144809723, -0.08684365451335907, -0.04764169454574585, -0.00843973457813263, 0.03076222538948059, 0.06996417045593262, 0.10916614532470703, 0.14836810529232025, 0.18757006525993347, 0.2267720252275467, 0.2659739851951599, 0.3051759600639343, 0.34437790513038635, 0.3835798501968384, 0.4227818250656128, 0.4619837999343872, 0.5011857748031616, 0.5403876900672913, 0.5795896649360657, 0.6187916398048401, 0.6579935550689697, 0.6971955299377441, 0.7363975048065186]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 5.0, 5.0, 5.0, 14.0, 13.0, 9.0, 15.0, 16.0, 23.0, 19.0, 20.0, 31.0, 37.0, 36.0, 38.0, 32.0, 36.0, 36.0, 38.0, 33.0, 45.0, 35.0, 32.0, 38.0, 41.0, 34.0, 34.0, 29.0, 30.0, 30.0, 25.0, 27.0, 16.0, 25.0, 16.0, 22.0, 9.0, 15.0, 5.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3731423616409302, -0.3618837296962738, -0.35062506794929504, -0.33936643600463867, -0.3281077742576599, -0.31684914231300354, -0.3055904805660248, -0.2943318486213684, -0.28307318687438965, -0.2718145549297333, -0.2605558931827545, -0.24929724633693695, -0.23803859949111938, -0.22677995264530182, -0.21552130579948425, -0.20426267385482788, -0.19300402700901031, -0.18174538016319275, -0.17048673331737518, -0.15922808647155762, -0.14796943962574005, -0.13671079277992249, -0.1254521608352661, -0.11419350653886795, -0.10293485969305038, -0.09167621284723282, -0.08041756600141525, -0.06915892660617828, -0.05790027603507042, -0.04664162918925285, -0.035382986068725586, -0.02412433922290802, -0.012865692377090454, -0.0016070464625954628, 0.009651599451899529, 0.020910244435071945, 0.03216889128088951, 0.04342753812670708, 0.054686181247234344, 0.06594482809305191, 0.07720347493886948, 0.08846212178468704, 0.09972076863050461, 0.11097940802574158, 0.12223805487155914, 0.1334967017173767, 0.14475534856319427, 0.15601399540901184, 0.1672726422548294, 0.17853128910064697, 0.18978993594646454, 0.2010485827922821, 0.21230722963809967, 0.22356587648391724, 0.2348245084285736, 0.24608317017555237, 0.25734180212020874, 0.2686004340648651, 0.27985909581184387, 0.29111772775650024, 0.302376389503479, 0.3136350214481354, 0.32489368319511414, 0.3361523151397705, 0.34741097688674927]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 7.0, 15.0, 12.0, 18.0, 21.0, 46.0, 50.0, 81.0, 109.0, 261.0, 460.0, 1052.0, 3276.0, 16199.0, 3301639.0, 851125.0, 15072.0, 3066.0, 926.0, 393.0, 194.0, 100.0, 53.0, 39.0, 19.0, 16.0, 9.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2017822265625, -0.19719409942626953, -0.19260597229003906, -0.1880178451538086, -0.18342971801757812, -0.17884159088134766, -0.1742534637451172, -0.16966533660888672, -0.16507720947265625, -0.16048908233642578, -0.1559009552001953, -0.15131282806396484, -0.14672470092773438, -0.1421365737915039, -0.13754844665527344, -0.13296031951904297, -0.1283721923828125, -0.12378406524658203, -0.11919593811035156, -0.1146078109741211, -0.11001968383789062, -0.10543155670166016, -0.10084342956542969, -0.09625530242919922, -0.09166717529296875, -0.08707904815673828, -0.08249092102050781, -0.07790279388427734, -0.07331466674804688, -0.0687265396118164, -0.06413841247558594, -0.05955028533935547, -0.054962158203125, -0.05037403106689453, -0.04578590393066406, -0.041197776794433594, -0.036609649658203125, -0.032021522521972656, -0.027433395385742188, -0.02284526824951172, -0.01825714111328125, -0.013669013977050781, -0.009080886840820312, -0.004492759704589844, 9.5367431640625e-05, 0.004683494567871094, 0.009271621704101562, 0.013859748840332031, 0.0184478759765625, 0.02303600311279297, 0.027624130249023438, 0.032212257385253906, 0.036800384521484375, 0.041388511657714844, 0.04597663879394531, 0.05056476593017578, 0.05515289306640625, 0.05974102020263672, 0.06432914733886719, 0.06891727447509766, 0.07350540161132812, 0.0780935287475586, 0.08268165588378906, 0.08726978302001953, 0.09185791015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 16.0, 32.0, 43.0, 102.0, 110.0, 134.0, 159.0, 141.0, 92.0, 72.0, 47.0, 25.0, 11.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0682373046875, -0.0666959285736084, -0.0651545524597168, -0.0636131763458252, -0.062071800231933594, -0.06053042411804199, -0.05898904800415039, -0.05744767189025879, -0.05590629577636719, -0.054364919662475586, -0.052823543548583984, -0.05128216743469238, -0.04974079132080078, -0.04819941520690918, -0.04665803909301758, -0.04511666297912598, -0.043575286865234375, -0.04203391075134277, -0.04049253463745117, -0.03895115852355957, -0.03740978240966797, -0.03586840629577637, -0.034327030181884766, -0.032785654067993164, -0.031244277954101562, -0.02970290184020996, -0.02816152572631836, -0.026620149612426758, -0.025078773498535156, -0.023537397384643555, -0.021996021270751953, -0.02045464515686035, -0.01891326904296875, -0.01737189292907715, -0.015830516815185547, -0.014289140701293945, -0.012747764587402344, -0.011206388473510742, -0.00966501235961914, -0.008123636245727539, -0.0065822601318359375, -0.005040884017944336, -0.0034995079040527344, -0.001958131790161133, -0.00041675567626953125, 0.0011246204376220703, 0.002665996551513672, 0.0042073726654052734, 0.005748748779296875, 0.0072901248931884766, 0.008831501007080078, 0.01037287712097168, 0.011914253234863281, 0.013455629348754883, 0.014997005462646484, 0.016538381576538086, 0.018079757690429688, 0.01962113380432129, 0.02116250991821289, 0.022703886032104492, 0.024245262145996094, 0.025786638259887695, 0.027328014373779297, 0.0288693904876709, 0.0304107666015625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 13.0, 17.0, 32.0, 47.0, 96.0, 175.0, 480.0, 1115.0, 3366.0, 13973.0, 193051.0, 3928642.0, 41795.0, 7555.0, 2315.0, 873.0, 345.0, 188.0, 87.0, 49.0, 25.0, 15.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111083984375, -0.10784244537353516, -0.10460090637207031, -0.10135936737060547, -0.09811782836914062, -0.09487628936767578, -0.09163475036621094, -0.0883932113647461, -0.08515167236328125, -0.0819101333618164, -0.07866859436035156, -0.07542705535888672, -0.07218551635742188, -0.06894397735595703, -0.06570243835449219, -0.062460899353027344, -0.0592193603515625, -0.055977821350097656, -0.05273628234863281, -0.04949474334716797, -0.046253204345703125, -0.04301166534423828, -0.03977012634277344, -0.036528587341308594, -0.03328704833984375, -0.030045509338378906, -0.026803970336914062, -0.02356243133544922, -0.020320892333984375, -0.01707935333251953, -0.013837814331054688, -0.010596275329589844, -0.007354736328125, -0.004113197326660156, -0.0008716583251953125, 0.0023698806762695312, 0.005611419677734375, 0.008852958679199219, 0.012094497680664062, 0.015336036682128906, 0.01857757568359375, 0.021819114685058594, 0.025060653686523438, 0.02830219268798828, 0.031543731689453125, 0.03478527069091797, 0.03802680969238281, 0.041268348693847656, 0.0445098876953125, 0.047751426696777344, 0.05099296569824219, 0.05423450469970703, 0.057476043701171875, 0.06071758270263672, 0.06395912170410156, 0.0672006607055664, 0.07044219970703125, 0.0736837387084961, 0.07692527770996094, 0.08016681671142578, 0.08340835571289062, 0.08664989471435547, 0.08989143371582031, 0.09313297271728516, 0.09637451171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 13.0, 14.0, 30.0, 44.0, 92.0, 239.0, 1333.0, 1875.0, 214.0, 82.0, 40.0, 20.0, 15.0, 6.0, 3.0, 2.0, 8.0, 8.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.029296875, -0.028171062469482422, -0.027045249938964844, -0.025919437408447266, -0.024793624877929688, -0.02366781234741211, -0.02254199981689453, -0.021416187286376953, -0.020290374755859375, -0.019164562225341797, -0.01803874969482422, -0.01691293716430664, -0.015787124633789062, -0.014661312103271484, -0.013535499572753906, -0.012409687042236328, -0.01128387451171875, -0.010158061981201172, -0.009032249450683594, -0.007906436920166016, -0.0067806243896484375, -0.005654811859130859, -0.004528999328613281, -0.003403186798095703, -0.002277374267578125, -0.0011515617370605469, -2.574920654296875e-05, 0.0011000633239746094, 0.0022258758544921875, 0.0033516883850097656, 0.004477500915527344, 0.005603313446044922, 0.0067291259765625, 0.007854938507080078, 0.008980751037597656, 0.010106563568115234, 0.011232376098632812, 0.01235818862915039, 0.013484001159667969, 0.014609813690185547, 0.015735626220703125, 0.016861438751220703, 0.01798725128173828, 0.01911306381225586, 0.020238876342773438, 0.021364688873291016, 0.022490501403808594, 0.023616313934326172, 0.02474212646484375, 0.025867938995361328, 0.026993751525878906, 0.028119564056396484, 0.029245376586914062, 0.03037118911743164, 0.03149700164794922, 0.0326228141784668, 0.033748626708984375, 0.03487443923950195, 0.03600025177001953, 0.03712606430053711, 0.03825187683105469, 0.039377689361572266, 0.040503501892089844, 0.04162931442260742, 0.042755126953125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 11.0, 36.0, 180.0, 401.0, 278.0, 75.0, 16.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13715097308158875, -0.12664353847503662, -0.1161361038684845, -0.10562866926193237, -0.09512123465538025, -0.08461380004882812, -0.074106365442276, -0.06359893083572388, -0.05309149622917175, -0.04258406162261963, -0.032076627016067505, -0.02156919240951538, -0.011061757802963257, -0.0005543231964111328, 0.009953111410140991, 0.020460546016693115, 0.03096798062324524, 0.04147541522979736, 0.05198284983634949, 0.06249028444290161, 0.07299771904945374, 0.08350515365600586, 0.09401258826255798, 0.10452002286911011, 0.11502745747566223, 0.12553489208221436, 0.13604232668876648, 0.1465497612953186, 0.15705719590187073, 0.16756463050842285, 0.17807206511497498, 0.1885794997215271, 0.19908690452575684, 0.20959433913230896, 0.22010177373886108, 0.2306092083454132, 0.24111664295196533, 0.25162407755851746, 0.2621315121650696, 0.2726389467716217, 0.28314638137817383, 0.29365381598472595, 0.3041612505912781, 0.3146686851978302, 0.3251761198043823, 0.33568355441093445, 0.3461909890174866, 0.3566984236240387, 0.3672058582305908, 0.37771329283714294, 0.38822072744369507, 0.3987281620502472, 0.4092355966567993, 0.41974303126335144, 0.43025046586990356, 0.4407579004764557, 0.4512653350830078, 0.46177276968955994, 0.47228020429611206, 0.4827876389026642, 0.4932950735092163, 0.5038025379180908, 0.5143099427223206, 0.5248173475265503, 0.5353248119354248]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 9.0, 8.0, 14.0, 28.0, 41.0, 43.0, 57.0, 62.0, 101.0, 81.0, 89.0, 68.0, 77.0, 78.0, 55.0, 61.0, 38.0, 27.0, 24.0, 17.0, 12.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17221498489379883, -0.16678152978420258, -0.16134808957576752, -0.15591463446617126, -0.1504811942577362, -0.14504773914813995, -0.1396142840385437, -0.13418084383010864, -0.12874740362167358, -0.12331395596265793, -0.11788050830364227, -0.11244705319404602, -0.10701361298561096, -0.10158015787601471, -0.09614671021699905, -0.0907132625579834, -0.08527980744838715, -0.07984635978937149, -0.07441291213035583, -0.06897945702075958, -0.06354601681232452, -0.05811256542801857, -0.052679114043712616, -0.04724566638469696, -0.041812218725681305, -0.03637877106666565, -0.030945321545004845, -0.02551187202334404, -0.020078424364328384, -0.014644976705312729, -0.009211525321006775, -0.0037780776619911194, 0.0016553699970245361, 0.007088818587362766, 0.012522267177700996, 0.0179557166993618, 0.023389164358377457, 0.028822612017393112, 0.034256063401699066, 0.03968951106071472, 0.04512295871973038, 0.05055640637874603, 0.05598985403776169, 0.06142330542206764, 0.0668567568063736, 0.07229019701480865, 0.07772365212440491, 0.08315709978342056, 0.08859054744243622, 0.09402399510145187, 0.09945744276046753, 0.10489089787006378, 0.11032433807849884, 0.11575779318809509, 0.12119124084711075, 0.1266246885061264, 0.13205814361572266, 0.1374915987253189, 0.14292503893375397, 0.14835849404335022, 0.15379193425178528, 0.15922538936138153, 0.16465884447097778, 0.17009228467941284, 0.1755257248878479]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 18.0, 24.0, 24.0, 25.0, 40.0, 59.0, 124.0, 262.0, 552.0, 1388.0, 4773.0, 41602.0, 816406.0, 169074.0, 10439.0, 2139.0, 835.0, 372.0, 179.0, 79.0, 45.0, 27.0, 19.0, 16.0, 7.0, 4.0, 7.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0], "bins": [-0.2215576171875, -0.2163705825805664, -0.2111835479736328, -0.20599651336669922, -0.20080947875976562, -0.19562244415283203, -0.19043540954589844, -0.18524837493896484, -0.18006134033203125, -0.17487430572509766, -0.16968727111816406, -0.16450023651123047, -0.15931320190429688, -0.15412616729736328, -0.1489391326904297, -0.1437520980834961, -0.1385650634765625, -0.1333780288696289, -0.1281909942626953, -0.12300395965576172, -0.11781692504882812, -0.11262989044189453, -0.10744285583496094, -0.10225582122802734, -0.09706878662109375, -0.09188175201416016, -0.08669471740722656, -0.08150768280029297, -0.07632064819335938, -0.07113361358642578, -0.06594657897949219, -0.060759544372558594, -0.055572509765625, -0.050385475158691406, -0.04519844055175781, -0.04001140594482422, -0.034824371337890625, -0.02963733673095703, -0.024450302124023438, -0.019263267517089844, -0.01407623291015625, -0.008889198303222656, -0.0037021636962890625, 0.0014848709106445312, 0.006671905517578125, 0.011858940124511719, 0.017045974731445312, 0.022233009338378906, 0.0274200439453125, 0.032607078552246094, 0.03779411315917969, 0.04298114776611328, 0.048168182373046875, 0.05335521697998047, 0.05854225158691406, 0.06372928619384766, 0.06891632080078125, 0.07410335540771484, 0.07929039001464844, 0.08447742462158203, 0.08966445922851562, 0.09485149383544922, 0.10003852844238281, 0.1052255630493164, 0.11041259765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 26.0, 39.0, 76.0, 100.0, 123.0, 155.0, 131.0, 117.0, 78.0, 65.0, 31.0, 22.0, 10.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.06286096572875977, -0.06139087677001953, -0.0599207878112793, -0.05845069885253906, -0.05698060989379883, -0.055510520935058594, -0.05404043197631836, -0.052570343017578125, -0.05110025405883789, -0.049630165100097656, -0.04816007614135742, -0.04668998718261719, -0.04521989822387695, -0.04374980926513672, -0.042279720306396484, -0.04080963134765625, -0.039339542388916016, -0.03786945343017578, -0.03639936447143555, -0.03492927551269531, -0.03345918655395508, -0.031989097595214844, -0.03051900863647461, -0.029048919677734375, -0.02757883071899414, -0.026108741760253906, -0.024638652801513672, -0.023168563842773438, -0.021698474884033203, -0.02022838592529297, -0.018758296966552734, -0.0172882080078125, -0.015818119049072266, -0.014348030090332031, -0.012877941131591797, -0.011407852172851562, -0.009937763214111328, -0.008467674255371094, -0.006997585296630859, -0.005527496337890625, -0.004057407379150391, -0.0025873184204101562, -0.0011172294616699219, 0.0003528594970703125, 0.0018229484558105469, 0.0032930374145507812, 0.004763126373291016, 0.00623321533203125, 0.007703304290771484, 0.009173393249511719, 0.010643482208251953, 0.012113571166992188, 0.013583660125732422, 0.015053749084472656, 0.01652383804321289, 0.017993927001953125, 0.01946401596069336, 0.020934104919433594, 0.022404193878173828, 0.023874282836914062, 0.025344371795654297, 0.02681446075439453, 0.028284549713134766, 0.029754638671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 8.0, 10.0, 14.0, 19.0, 41.0, 49.0, 91.0, 145.0, 225.0, 535.0, 1347.0, 5557.0, 35117.0, 460628.0, 498796.0, 37625.0, 5698.0, 1459.0, 537.0, 267.0, 130.0, 73.0, 61.0, 36.0, 22.0, 19.0, 10.0, 6.0, 8.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09686279296875, -0.0931396484375, -0.08941650390625, -0.085693359375, -0.08197021484375, -0.0782470703125, -0.07452392578125, -0.07080078125, -0.06707763671875, -0.0633544921875, -0.05963134765625, -0.055908203125, -0.05218505859375, -0.0484619140625, -0.04473876953125, -0.041015625, -0.03729248046875, -0.0335693359375, -0.02984619140625, -0.026123046875, -0.02239990234375, -0.0186767578125, -0.01495361328125, -0.01123046875, -0.00750732421875, -0.0037841796875, -6.103515625e-05, 0.003662109375, 0.00738525390625, 0.0111083984375, 0.01483154296875, 0.0185546875, 0.02227783203125, 0.0260009765625, 0.02972412109375, 0.033447265625, 0.03717041015625, 0.0408935546875, 0.04461669921875, 0.04833984375, 0.05206298828125, 0.0557861328125, 0.05950927734375, 0.063232421875, 0.06695556640625, 0.0706787109375, 0.07440185546875, 0.078125, 0.08184814453125, 0.0855712890625, 0.08929443359375, 0.093017578125, 0.09674072265625, 0.1004638671875, 0.10418701171875, 0.10791015625, 0.11163330078125, 0.1153564453125, 0.11907958984375, 0.122802734375, 0.12652587890625, 0.1302490234375, 0.13397216796875, 0.1376953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 10.0, 12.0, 10.0, 16.0, 21.0, 31.0, 33.0, 36.0, 55.0, 55.0, 90.0, 80.0, 74.0, 55.0, 67.0, 61.0, 55.0, 43.0, 45.0, 48.0, 32.0, 20.0, 13.0, 11.0, 3.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13525390625, -0.13157081604003906, -0.12788772583007812, -0.12420463562011719, -0.12052154541015625, -0.11683845520019531, -0.11315536499023438, -0.10947227478027344, -0.1057891845703125, -0.10210609436035156, -0.09842300415039062, -0.09473991394042969, -0.09105682373046875, -0.08737373352050781, -0.08369064331054688, -0.08000755310058594, -0.076324462890625, -0.07264137268066406, -0.06895828247070312, -0.06527519226074219, -0.06159210205078125, -0.05790901184082031, -0.054225921630859375, -0.05054283142089844, -0.0468597412109375, -0.04317665100097656, -0.039493560791015625, -0.03581047058105469, -0.03212738037109375, -0.028444290161132812, -0.024761199951171875, -0.021078109741210938, -0.01739501953125, -0.013711929321289062, -0.010028839111328125, -0.0063457489013671875, -0.00266265869140625, 0.0010204315185546875, 0.004703521728515625, 0.008386611938476562, 0.0120697021484375, 0.015752792358398438, 0.019435882568359375, 0.023118972778320312, 0.02680206298828125, 0.030485153198242188, 0.034168243408203125, 0.03785133361816406, 0.041534423828125, 0.04521751403808594, 0.048900604248046875, 0.05258369445800781, 0.05626678466796875, 0.05994987487792969, 0.06363296508789062, 0.06731605529785156, 0.0709991455078125, 0.07468223571777344, 0.07836532592773438, 0.08204841613769531, 0.08573150634765625, 0.08941459655761719, 0.09309768676757812, 0.09678077697753906, 0.1004638671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 12.0, 22.0, 27.0, 40.0, 89.0, 166.0, 399.0, 2156.0, 36379.0, 952604.0, 53141.0, 2602.0, 512.0, 201.0, 96.0, 47.0, 27.0, 14.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052825927734375, -0.05083608627319336, -0.04884624481201172, -0.04685640335083008, -0.04486656188964844, -0.0428767204284668, -0.040886878967285156, -0.038897037506103516, -0.036907196044921875, -0.034917354583740234, -0.032927513122558594, -0.030937671661376953, -0.028947830200195312, -0.026957988739013672, -0.02496814727783203, -0.02297830581665039, -0.02098846435546875, -0.01899862289428711, -0.01700878143310547, -0.015018939971923828, -0.013029098510742188, -0.011039257049560547, -0.009049415588378906, -0.007059574127197266, -0.005069732666015625, -0.0030798912048339844, -0.0010900497436523438, 0.0008997917175292969, 0.0028896331787109375, 0.004879474639892578, 0.006869316101074219, 0.00885915756225586, 0.0108489990234375, 0.01283884048461914, 0.014828681945800781, 0.016818523406982422, 0.018808364868164062, 0.020798206329345703, 0.022788047790527344, 0.024777889251708984, 0.026767730712890625, 0.028757572174072266, 0.030747413635253906, 0.03273725509643555, 0.03472709655761719, 0.03671693801879883, 0.03870677947998047, 0.04069662094116211, 0.04268646240234375, 0.04467630386352539, 0.04666614532470703, 0.04865598678588867, 0.05064582824707031, 0.05263566970825195, 0.054625511169433594, 0.056615352630615234, 0.058605194091796875, 0.060595035552978516, 0.06258487701416016, 0.0645747184753418, 0.06656455993652344, 0.06855440139770508, 0.07054424285888672, 0.07253408432006836, 0.07452392578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 6.0, 4.0, 11.0, 9.0, 16.0, 24.0, 57.0, 100.0, 199.0, 217.0, 166.0, 68.0, 37.0, 19.0, 10.0, 12.0, 15.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.314018249511719e-05, -3.2335519790649414e-05, -3.153085708618164e-05, -3.072619438171387e-05, -2.9921531677246094e-05, -2.911686897277832e-05, -2.8312206268310547e-05, -2.7507543563842773e-05, -2.6702880859375e-05, -2.5898218154907227e-05, -2.5093555450439453e-05, -2.428889274597168e-05, -2.3484230041503906e-05, -2.2679567337036133e-05, -2.187490463256836e-05, -2.1070241928100586e-05, -2.0265579223632812e-05, -1.946091651916504e-05, -1.8656253814697266e-05, -1.7851591110229492e-05, -1.704692840576172e-05, -1.6242265701293945e-05, -1.5437602996826172e-05, -1.4632940292358398e-05, -1.3828277587890625e-05, -1.3023614883422852e-05, -1.2218952178955078e-05, -1.1414289474487305e-05, -1.0609626770019531e-05, -9.804964065551758e-06, -9.000301361083984e-06, -8.195638656616211e-06, -7.3909759521484375e-06, -6.586313247680664e-06, -5.781650543212891e-06, -4.976987838745117e-06, -4.172325134277344e-06, -3.3676624298095703e-06, -2.562999725341797e-06, -1.7583370208740234e-06, -9.5367431640625e-07, -1.4901161193847656e-07, 6.556510925292969e-07, 1.4603137969970703e-06, 2.2649765014648438e-06, 3.069639205932617e-06, 3.874301910400391e-06, 4.678964614868164e-06, 5.4836273193359375e-06, 6.288290023803711e-06, 7.092952728271484e-06, 7.897615432739258e-06, 8.702278137207031e-06, 9.506940841674805e-06, 1.0311603546142578e-05, 1.1116266250610352e-05, 1.1920928955078125e-05, 1.2725591659545898e-05, 1.3530254364013672e-05, 1.4334917068481445e-05, 1.5139579772949219e-05, 1.5944242477416992e-05, 1.6748905181884766e-05, 1.755356788635254e-05, 1.8358230590820312e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 13.0, 21.0, 24.0, 60.0, 102.0, 164.0, 456.0, 2073.0, 25064.0, 889820.0, 124268.0, 5122.0, 824.0, 239.0, 129.0, 75.0, 44.0, 15.0, 6.0, 16.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.03325843811035156, -0.031726837158203125, -0.030195236206054688, -0.02866363525390625, -0.027132034301757812, -0.025600433349609375, -0.024068832397460938, -0.0225372314453125, -0.021005630493164062, -0.019474029541015625, -0.017942428588867188, -0.01641082763671875, -0.014879226684570312, -0.013347625732421875, -0.011816024780273438, -0.010284423828125, -0.008752822875976562, -0.007221221923828125, -0.0056896209716796875, -0.00415802001953125, -0.0026264190673828125, -0.001094818115234375, 0.0004367828369140625, 0.0019683837890625, 0.0034999847412109375, 0.005031585693359375, 0.0065631866455078125, 0.00809478759765625, 0.009626388549804688, 0.011157989501953125, 0.012689590454101562, 0.01422119140625, 0.015752792358398438, 0.017284393310546875, 0.018815994262695312, 0.02034759521484375, 0.021879196166992188, 0.023410797119140625, 0.024942398071289062, 0.0264739990234375, 0.028005599975585938, 0.029537200927734375, 0.031068801879882812, 0.03260040283203125, 0.03413200378417969, 0.035663604736328125, 0.03719520568847656, 0.038726806640625, 0.04025840759277344, 0.041790008544921875, 0.04332160949707031, 0.04485321044921875, 0.04638481140136719, 0.047916412353515625, 0.04944801330566406, 0.0509796142578125, 0.05251121520996094, 0.054042816162109375, 0.05557441711425781, 0.05710601806640625, 0.05863761901855469, 0.060169219970703125, 0.06170082092285156, 0.063232421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 8.0, 8.0, 17.0, 24.0, 35.0, 88.0, 111.0, 179.0, 189.0, 134.0, 96.0, 39.0, 27.0, 18.0, 11.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.060333251953125, -0.059105634689331055, -0.05787801742553711, -0.056650400161743164, -0.05542278289794922, -0.05419516563415527, -0.05296754837036133, -0.05173993110656738, -0.05051231384277344, -0.04928469657897949, -0.04805707931518555, -0.0468294620513916, -0.045601844787597656, -0.04437422752380371, -0.043146610260009766, -0.04191899299621582, -0.040691375732421875, -0.03946375846862793, -0.038236141204833984, -0.03700852394104004, -0.035780906677246094, -0.03455328941345215, -0.0333256721496582, -0.03209805488586426, -0.030870437622070312, -0.029642820358276367, -0.028415203094482422, -0.027187585830688477, -0.02595996856689453, -0.024732351303100586, -0.02350473403930664, -0.022277116775512695, -0.02104949951171875, -0.019821882247924805, -0.01859426498413086, -0.017366647720336914, -0.01613903045654297, -0.014911413192749023, -0.013683795928955078, -0.012456178665161133, -0.011228561401367188, -0.010000944137573242, -0.008773326873779297, -0.0075457096099853516, -0.006318092346191406, -0.005090475082397461, -0.0038628578186035156, -0.0026352405548095703, -0.001407623291015625, -0.0001800060272216797, 0.0010476112365722656, 0.002275228500366211, 0.0035028457641601562, 0.0047304630279541016, 0.005958080291748047, 0.007185697555541992, 0.008413314819335938, 0.009640932083129883, 0.010868549346923828, 0.012096166610717773, 0.013323783874511719, 0.014551401138305664, 0.01577901840209961, 0.017006635665893555, 0.0182342529296875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 18.0, 16.0, 71.0, 160.0, 248.0, 246.0, 127.0, 55.0, 27.0, 21.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6741114854812622, -0.6517782807350159, -0.6294451355934143, -0.607111930847168, -0.5847787857055664, -0.5624455809593201, -0.5401124358177185, -0.5177792310714722, -0.4954460859298706, -0.47311291098594666, -0.4507797360420227, -0.42844656109809875, -0.4061133861541748, -0.38378021121025085, -0.3614470362663269, -0.33911383152008057, -0.3167806565761566, -0.29444748163223267, -0.2721143066883087, -0.24978113174438477, -0.22744795680046082, -0.20511478185653687, -0.18278159201145172, -0.16044841706752777, -0.13811524212360382, -0.11578206717967987, -0.09344889223575592, -0.07111570984125137, -0.04878253489732742, -0.026449359953403473, -0.004116177558898926, 0.018216997385025024, 0.040550172328948975, 0.06288334727287292, 0.08521652221679688, 0.10754970461130142, 0.12988287210464478, 0.15221604704856873, 0.17454923689365387, 0.19688241183757782, 0.21921558678150177, 0.24154876172542572, 0.26388195157051086, 0.2862151265144348, 0.30854830145835876, 0.3308814764022827, 0.35321465134620667, 0.3755478262901306, 0.39788100123405457, 0.4202141761779785, 0.44254735112190247, 0.4648805260658264, 0.48721370100975037, 0.5095468759536743, 0.5318800806999207, 0.5542132258415222, 0.5765464305877686, 0.5988796353340149, 0.6212127804756165, 0.6435459852218628, 0.6658791303634644, 0.6882123351097107, 0.7105454802513123, 0.7328786849975586, 0.7552118301391602]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 5.0, 8.0, 5.0, 15.0, 5.0, 8.0, 17.0, 23.0, 14.0, 14.0, 26.0, 32.0, 26.0, 39.0, 25.0, 36.0, 38.0, 43.0, 37.0, 38.0, 40.0, 35.0, 25.0, 47.0, 38.0, 37.0, 29.0, 27.0, 24.0, 35.0, 28.0, 26.0, 27.0, 24.0, 19.0, 12.0, 14.0, 6.0, 7.0, 4.0, 8.0, 7.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.315432608127594, -0.30483388900756836, -0.29423514008522034, -0.2836364209651947, -0.2730376720428467, -0.26243895292282104, -0.2518402338027954, -0.24124149978160858, -0.23064276576042175, -0.22004403173923492, -0.2094452977180481, -0.19884657859802246, -0.18824784457683563, -0.1776491105556488, -0.16705039143562317, -0.15645165741443634, -0.1458529233932495, -0.13525418937206268, -0.12465546280145645, -0.11405673623085022, -0.10345800220966339, -0.09285926818847656, -0.08226054161787033, -0.0716618150472641, -0.06106308102607727, -0.05046435073018074, -0.03986562043428421, -0.02926689013838768, -0.01866815984249115, -0.00806942954659462, 0.0025293007493019104, 0.013128027319908142, 0.02372676134109497, 0.0343254916369915, 0.04492422193288803, 0.05552295222878456, 0.06612168252468109, 0.07672041654586792, 0.08731914311647415, 0.09791786968708038, 0.10851660370826721, 0.11911533772945404, 0.12971407175064087, 0.1403127908706665, 0.15091152489185333, 0.16151025891304016, 0.1721089780330658, 0.18270771205425262, 0.19330644607543945, 0.20390518009662628, 0.2145039141178131, 0.22510263323783875, 0.23570136725902557, 0.2463001012802124, 0.25689882040023804, 0.26749753952026367, 0.2780962884426117, 0.28869500756263733, 0.29929375648498535, 0.309892475605011, 0.3204911947250366, 0.33108994364738464, 0.3416886627674103, 0.3522874116897583, 0.36288613080978394]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 8.0, 15.0, 19.0, 22.0, 41.0, 106.0, 155.0, 389.0, 886.0, 2786.0, 20516.0, 4088995.0, 73555.0, 4650.0, 1245.0, 451.0, 197.0, 106.0, 44.0, 25.0, 16.0, 12.0, 5.0, 10.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32470703125, -0.3163108825683594, -0.30791473388671875, -0.2995185852050781, -0.2911224365234375, -0.2827262878417969, -0.27433013916015625, -0.2659339904785156, -0.257537841796875, -0.24914169311523438, -0.24074554443359375, -0.23234939575195312, -0.2239532470703125, -0.21555709838867188, -0.20716094970703125, -0.19876480102539062, -0.19036865234375, -0.18197250366210938, -0.17357635498046875, -0.16518020629882812, -0.1567840576171875, -0.14838790893554688, -0.13999176025390625, -0.13159561157226562, -0.123199462890625, -0.11480331420898438, -0.10640716552734375, -0.09801101684570312, -0.0896148681640625, -0.08121871948242188, -0.07282257080078125, -0.06442642211914062, -0.0560302734375, -0.047634124755859375, -0.03923797607421875, -0.030841827392578125, -0.0224456787109375, -0.014049530029296875, -0.00565338134765625, 0.002742767333984375, 0.011138916015625, 0.019535064697265625, 0.02793121337890625, 0.036327362060546875, 0.0447235107421875, 0.053119659423828125, 0.06151580810546875, 0.06991195678710938, 0.07830810546875, 0.08670425415039062, 0.09510040283203125, 0.10349655151367188, 0.1118927001953125, 0.12028884887695312, 0.12868499755859375, 0.13708114624023438, 0.145477294921875, 0.15387344360351562, 0.16226959228515625, 0.17066574096679688, 0.1790618896484375, 0.18745803833007812, 0.19585418701171875, 0.20425033569335938, 0.212646484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 16.0, 19.0, 27.0, 62.0, 72.0, 106.0, 117.0, 113.0, 128.0, 97.0, 82.0, 60.0, 34.0, 29.0, 12.0, 11.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0660400390625, -0.06455755233764648, -0.06307506561279297, -0.06159257888793945, -0.06011009216308594, -0.05862760543823242, -0.057145118713378906, -0.05566263198852539, -0.054180145263671875, -0.05269765853881836, -0.051215171813964844, -0.04973268508911133, -0.04825019836425781, -0.0467677116394043, -0.04528522491455078, -0.043802738189697266, -0.04232025146484375, -0.040837764739990234, -0.03935527801513672, -0.0378727912902832, -0.03639030456542969, -0.03490781784057617, -0.033425331115722656, -0.03194284439086914, -0.030460357666015625, -0.02897787094116211, -0.027495384216308594, -0.026012897491455078, -0.024530410766601562, -0.023047924041748047, -0.02156543731689453, -0.020082950592041016, -0.0186004638671875, -0.017117977142333984, -0.01563549041748047, -0.014153003692626953, -0.012670516967773438, -0.011188030242919922, -0.009705543518066406, -0.00822305679321289, -0.006740570068359375, -0.005258083343505859, -0.0037755966186523438, -0.002293109893798828, -0.0008106231689453125, 0.0006718635559082031, 0.0021543502807617188, 0.0036368370056152344, 0.00511932373046875, 0.006601810455322266, 0.008084297180175781, 0.009566783905029297, 0.011049270629882812, 0.012531757354736328, 0.014014244079589844, 0.01549673080444336, 0.016979217529296875, 0.01846170425415039, 0.019944190979003906, 0.021426677703857422, 0.022909164428710938, 0.024391651153564453, 0.02587413787841797, 0.027356624603271484, 0.028839111328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 3.0, 10.0, 16.0, 25.0, 46.0, 75.0, 129.0, 253.0, 541.0, 1233.0, 2828.0, 8873.0, 44899.0, 3456983.0, 633688.0, 32375.0, 7452.0, 2689.0, 1079.0, 521.0, 252.0, 150.0, 72.0, 38.0, 15.0, 11.0, 4.0, 8.0, 1.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12491130828857422, -0.12152671813964844, -0.11814212799072266, -0.11475753784179688, -0.1113729476928711, -0.10798835754394531, -0.10460376739501953, -0.10121917724609375, -0.09783458709716797, -0.09444999694824219, -0.0910654067993164, -0.08768081665039062, -0.08429622650146484, -0.08091163635253906, -0.07752704620361328, -0.0741424560546875, -0.07075786590576172, -0.06737327575683594, -0.06398868560791016, -0.060604095458984375, -0.057219505310058594, -0.05383491516113281, -0.05045032501220703, -0.04706573486328125, -0.04368114471435547, -0.04029655456542969, -0.036911964416503906, -0.033527374267578125, -0.030142784118652344, -0.026758193969726562, -0.02337360382080078, -0.019989013671875, -0.01660442352294922, -0.013219833374023438, -0.009835243225097656, -0.006450653076171875, -0.0030660629272460938, 0.0003185272216796875, 0.0037031173706054688, 0.00708770751953125, 0.010472297668457031, 0.013856887817382812, 0.017241477966308594, 0.020626068115234375, 0.024010658264160156, 0.027395248413085938, 0.03077983856201172, 0.0341644287109375, 0.03754901885986328, 0.04093360900878906, 0.044318199157714844, 0.047702789306640625, 0.051087379455566406, 0.05447196960449219, 0.05785655975341797, 0.06124114990234375, 0.06462574005126953, 0.06801033020019531, 0.0713949203491211, 0.07477951049804688, 0.07816410064697266, 0.08154869079589844, 0.08493328094482422, 0.08831787109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 7.0, 8.0, 10.0, 19.0, 49.0, 76.0, 141.0, 328.0, 2386.0, 540.0, 189.0, 96.0, 58.0, 34.0, 29.0, 8.0, 17.0, 12.0, 6.0, 7.0, 7.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.024566650390625, -0.02353191375732422, -0.022497177124023438, -0.021462440490722656, -0.020427703857421875, -0.019392967224121094, -0.018358230590820312, -0.01732349395751953, -0.01628875732421875, -0.015254020690917969, -0.014219284057617188, -0.013184547424316406, -0.012149810791015625, -0.011115074157714844, -0.010080337524414062, -0.009045600891113281, -0.0080108642578125, -0.006976127624511719, -0.0059413909912109375, -0.004906654357910156, -0.003871917724609375, -0.0028371810913085938, -0.0018024444580078125, -0.0007677078247070312, 0.00026702880859375, 0.0013017654418945312, 0.0023365020751953125, 0.0033712387084960938, 0.004405975341796875, 0.005440711975097656, 0.0064754486083984375, 0.007510185241699219, 0.008544921875, 0.009579658508300781, 0.010614395141601562, 0.011649131774902344, 0.012683868408203125, 0.013718605041503906, 0.014753341674804688, 0.01578807830810547, 0.01682281494140625, 0.01785755157470703, 0.018892288208007812, 0.019927024841308594, 0.020961761474609375, 0.021996498107910156, 0.023031234741210938, 0.02406597137451172, 0.0251007080078125, 0.02613544464111328, 0.027170181274414062, 0.028204917907714844, 0.029239654541015625, 0.030274391174316406, 0.03130912780761719, 0.03234386444091797, 0.03337860107421875, 0.03441333770751953, 0.03544807434082031, 0.036482810974121094, 0.037517547607421875, 0.038552284240722656, 0.03958702087402344, 0.04062175750732422, 0.041656494140625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 10.0, 41.0, 228.0, 432.0, 212.0, 53.0, 13.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10773447155952454, -0.09327729791402817, -0.0788201242685318, -0.06436295062303543, -0.04990577697753906, -0.035448603332042694, -0.020991429686546326, -0.006534256041049957, 0.007922917604446411, 0.02238009124994278, 0.03683726489543915, 0.051294438540935516, 0.06575161218643188, 0.08020878583192825, 0.09466595947742462, 0.10912313312292099, 0.12358030676841736, 0.13803747296333313, 0.1524946540594101, 0.16695183515548706, 0.18140900135040283, 0.1958661675453186, 0.21032334864139557, 0.22478052973747253, 0.2392376959323883, 0.2536948621273041, 0.26815205812454224, 0.282609224319458, 0.2970663905143738, 0.31152355670928955, 0.3259807229042053, 0.3404379189014435, 0.35489511489868164, 0.3693522810935974, 0.3838094472885132, 0.39826664328575134, 0.4127238094806671, 0.4271809756755829, 0.44163817167282104, 0.4560953378677368, 0.4705525040626526, 0.48500967025756836, 0.49946683645248413, 0.5139240026473999, 0.5283812284469604, 0.5428383946418762, 0.557295560836792, 0.5717527270317078, 0.5862098932266235, 0.6006670594215393, 0.6151242256164551, 0.6295813918113708, 0.6440385580062866, 0.6584957838058472, 0.6729529500007629, 0.6874101161956787, 0.7018672823905945, 0.7163244485855103, 0.730781614780426, 0.7452387809753418, 0.7596960067749023, 0.7741531729698181, 0.7886103391647339, 0.8030675053596497, 0.8175246715545654]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 11.0, 13.0, 19.0, 27.0, 59.0, 50.0, 85.0, 83.0, 80.0, 75.0, 89.0, 75.0, 76.0, 54.0, 56.0, 46.0, 35.0, 23.0, 18.0, 11.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1710517406463623, -0.16449570655822754, -0.15793967247009277, -0.151383638381958, -0.14482758939266205, -0.13827155530452728, -0.13171552121639252, -0.12515948712825775, -0.11860344558954239, -0.11204741150140762, -0.10549136996269226, -0.0989353358745575, -0.09237930178642273, -0.08582326024770737, -0.0792672261595726, -0.07271118462085724, -0.06615515053272247, -0.05959911271929741, -0.053043074905872345, -0.04648704081773758, -0.039931003004312515, -0.03337496519088745, -0.026818931102752686, -0.02026289328932762, -0.013706855475902557, -0.007150818593800068, -0.0005947817116975784, 0.005961254239082336, 0.0125172920525074, 0.019073329865932465, 0.02562936395406723, 0.032185401767492294, 0.03874143958091736, 0.04529747739434242, 0.05185351520776749, 0.05840954929590225, 0.06496559083461761, 0.07152162492275238, 0.07807765901088715, 0.08463369309902191, 0.09118973463773727, 0.09774576872587204, 0.1043018102645874, 0.11085784435272217, 0.11741387844085693, 0.1239699199795723, 0.13052594661712646, 0.13708199560642242, 0.1436380296945572, 0.15019406378269196, 0.15675009787082672, 0.16330614686012268, 0.16986218094825745, 0.1764182150363922, 0.18297424912452698, 0.18953028321266174, 0.1960863173007965, 0.20264235138893127, 0.20919838547706604, 0.2157544195652008, 0.22231046855449677, 0.22886650264263153, 0.2354225367307663, 0.24197857081890106, 0.24853461980819702]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 8.0, 16.0, 13.0, 34.0, 40.0, 81.0, 71.0, 173.0, 337.0, 629.0, 1437.0, 3816.0, 14155.0, 90346.0, 617774.0, 274664.0, 33681.0, 6937.0, 2271.0, 998.0, 439.0, 232.0, 122.0, 76.0, 62.0, 38.0, 28.0, 12.0, 12.0, 14.0, 8.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1392822265625, -0.13515567779541016, -0.1310291290283203, -0.12690258026123047, -0.12277603149414062, -0.11864948272705078, -0.11452293395996094, -0.1103963851928711, -0.10626983642578125, -0.1021432876586914, -0.09801673889160156, -0.09389019012451172, -0.08976364135742188, -0.08563709259033203, -0.08151054382324219, -0.07738399505615234, -0.0732574462890625, -0.06913089752197266, -0.06500434875488281, -0.06087779998779297, -0.056751251220703125, -0.05262470245361328, -0.04849815368652344, -0.044371604919433594, -0.04024505615234375, -0.036118507385253906, -0.03199195861816406, -0.02786540985107422, -0.023738861083984375, -0.01961231231689453, -0.015485763549804688, -0.011359214782714844, -0.007232666015625, -0.0031061172485351562, 0.0010204315185546875, 0.005146980285644531, 0.009273529052734375, 0.013400077819824219, 0.017526626586914062, 0.021653175354003906, 0.02577972412109375, 0.029906272888183594, 0.03403282165527344, 0.03815937042236328, 0.042285919189453125, 0.04641246795654297, 0.05053901672363281, 0.054665565490722656, 0.0587921142578125, 0.06291866302490234, 0.06704521179199219, 0.07117176055908203, 0.07529830932617188, 0.07942485809326172, 0.08355140686035156, 0.0876779556274414, 0.09180450439453125, 0.0959310531616211, 0.10005760192871094, 0.10418415069580078, 0.10831069946289062, 0.11243724822998047, 0.11656379699707031, 0.12069034576416016, 0.12481689453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 5.0, 6.0, 15.0, 23.0, 25.0, 45.0, 59.0, 91.0, 101.0, 107.0, 119.0, 99.0, 93.0, 69.0, 46.0, 46.0, 23.0, 12.0, 12.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.062042236328125, -0.06060457229614258, -0.059166908264160156, -0.057729244232177734, -0.05629158020019531, -0.05485391616821289, -0.05341625213623047, -0.05197858810424805, -0.050540924072265625, -0.0491032600402832, -0.04766559600830078, -0.04622793197631836, -0.04479026794433594, -0.043352603912353516, -0.041914939880371094, -0.04047727584838867, -0.03903961181640625, -0.03760194778442383, -0.036164283752441406, -0.034726619720458984, -0.03328895568847656, -0.03185129165649414, -0.03041362762451172, -0.028975963592529297, -0.027538299560546875, -0.026100635528564453, -0.02466297149658203, -0.02322530746459961, -0.021787643432617188, -0.020349979400634766, -0.018912315368652344, -0.017474651336669922, -0.0160369873046875, -0.014599323272705078, -0.013161659240722656, -0.011723995208740234, -0.010286331176757812, -0.00884866714477539, -0.007411003112792969, -0.005973339080810547, -0.004535675048828125, -0.003098011016845703, -0.0016603469848632812, -0.00022268295288085938, 0.0012149810791015625, 0.0026526451110839844, 0.004090309143066406, 0.005527973175048828, 0.00696563720703125, 0.008403301239013672, 0.009840965270996094, 0.011278629302978516, 0.012716293334960938, 0.01415395736694336, 0.015591621398925781, 0.017029285430908203, 0.018466949462890625, 0.019904613494873047, 0.02134227752685547, 0.02277994155883789, 0.024217605590820312, 0.025655269622802734, 0.027092933654785156, 0.028530597686767578, 0.02996826171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 11.0, 10.0, 5.0, 7.0, 8.0, 21.0, 27.0, 44.0, 67.0, 118.0, 170.0, 262.0, 499.0, 892.0, 1870.0, 4594.0, 13399.0, 48031.0, 250860.0, 561587.0, 122924.0, 27764.0, 8691.0, 3396.0, 1455.0, 748.0, 427.0, 245.0, 143.0, 108.0, 44.0, 56.0, 18.0, 18.0, 16.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.116455078125, -0.11333274841308594, -0.11021041870117188, -0.10708808898925781, -0.10396575927734375, -0.10084342956542969, -0.09772109985351562, -0.09459877014160156, -0.0914764404296875, -0.08835411071777344, -0.08523178100585938, -0.08210945129394531, -0.07898712158203125, -0.07586479187011719, -0.07274246215820312, -0.06962013244628906, -0.066497802734375, -0.06337547302246094, -0.060253143310546875, -0.05713081359863281, -0.05400848388671875, -0.05088615417480469, -0.047763824462890625, -0.04464149475097656, -0.0415191650390625, -0.03839683532714844, -0.035274505615234375, -0.03215217590332031, -0.02902984619140625, -0.025907516479492188, -0.022785186767578125, -0.019662857055664062, -0.01654052734375, -0.013418197631835938, -0.010295867919921875, -0.0071735382080078125, -0.00405120849609375, -0.0009288787841796875, 0.002193450927734375, 0.0053157806396484375, 0.0084381103515625, 0.011560440063476562, 0.014682769775390625, 0.017805099487304688, 0.02092742919921875, 0.024049758911132812, 0.027172088623046875, 0.030294418334960938, 0.033416748046875, 0.03653907775878906, 0.039661407470703125, 0.04278373718261719, 0.04590606689453125, 0.04902839660644531, 0.052150726318359375, 0.05527305603027344, 0.0583953857421875, 0.06151771545410156, 0.06464004516601562, 0.06776237487792969, 0.07088470458984375, 0.07400703430175781, 0.07712936401367188, 0.08025169372558594, 0.0833740234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 16.0, 17.0, 16.0, 12.0, 34.0, 46.0, 35.0, 47.0, 49.0, 60.0, 66.0, 68.0, 68.0, 74.0, 61.0, 55.0, 50.0, 45.0, 38.0, 22.0, 27.0, 20.0, 20.0, 12.0, 9.0, 8.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12329292297363281, -0.11853408813476562, -0.11377525329589844, -0.10901641845703125, -0.10425758361816406, -0.09949874877929688, -0.09473991394042969, -0.0899810791015625, -0.08522224426269531, -0.08046340942382812, -0.07570457458496094, -0.07094573974609375, -0.06618690490722656, -0.061428070068359375, -0.05666923522949219, -0.051910400390625, -0.04715156555175781, -0.042392730712890625, -0.03763389587402344, -0.03287506103515625, -0.028116226196289062, -0.023357391357421875, -0.018598556518554688, -0.0138397216796875, -0.009080886840820312, -0.004322052001953125, 0.0004367828369140625, 0.00519561767578125, 0.009954452514648438, 0.014713287353515625, 0.019472122192382812, 0.02423095703125, 0.028989791870117188, 0.033748626708984375, 0.03850746154785156, 0.04326629638671875, 0.04802513122558594, 0.052783966064453125, 0.05754280090332031, 0.0623016357421875, 0.06706047058105469, 0.07181930541992188, 0.07657814025878906, 0.08133697509765625, 0.08609580993652344, 0.09085464477539062, 0.09561347961425781, 0.100372314453125, 0.10513114929199219, 0.10988998413085938, 0.11464881896972656, 0.11940765380859375, 0.12416648864746094, 0.12892532348632812, 0.1336841583251953, 0.1384429931640625, 0.1432018280029297, 0.14796066284179688, 0.15271949768066406, 0.15747833251953125, 0.16223716735839844, 0.16699600219726562, 0.1717548370361328, 0.176513671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 7.0, 10.0, 14.0, 15.0, 21.0, 30.0, 54.0, 73.0, 131.0, 225.0, 352.0, 585.0, 1100.0, 2053.0, 4019.0, 9078.0, 26000.0, 160591.0, 733935.0, 78376.0, 17871.0, 6934.0, 3223.0, 1638.0, 876.0, 523.0, 329.0, 163.0, 117.0, 76.0, 42.0, 31.0, 22.0, 12.0, 8.0, 8.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054656982421875, -0.053110599517822266, -0.05156421661376953, -0.0500178337097168, -0.04847145080566406, -0.04692506790161133, -0.045378684997558594, -0.04383230209350586, -0.042285919189453125, -0.04073953628540039, -0.039193153381347656, -0.03764677047729492, -0.03610038757324219, -0.03455400466918945, -0.03300762176513672, -0.031461238861083984, -0.02991485595703125, -0.028368473052978516, -0.02682209014892578, -0.025275707244873047, -0.023729324340820312, -0.022182941436767578, -0.020636558532714844, -0.01909017562866211, -0.017543792724609375, -0.01599740982055664, -0.014451026916503906, -0.012904644012451172, -0.011358261108398438, -0.009811878204345703, -0.008265495300292969, -0.006719112396240234, -0.0051727294921875, -0.0036263465881347656, -0.0020799636840820312, -0.0005335807800292969, 0.0010128021240234375, 0.002559185028076172, 0.004105567932128906, 0.005651950836181641, 0.007198333740234375, 0.00874471664428711, 0.010291099548339844, 0.011837482452392578, 0.013383865356445312, 0.014930248260498047, 0.01647663116455078, 0.018023014068603516, 0.01956939697265625, 0.021115779876708984, 0.02266216278076172, 0.024208545684814453, 0.025754928588867188, 0.027301311492919922, 0.028847694396972656, 0.03039407730102539, 0.031940460205078125, 0.03348684310913086, 0.035033226013183594, 0.03657960891723633, 0.03812599182128906, 0.0396723747253418, 0.04121875762939453, 0.042765140533447266, 0.0443115234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 10.0, 10.0, 8.0, 13.0, 18.0, 17.0, 16.0, 23.0, 32.0, 25.0, 46.0, 81.0, 67.0, 82.0, 90.0, 108.0, 82.0, 56.0, 43.0, 26.0, 18.0, 21.0, 23.0, 19.0, 17.0, 7.0, 7.0, 11.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2218952178955078e-05, -1.1787749826908112e-05, -1.1356547474861145e-05, -1.0925345122814178e-05, -1.0494142770767212e-05, -1.0062940418720245e-05, -9.631738066673279e-06, -9.200535714626312e-06, -8.769333362579346e-06, -8.338131010532379e-06, -7.906928658485413e-06, -7.475726306438446e-06, -7.0445239543914795e-06, -6.613321602344513e-06, -6.182119250297546e-06, -5.75091689825058e-06, -5.319714546203613e-06, -4.888512194156647e-06, -4.45730984210968e-06, -4.026107490062714e-06, -3.594905138015747e-06, -3.1637027859687805e-06, -2.732500433921814e-06, -2.3012980818748474e-06, -1.8700957298278809e-06, -1.4388933777809143e-06, -1.0076910257339478e-06, -5.764886736869812e-07, -1.4528632164001465e-07, 2.859160304069519e-07, 7.171183824539185e-07, 1.148320734500885e-06, 1.5795230865478516e-06, 2.010725438594818e-06, 2.4419277906417847e-06, 2.8731301426887512e-06, 3.3043324947357178e-06, 3.7355348467826843e-06, 4.166737198829651e-06, 4.5979395508766174e-06, 5.029141902923584e-06, 5.4603442549705505e-06, 5.891546607017517e-06, 6.322748959064484e-06, 6.75395131111145e-06, 7.185153663158417e-06, 7.616356015205383e-06, 8.04755836725235e-06, 8.478760719299316e-06, 8.909963071346283e-06, 9.34116542339325e-06, 9.772367775440216e-06, 1.0203570127487183e-05, 1.063477247953415e-05, 1.1065974831581116e-05, 1.1497177183628082e-05, 1.1928379535675049e-05, 1.2359581887722015e-05, 1.2790784239768982e-05, 1.3221986591815948e-05, 1.3653188943862915e-05, 1.4084391295909882e-05, 1.4515593647956848e-05, 1.4946796000003815e-05, 1.537799835205078e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 8.0, 4.0, 16.0, 13.0, 31.0, 34.0, 41.0, 80.0, 117.0, 235.0, 488.0, 1336.0, 3756.0, 13341.0, 89238.0, 803768.0, 113146.0, 15873.0, 4240.0, 1544.0, 622.0, 280.0, 143.0, 69.0, 43.0, 33.0, 18.0, 10.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06707763671875, -0.06513595581054688, -0.06319427490234375, -0.061252593994140625, -0.0593109130859375, -0.057369232177734375, -0.05542755126953125, -0.053485870361328125, -0.051544189453125, -0.049602508544921875, -0.04766082763671875, -0.045719146728515625, -0.0437774658203125, -0.041835784912109375, -0.03989410400390625, -0.037952423095703125, -0.0360107421875, -0.034069061279296875, -0.03212738037109375, -0.030185699462890625, -0.0282440185546875, -0.026302337646484375, -0.02436065673828125, -0.022418975830078125, -0.020477294921875, -0.018535614013671875, -0.01659393310546875, -0.014652252197265625, -0.0127105712890625, -0.010768890380859375, -0.00882720947265625, -0.006885528564453125, -0.00494384765625, -0.003002166748046875, -0.00106048583984375, 0.000881195068359375, 0.0028228759765625, 0.004764556884765625, 0.00670623779296875, 0.008647918701171875, 0.010589599609375, 0.012531280517578125, 0.01447296142578125, 0.016414642333984375, 0.0183563232421875, 0.020298004150390625, 0.02223968505859375, 0.024181365966796875, 0.026123046875, 0.028064727783203125, 0.03000640869140625, 0.031948089599609375, 0.0338897705078125, 0.035831451416015625, 0.03777313232421875, 0.039714813232421875, 0.041656494140625, 0.043598175048828125, 0.04553985595703125, 0.047481536865234375, 0.0494232177734375, 0.051364898681640625, 0.05330657958984375, 0.055248260498046875, 0.05718994140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 5.0, 8.0, 12.0, 17.0, 28.0, 39.0, 54.0, 59.0, 106.0, 144.0, 114.0, 103.0, 57.0, 62.0, 35.0, 28.0, 21.0, 21.0, 13.0, 5.0, 6.0, 8.0, 5.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043182373046875, -0.04152059555053711, -0.03985881805419922, -0.03819704055786133, -0.03653526306152344, -0.03487348556518555, -0.033211708068847656, -0.031549930572509766, -0.029888153076171875, -0.028226375579833984, -0.026564598083496094, -0.024902820587158203, -0.023241043090820312, -0.021579265594482422, -0.01991748809814453, -0.01825571060180664, -0.01659393310546875, -0.01493215560913086, -0.013270378112792969, -0.011608600616455078, -0.009946823120117188, -0.008285045623779297, -0.006623268127441406, -0.004961490631103516, -0.003299713134765625, -0.0016379356384277344, 2.384185791015625e-05, 0.0016856193542480469, 0.0033473968505859375, 0.005009174346923828, 0.006670951843261719, 0.00833272933959961, 0.0099945068359375, 0.01165628433227539, 0.013318061828613281, 0.014979839324951172, 0.016641616821289062, 0.018303394317626953, 0.019965171813964844, 0.021626949310302734, 0.023288726806640625, 0.024950504302978516, 0.026612281799316406, 0.028274059295654297, 0.029935836791992188, 0.03159761428833008, 0.03325939178466797, 0.03492116928100586, 0.03658294677734375, 0.03824472427368164, 0.03990650177001953, 0.04156827926635742, 0.04323005676269531, 0.0448918342590332, 0.046553611755371094, 0.048215389251708984, 0.049877166748046875, 0.051538944244384766, 0.053200721740722656, 0.05486249923706055, 0.05652427673339844, 0.05818605422973633, 0.05984783172607422, 0.06150960922241211, 0.06317138671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 10.0, 24.0, 47.0, 109.0, 168.0, 267.0, 200.0, 92.0, 46.0, 20.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5806005001068115, -1.5362108945846558, -1.4918211698532104, -1.4474315643310547, -1.4030418395996094, -1.3586522340774536, -1.3142626285552979, -1.2698729038238525, -1.2254832983016968, -1.181093692779541, -1.1367039680480957, -1.09231436252594, -1.0479247570037842, -1.0035350322723389, -0.9591454267501831, -0.9147557616233826, -0.870366096496582, -0.8259764313697815, -0.781586766242981, -0.7371971607208252, -0.6928074955940247, -0.6484178304672241, -0.6040282249450684, -0.5596385598182678, -0.5152488946914673, -0.47085922956466675, -0.4264695942401886, -0.38207995891571045, -0.3376902937889099, -0.2933006286621094, -0.24891099333763123, -0.20452135801315308, -0.16013169288635254, -0.1157420426607132, -0.07135239243507385, -0.02696274220943451, 0.017426908016204834, 0.06181655824184418, 0.10620620846748352, 0.15059584379196167, 0.1949855089187622, 0.23937515914440155, 0.2837648093700409, 0.32815444469451904, 0.3725441098213196, 0.4169337749481201, 0.46132341027259827, 0.5057130455970764, 0.550102710723877, 0.5944923758506775, 0.638882040977478, 0.6832716464996338, 0.7276613116264343, 0.7720509767532349, 0.8164405822753906, 0.8608302474021912, 0.9052199125289917, 0.9496095776557922, 0.9939992427825928, 1.0383888483047485, 1.0827784538269043, 1.1271681785583496, 1.1715577840805054, 1.2159473896026611, 1.2603371143341064]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 8.0, 12.0, 14.0, 9.0, 11.0, 13.0, 26.0, 28.0, 21.0, 31.0, 39.0, 26.0, 25.0, 36.0, 48.0, 38.0, 42.0, 52.0, 52.0, 52.0, 35.0, 37.0, 47.0, 33.0, 40.0, 27.0, 24.0, 31.0, 20.0, 20.0, 19.0, 14.0, 10.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.752295732498169, -0.7290474772453308, -0.7057992219924927, -0.6825509071350098, -0.6593026518821716, -0.6360543966293335, -0.6128060817718506, -0.5895578265190125, -0.5663095712661743, -0.5430613160133362, -0.519813060760498, -0.49656474590301514, -0.473316490650177, -0.45006823539733887, -0.42681995034217834, -0.4035716652870178, -0.3803234100341797, -0.35707515478134155, -0.33382686972618103, -0.3105785846710205, -0.2873303294181824, -0.26408207416534424, -0.24083378911018372, -0.2175855189561844, -0.19433724880218506, -0.17108897864818573, -0.1478407084941864, -0.12459243834018707, -0.10134416818618774, -0.07809589803218842, -0.05484762787818909, -0.03159935772418976, -0.008351147174835205, 0.014897122979164124, 0.03814539313316345, 0.06139366328716278, 0.08464193344116211, 0.10789020359516144, 0.13113847374916077, 0.1543867439031601, 0.17763501405715942, 0.20088328421115875, 0.22413155436515808, 0.2473798245191574, 0.27062809467315674, 0.2938763499259949, 0.3171246349811554, 0.3403729200363159, 0.36362117528915405, 0.3868694305419922, 0.4101177155971527, 0.43336600065231323, 0.45661425590515137, 0.4798625111579895, 0.5031107664108276, 0.5263590812683105, 0.5496073365211487, 0.5728555917739868, 0.5961039066314697, 0.6193521618843079, 0.642600417137146, 0.6658486723899841, 0.6890969276428223, 0.7123452425003052, 0.7355934977531433]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 4.0, 5.0, 10.0, 13.0, 18.0, 14.0, 27.0, 63.0, 76.0, 149.0, 218.0, 412.0, 857.0, 1744.0, 4786.0, 19554.0, 221974.0, 3871193.0, 58511.0, 9387.0, 2837.0, 1187.0, 547.0, 277.0, 158.0, 101.0, 47.0, 37.0, 24.0, 12.0, 9.0, 7.0, 5.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.23828125, -0.23250770568847656, -0.22673416137695312, -0.2209606170654297, -0.21518707275390625, -0.2094135284423828, -0.20363998413085938, -0.19786643981933594, -0.1920928955078125, -0.18631935119628906, -0.18054580688476562, -0.1747722625732422, -0.16899871826171875, -0.1632251739501953, -0.15745162963867188, -0.15167808532714844, -0.145904541015625, -0.14013099670410156, -0.13435745239257812, -0.1285839080810547, -0.12281036376953125, -0.11703681945800781, -0.11126327514648438, -0.10548973083496094, -0.0997161865234375, -0.09394264221191406, -0.08816909790039062, -0.08239555358886719, -0.07662200927734375, -0.07084846496582031, -0.06507492065429688, -0.05930137634277344, -0.05352783203125, -0.04775428771972656, -0.041980743408203125, -0.03620719909667969, -0.03043365478515625, -0.024660110473632812, -0.018886566162109375, -0.013113021850585938, -0.0073394775390625, -0.0015659332275390625, 0.004207611083984375, 0.009981155395507812, 0.01575469970703125, 0.021528244018554688, 0.027301788330078125, 0.03307533264160156, 0.038848876953125, 0.04462242126464844, 0.050395965576171875, 0.05616950988769531, 0.06194305419921875, 0.06771659851074219, 0.07349014282226562, 0.07926368713378906, 0.0850372314453125, 0.09081077575683594, 0.09658432006835938, 0.10235786437988281, 0.10813140869140625, 0.11390495300292969, 0.11967849731445312, 0.12545204162597656, 0.1312255859375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 2.0, 8.0, 7.0, 23.0, 20.0, 32.0, 41.0, 57.0, 58.0, 78.0, 61.0, 91.0, 92.0, 93.0, 79.0, 56.0, 56.0, 48.0, 28.0, 30.0, 18.0, 7.0, 6.0, 7.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.06597900390625, -0.06444501876831055, -0.0629110336303711, -0.06137704849243164, -0.05984306335449219, -0.058309078216552734, -0.05677509307861328, -0.05524110794067383, -0.053707122802734375, -0.05217313766479492, -0.05063915252685547, -0.049105167388916016, -0.04757118225097656, -0.04603719711303711, -0.044503211975097656, -0.0429692268371582, -0.04143524169921875, -0.0399012565612793, -0.038367271423339844, -0.03683328628540039, -0.03529930114746094, -0.033765316009521484, -0.03223133087158203, -0.030697345733642578, -0.029163360595703125, -0.027629375457763672, -0.02609539031982422, -0.024561405181884766, -0.023027420043945312, -0.02149343490600586, -0.019959449768066406, -0.018425464630126953, -0.0168914794921875, -0.015357494354248047, -0.013823509216308594, -0.01228952407836914, -0.010755538940429688, -0.009221553802490234, -0.007687568664550781, -0.006153583526611328, -0.004619598388671875, -0.003085613250732422, -0.0015516281127929688, -1.7642974853515625e-05, 0.0015163421630859375, 0.0030503273010253906, 0.004584312438964844, 0.006118297576904297, 0.00765228271484375, 0.009186267852783203, 0.010720252990722656, 0.01225423812866211, 0.013788223266601562, 0.015322208404541016, 0.01685619354248047, 0.018390178680419922, 0.019924163818359375, 0.021458148956298828, 0.02299213409423828, 0.024526119232177734, 0.026060104370117188, 0.02759408950805664, 0.029128074645996094, 0.030662059783935547, 0.032196044921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 10.0, 24.0, 25.0, 38.0, 38.0, 61.0, 121.0, 210.0, 281.0, 511.0, 929.0, 1818.0, 4237.0, 12154.0, 45010.0, 339438.0, 3611995.0, 136889.0, 26223.0, 8103.0, 3010.0, 1415.0, 709.0, 389.0, 224.0, 132.0, 100.0, 47.0, 41.0, 32.0, 17.0, 14.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11956787109375, -0.11608314514160156, -0.11259841918945312, -0.10911369323730469, -0.10562896728515625, -0.10214424133300781, -0.09865951538085938, -0.09517478942871094, -0.0916900634765625, -0.08820533752441406, -0.08472061157226562, -0.08123588562011719, -0.07775115966796875, -0.07426643371582031, -0.07078170776367188, -0.06729698181152344, -0.063812255859375, -0.06032752990722656, -0.056842803955078125, -0.05335807800292969, -0.04987335205078125, -0.04638862609863281, -0.042903900146484375, -0.03941917419433594, -0.0359344482421875, -0.03244972229003906, -0.028964996337890625, -0.025480270385742188, -0.02199554443359375, -0.018510818481445312, -0.015026092529296875, -0.011541366577148438, -0.008056640625, -0.0045719146728515625, -0.001087188720703125, 0.0023975372314453125, 0.00588226318359375, 0.009366989135742188, 0.012851715087890625, 0.016336441040039062, 0.0198211669921875, 0.023305892944335938, 0.026790618896484375, 0.030275344848632812, 0.03376007080078125, 0.03724479675292969, 0.040729522705078125, 0.04421424865722656, 0.047698974609375, 0.05118370056152344, 0.054668426513671875, 0.05815315246582031, 0.06163787841796875, 0.06512260437011719, 0.06860733032226562, 0.07209205627441406, 0.0755767822265625, 0.07906150817871094, 0.08254623413085938, 0.08603096008300781, 0.08951568603515625, 0.09300041198730469, 0.09648513793945312, 0.09996986389160156, 0.10345458984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 15.0, 13.0, 15.0, 29.0, 52.0, 117.0, 330.0, 2562.0, 527.0, 160.0, 100.0, 49.0, 32.0, 28.0, 9.0, 10.0, 8.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0634765625, -0.06089973449707031, -0.058322906494140625, -0.05574607849121094, -0.05316925048828125, -0.05059242248535156, -0.048015594482421875, -0.04543876647949219, -0.0428619384765625, -0.04028511047363281, -0.037708282470703125, -0.03513145446777344, -0.03255462646484375, -0.029977798461914062, -0.027400970458984375, -0.024824142456054688, -0.022247314453125, -0.019670486450195312, -0.017093658447265625, -0.014516830444335938, -0.01194000244140625, -0.009363174438476562, -0.006786346435546875, -0.0042095184326171875, -0.0016326904296875, 0.0009441375732421875, 0.003520965576171875, 0.0060977935791015625, 0.00867462158203125, 0.011251449584960938, 0.013828277587890625, 0.016405105590820312, 0.01898193359375, 0.021558761596679688, 0.024135589599609375, 0.026712417602539062, 0.02928924560546875, 0.03186607360839844, 0.034442901611328125, 0.03701972961425781, 0.0395965576171875, 0.04217338562011719, 0.044750213623046875, 0.04732704162597656, 0.04990386962890625, 0.05248069763183594, 0.055057525634765625, 0.05763435363769531, 0.060211181640625, 0.06278800964355469, 0.06536483764648438, 0.06794166564941406, 0.07051849365234375, 0.07309532165527344, 0.07567214965820312, 0.07824897766113281, 0.0808258056640625, 0.08340263366699219, 0.08597946166992188, 0.08855628967285156, 0.09113311767578125, 0.09370994567871094, 0.09628677368164062, 0.09886360168457031, 0.1014404296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 10.0, 14.0, 41.0, 130.0, 235.0, 279.0, 178.0, 65.0, 32.0, 6.0, 9.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2674475312232971, -0.24943660199642181, -0.2314256727695465, -0.2134147584438324, -0.1954038292169571, -0.1773928999900818, -0.15938198566436768, -0.14137105643749237, -0.12336012721061707, -0.10534919798374176, -0.08733827620744705, -0.06932735443115234, -0.05131642520427704, -0.03330549597740173, -0.015294574201107025, 0.002716347575187683, 0.02072727680206299, 0.038738202303647995, 0.056749127805233, 0.07476004958152771, 0.09277097880840302, 0.11078190803527832, 0.12879282236099243, 0.14680375158786774, 0.16481468081474304, 0.18282561004161835, 0.20083653926849365, 0.21884745359420776, 0.23685838282108307, 0.2548693120479584, 0.2728802263736725, 0.290891170501709, 0.3089020252227783, 0.32691293954849243, 0.34492388367652893, 0.36293479800224304, 0.38094574213027954, 0.39895665645599365, 0.41696757078170776, 0.4349784851074219, 0.4529894292354584, 0.4710003435611725, 0.489011287689209, 0.5070222020149231, 0.5250331163406372, 0.5430440902709961, 0.5610550045967102, 0.5790659189224243, 0.5970768332481384, 0.6150877475738525, 0.6330986618995667, 0.6511096358299255, 0.6691205501556396, 0.6871314644813538, 0.7051423788070679, 0.723153293132782, 0.7411642074584961, 0.7591751217842102, 0.7771860361099243, 0.7951970100402832, 0.8132079243659973, 0.8312188386917114, 0.8492297530174255, 0.8672406673431396, 0.8852516412734985]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 10.0, 8.0, 21.0, 19.0, 25.0, 39.0, 32.0, 54.0, 73.0, 69.0, 63.0, 80.0, 77.0, 65.0, 65.0, 48.0, 41.0, 50.0, 34.0, 36.0, 22.0, 20.0, 9.0, 12.0, 16.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.285880446434021, -0.2766280770301819, -0.2673757076263428, -0.25812333822250366, -0.24887096881866455, -0.23961859941482544, -0.23036621510982513, -0.22111384570598602, -0.2118614763021469, -0.2026091068983078, -0.1933567374944687, -0.18410436809062958, -0.17485198378562927, -0.16559961438179016, -0.15634724497795105, -0.14709487557411194, -0.13784250617027283, -0.12859013676643372, -0.1193377673625946, -0.1100853905081749, -0.10083302110433578, -0.09158065170049667, -0.08232827484607697, -0.07307590544223785, -0.06382353603839874, -0.05457116663455963, -0.04531879350543022, -0.03606642037630081, -0.0268140509724617, -0.01756168156862259, -0.00830930843949318, 0.0009430646896362305, 0.010195434093475342, 0.019447805359959602, 0.028700176626443863, 0.03795254975557327, 0.047204919159412384, 0.056457288563251495, 0.0657096654176712, 0.07496203482151031, 0.08421440422534943, 0.09346677362918854, 0.10271914303302765, 0.11197151988744736, 0.12122388929128647, 0.13047626614570618, 0.1397286355495453, 0.1489810049533844, 0.1582333743572235, 0.16748574376106262, 0.17673811316490173, 0.18599048256874084, 0.19524285197257996, 0.20449522137641907, 0.21374760568141937, 0.22299997508525848, 0.2322523444890976, 0.2415047138929367, 0.250757098197937, 0.2600094676017761, 0.26926183700561523, 0.27851420640945435, 0.28776657581329346, 0.29701894521713257, 0.3062713146209717]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 17.0, 29.0, 25.0, 46.0, 55.0, 117.0, 191.0, 428.0, 876.0, 2366.0, 7144.0, 28771.0, 161458.0, 619962.0, 182789.0, 32067.0, 7826.0, 2495.0, 928.0, 459.0, 210.0, 98.0, 61.0, 44.0, 24.0, 18.0, 15.0, 8.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.18055343627929688, -0.17482757568359375, -0.16910171508789062, -0.1633758544921875, -0.15764999389648438, -0.15192413330078125, -0.14619827270507812, -0.140472412109375, -0.13474655151367188, -0.12902069091796875, -0.12329483032226562, -0.1175689697265625, -0.11184310913085938, -0.10611724853515625, -0.10039138793945312, -0.09466552734375, -0.08893966674804688, -0.08321380615234375, -0.07748794555664062, -0.0717620849609375, -0.06603622436523438, -0.06031036376953125, -0.054584503173828125, -0.048858642578125, -0.043132781982421875, -0.03740692138671875, -0.031681060791015625, -0.0259552001953125, -0.020229339599609375, -0.01450347900390625, -0.008777618408203125, -0.0030517578125, 0.002674102783203125, 0.00839996337890625, 0.014125823974609375, 0.0198516845703125, 0.025577545166015625, 0.03130340576171875, 0.037029266357421875, 0.042755126953125, 0.048480987548828125, 0.05420684814453125, 0.059932708740234375, 0.0656585693359375, 0.07138442993164062, 0.07711029052734375, 0.08283615112304688, 0.08856201171875, 0.09428787231445312, 0.10001373291015625, 0.10573959350585938, 0.1114654541015625, 0.11719131469726562, 0.12291717529296875, 0.12864303588867188, 0.134368896484375, 0.14009475708007812, 0.14582061767578125, 0.15154647827148438, 0.1572723388671875, 0.16299819946289062, 0.16872406005859375, 0.17444992065429688, 0.18017578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 2.0, 10.0, 18.0, 21.0, 26.0, 30.0, 43.0, 51.0, 57.0, 68.0, 89.0, 84.0, 68.0, 71.0, 88.0, 61.0, 50.0, 50.0, 29.0, 29.0, 17.0, 12.0, 10.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.060943603515625, -0.05945444107055664, -0.05796527862548828, -0.05647611618041992, -0.05498695373535156, -0.0534977912902832, -0.052008628845214844, -0.050519466400146484, -0.049030303955078125, -0.047541141510009766, -0.046051979064941406, -0.04456281661987305, -0.04307365417480469, -0.04158449172973633, -0.04009532928466797, -0.03860616683959961, -0.03711700439453125, -0.03562784194946289, -0.03413867950439453, -0.03264951705932617, -0.031160354614257812, -0.029671192169189453, -0.028182029724121094, -0.026692867279052734, -0.025203704833984375, -0.023714542388916016, -0.022225379943847656, -0.020736217498779297, -0.019247055053710938, -0.017757892608642578, -0.01626873016357422, -0.01477956771850586, -0.0132904052734375, -0.01180124282836914, -0.010312080383300781, -0.008822917938232422, -0.0073337554931640625, -0.005844593048095703, -0.004355430603027344, -0.0028662681579589844, -0.001377105712890625, 0.00011205673217773438, 0.0016012191772460938, 0.003090381622314453, 0.0045795440673828125, 0.006068706512451172, 0.007557868957519531, 0.00904703140258789, 0.01053619384765625, 0.01202535629272461, 0.013514518737792969, 0.015003681182861328, 0.016492843627929688, 0.017982006072998047, 0.019471168518066406, 0.020960330963134766, 0.022449493408203125, 0.023938655853271484, 0.025427818298339844, 0.026916980743408203, 0.028406143188476562, 0.029895305633544922, 0.03138446807861328, 0.03287363052368164, 0.03436279296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 5.0, 12.0, 17.0, 16.0, 21.0, 32.0, 67.0, 80.0, 120.0, 243.0, 344.0, 659.0, 1375.0, 3201.0, 8664.0, 26862.0, 118285.0, 565469.0, 252833.0, 47867.0, 13733.0, 4705.0, 1826.0, 890.0, 484.0, 280.0, 160.0, 92.0, 62.0, 43.0, 35.0, 16.0, 13.0, 11.0, 2.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.18897438049316406, -0.18336868286132812, -0.1777629852294922, -0.17215728759765625, -0.1665515899658203, -0.16094589233398438, -0.15534019470214844, -0.1497344970703125, -0.14412879943847656, -0.13852310180664062, -0.1329174041748047, -0.12731170654296875, -0.12170600891113281, -0.11610031127929688, -0.11049461364746094, -0.104888916015625, -0.09928321838378906, -0.09367752075195312, -0.08807182312011719, -0.08246612548828125, -0.07686042785644531, -0.07125473022460938, -0.06564903259277344, -0.0600433349609375, -0.05443763732910156, -0.048831939697265625, -0.04322624206542969, -0.03762054443359375, -0.03201484680175781, -0.026409149169921875, -0.020803451538085938, -0.01519775390625, -0.009592056274414062, -0.003986358642578125, 0.0016193389892578125, 0.00722503662109375, 0.012830734252929688, 0.018436431884765625, 0.024042129516601562, 0.0296478271484375, 0.03525352478027344, 0.040859222412109375, 0.04646492004394531, 0.05207061767578125, 0.05767631530761719, 0.06328201293945312, 0.06888771057128906, 0.074493408203125, 0.08009910583496094, 0.08570480346679688, 0.09131050109863281, 0.09691619873046875, 0.10252189636230469, 0.10812759399414062, 0.11373329162597656, 0.1193389892578125, 0.12494468688964844, 0.13055038452148438, 0.1361560821533203, 0.14176177978515625, 0.1473674774169922, 0.15297317504882812, 0.15857887268066406, 0.1641845703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 11.0, 13.0, 13.0, 13.0, 22.0, 27.0, 23.0, 31.0, 48.0, 34.0, 54.0, 54.0, 43.0, 41.0, 63.0, 60.0, 55.0, 68.0, 48.0, 38.0, 48.0, 43.0, 32.0, 25.0, 18.0, 17.0, 18.0, 12.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.244384765625, -0.2371063232421875, -0.229827880859375, -0.2225494384765625, -0.21527099609375, -0.2079925537109375, -0.200714111328125, -0.1934356689453125, -0.1861572265625, -0.1788787841796875, -0.171600341796875, -0.1643218994140625, -0.15704345703125, -0.1497650146484375, -0.142486572265625, -0.1352081298828125, -0.1279296875, -0.1206512451171875, -0.113372802734375, -0.1060943603515625, -0.09881591796875, -0.0915374755859375, -0.084259033203125, -0.0769805908203125, -0.0697021484375, -0.0624237060546875, -0.055145263671875, -0.0478668212890625, -0.04058837890625, -0.0333099365234375, -0.026031494140625, -0.0187530517578125, -0.011474609375, -0.0041961669921875, 0.003082275390625, 0.0103607177734375, 0.01763916015625, 0.0249176025390625, 0.032196044921875, 0.0394744873046875, 0.0467529296875, 0.0540313720703125, 0.061309814453125, 0.0685882568359375, 0.07586669921875, 0.0831451416015625, 0.090423583984375, 0.0977020263671875, 0.10498046875, 0.1122589111328125, 0.119537353515625, 0.1268157958984375, 0.13409423828125, 0.1413726806640625, 0.148651123046875, 0.1559295654296875, 0.1632080078125, 0.1704864501953125, 0.177764892578125, 0.1850433349609375, 0.19232177734375, 0.1996002197265625, 0.206878662109375, 0.2141571044921875, 0.221435546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 15.0, 15.0, 15.0, 29.0, 36.0, 52.0, 73.0, 97.0, 163.0, 259.0, 459.0, 778.0, 1538.0, 3143.0, 7827.0, 26748.0, 204044.0, 707684.0, 70636.0, 14764.0, 5241.0, 2245.0, 1069.0, 548.0, 338.0, 236.0, 142.0, 93.0, 72.0, 51.0, 31.0, 28.0, 9.0, 14.0, 12.0, 10.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.116943359375, -0.11371994018554688, -0.11049652099609375, -0.10727310180664062, -0.1040496826171875, -0.10082626342773438, -0.09760284423828125, -0.09437942504882812, -0.091156005859375, -0.08793258666992188, -0.08470916748046875, -0.08148574829101562, -0.0782623291015625, -0.07503890991210938, -0.07181549072265625, -0.06859207153320312, -0.06536865234375, -0.062145233154296875, -0.05892181396484375, -0.055698394775390625, -0.0524749755859375, -0.049251556396484375, -0.04602813720703125, -0.042804718017578125, -0.039581298828125, -0.036357879638671875, -0.03313446044921875, -0.029911041259765625, -0.0266876220703125, -0.023464202880859375, -0.02024078369140625, -0.017017364501953125, -0.0137939453125, -0.010570526123046875, -0.00734710693359375, -0.004123687744140625, -0.0009002685546875, 0.002323150634765625, 0.00554656982421875, 0.008769989013671875, 0.011993408203125, 0.015216827392578125, 0.01844024658203125, 0.021663665771484375, 0.0248870849609375, 0.028110504150390625, 0.03133392333984375, 0.034557342529296875, 0.03778076171875, 0.041004180908203125, 0.04422760009765625, 0.047451019287109375, 0.0506744384765625, 0.053897857666015625, 0.05712127685546875, 0.060344696044921875, 0.063568115234375, 0.06679153442382812, 0.07001495361328125, 0.07323837280273438, 0.0764617919921875, 0.07968521118164062, 0.08290863037109375, 0.08613204956054688, 0.08935546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 7.0, 3.0, 9.0, 17.0, 13.0, 20.0, 39.0, 66.0, 73.0, 100.0, 148.0, 129.0, 115.0, 85.0, 41.0, 35.0, 28.0, 19.0, 10.0, 7.0, 4.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.282857894897461e-05, -2.2036954760551453e-05, -2.1245330572128296e-05, -2.045370638370514e-05, -1.9662082195281982e-05, -1.8870458006858826e-05, -1.807883381843567e-05, -1.7287209630012512e-05, -1.6495585441589355e-05, -1.57039612531662e-05, -1.4912337064743042e-05, -1.4120712876319885e-05, -1.3329088687896729e-05, -1.2537464499473572e-05, -1.1745840311050415e-05, -1.0954216122627258e-05, -1.0162591934204102e-05, -9.370967745780945e-06, -8.579343557357788e-06, -7.787719368934631e-06, -6.996095180511475e-06, -6.204470992088318e-06, -5.412846803665161e-06, -4.621222615242004e-06, -3.829598426818848e-06, -3.037974238395691e-06, -2.246350049972534e-06, -1.4547258615493774e-06, -6.631016731262207e-07, 1.2852251529693604e-07, 9.201467037200928e-07, 1.7117708921432495e-06, 2.5033950805664062e-06, 3.295019268989563e-06, 4.08664345741272e-06, 4.8782676458358765e-06, 5.669891834259033e-06, 6.46151602268219e-06, 7.253140211105347e-06, 8.044764399528503e-06, 8.83638858795166e-06, 9.628012776374817e-06, 1.0419636964797974e-05, 1.121126115322113e-05, 1.2002885341644287e-05, 1.2794509530067444e-05, 1.35861337184906e-05, 1.4377757906913757e-05, 1.5169382095336914e-05, 1.596100628376007e-05, 1.6752630472183228e-05, 1.7544254660606384e-05, 1.833587884902954e-05, 1.9127503037452698e-05, 1.9919127225875854e-05, 2.071075141429901e-05, 2.1502375602722168e-05, 2.2293999791145325e-05, 2.308562397956848e-05, 2.3877248167991638e-05, 2.4668872356414795e-05, 2.546049654483795e-05, 2.625212073326111e-05, 2.7043744921684265e-05, 2.7835369110107422e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 4.0, 11.0, 9.0, 17.0, 22.0, 34.0, 47.0, 82.0, 146.0, 217.0, 377.0, 662.0, 1252.0, 2668.0, 7222.0, 39536.0, 770325.0, 201941.0, 15655.0, 4365.0, 1803.0, 930.0, 465.0, 286.0, 148.0, 107.0, 53.0, 46.0, 40.0, 23.0, 15.0, 10.0, 16.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.150390625, -0.1463003158569336, -0.1422100067138672, -0.13811969757080078, -0.13402938842773438, -0.12993907928466797, -0.12584877014160156, -0.12175846099853516, -0.11766815185546875, -0.11357784271240234, -0.10948753356933594, -0.10539722442626953, -0.10130691528320312, -0.09721660614013672, -0.09312629699707031, -0.0890359878540039, -0.0849456787109375, -0.0808553695678711, -0.07676506042480469, -0.07267475128173828, -0.06858444213867188, -0.06449413299560547, -0.06040382385253906, -0.056313514709472656, -0.05222320556640625, -0.048132896423339844, -0.04404258728027344, -0.03995227813720703, -0.035861968994140625, -0.03177165985107422, -0.027681350708007812, -0.023591041564941406, -0.019500732421875, -0.015410423278808594, -0.011320114135742188, -0.007229804992675781, -0.003139495849609375, 0.0009508132934570312, 0.0050411224365234375, 0.009131431579589844, 0.01322174072265625, 0.017312049865722656, 0.021402359008789062, 0.02549266815185547, 0.029582977294921875, 0.03367328643798828, 0.03776359558105469, 0.041853904724121094, 0.0459442138671875, 0.050034523010253906, 0.05412483215332031, 0.05821514129638672, 0.062305450439453125, 0.06639575958251953, 0.07048606872558594, 0.07457637786865234, 0.07866668701171875, 0.08275699615478516, 0.08684730529785156, 0.09093761444091797, 0.09502792358398438, 0.09911823272705078, 0.10320854187011719, 0.1072988510131836, 0.11138916015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 0.0, 3.0, 4.0, 10.0, 9.0, 20.0, 36.0, 67.0, 149.0, 228.0, 200.0, 108.0, 70.0, 36.0, 19.0, 13.0, 14.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.1564311981201172, -0.15038681030273438, -0.14434242248535156, -0.13829803466796875, -0.13225364685058594, -0.12620925903320312, -0.12016487121582031, -0.1141204833984375, -0.10807609558105469, -0.10203170776367188, -0.09598731994628906, -0.08994293212890625, -0.08389854431152344, -0.07785415649414062, -0.07180976867675781, -0.065765380859375, -0.05972099304199219, -0.053676605224609375, -0.04763221740722656, -0.04158782958984375, -0.03554344177246094, -0.029499053955078125, -0.023454666137695312, -0.0174102783203125, -0.011365890502929688, -0.005321502685546875, 0.0007228851318359375, 0.00676727294921875, 0.012811660766601562, 0.018856048583984375, 0.024900436401367188, 0.03094482421875, 0.03698921203613281, 0.043033599853515625, 0.04907798767089844, 0.05512237548828125, 0.06116676330566406, 0.06721115112304688, 0.07325553894042969, 0.0792999267578125, 0.08534431457519531, 0.09138870239257812, 0.09743309020996094, 0.10347747802734375, 0.10952186584472656, 0.11556625366210938, 0.12161064147949219, 0.127655029296875, 0.1336994171142578, 0.13974380493164062, 0.14578819274902344, 0.15183258056640625, 0.15787696838378906, 0.16392135620117188, 0.1699657440185547, 0.1760101318359375, 0.1820545196533203, 0.18809890747070312, 0.19414329528808594, 0.20018768310546875, 0.20623207092285156, 0.21227645874023438, 0.2183208465576172, 0.224365234375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 11.0, 6.0, 13.0, 24.0, 42.0, 69.0, 126.0, 181.0, 189.0, 152.0, 86.0, 43.0, 18.0, 25.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9360122680664062, -1.877883791923523, -1.81975519657135, -1.7616267204284668, -1.7034982442855835, -1.6453697681427002, -1.5872411727905273, -1.529112696647644, -1.4709842205047607, -1.4128557443618774, -1.3547271490097046, -1.2965986728668213, -1.238470196723938, -1.1803417205810547, -1.1222131252288818, -1.0640846490859985, -1.0059561729431152, -0.9478276371955872, -0.8896991610527039, -0.8315706253051758, -0.7734421491622925, -0.7153136134147644, -0.6571850776672363, -0.599056601524353, -0.5409280061721802, -0.4827995002269745, -0.4246709942817688, -0.3665424585342407, -0.3084139823913574, -0.25028544664382935, -0.19215694069862366, -0.13402843475341797, -0.07589995861053467, -0.01777144894003868, 0.040357060730457306, 0.09848557412624359, 0.15661408007144928, 0.21474260091781616, 0.27287110686302185, 0.33099961280822754, 0.3891281187534332, 0.4472566246986389, 0.505385160446167, 0.5635136365890503, 0.6216421723365784, 0.6797707080841064, 0.7378991842269897, 0.796027660369873, 0.8541561961174011, 0.9122847318649292, 0.9704132080078125, 1.0285416841506958, 1.0866702795028687, 1.144798755645752, 1.2029272317886353, 1.2610557079315186, 1.3191843032836914, 1.3773127794265747, 1.4354413747787476, 1.4935698509216309, 1.5516983270645142, 1.6098268032073975, 1.6679553985595703, 1.7260838747024536, 1.784212350845337]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 14.0, 12.0, 12.0, 10.0, 17.0, 20.0, 24.0, 30.0, 29.0, 35.0, 37.0, 30.0, 52.0, 59.0, 48.0, 44.0, 64.0, 57.0, 51.0, 52.0, 39.0, 42.0, 34.0, 34.0, 26.0, 22.0, 23.0, 13.0, 13.0, 12.0, 8.0, 9.0, 2.0, 3.0, 1.0, 3.0, 6.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.576378583908081, -1.5293853282928467, -1.4823921918869019, -1.4353989362716675, -1.3884057998657227, -1.3414125442504883, -1.294419288635254, -1.2474260330200195, -1.2004328966140747, -1.1534396409988403, -1.1064465045928955, -1.0594532489776611, -1.0124599933624268, -0.9654668569564819, -0.9184736013412476, -0.871480405330658, -0.8244872093200684, -0.7774940133094788, -0.7305008172988892, -0.6835075616836548, -0.6365143656730652, -0.5895211696624756, -0.5425279140472412, -0.4955347180366516, -0.448541522026062, -0.4015483260154724, -0.3545551002025604, -0.30756187438964844, -0.26056867837905884, -0.21357546746730804, -0.16658225655555725, -0.11958903074264526, -0.07259595394134521, -0.02560274302959442, 0.021390467882156372, 0.06838367879390717, 0.11537688970565796, 0.16237010061740875, 0.20936331152915955, 0.25635653734207153, 0.30334973335266113, 0.35034292936325073, 0.3973361551761627, 0.4443293809890747, 0.4913225769996643, 0.5383157730102539, 0.5853090286254883, 0.6323022246360779, 0.6792954206466675, 0.7262886166572571, 0.7732818126678467, 0.820275068283081, 0.8672682642936707, 0.9142614603042603, 0.9612547159194946, 1.0082478523254395, 1.0552411079406738, 1.1022343635559082, 1.149227499961853, 1.1962207555770874, 1.2432138919830322, 1.2902071475982666, 1.337200403213501, 1.3841936588287354, 1.4311867952346802]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 11.0, 20.0, 30.0, 40.0, 58.0, 100.0, 216.0, 457.0, 1432.0, 5358.0, 43699.0, 4110863.0, 26125.0, 4009.0, 995.0, 416.0, 182.0, 98.0, 57.0, 42.0, 20.0, 15.0, 9.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415771484375, -0.40435028076171875, -0.3929290771484375, -0.38150787353515625, -0.370086669921875, -0.35866546630859375, -0.3472442626953125, -0.33582305908203125, -0.32440185546875, -0.31298065185546875, -0.3015594482421875, -0.29013824462890625, -0.278717041015625, -0.26729583740234375, -0.2558746337890625, -0.24445343017578125, -0.2330322265625, -0.22161102294921875, -0.2101898193359375, -0.19876861572265625, -0.187347412109375, -0.17592620849609375, -0.1645050048828125, -0.15308380126953125, -0.14166259765625, -0.13024139404296875, -0.1188201904296875, -0.10739898681640625, -0.095977783203125, -0.08455657958984375, -0.0731353759765625, -0.06171417236328125, -0.05029296875, -0.03887176513671875, -0.0274505615234375, -0.01602935791015625, -0.004608154296875, 0.00681304931640625, 0.0182342529296875, 0.02965545654296875, 0.04107666015625, 0.05249786376953125, 0.0639190673828125, 0.07534027099609375, 0.086761474609375, 0.09818267822265625, 0.1096038818359375, 0.12102508544921875, 0.1324462890625, 0.14386749267578125, 0.1552886962890625, 0.16670989990234375, 0.178131103515625, 0.18955230712890625, 0.2009735107421875, 0.21239471435546875, 0.22381591796875, 0.23523712158203125, 0.2466583251953125, 0.25807952880859375, 0.269500732421875, 0.28092193603515625, 0.2923431396484375, 0.30376434326171875, 0.315185546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 16.0, 16.0, 23.0, 38.0, 38.0, 52.0, 49.0, 58.0, 80.0, 60.0, 74.0, 84.0, 75.0, 68.0, 41.0, 58.0, 49.0, 22.0, 14.0, 17.0, 17.0, 10.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0736083984375, -0.07158041000366211, -0.06955242156982422, -0.06752443313598633, -0.06549644470214844, -0.06346845626831055, -0.061440467834472656, -0.059412479400634766, -0.057384490966796875, -0.055356502532958984, -0.053328514099121094, -0.0513005256652832, -0.04927253723144531, -0.04724454879760742, -0.04521656036376953, -0.04318857192993164, -0.04116058349609375, -0.03913259506225586, -0.03710460662841797, -0.03507661819458008, -0.03304862976074219, -0.031020641326904297, -0.028992652893066406, -0.026964664459228516, -0.024936676025390625, -0.022908687591552734, -0.020880699157714844, -0.018852710723876953, -0.016824722290039062, -0.014796733856201172, -0.012768745422363281, -0.01074075698852539, -0.0087127685546875, -0.006684780120849609, -0.004656791687011719, -0.002628803253173828, -0.0006008148193359375, 0.0014271736145019531, 0.0034551620483398438, 0.005483150482177734, 0.007511138916015625, 0.009539127349853516, 0.011567115783691406, 0.013595104217529297, 0.015623092651367188, 0.017651081085205078, 0.01967906951904297, 0.02170705795288086, 0.02373504638671875, 0.02576303482055664, 0.02779102325439453, 0.029819011688232422, 0.03184700012207031, 0.0338749885559082, 0.035902976989746094, 0.037930965423583984, 0.039958953857421875, 0.041986942291259766, 0.044014930725097656, 0.04604291915893555, 0.04807090759277344, 0.05009889602661133, 0.05212688446044922, 0.05415487289428711, 0.056182861328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 8.0, 12.0, 15.0, 15.0, 18.0, 36.0, 57.0, 70.0, 116.0, 181.0, 261.0, 329.0, 549.0, 852.0, 1281.0, 2197.0, 4170.0, 8665.0, 22996.0, 105596.0, 3958081.0, 57375.0, 16313.0, 6747.0, 3332.0, 1780.0, 1135.0, 706.0, 403.0, 320.0, 237.0, 137.0, 95.0, 65.0, 38.0, 30.0, 16.0, 13.0, 16.0, 8.0, 7.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1966552734375, -0.19017410278320312, -0.18369293212890625, -0.17721176147460938, -0.1707305908203125, -0.16424942016601562, -0.15776824951171875, -0.15128707885742188, -0.144805908203125, -0.13832473754882812, -0.13184356689453125, -0.12536239624023438, -0.1188812255859375, -0.11240005493164062, -0.10591888427734375, -0.09943771362304688, -0.09295654296875, -0.08647537231445312, -0.07999420166015625, -0.07351303100585938, -0.0670318603515625, -0.060550689697265625, -0.05406951904296875, -0.047588348388671875, -0.041107177734375, -0.034626007080078125, -0.02814483642578125, -0.021663665771484375, -0.0151824951171875, -0.008701324462890625, -0.00222015380859375, 0.004261016845703125, 0.0107421875, 0.017223358154296875, 0.02370452880859375, 0.030185699462890625, 0.0366668701171875, 0.043148040771484375, 0.04962921142578125, 0.056110382080078125, 0.062591552734375, 0.06907272338867188, 0.07555389404296875, 0.08203506469726562, 0.0885162353515625, 0.09499740600585938, 0.10147857666015625, 0.10795974731445312, 0.11444091796875, 0.12092208862304688, 0.12740325927734375, 0.13388442993164062, 0.1403656005859375, 0.14684677124023438, 0.15332794189453125, 0.15980911254882812, 0.166290283203125, 0.17277145385742188, 0.17925262451171875, 0.18573379516601562, 0.1922149658203125, 0.19869613647460938, 0.20517730712890625, 0.21165847778320312, 0.2181396484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 16.0, 10.0, 25.0, 16.0, 68.0, 438.0, 3299.0, 75.0, 39.0, 29.0, 12.0, 11.0, 6.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07440185546875, -0.07239246368408203, -0.07038307189941406, -0.0683736801147461, -0.06636428833007812, -0.06435489654541016, -0.06234550476074219, -0.06033611297607422, -0.05832672119140625, -0.05631732940673828, -0.05430793762207031, -0.052298545837402344, -0.050289154052734375, -0.048279762268066406, -0.04627037048339844, -0.04426097869873047, -0.0422515869140625, -0.04024219512939453, -0.03823280334472656, -0.036223411560058594, -0.034214019775390625, -0.032204627990722656, -0.030195236206054688, -0.02818584442138672, -0.02617645263671875, -0.02416706085205078, -0.022157669067382812, -0.020148277282714844, -0.018138885498046875, -0.016129493713378906, -0.014120101928710938, -0.012110710144042969, -0.010101318359375, -0.008091926574707031, -0.0060825347900390625, -0.004073143005371094, -0.002063751220703125, -5.435943603515625e-05, 0.0019550323486328125, 0.003964424133300781, 0.00597381591796875, 0.007983207702636719, 0.009992599487304688, 0.012001991271972656, 0.014011383056640625, 0.016020774841308594, 0.018030166625976562, 0.02003955841064453, 0.0220489501953125, 0.02405834197998047, 0.026067733764648438, 0.028077125549316406, 0.030086517333984375, 0.032095909118652344, 0.03410530090332031, 0.03611469268798828, 0.03812408447265625, 0.04013347625732422, 0.04214286804199219, 0.044152259826660156, 0.046161651611328125, 0.048171043395996094, 0.05018043518066406, 0.05218982696533203, 0.05419921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 11.0, 9.0, 13.0, 12.0, 24.0, 40.0, 52.0, 72.0, 118.0, 111.0, 111.0, 130.0, 86.0, 73.0, 48.0, 35.0, 20.0, 17.0, 11.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2768574059009552, -0.27058255672454834, -0.2643077075481415, -0.25803282856941223, -0.25175797939300537, -0.2454831302165985, -0.23920828104019165, -0.2329334169626236, -0.22665856778621674, -0.22038371860980988, -0.21410885453224182, -0.20783400535583496, -0.2015591412782669, -0.19528429210186005, -0.189009428024292, -0.18273457884788513, -0.17645972967147827, -0.1701848804950714, -0.16391001641750336, -0.1576351672410965, -0.15136030316352844, -0.14508545398712158, -0.13881060481071472, -0.13253574073314667, -0.1262608766555786, -0.11998602002859116, -0.1137111634016037, -0.10743631422519684, -0.10116145759820938, -0.09488660097122192, -0.08861174434423447, -0.08233688771724701, -0.07606203854084015, -0.06978718191385269, -0.06351232528686523, -0.057237472385168076, -0.05096261948347092, -0.04468776285648346, -0.038412906229496, -0.03213805332779884, -0.025863196700811386, -0.019588341936469078, -0.013313486240804195, -0.007038630545139313, -0.0007637757807970047, 0.005511078983545303, 0.01178593561053276, 0.01806078851222992, 0.024335645139217377, 0.030610499903559685, 0.03688535466790199, 0.04316021129488945, 0.04943506419658661, 0.055709920823574066, 0.06198477745056152, 0.06825962662696838, 0.07453449070453644, 0.0808093473315239, 0.08708420395851135, 0.09335905313491821, 0.09963390976190567, 0.10590876638889313, 0.11218362301588058, 0.11845847964286804, 0.1247333288192749]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 17.0, 11.0, 14.0, 16.0, 22.0, 28.0, 32.0, 31.0, 38.0, 38.0, 46.0, 33.0, 40.0, 46.0, 64.0, 46.0, 46.0, 47.0, 46.0, 49.0, 29.0, 40.0, 35.0, 28.0, 24.0, 19.0, 14.0, 24.0, 14.0, 10.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0963703989982605, -0.09280478954315186, -0.08923918753862381, -0.08567357808351517, -0.08210797607898712, -0.07854236662387848, -0.07497675716876984, -0.0714111477136612, -0.06784554570913315, -0.0642799362540245, -0.06071433424949646, -0.05714872479438782, -0.05358311906456947, -0.05001751333475113, -0.04645190387964249, -0.04288629814982414, -0.0393206924200058, -0.035755086690187454, -0.03218948096036911, -0.028623871505260468, -0.025058265775442123, -0.02149266004562378, -0.017927052453160286, -0.014361444860696793, -0.010795839130878448, -0.00723023246973753, -0.003664625808596611, -9.901914745569229e-05, 0.0034665875136852264, 0.0070321932435035706, 0.010597800835967064, 0.014163408428430557, 0.0177290141582489, 0.021294619888067245, 0.02486022748053074, 0.028425835072994232, 0.031991440802812576, 0.03555704653263092, 0.03912265598773956, 0.04268826171755791, 0.04625386744737625, 0.049819473177194595, 0.05338507890701294, 0.05695068836212158, 0.060516294091939926, 0.06408189982175827, 0.06764750927686691, 0.07121311128139496, 0.0747787207365036, 0.07834433019161224, 0.08190993219614029, 0.08547554165124893, 0.08904114365577698, 0.09260675311088562, 0.09617236256599426, 0.0997379720211029, 0.10330357402563095, 0.1068691834807396, 0.11043478548526764, 0.11400039494037628, 0.11756600439548492, 0.12113160640001297, 0.12469721585512161, 0.12826281785964966, 0.1318284273147583]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 11.0, 10.0, 19.0, 43.0, 42.0, 77.0, 142.0, 224.0, 363.0, 657.0, 1369.0, 3236.0, 8038.0, 24562.0, 82741.0, 319546.0, 426116.0, 127044.0, 35066.0, 11337.0, 4196.0, 1763.0, 805.0, 459.0, 245.0, 148.0, 94.0, 64.0, 43.0, 28.0, 17.0, 8.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17724609375, -0.17071914672851562, -0.16419219970703125, -0.15766525268554688, -0.1511383056640625, -0.14461135864257812, -0.13808441162109375, -0.13155746459960938, -0.125030517578125, -0.11850357055664062, -0.11197662353515625, -0.10544967651367188, -0.0989227294921875, -0.09239578247070312, -0.08586883544921875, -0.07934188842773438, -0.07281494140625, -0.06628799438476562, -0.05976104736328125, -0.053234100341796875, -0.0467071533203125, -0.040180206298828125, -0.03365325927734375, -0.027126312255859375, -0.020599365234375, -0.014072418212890625, -0.00754547119140625, -0.001018524169921875, 0.0055084228515625, 0.012035369873046875, 0.01856231689453125, 0.025089263916015625, 0.0316162109375, 0.038143157958984375, 0.04467010498046875, 0.051197052001953125, 0.0577239990234375, 0.06425094604492188, 0.07077789306640625, 0.07730484008789062, 0.083831787109375, 0.09035873413085938, 0.09688568115234375, 0.10341262817382812, 0.1099395751953125, 0.11646652221679688, 0.12299346923828125, 0.12952041625976562, 0.13604736328125, 0.14257431030273438, 0.14910125732421875, 0.15562820434570312, 0.1621551513671875, 0.16868209838867188, 0.17520904541015625, 0.18173599243164062, 0.188262939453125, 0.19478988647460938, 0.20131683349609375, 0.20784378051757812, 0.2143707275390625, 0.22089767456054688, 0.22742462158203125, 0.23395156860351562, 0.240478515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 2.0, 5.0, 10.0, 12.0, 19.0, 31.0, 42.0, 43.0, 49.0, 38.0, 58.0, 82.0, 77.0, 81.0, 69.0, 73.0, 72.0, 56.0, 34.0, 41.0, 26.0, 23.0, 20.0, 14.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.078125, -0.07590866088867188, -0.07369232177734375, -0.07147598266601562, -0.0692596435546875, -0.06704330444335938, -0.06482696533203125, -0.06261062622070312, -0.060394287109375, -0.058177947998046875, -0.05596160888671875, -0.053745269775390625, -0.0515289306640625, -0.049312591552734375, -0.04709625244140625, -0.044879913330078125, -0.04266357421875, -0.040447235107421875, -0.03823089599609375, -0.036014556884765625, -0.0337982177734375, -0.031581878662109375, -0.02936553955078125, -0.027149200439453125, -0.024932861328125, -0.022716522216796875, -0.02050018310546875, -0.018283843994140625, -0.0160675048828125, -0.013851165771484375, -0.01163482666015625, -0.009418487548828125, -0.0072021484375, -0.004985809326171875, -0.00276947021484375, -0.000553131103515625, 0.0016632080078125, 0.003879547119140625, 0.00609588623046875, 0.008312225341796875, 0.010528564453125, 0.012744903564453125, 0.01496124267578125, 0.017177581787109375, 0.0193939208984375, 0.021610260009765625, 0.02382659912109375, 0.026042938232421875, 0.02825927734375, 0.030475616455078125, 0.03269195556640625, 0.034908294677734375, 0.0371246337890625, 0.039340972900390625, 0.04155731201171875, 0.043773651123046875, 0.045989990234375, 0.048206329345703125, 0.05042266845703125, 0.052639007568359375, 0.0548553466796875, 0.057071685791015625, 0.05928802490234375, 0.061504364013671875, 0.063720703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 3.0, 4.0, 6.0, 13.0, 28.0, 30.0, 63.0, 72.0, 109.0, 195.0, 350.0, 586.0, 1254.0, 2698.0, 6715.0, 20195.0, 86208.0, 541808.0, 313672.0, 51467.0, 13932.0, 4830.0, 2102.0, 984.0, 461.0, 249.0, 174.0, 107.0, 84.0, 47.0, 34.0, 17.0, 16.0, 12.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.343994140625, -0.3343963623046875, -0.324798583984375, -0.3152008056640625, -0.30560302734375, -0.2960052490234375, -0.286407470703125, -0.2768096923828125, -0.2672119140625, -0.2576141357421875, -0.248016357421875, -0.2384185791015625, -0.22882080078125, -0.2192230224609375, -0.209625244140625, -0.2000274658203125, -0.1904296875, -0.1808319091796875, -0.171234130859375, -0.1616363525390625, -0.15203857421875, -0.1424407958984375, -0.132843017578125, -0.1232452392578125, -0.1136474609375, -0.1040496826171875, -0.094451904296875, -0.0848541259765625, -0.07525634765625, -0.0656585693359375, -0.056060791015625, -0.0464630126953125, -0.036865234375, -0.0272674560546875, -0.017669677734375, -0.0080718994140625, 0.00152587890625, 0.0111236572265625, 0.020721435546875, 0.0303192138671875, 0.0399169921875, 0.0495147705078125, 0.059112548828125, 0.0687103271484375, 0.07830810546875, 0.0879058837890625, 0.097503662109375, 0.1071014404296875, 0.11669921875, 0.1262969970703125, 0.135894775390625, 0.1454925537109375, 0.15509033203125, 0.1646881103515625, 0.174285888671875, 0.1838836669921875, 0.1934814453125, 0.2030792236328125, 0.212677001953125, 0.2222747802734375, 0.23187255859375, 0.2414703369140625, 0.251068115234375, 0.2606658935546875, 0.270263671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 5.0, 11.0, 15.0, 9.0, 11.0, 20.0, 29.0, 38.0, 36.0, 37.0, 47.0, 50.0, 55.0, 68.0, 64.0, 63.0, 62.0, 55.0, 49.0, 53.0, 55.0, 34.0, 25.0, 20.0, 14.0, 16.0, 15.0, 10.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355712890625, -0.3414115905761719, -0.32711029052734375, -0.3128089904785156, -0.2985076904296875, -0.2842063903808594, -0.26990509033203125, -0.2556037902832031, -0.241302490234375, -0.22700119018554688, -0.21269989013671875, -0.19839859008789062, -0.1840972900390625, -0.16979598999023438, -0.15549468994140625, -0.14119338989257812, -0.12689208984375, -0.11259078979492188, -0.09828948974609375, -0.08398818969726562, -0.0696868896484375, -0.055385589599609375, -0.04108428955078125, -0.026782989501953125, -0.012481689453125, 0.001819610595703125, 0.01612091064453125, 0.030422210693359375, 0.0447235107421875, 0.059024810791015625, 0.07332611083984375, 0.08762741088867188, 0.1019287109375, 0.11623001098632812, 0.13053131103515625, 0.14483261108398438, 0.1591339111328125, 0.17343521118164062, 0.18773651123046875, 0.20203781127929688, 0.216339111328125, 0.23064041137695312, 0.24494171142578125, 0.2592430114746094, 0.2735443115234375, 0.2878456115722656, 0.30214691162109375, 0.3164482116699219, 0.33074951171875, 0.3450508117675781, 0.35935211181640625, 0.3736534118652344, 0.3879547119140625, 0.4022560119628906, 0.41655731201171875, 0.4308586120605469, 0.445159912109375, 0.4594612121582031, 0.47376251220703125, 0.4880638122558594, 0.5023651123046875, 0.5166664123535156, 0.5309677124023438, 0.5452690124511719, 0.5595703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 10.0, 7.0, 13.0, 22.0, 19.0, 25.0, 28.0, 47.0, 75.0, 84.0, 138.0, 178.0, 307.0, 508.0, 819.0, 1568.0, 3142.0, 8703.0, 46143.0, 763352.0, 194161.0, 18700.0, 5226.0, 2373.0, 1091.0, 612.0, 376.0, 239.0, 169.0, 120.0, 77.0, 57.0, 37.0, 26.0, 23.0, 16.0, 17.0, 13.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2486572265625, -0.24057579040527344, -0.23249435424804688, -0.2244129180908203, -0.21633148193359375, -0.2082500457763672, -0.20016860961914062, -0.19208717346191406, -0.1840057373046875, -0.17592430114746094, -0.16784286499023438, -0.1597614288330078, -0.15167999267578125, -0.1435985565185547, -0.13551712036132812, -0.12743568420410156, -0.119354248046875, -0.11127281188964844, -0.10319137573242188, -0.09510993957519531, -0.08702850341796875, -0.07894706726074219, -0.07086563110351562, -0.06278419494628906, -0.0547027587890625, -0.04662132263183594, -0.038539886474609375, -0.030458450317382812, -0.02237701416015625, -0.014295578002929688, -0.006214141845703125, 0.0018672943115234375, 0.00994873046875, 0.018030166625976562, 0.026111602783203125, 0.03419303894042969, 0.04227447509765625, 0.05035591125488281, 0.058437347412109375, 0.06651878356933594, 0.0746002197265625, 0.08268165588378906, 0.09076309204101562, 0.09884452819824219, 0.10692596435546875, 0.11500740051269531, 0.12308883666992188, 0.13117027282714844, 0.139251708984375, 0.14733314514160156, 0.15541458129882812, 0.1634960174560547, 0.17157745361328125, 0.1796588897705078, 0.18774032592773438, 0.19582176208496094, 0.2039031982421875, 0.21198463439941406, 0.22006607055664062, 0.2281475067138672, 0.23622894287109375, 0.2443103790283203, 0.2523918151855469, 0.26047325134277344, 0.2685546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 8.0, 6.0, 13.0, 23.0, 37.0, 67.0, 118.0, 147.0, 176.0, 141.0, 101.0, 64.0, 41.0, 25.0, 14.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5643577575683594e-05, -3.458000719547272e-05, -3.351643681526184e-05, -3.2452866435050964e-05, -3.138929605484009e-05, -3.032572567462921e-05, -2.9262155294418335e-05, -2.819858491420746e-05, -2.7135014533996582e-05, -2.6071444153785706e-05, -2.500787377357483e-05, -2.3944303393363953e-05, -2.2880733013153076e-05, -2.18171626329422e-05, -2.0753592252731323e-05, -1.9690021872520447e-05, -1.862645149230957e-05, -1.7562881112098694e-05, -1.6499310731887817e-05, -1.543574035167694e-05, -1.4372169971466064e-05, -1.3308599591255188e-05, -1.2245029211044312e-05, -1.1181458830833435e-05, -1.0117888450622559e-05, -9.054318070411682e-06, -7.990747690200806e-06, -6.927177309989929e-06, -5.863606929779053e-06, -4.800036549568176e-06, -3.7364661693573e-06, -2.6728957891464233e-06, -1.6093254089355469e-06, -5.457550287246704e-07, 5.178153514862061e-07, 1.5813857316970825e-06, 2.644956111907959e-06, 3.7085264921188354e-06, 4.772096872329712e-06, 5.835667252540588e-06, 6.899237632751465e-06, 7.962808012962341e-06, 9.026378393173218e-06, 1.0089948773384094e-05, 1.115351915359497e-05, 1.2217089533805847e-05, 1.3280659914016724e-05, 1.43442302942276e-05, 1.5407800674438477e-05, 1.6471371054649353e-05, 1.753494143486023e-05, 1.8598511815071106e-05, 1.9662082195281982e-05, 2.072565257549286e-05, 2.1789222955703735e-05, 2.2852793335914612e-05, 2.3916363716125488e-05, 2.4979934096336365e-05, 2.604350447654724e-05, 2.7107074856758118e-05, 2.8170645236968994e-05, 2.923421561717987e-05, 3.0297785997390747e-05, 3.1361356377601624e-05, 3.24249267578125e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 6.0, 4.0, 4.0, 11.0, 14.0, 17.0, 19.0, 38.0, 50.0, 80.0, 187.0, 278.0, 560.0, 1316.0, 3686.0, 17686.0, 321202.0, 669333.0, 26363.0, 4648.0, 1585.0, 697.0, 331.0, 168.0, 93.0, 65.0, 32.0, 23.0, 14.0, 17.0, 11.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275634765625, -0.2675495147705078, -0.2594642639160156, -0.25137901306152344, -0.24329376220703125, -0.23520851135253906, -0.22712326049804688, -0.2190380096435547, -0.2109527587890625, -0.2028675079345703, -0.19478225708007812, -0.18669700622558594, -0.17861175537109375, -0.17052650451660156, -0.16244125366210938, -0.1543560028076172, -0.146270751953125, -0.1381855010986328, -0.13010025024414062, -0.12201499938964844, -0.11392974853515625, -0.10584449768066406, -0.09775924682617188, -0.08967399597167969, -0.0815887451171875, -0.07350349426269531, -0.06541824340820312, -0.05733299255371094, -0.04924774169921875, -0.04116249084472656, -0.033077239990234375, -0.024991989135742188, -0.01690673828125, -0.008821487426757812, -0.000736236572265625, 0.0073490142822265625, 0.01543426513671875, 0.023519515991210938, 0.031604766845703125, 0.03969001770019531, 0.0477752685546875, 0.05586051940917969, 0.06394577026367188, 0.07203102111816406, 0.08011627197265625, 0.08820152282714844, 0.09628677368164062, 0.10437202453613281, 0.112457275390625, 0.12054252624511719, 0.12862777709960938, 0.13671302795410156, 0.14479827880859375, 0.15288352966308594, 0.16096878051757812, 0.1690540313720703, 0.1771392822265625, 0.1852245330810547, 0.19330978393554688, 0.20139503479003906, 0.20948028564453125, 0.21756553649902344, 0.22565078735351562, 0.2337360382080078, 0.2418212890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 16.0, 17.0, 33.0, 45.0, 69.0, 86.0, 183.0, 203.0, 108.0, 64.0, 47.0, 41.0, 13.0, 19.0, 13.0, 11.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30517578125, -0.29471588134765625, -0.2842559814453125, -0.27379608154296875, -0.263336181640625, -0.25287628173828125, -0.2424163818359375, -0.23195648193359375, -0.22149658203125, -0.21103668212890625, -0.2005767822265625, -0.19011688232421875, -0.179656982421875, -0.16919708251953125, -0.1587371826171875, -0.14827728271484375, -0.1378173828125, -0.12735748291015625, -0.1168975830078125, -0.10643768310546875, -0.095977783203125, -0.08551788330078125, -0.0750579833984375, -0.06459808349609375, -0.05413818359375, -0.04367828369140625, -0.0332183837890625, -0.02275848388671875, -0.012298583984375, -0.00183868408203125, 0.0086212158203125, 0.01908111572265625, 0.029541015625, 0.04000091552734375, 0.0504608154296875, 0.06092071533203125, 0.071380615234375, 0.08184051513671875, 0.0923004150390625, 0.10276031494140625, 0.11322021484375, 0.12368011474609375, 0.1341400146484375, 0.14459991455078125, 0.155059814453125, 0.16551971435546875, 0.1759796142578125, 0.18643951416015625, 0.1968994140625, 0.20735931396484375, 0.2178192138671875, 0.22827911376953125, 0.238739013671875, 0.24919891357421875, 0.2596588134765625, 0.27011871337890625, 0.28057861328125, 0.29103851318359375, 0.3014984130859375, 0.31195831298828125, 0.322418212890625, 0.33287811279296875, 0.3433380126953125, 0.35379791259765625, 0.3642578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 12.0, 17.0, 32.0, 80.0, 165.0, 284.0, 258.0, 101.0, 40.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.075802803039551, -3.879946231842041, -3.6840896606445312, -3.4882330894470215, -3.2923765182495117, -3.096519947052002, -2.900663375854492, -2.7048068046569824, -2.5089502334594727, -2.313093662261963, -2.117237091064453, -1.9213805198669434, -1.7255239486694336, -1.5296673774719238, -1.3338106870651245, -1.1379541158676147, -0.9420974254608154, -0.7462408542633057, -0.5503842830657959, -0.35452765226364136, -0.1586710810661316, 0.037185490131378174, 0.23304212093353271, 0.4288986921310425, 0.6247552633285522, 0.820611834526062, 1.0164684057235718, 1.212325096130371, 1.4081816673278809, 1.6040382385253906, 1.7998948097229004, 1.9957513809204102, 2.19160795211792, 2.3874645233154297, 2.5833210945129395, 2.779177665710449, 2.975034236907959, 3.1708908081054688, 3.3667473793029785, 3.5626039505004883, 3.758460521697998, 3.954317092895508, 4.150173664093018, 4.346030235290527, 4.541886806488037, 4.737743377685547, 4.933599948883057, 5.129456520080566, 5.325313568115234, 5.521170139312744, 5.717026710510254, 5.912883281707764, 6.108739852905273, 6.304596424102783, 6.500452995300293, 6.696309566497803, 6.8921661376953125, 7.088022708892822, 7.283879280090332, 7.479735851287842, 7.675592422485352, 7.871448993682861, 8.067305564880371, 8.263162612915039, 8.45901870727539]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 3.0, 4.0, 3.0, 6.0, 9.0, 6.0, 10.0, 17.0, 15.0, 29.0, 28.0, 48.0, 43.0, 59.0, 60.0, 66.0, 59.0, 71.0, 64.0, 67.0, 46.0, 46.0, 46.0, 44.0, 37.0, 32.0, 12.0, 16.0, 17.0, 8.0, 8.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5909507274627686, -3.4994592666625977, -3.407968044281006, -3.316476583480835, -3.224985122680664, -3.1334939002990723, -3.0420024394989014, -2.9505109786987305, -2.8590197563171387, -2.7675282955169678, -2.676037073135376, -2.584545612335205, -2.4930543899536133, -2.4015629291534424, -2.3100714683532715, -2.2185802459716797, -2.127088785171509, -2.035597324371338, -1.944106101989746, -1.8526146411895752, -1.7611232995986938, -1.6696319580078125, -1.5781404972076416, -1.4866491556167603, -1.395157814025879, -1.3036664724349976, -1.2121751308441162, -1.1206836700439453, -1.029192328453064, -0.9377009868621826, -0.8462095856666565, -0.7547181844711304, -0.663226842880249, -0.5717355012893677, -0.48024410009384155, -0.3887527287006378, -0.2972613573074341, -0.20576998591423035, -0.11427861452102661, -0.02278721332550049, 0.06870412826538086, 0.1601954996585846, 0.25168687105178833, 0.34317824244499207, 0.4346696138381958, 0.5261609554290771, 0.6176523566246033, 0.7091437578201294, 0.8006350994110107, 0.8921264410018921, 0.9836178421974182, 1.0751092433929443, 1.1666005849838257, 1.258091926574707, 1.349583387374878, 1.4410747289657593, 1.5325660705566406, 1.624057412147522, 1.7155487537384033, 1.8070402145385742, 1.8985315561294556, 1.990022897720337, 2.081514358520508, 2.1730055809020996, 2.2644970417022705]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 0.0, 7.0, 8.0, 10.0, 13.0, 6.0, 22.0, 53.0, 71.0, 91.0, 160.0, 295.0, 485.0, 1064.0, 2735.0, 9712.0, 104656.0, 4046879.0, 20962.0, 4315.0, 1418.0, 592.0, 302.0, 161.0, 99.0, 56.0, 37.0, 24.0, 17.0, 14.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.638671875, -0.6200027465820312, -0.6013336181640625, -0.5826644897460938, -0.563995361328125, -0.5453262329101562, -0.5266571044921875, -0.5079879760742188, -0.48931884765625, -0.47064971923828125, -0.4519805908203125, -0.43331146240234375, -0.414642333984375, -0.39597320556640625, -0.3773040771484375, -0.35863494873046875, -0.3399658203125, -0.32129669189453125, -0.3026275634765625, -0.28395843505859375, -0.265289306640625, -0.24662017822265625, -0.2279510498046875, -0.20928192138671875, -0.19061279296875, -0.17194366455078125, -0.1532745361328125, -0.13460540771484375, -0.115936279296875, -0.09726715087890625, -0.0785980224609375, -0.05992889404296875, -0.041259765625, -0.02259063720703125, -0.0039215087890625, 0.01474761962890625, 0.033416748046875, 0.05208587646484375, 0.0707550048828125, 0.08942413330078125, 0.10809326171875, 0.12676239013671875, 0.1454315185546875, 0.16410064697265625, 0.182769775390625, 0.20143890380859375, 0.2201080322265625, 0.23877716064453125, 0.2574462890625, 0.27611541748046875, 0.2947845458984375, 0.31345367431640625, 0.332122802734375, 0.35079193115234375, 0.3694610595703125, 0.38813018798828125, 0.40679931640625, 0.42546844482421875, 0.4441375732421875, 0.46280670166015625, 0.481475830078125, 0.5001449584960938, 0.5188140869140625, 0.5374832153320312, 0.55615234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 11.0, 12.0, 18.0, 33.0, 45.0, 50.0, 71.0, 91.0, 100.0, 107.0, 131.0, 90.0, 75.0, 46.0, 35.0, 20.0, 20.0, 5.0, 4.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.16455078125, -0.16055679321289062, -0.15656280517578125, -0.15256881713867188, -0.1485748291015625, -0.14458084106445312, -0.14058685302734375, -0.13659286499023438, -0.132598876953125, -0.12860488891601562, -0.12461090087890625, -0.12061691284179688, -0.1166229248046875, -0.11262893676757812, -0.10863494873046875, -0.10464096069335938, -0.10064697265625, -0.09665298461914062, -0.09265899658203125, -0.08866500854492188, -0.0846710205078125, -0.08067703247070312, -0.07668304443359375, -0.07268905639648438, -0.068695068359375, -0.06470108032226562, -0.06070709228515625, -0.056713104248046875, -0.0527191162109375, -0.048725128173828125, -0.04473114013671875, -0.040737152099609375, -0.0367431640625, -0.032749176025390625, -0.02875518798828125, -0.024761199951171875, -0.0207672119140625, -0.016773223876953125, -0.01277923583984375, -0.008785247802734375, -0.004791259765625, -0.000797271728515625, 0.00319671630859375, 0.007190704345703125, 0.0111846923828125, 0.015178680419921875, 0.01917266845703125, 0.023166656494140625, 0.02716064453125, 0.031154632568359375, 0.03514862060546875, 0.039142608642578125, 0.0431365966796875, 0.047130584716796875, 0.05112457275390625, 0.055118560791015625, 0.059112548828125, 0.06310653686523438, 0.06710052490234375, 0.07109451293945312, 0.0750885009765625, 0.07908248901367188, 0.08307647705078125, 0.08707046508789062, 0.091064453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 8.0, 17.0, 27.0, 31.0, 39.0, 67.0, 97.0, 152.0, 225.0, 326.0, 523.0, 828.0, 1460.0, 2465.0, 4575.0, 9490.0, 23878.0, 94933.0, 3909862.0, 100112.0, 24627.0, 9697.0, 4492.0, 2470.0, 1419.0, 867.0, 536.0, 352.0, 195.0, 173.0, 107.0, 67.0, 44.0, 30.0, 34.0, 11.0, 7.0, 10.0, 15.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40380859375, -0.3905754089355469, -0.37734222412109375, -0.3641090393066406, -0.3508758544921875, -0.3376426696777344, -0.32440948486328125, -0.3111763000488281, -0.297943115234375, -0.2847099304199219, -0.27147674560546875, -0.2582435607910156, -0.2450103759765625, -0.23177719116210938, -0.21854400634765625, -0.20531082153320312, -0.19207763671875, -0.17884445190429688, -0.16561126708984375, -0.15237808227539062, -0.1391448974609375, -0.12591171264648438, -0.11267852783203125, -0.09944534301757812, -0.086212158203125, -0.07297897338867188, -0.05974578857421875, -0.046512603759765625, -0.0332794189453125, -0.020046234130859375, -0.00681304931640625, 0.006420135498046875, 0.0196533203125, 0.032886505126953125, 0.04611968994140625, 0.059352874755859375, 0.0725860595703125, 0.08581924438476562, 0.09905242919921875, 0.11228561401367188, 0.125518798828125, 0.13875198364257812, 0.15198516845703125, 0.16521835327148438, 0.1784515380859375, 0.19168472290039062, 0.20491790771484375, 0.21815109252929688, 0.23138427734375, 0.24461746215820312, 0.25785064697265625, 0.2710838317871094, 0.2843170166015625, 0.2975502014160156, 0.31078338623046875, 0.3240165710449219, 0.337249755859375, 0.3504829406738281, 0.36371612548828125, 0.3769493103027344, 0.3901824951171875, 0.4034156799316406, 0.41664886474609375, 0.4298820495605469, 0.443115234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 14.0, 8.0, 11.0, 29.0, 30.0, 45.0, 114.0, 3029.0, 514.0, 102.0, 47.0, 29.0, 16.0, 18.0, 11.0, 9.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.13882160186767578, -0.13506507873535156, -0.13130855560302734, -0.12755203247070312, -0.1237955093383789, -0.12003898620605469, -0.11628246307373047, -0.11252593994140625, -0.10876941680908203, -0.10501289367675781, -0.1012563705444336, -0.09749984741210938, -0.09374332427978516, -0.08998680114746094, -0.08623027801513672, -0.0824737548828125, -0.07871723175048828, -0.07496070861816406, -0.07120418548583984, -0.06744766235351562, -0.0636911392211914, -0.05993461608886719, -0.05617809295654297, -0.05242156982421875, -0.04866504669189453, -0.04490852355957031, -0.041152000427246094, -0.037395477294921875, -0.033638954162597656, -0.029882431030273438, -0.02612590789794922, -0.022369384765625, -0.01861286163330078, -0.014856338500976562, -0.011099815368652344, -0.007343292236328125, -0.0035867691040039062, 0.0001697540283203125, 0.003926277160644531, 0.00768280029296875, 0.011439323425292969, 0.015195846557617188, 0.018952369689941406, 0.022708892822265625, 0.026465415954589844, 0.030221939086914062, 0.03397846221923828, 0.0377349853515625, 0.04149150848388672, 0.04524803161621094, 0.049004554748535156, 0.052761077880859375, 0.056517601013183594, 0.06027412414550781, 0.06403064727783203, 0.06778717041015625, 0.07154369354248047, 0.07530021667480469, 0.0790567398071289, 0.08281326293945312, 0.08656978607177734, 0.09032630920410156, 0.09408283233642578, 0.09783935546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 8.0, 7.0, 8.0, 5.0, 15.0, 11.0, 13.0, 22.0, 17.0, 28.0, 41.0, 34.0, 43.0, 65.0, 70.0, 60.0, 82.0, 78.0, 59.0, 74.0, 53.0, 46.0, 42.0, 27.0, 19.0, 14.0, 10.0, 8.0, 5.0, 11.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.30656808614730835, -0.2964431047439575, -0.2863180935382843, -0.2761930823326111, -0.26606810092926025, -0.2559431195259094, -0.2458181083202362, -0.23569311201572418, -0.22556811571121216, -0.21544311940670013, -0.2053181231021881, -0.1951931267976761, -0.18506813049316406, -0.17494313418865204, -0.16481813788414001, -0.154693141579628, -0.14456814527511597, -0.13444314897060394, -0.12431815266609192, -0.1141931563615799, -0.10406816005706787, -0.09394316375255585, -0.08381816744804382, -0.0736931711435318, -0.06356817483901978, -0.05344317853450775, -0.04331818222999573, -0.033193185925483704, -0.02306818962097168, -0.012943193316459656, -0.002818197011947632, 0.007306799292564392, 0.01743176579475403, 0.027556762099266052, 0.037681758403778076, 0.0478067547082901, 0.057931751012802124, 0.06805674731731415, 0.07818174362182617, 0.0883067399263382, 0.09843173623085022, 0.10855673253536224, 0.11868172883987427, 0.1288067251443863, 0.13893172144889832, 0.14905671775341034, 0.15918171405792236, 0.1693067103624344, 0.1794317066669464, 0.18955670297145844, 0.19968169927597046, 0.20980669558048248, 0.2199316918849945, 0.23005668818950653, 0.24018168449401855, 0.2503066658973694, 0.2604316771030426, 0.2705566883087158, 0.28068166971206665, 0.2908066511154175, 0.3009316623210907, 0.3110566735267639, 0.32118165493011475, 0.3313066363334656, 0.3414316475391388]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 8.0, 6.0, 5.0, 6.0, 14.0, 14.0, 14.0, 11.0, 27.0, 15.0, 23.0, 27.0, 33.0, 31.0, 31.0, 40.0, 42.0, 33.0, 47.0, 50.0, 40.0, 43.0, 40.0, 43.0, 38.0, 34.0, 30.0, 32.0, 29.0, 31.0, 18.0, 21.0, 18.0, 16.0, 14.0, 12.0, 10.0, 8.0, 8.0, 11.0, 4.0, 3.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3044542074203491, -0.2945215404033661, -0.28458887338638306, -0.2746562361717224, -0.2647235691547394, -0.25479090213775635, -0.24485823512077332, -0.23492556810379028, -0.22499290108680725, -0.21506023406982422, -0.20512758195400238, -0.19519491493701935, -0.18526224792003632, -0.17532959580421448, -0.16539692878723145, -0.1554642617702484, -0.14553160965442657, -0.13559894263744354, -0.1256662905216217, -0.11573362350463867, -0.10580095648765564, -0.0958682969212532, -0.08593563735485077, -0.07600297033786774, -0.0660703107714653, -0.05613764747977257, -0.046204984188079834, -0.0362723246216774, -0.026339661329984665, -0.01640699803829193, -0.006474338471889496, 0.0034583285450935364, 0.013390988111495972, 0.023323651403188705, 0.03325631469488144, 0.043188974261283875, 0.05312163755297661, 0.06305430084466934, 0.07298696041107178, 0.08291962742805481, 0.09285228699445724, 0.10278494656085968, 0.11271761357784271, 0.12265027314424515, 0.13258293271064758, 0.14251559972763062, 0.15244826674461365, 0.16238093376159668, 0.17231358587741852, 0.18224625289440155, 0.1921789050102234, 0.20211157202720642, 0.21204423904418945, 0.22197690606117249, 0.23190955817699432, 0.24184222519397736, 0.2517748773097992, 0.2617075443267822, 0.27164021134376526, 0.2815728783607483, 0.29150551557540894, 0.30143818259239197, 0.311370849609375, 0.32130351662635803, 0.33123618364334106]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 9.0, 10.0, 15.0, 12.0, 18.0, 15.0, 35.0, 45.0, 72.0, 106.0, 176.0, 317.0, 599.0, 1235.0, 2903.0, 7261.0, 24216.0, 102286.0, 435167.0, 363833.0, 79544.0, 19563.0, 6222.0, 2446.0, 1077.0, 559.0, 292.0, 151.0, 118.0, 69.0, 57.0, 40.0, 22.0, 17.0, 14.0, 9.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.291015625, -0.28020477294921875, -0.2693939208984375, -0.25858306884765625, -0.247772216796875, -0.23696136474609375, -0.2261505126953125, -0.21533966064453125, -0.20452880859375, -0.19371795654296875, -0.1829071044921875, -0.17209625244140625, -0.161285400390625, -0.15047454833984375, -0.1396636962890625, -0.12885284423828125, -0.1180419921875, -0.10723114013671875, -0.0964202880859375, -0.08560943603515625, -0.074798583984375, -0.06398773193359375, -0.0531768798828125, -0.04236602783203125, -0.03155517578125, -0.02074432373046875, -0.0099334716796875, 0.00087738037109375, 0.011688232421875, 0.02249908447265625, 0.0333099365234375, 0.04412078857421875, 0.054931640625, 0.06574249267578125, 0.0765533447265625, 0.08736419677734375, 0.098175048828125, 0.10898590087890625, 0.1197967529296875, 0.13060760498046875, 0.14141845703125, 0.15222930908203125, 0.1630401611328125, 0.17385101318359375, 0.184661865234375, 0.19547271728515625, 0.2062835693359375, 0.21709442138671875, 0.2279052734375, 0.23871612548828125, 0.2495269775390625, 0.26033782958984375, 0.271148681640625, 0.28195953369140625, 0.2927703857421875, 0.30358123779296875, 0.31439208984375, 0.32520294189453125, 0.3360137939453125, 0.34682464599609375, 0.357635498046875, 0.36844635009765625, 0.3792572021484375, 0.39006805419921875, 0.40087890625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 6.0, 12.0, 13.0, 21.0, 38.0, 37.0, 50.0, 75.0, 72.0, 103.0, 97.0, 96.0, 91.0, 79.0, 59.0, 41.0, 33.0, 19.0, 10.0, 11.0, 13.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.16748046875, -0.1633434295654297, -0.15920639038085938, -0.15506935119628906, -0.15093231201171875, -0.14679527282714844, -0.14265823364257812, -0.1385211944580078, -0.1343841552734375, -0.1302471160888672, -0.12611007690429688, -0.12197303771972656, -0.11783599853515625, -0.11369895935058594, -0.10956192016601562, -0.10542488098144531, -0.101287841796875, -0.09715080261230469, -0.09301376342773438, -0.08887672424316406, -0.08473968505859375, -0.08060264587402344, -0.07646560668945312, -0.07232856750488281, -0.0681915283203125, -0.06405448913574219, -0.059917449951171875, -0.05578041076660156, -0.05164337158203125, -0.04750633239746094, -0.043369293212890625, -0.03923225402832031, -0.03509521484375, -0.030958175659179688, -0.026821136474609375, -0.022684097290039062, -0.01854705810546875, -0.014410018920898438, -0.010272979736328125, -0.0061359405517578125, -0.0019989013671875, 0.0021381378173828125, 0.006275177001953125, 0.010412216186523438, 0.01454925537109375, 0.018686294555664062, 0.022823333740234375, 0.026960372924804688, 0.031097412109375, 0.03523445129394531, 0.039371490478515625, 0.04350852966308594, 0.04764556884765625, 0.05178260803222656, 0.055919647216796875, 0.06005668640136719, 0.0641937255859375, 0.06833076477050781, 0.07246780395507812, 0.07660484313964844, 0.08074188232421875, 0.08487892150878906, 0.08901596069335938, 0.09315299987792969, 0.0972900390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 9.0, 15.0, 21.0, 28.0, 38.0, 50.0, 73.0, 129.0, 242.0, 447.0, 831.0, 1856.0, 4491.0, 15117.0, 80808.0, 633657.0, 264022.0, 32882.0, 8209.0, 2865.0, 1253.0, 656.0, 312.0, 182.0, 97.0, 73.0, 38.0, 46.0, 26.0, 13.0, 9.0, 11.0, 9.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5339126586914062, -0.5165557861328125, -0.49919891357421875, -0.481842041015625, -0.46448516845703125, -0.4471282958984375, -0.42977142333984375, -0.41241455078125, -0.39505767822265625, -0.3777008056640625, -0.36034393310546875, -0.342987060546875, -0.32563018798828125, -0.3082733154296875, -0.29091644287109375, -0.2735595703125, -0.25620269775390625, -0.2388458251953125, -0.22148895263671875, -0.204132080078125, -0.18677520751953125, -0.1694183349609375, -0.15206146240234375, -0.13470458984375, -0.11734771728515625, -0.0999908447265625, -0.08263397216796875, -0.065277099609375, -0.04792022705078125, -0.0305633544921875, -0.01320648193359375, 0.004150390625, 0.02150726318359375, 0.0388641357421875, 0.05622100830078125, 0.073577880859375, 0.09093475341796875, 0.1082916259765625, 0.12564849853515625, 0.14300537109375, 0.16036224365234375, 0.1777191162109375, 0.19507598876953125, 0.212432861328125, 0.22978973388671875, 0.2471466064453125, 0.26450347900390625, 0.2818603515625, 0.29921722412109375, 0.3165740966796875, 0.33393096923828125, 0.351287841796875, 0.36864471435546875, 0.3860015869140625, 0.40335845947265625, 0.42071533203125, 0.43807220458984375, 0.4554290771484375, 0.47278594970703125, 0.490142822265625, 0.5074996948242188, 0.5248565673828125, 0.5422134399414062, 0.5595703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 12.0, 16.0, 17.0, 20.0, 24.0, 22.0, 28.0, 43.0, 32.0, 50.0, 59.0, 66.0, 73.0, 69.0, 62.0, 63.0, 50.0, 48.0, 34.0, 46.0, 24.0, 16.0, 15.0, 19.0, 19.0, 8.0, 6.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5732421875, -0.5542755126953125, -0.535308837890625, -0.5163421630859375, -0.49737548828125, -0.4784088134765625, -0.459442138671875, -0.4404754638671875, -0.4215087890625, -0.4025421142578125, -0.383575439453125, -0.3646087646484375, -0.34564208984375, -0.3266754150390625, -0.307708740234375, -0.2887420654296875, -0.269775390625, -0.2508087158203125, -0.231842041015625, -0.2128753662109375, -0.19390869140625, -0.1749420166015625, -0.155975341796875, -0.1370086669921875, -0.1180419921875, -0.0990753173828125, -0.080108642578125, -0.0611419677734375, -0.04217529296875, -0.0232086181640625, -0.004241943359375, 0.0147247314453125, 0.03369140625, 0.0526580810546875, 0.071624755859375, 0.0905914306640625, 0.10955810546875, 0.1285247802734375, 0.147491455078125, 0.1664581298828125, 0.1854248046875, 0.2043914794921875, 0.223358154296875, 0.2423248291015625, 0.26129150390625, 0.2802581787109375, 0.299224853515625, 0.3181915283203125, 0.337158203125, 0.3561248779296875, 0.375091552734375, 0.3940582275390625, 0.41302490234375, 0.4319915771484375, 0.450958251953125, 0.4699249267578125, 0.4888916015625, 0.5078582763671875, 0.526824951171875, 0.5457916259765625, 0.56475830078125, 0.5837249755859375, 0.602691650390625, 0.6216583251953125, 0.640625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 15.0, 11.0, 17.0, 21.0, 52.0, 74.0, 142.0, 240.0, 569.0, 1948.0, 15095.0, 980685.0, 45115.0, 3011.0, 833.0, 307.0, 160.0, 102.0, 58.0, 24.0, 22.0, 15.0, 14.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9825973510742188, -0.9524993896484375, -0.9224014282226562, -0.892303466796875, -0.8622055053710938, -0.8321075439453125, -0.8020095825195312, -0.77191162109375, -0.7418136596679688, -0.7117156982421875, -0.6816177368164062, -0.651519775390625, -0.6214218139648438, -0.5913238525390625, -0.5612258911132812, -0.5311279296875, -0.5010299682617188, -0.4709320068359375, -0.44083404541015625, -0.410736083984375, -0.38063812255859375, -0.3505401611328125, -0.32044219970703125, -0.29034423828125, -0.26024627685546875, -0.2301483154296875, -0.20005035400390625, -0.169952392578125, -0.13985443115234375, -0.1097564697265625, -0.07965850830078125, -0.049560546875, -0.01946258544921875, 0.0106353759765625, 0.04073333740234375, 0.070831298828125, 0.10092926025390625, 0.1310272216796875, 0.16112518310546875, 0.19122314453125, 0.22132110595703125, 0.2514190673828125, 0.28151702880859375, 0.311614990234375, 0.34171295166015625, 0.3718109130859375, 0.40190887451171875, 0.4320068359375, 0.46210479736328125, 0.4922027587890625, 0.5223007202148438, 0.552398681640625, 0.5824966430664062, 0.6125946044921875, 0.6426925659179688, 0.67279052734375, 0.7028884887695312, 0.7329864501953125, 0.7630844116210938, 0.793182373046875, 0.8232803344726562, 0.8533782958984375, 0.8834762573242188, 0.91357421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 22.0, 19.0, 44.0, 105.0, 203.0, 208.0, 183.0, 116.0, 44.0, 26.0, 10.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.903575897216797e-05, -7.652211934328079e-05, -7.400847971439362e-05, -7.149484008550644e-05, -6.898120045661926e-05, -6.646756082773209e-05, -6.395392119884491e-05, -6.144028156995773e-05, -5.892664194107056e-05, -5.641300231218338e-05, -5.3899362683296204e-05, -5.138572305440903e-05, -4.887208342552185e-05, -4.6358443796634674e-05, -4.38448041677475e-05, -4.133116453886032e-05, -3.8817524909973145e-05, -3.630388528108597e-05, -3.379024565219879e-05, -3.1276606023311615e-05, -2.876296639442444e-05, -2.6249326765537262e-05, -2.3735687136650085e-05, -2.122204750776291e-05, -1.8708407878875732e-05, -1.6194768249988556e-05, -1.368112862110138e-05, -1.1167488992214203e-05, -8.653849363327026e-06, -6.14020973443985e-06, -3.6265701055526733e-06, -1.1129304766654968e-06, 1.4007091522216797e-06, 3.914348781108856e-06, 6.427988409996033e-06, 8.94162803888321e-06, 1.1455267667770386e-05, 1.3968907296657562e-05, 1.648254692554474e-05, 1.8996186554431915e-05, 2.1509826183319092e-05, 2.402346581220627e-05, 2.6537105441093445e-05, 2.905074506998062e-05, 3.15643846988678e-05, 3.4078024327754974e-05, 3.659166395664215e-05, 3.910530358552933e-05, 4.1618943214416504e-05, 4.413258284330368e-05, 4.664622247219086e-05, 4.9159862101078033e-05, 5.167350172996521e-05, 5.4187141358852386e-05, 5.670078098773956e-05, 5.921442061662674e-05, 6.172806024551392e-05, 6.424169987440109e-05, 6.675533950328827e-05, 6.926897913217545e-05, 7.178261876106262e-05, 7.42962583899498e-05, 7.680989801883698e-05, 7.932353764772415e-05, 8.183717727661133e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 17.0, 17.0, 33.0, 50.0, 110.0, 293.0, 780.0, 3371.0, 48826.0, 971107.0, 20648.0, 2199.0, 598.0, 224.0, 99.0, 73.0, 34.0, 22.0, 16.0, 10.0, 8.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.93896484375, -0.9151229858398438, -0.8912811279296875, -0.8674392700195312, -0.843597412109375, -0.8197555541992188, -0.7959136962890625, -0.7720718383789062, -0.74822998046875, -0.7243881225585938, -0.7005462646484375, -0.6767044067382812, -0.652862548828125, -0.6290206909179688, -0.6051788330078125, -0.5813369750976562, -0.5574951171875, -0.5336532592773438, -0.5098114013671875, -0.48596954345703125, -0.462127685546875, -0.43828582763671875, -0.4144439697265625, -0.39060211181640625, -0.36676025390625, -0.34291839599609375, -0.3190765380859375, -0.29523468017578125, -0.271392822265625, -0.24755096435546875, -0.2237091064453125, -0.19986724853515625, -0.176025390625, -0.15218353271484375, -0.1283416748046875, -0.10449981689453125, -0.080657958984375, -0.05681610107421875, -0.0329742431640625, -0.00913238525390625, 0.01470947265625, 0.03855133056640625, 0.0623931884765625, 0.08623504638671875, 0.110076904296875, 0.13391876220703125, 0.1577606201171875, 0.18160247802734375, 0.2054443359375, 0.22928619384765625, 0.2531280517578125, 0.27696990966796875, 0.300811767578125, 0.32465362548828125, 0.3484954833984375, 0.37233734130859375, 0.39617919921875, 0.42002105712890625, 0.4438629150390625, 0.46770477294921875, 0.491546630859375, 0.5153884887695312, 0.5392303466796875, 0.5630722045898438, 0.5869140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 11.0, 22.0, 58.0, 158.0, 325.0, 242.0, 97.0, 34.0, 19.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.426025390625, -0.4020347595214844, -0.37804412841796875, -0.3540534973144531, -0.3300628662109375, -0.3060722351074219, -0.28208160400390625, -0.2580909729003906, -0.234100341796875, -0.21010971069335938, -0.18611907958984375, -0.16212844848632812, -0.1381378173828125, -0.11414718627929688, -0.09015655517578125, -0.06616592407226562, -0.04217529296875, -0.018184661865234375, 0.00580596923828125, 0.029796600341796875, 0.0537872314453125, 0.07777786254882812, 0.10176849365234375, 0.12575912475585938, 0.149749755859375, 0.17374038696289062, 0.19773101806640625, 0.22172164916992188, 0.2457122802734375, 0.2697029113769531, 0.29369354248046875, 0.3176841735839844, 0.3416748046875, 0.3656654357910156, 0.38965606689453125, 0.4136466979980469, 0.4376373291015625, 0.4616279602050781, 0.48561859130859375, 0.5096092224121094, 0.533599853515625, 0.5575904846191406, 0.5815811157226562, 0.6055717468261719, 0.6295623779296875, 0.6535530090332031, 0.6775436401367188, 0.7015342712402344, 0.72552490234375, 0.7495155334472656, 0.7735061645507812, 0.7974967956542969, 0.8214874267578125, 0.8454780578613281, 0.8694686889648438, 0.8934593200683594, 0.917449951171875, 0.9414405822753906, 0.9654312133789062, 0.9894218444824219, 1.0134124755859375, 1.0374031066894531, 1.0613937377929688, 1.0853843688964844, 1.109375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 18.0, 34.0, 94.0, 210.0, 283.0, 221.0, 90.0, 37.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.47678279876709, -12.183839797973633, -11.890897750854492, -11.597954750061035, -11.305012702941895, -11.012069702148438, -10.719127655029297, -10.42618465423584, -10.133241653442383, -9.840298652648926, -9.547356605529785, -9.254413604736328, -8.961471557617188, -8.66852855682373, -8.37558650970459, -8.082643508911133, -7.789701461791992, -7.496758937835693, -7.2038164138793945, -6.910873889923096, -6.617931365966797, -6.32498836517334, -6.032045841217041, -5.739103317260742, -5.446160793304443, -5.1532182693481445, -4.860275745391846, -4.567333221435547, -4.27439022064209, -3.98144793510437, -3.688505172729492, -3.3955626487731934, -3.1026201248168945, -2.8096776008605957, -2.516735076904297, -2.223792314529419, -1.9308497905731201, -1.6379072666168213, -1.344964623451233, -1.0520219802856445, -0.7590794563293457, -0.4661368727684021, -0.1731942892074585, 0.11974829435348511, 0.4126908779144287, 0.7056334018707275, 0.9985760450363159, 1.2915186882019043, 1.5844612121582031, 1.877403736114502, 2.170346260070801, 2.4632890224456787, 2.7562315464019775, 3.0491740703582764, 3.3421168327331543, 3.635059356689453, 3.928001880645752, 4.220944404602051, 4.51388692855835, 4.806829452514648, 5.0997724533081055, 5.392714500427246, 5.685657501220703, 5.978600025177002, 6.271542549133301]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 12.0, 3.0, 16.0, 15.0, 16.0, 20.0, 32.0, 28.0, 40.0, 51.0, 53.0, 55.0, 75.0, 57.0, 79.0, 60.0, 53.0, 50.0, 38.0, 39.0, 30.0, 36.0, 32.0, 27.0, 22.0, 12.0, 13.0, 5.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2674498558044434, -3.1652798652648926, -3.063110113143921, -2.960940361022949, -2.8587703704833984, -2.7566003799438477, -2.654430627822876, -2.5522608757019043, -2.4500908851623535, -2.3479208946228027, -2.245751142501831, -2.1435813903808594, -2.0414113998413086, -1.9392415285110474, -1.8370716571807861, -1.734901785850525, -1.6327319145202637, -1.5305620431900024, -1.4283921718597412, -1.32622230052948, -1.2240524291992188, -1.1218825578689575, -1.0197126865386963, -0.9175428152084351, -0.8153729438781738, -0.7132030725479126, -0.6110332012176514, -0.5088633298873901, -0.4066934585571289, -0.3045235872268677, -0.20235371589660645, -0.10018384456634521, 0.0019860267639160156, 0.10415589809417725, 0.20632576942443848, 0.3084956407546997, 0.41066551208496094, 0.5128353834152222, 0.6150052547454834, 0.7171751260757446, 0.8193449974060059, 0.9215148687362671, 1.0236847400665283, 1.1258546113967896, 1.2280244827270508, 1.330194354057312, 1.4323642253875732, 1.5345340967178345, 1.6367039680480957, 1.738873839378357, 1.8410437107086182, 1.9432135820388794, 2.0453834533691406, 2.1475534439086914, 2.249723196029663, 2.3518929481506348, 2.4540629386901855, 2.5562329292297363, 2.658402681350708, 2.7605724334716797, 2.8627424240112305, 2.9649124145507812, 3.067082166671753, 3.1692519187927246, 3.2714219093322754]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 12.0, 14.0, 22.0, 30.0, 32.0, 77.0, 104.0, 172.0, 323.0, 641.0, 1618.0, 5018.0, 30379.0, 4128944.0, 20494.0, 3929.0, 1269.0, 545.0, 290.0, 135.0, 82.0, 60.0, 19.0, 19.0, 12.0, 11.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8637008666992188, -0.8343353271484375, -0.8049697875976562, -0.775604248046875, -0.7462387084960938, -0.7168731689453125, -0.6875076293945312, -0.65814208984375, -0.6287765502929688, -0.5994110107421875, -0.5700454711914062, -0.540679931640625, -0.5113143920898438, -0.4819488525390625, -0.45258331298828125, -0.4232177734375, -0.39385223388671875, -0.3644866943359375, -0.33512115478515625, -0.305755615234375, -0.27639007568359375, -0.2470245361328125, -0.21765899658203125, -0.18829345703125, -0.15892791748046875, -0.1295623779296875, -0.10019683837890625, -0.070831298828125, -0.04146575927734375, -0.0121002197265625, 0.01726531982421875, 0.046630859375, 0.07599639892578125, 0.1053619384765625, 0.13472747802734375, 0.164093017578125, 0.19345855712890625, 0.2228240966796875, 0.25218963623046875, 0.28155517578125, 0.31092071533203125, 0.3402862548828125, 0.36965179443359375, 0.399017333984375, 0.42838287353515625, 0.4577484130859375, 0.48711395263671875, 0.5164794921875, 0.5458450317382812, 0.5752105712890625, 0.6045761108398438, 0.633941650390625, 0.6633071899414062, 0.6926727294921875, 0.7220382690429688, 0.75140380859375, 0.7807693481445312, 0.8101348876953125, 0.8395004272460938, 0.868865966796875, 0.8982315063476562, 0.9275970458984375, 0.9569625854492188, 0.986328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 6.0, 15.0, 21.0, 50.0, 69.0, 90.0, 131.0, 162.0, 157.0, 93.0, 78.0, 40.0, 18.0, 21.0, 13.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.277587890625, -0.2703685760498047, -0.2631492614746094, -0.25592994689941406, -0.24871063232421875, -0.24149131774902344, -0.23427200317382812, -0.2270526885986328, -0.2198333740234375, -0.2126140594482422, -0.20539474487304688, -0.19817543029785156, -0.19095611572265625, -0.18373680114746094, -0.17651748657226562, -0.1692981719970703, -0.162078857421875, -0.1548595428466797, -0.14764022827148438, -0.14042091369628906, -0.13320159912109375, -0.12598228454589844, -0.11876296997070312, -0.11154365539550781, -0.1043243408203125, -0.09710502624511719, -0.08988571166992188, -0.08266639709472656, -0.07544708251953125, -0.06822776794433594, -0.061008453369140625, -0.05378913879394531, -0.04656982421875, -0.03935050964355469, -0.032131195068359375, -0.024911880493164062, -0.01769256591796875, -0.010473251342773438, -0.003253936767578125, 0.0039653778076171875, 0.0111846923828125, 0.018404006958007812, 0.025623321533203125, 0.03284263610839844, 0.04006195068359375, 0.04728126525878906, 0.054500579833984375, 0.06171989440917969, 0.068939208984375, 0.07615852355957031, 0.08337783813476562, 0.09059715270996094, 0.09781646728515625, 0.10503578186035156, 0.11225509643554688, 0.11947441101074219, 0.1266937255859375, 0.1339130401611328, 0.14113235473632812, 0.14835166931152344, 0.15557098388671875, 0.16279029846191406, 0.17000961303710938, 0.1772289276123047, 0.1844482421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 13.0, 22.0, 23.0, 43.0, 53.0, 74.0, 127.0, 165.0, 249.0, 328.0, 506.0, 865.0, 1450.0, 2526.0, 5308.0, 12483.0, 45427.0, 4035930.0, 60826.0, 15011.0, 5929.0, 2727.0, 1544.0, 934.0, 534.0, 355.0, 230.0, 170.0, 125.0, 94.0, 47.0, 55.0, 25.0, 18.0, 18.0, 12.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82568359375, -0.8010940551757812, -0.7765045166015625, -0.7519149780273438, -0.727325439453125, -0.7027359008789062, -0.6781463623046875, -0.6535568237304688, -0.62896728515625, -0.6043777465820312, -0.5797882080078125, -0.5551986694335938, -0.530609130859375, -0.5060195922851562, -0.4814300537109375, -0.45684051513671875, -0.4322509765625, -0.40766143798828125, -0.3830718994140625, -0.35848236083984375, -0.333892822265625, -0.30930328369140625, -0.2847137451171875, -0.26012420654296875, -0.23553466796875, -0.21094512939453125, -0.1863555908203125, -0.16176605224609375, -0.137176513671875, -0.11258697509765625, -0.0879974365234375, -0.06340789794921875, -0.038818359375, -0.01422882080078125, 0.0103607177734375, 0.03495025634765625, 0.059539794921875, 0.08412933349609375, 0.1087188720703125, 0.13330841064453125, 0.15789794921875, 0.18248748779296875, 0.2070770263671875, 0.23166656494140625, 0.256256103515625, 0.28084564208984375, 0.3054351806640625, 0.33002471923828125, 0.3546142578125, 0.37920379638671875, 0.4037933349609375, 0.42838287353515625, 0.452972412109375, 0.47756195068359375, 0.5021514892578125, 0.5267410278320312, 0.55133056640625, 0.5759201049804688, 0.6005096435546875, 0.6250991821289062, 0.649688720703125, 0.6742782592773438, 0.6988677978515625, 0.7234573364257812, 0.748046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 5.0, 7.0, 10.0, 14.0, 22.0, 35.0, 57.0, 3576.0, 189.0, 45.0, 25.0, 17.0, 15.0, 12.0, 9.0, 3.0, 5.0, 7.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1846923828125, -0.17907333374023438, -0.17345428466796875, -0.16783523559570312, -0.1622161865234375, -0.15659713745117188, -0.15097808837890625, -0.14535903930664062, -0.139739990234375, -0.13412094116210938, -0.12850189208984375, -0.12288284301757812, -0.1172637939453125, -0.11164474487304688, -0.10602569580078125, -0.10040664672851562, -0.09478759765625, -0.08916854858398438, -0.08354949951171875, -0.07793045043945312, -0.0723114013671875, -0.06669235229492188, -0.06107330322265625, -0.055454254150390625, -0.049835205078125, -0.044216156005859375, -0.03859710693359375, -0.032978057861328125, -0.0273590087890625, -0.021739959716796875, -0.01612091064453125, -0.010501861572265625, -0.0048828125, 0.000736236572265625, 0.00635528564453125, 0.011974334716796875, 0.0175933837890625, 0.023212432861328125, 0.02883148193359375, 0.034450531005859375, 0.040069580078125, 0.045688629150390625, 0.05130767822265625, 0.056926727294921875, 0.0625457763671875, 0.06816482543945312, 0.07378387451171875, 0.07940292358398438, 0.08502197265625, 0.09064102172851562, 0.09626007080078125, 0.10187911987304688, 0.1074981689453125, 0.11311721801757812, 0.11873626708984375, 0.12435531616210938, 0.129974365234375, 0.13559341430664062, 0.14121246337890625, 0.14683151245117188, 0.1524505615234375, 0.15806961059570312, 0.16368865966796875, 0.16930770874023438, 0.1749267578125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 18.0, 28.0, 62.0, 74.0, 122.0, 159.0, 163.0, 123.0, 102.0, 58.0, 30.0, 18.0, 11.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2079918384552002, -1.1756067276000977, -1.1432214975357056, -1.110836386680603, -1.0784512758255005, -1.0460660457611084, -1.0136809349060059, -0.9812958240509033, -0.948910653591156, -0.9165254831314087, -0.8841403722763062, -0.8517552018165588, -0.8193700313568115, -0.786984920501709, -0.7545997500419617, -0.7222145795822144, -0.6898294687271118, -0.6574442982673645, -0.625059187412262, -0.5926740169525146, -0.5602889060974121, -0.5279037356376648, -0.4955185651779175, -0.46313342452049255, -0.4307482838630676, -0.3983631432056427, -0.3659780025482178, -0.33359283208847046, -0.30120769143104553, -0.2688225507736206, -0.23643739521503448, -0.20405223965644836, -0.171667218208313, -0.13928207755088806, -0.10689692199230194, -0.07451177388429642, -0.042126625776290894, -0.009741485118865967, 0.022643670439720154, 0.055028825998306274, 0.0874139666557312, 0.11979911476373672, 0.15218426287174225, 0.18456941843032837, 0.2169545590877533, 0.24933969974517822, 0.28172487020492554, 0.31411001086235046, 0.3464951515197754, 0.3788802921772003, 0.41126543283462524, 0.44365060329437256, 0.4760357439517975, 0.5084208846092224, 0.5408060550689697, 0.5731911659240723, 0.6055763363838196, 0.6379615068435669, 0.6703466176986694, 0.7027317881584167, 0.7351169586181641, 0.7675020694732666, 0.7998872399330139, 0.8322724103927612, 0.8646575212478638]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 7.0, 9.0, 13.0, 9.0, 6.0, 17.0, 19.0, 20.0, 28.0, 22.0, 29.0, 27.0, 19.0, 32.0, 37.0, 31.0, 42.0, 39.0, 37.0, 33.0, 39.0, 43.0, 41.0, 38.0, 32.0, 32.0, 32.0, 25.0, 32.0, 25.0, 21.0, 29.0, 18.0, 20.0, 16.0, 14.0, 14.0, 11.0, 11.0, 4.0, 7.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.3984965682029724, -0.3874187171459198, -0.3763408958911896, -0.36526304483413696, -0.35418519377708435, -0.34310734272003174, -0.3320295214653015, -0.3209516704082489, -0.3098738193511963, -0.2987959682941437, -0.28771814703941345, -0.27664029598236084, -0.2655624449253082, -0.2544845938682556, -0.2434067726135254, -0.23232892155647278, -0.22125110030174255, -0.21017326414585114, -0.19909541308879852, -0.1880175769329071, -0.1769397258758545, -0.16586188971996307, -0.15478405356407166, -0.14370620250701904, -0.13262836635112762, -0.12155052274465561, -0.1104726791381836, -0.09939484298229218, -0.08831699937582016, -0.07723915576934814, -0.06616131961345673, -0.05508347600698471, -0.044005632400512695, -0.03292778879404068, -0.021849948912858963, -0.010772109031677246, 0.0003057345747947693, 0.011383578181266785, 0.022461414337158203, 0.03353925794363022, 0.044617101550102234, 0.05569494515657425, 0.06677278876304626, 0.07785062491893768, 0.0889284685254097, 0.10000631213188171, 0.11108414828777313, 0.12216199189424515, 0.13323983550071716, 0.14431767165660858, 0.1553955227136612, 0.1664733588695526, 0.17755120992660522, 0.18862904608249664, 0.19970688223838806, 0.21078473329544067, 0.2218625694513321, 0.2329404056072235, 0.24401825666427612, 0.25509607791900635, 0.26617392897605896, 0.2772517800331116, 0.2883296012878418, 0.2994074523448944, 0.310485303401947]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 0.0, 7.0, 7.0, 7.0, 9.0, 15.0, 22.0, 23.0, 46.0, 42.0, 58.0, 99.0, 160.0, 214.0, 345.0, 542.0, 939.0, 1814.0, 4344.0, 11846.0, 42049.0, 197262.0, 551626.0, 179442.0, 37931.0, 11130.0, 4136.0, 1865.0, 959.0, 557.0, 320.0, 198.0, 128.0, 120.0, 68.0, 45.0, 42.0, 29.0, 17.0, 19.0, 16.0, 19.0, 6.0, 4.0, 8.0, 4.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.419677734375, -0.4054374694824219, -0.39119720458984375, -0.3769569396972656, -0.3627166748046875, -0.3484764099121094, -0.33423614501953125, -0.3199958801269531, -0.305755615234375, -0.2915153503417969, -0.27727508544921875, -0.2630348205566406, -0.2487945556640625, -0.23455429077148438, -0.22031402587890625, -0.20607376098632812, -0.19183349609375, -0.17759323120117188, -0.16335296630859375, -0.14911270141601562, -0.1348724365234375, -0.12063217163085938, -0.10639190673828125, -0.09215164184570312, -0.077911376953125, -0.06367111206054688, -0.04943084716796875, -0.035190582275390625, -0.0209503173828125, -0.006710052490234375, 0.00753021240234375, 0.021770477294921875, 0.0360107421875, 0.050251007080078125, 0.06449127197265625, 0.07873153686523438, 0.0929718017578125, 0.10721206665039062, 0.12145233154296875, 0.13569259643554688, 0.149932861328125, 0.16417312622070312, 0.17841339111328125, 0.19265365600585938, 0.2068939208984375, 0.22113418579101562, 0.23537445068359375, 0.24961471557617188, 0.26385498046875, 0.2780952453613281, 0.29233551025390625, 0.3065757751464844, 0.3208160400390625, 0.3350563049316406, 0.34929656982421875, 0.3635368347167969, 0.377777099609375, 0.3920173645019531, 0.40625762939453125, 0.4204978942871094, 0.4347381591796875, 0.4489784240722656, 0.46321868896484375, 0.4774589538574219, 0.49169921875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 12.0, 16.0, 23.0, 36.0, 60.0, 59.0, 82.0, 107.0, 124.0, 117.0, 97.0, 81.0, 51.0, 30.0, 24.0, 23.0, 12.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.275634765625, -0.2689971923828125, -0.262359619140625, -0.2557220458984375, -0.24908447265625, -0.2424468994140625, -0.235809326171875, -0.2291717529296875, -0.2225341796875, -0.2158966064453125, -0.209259033203125, -0.2026214599609375, -0.19598388671875, -0.1893463134765625, -0.182708740234375, -0.1760711669921875, -0.16943359375, -0.1627960205078125, -0.156158447265625, -0.1495208740234375, -0.14288330078125, -0.1362457275390625, -0.129608154296875, -0.1229705810546875, -0.1163330078125, -0.1096954345703125, -0.103057861328125, -0.0964202880859375, -0.08978271484375, -0.0831451416015625, -0.076507568359375, -0.0698699951171875, -0.063232421875, -0.0565948486328125, -0.049957275390625, -0.0433197021484375, -0.03668212890625, -0.0300445556640625, -0.023406982421875, -0.0167694091796875, -0.0101318359375, -0.0034942626953125, 0.003143310546875, 0.0097808837890625, 0.01641845703125, 0.0230560302734375, 0.029693603515625, 0.0363311767578125, 0.04296875, 0.0496063232421875, 0.056243896484375, 0.0628814697265625, 0.06951904296875, 0.0761566162109375, 0.082794189453125, 0.0894317626953125, 0.0960693359375, 0.1027069091796875, 0.109344482421875, 0.1159820556640625, 0.12261962890625, 0.1292572021484375, 0.135894775390625, 0.1425323486328125, 0.149169921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 8.0, 4.0, 8.0, 21.0, 32.0, 45.0, 65.0, 136.0, 170.0, 309.0, 556.0, 1022.0, 2399.0, 7451.0, 35645.0, 313938.0, 602501.0, 66343.0, 11765.0, 3304.0, 1311.0, 650.0, 302.0, 207.0, 122.0, 82.0, 52.0, 27.0, 21.0, 9.0, 11.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.73876953125, -0.7183380126953125, -0.697906494140625, -0.6774749755859375, -0.65704345703125, -0.6366119384765625, -0.616180419921875, -0.5957489013671875, -0.5753173828125, -0.5548858642578125, -0.534454345703125, -0.5140228271484375, -0.49359130859375, -0.4731597900390625, -0.452728271484375, -0.4322967529296875, -0.411865234375, -0.3914337158203125, -0.371002197265625, -0.3505706787109375, -0.33013916015625, -0.3097076416015625, -0.289276123046875, -0.2688446044921875, -0.2484130859375, -0.2279815673828125, -0.207550048828125, -0.1871185302734375, -0.16668701171875, -0.1462554931640625, -0.125823974609375, -0.1053924560546875, -0.0849609375, -0.0645294189453125, -0.044097900390625, -0.0236663818359375, -0.00323486328125, 0.0171966552734375, 0.037628173828125, 0.0580596923828125, 0.0784912109375, 0.0989227294921875, 0.119354248046875, 0.1397857666015625, 0.16021728515625, 0.1806488037109375, 0.201080322265625, 0.2215118408203125, 0.241943359375, 0.2623748779296875, 0.282806396484375, 0.3032379150390625, 0.32366943359375, 0.3441009521484375, 0.364532470703125, 0.3849639892578125, 0.4053955078125, 0.4258270263671875, 0.446258544921875, 0.4666900634765625, 0.48712158203125, 0.5075531005859375, 0.527984619140625, 0.5484161376953125, 0.56884765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 10.0, 8.0, 9.0, 10.0, 20.0, 28.0, 33.0, 44.0, 40.0, 51.0, 50.0, 74.0, 81.0, 73.0, 58.0, 61.0, 68.0, 54.0, 41.0, 35.0, 34.0, 26.0, 28.0, 21.0, 7.0, 7.0, 9.0, 6.0, 4.0, 4.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58984375, -0.5638885498046875, -0.537933349609375, -0.5119781494140625, -0.48602294921875, -0.4600677490234375, -0.434112548828125, -0.4081573486328125, -0.3822021484375, -0.3562469482421875, -0.330291748046875, -0.3043365478515625, -0.27838134765625, -0.2524261474609375, -0.226470947265625, -0.2005157470703125, -0.174560546875, -0.1486053466796875, -0.122650146484375, -0.0966949462890625, -0.07073974609375, -0.0447845458984375, -0.018829345703125, 0.0071258544921875, 0.0330810546875, 0.0590362548828125, 0.084991455078125, 0.1109466552734375, 0.13690185546875, 0.1628570556640625, 0.188812255859375, 0.2147674560546875, 0.24072265625, 0.2666778564453125, 0.292633056640625, 0.3185882568359375, 0.34454345703125, 0.3704986572265625, 0.396453857421875, 0.4224090576171875, 0.4483642578125, 0.4743194580078125, 0.500274658203125, 0.5262298583984375, 0.55218505859375, 0.5781402587890625, 0.604095458984375, 0.6300506591796875, 0.656005859375, 0.6819610595703125, 0.707916259765625, 0.7338714599609375, 0.75982666015625, 0.7857818603515625, 0.811737060546875, 0.8376922607421875, 0.8636474609375, 0.8896026611328125, 0.915557861328125, 0.9415130615234375, 0.96746826171875, 0.9934234619140625, 1.019378662109375, 1.0453338623046875, 1.0712890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 7.0, 23.0, 32.0, 42.0, 77.0, 108.0, 276.0, 723.0, 2653.0, 21083.0, 845294.0, 168763.0, 7110.0, 1378.0, 466.0, 210.0, 111.0, 51.0, 39.0, 24.0, 16.0, 12.0, 6.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7177734375, -0.6958770751953125, -0.673980712890625, -0.6520843505859375, -0.63018798828125, -0.6082916259765625, -0.586395263671875, -0.5644989013671875, -0.5426025390625, -0.5207061767578125, -0.498809814453125, -0.4769134521484375, -0.45501708984375, -0.4331207275390625, -0.411224365234375, -0.3893280029296875, -0.367431640625, -0.3455352783203125, -0.323638916015625, -0.3017425537109375, -0.27984619140625, -0.2579498291015625, -0.236053466796875, -0.2141571044921875, -0.1922607421875, -0.1703643798828125, -0.148468017578125, -0.1265716552734375, -0.10467529296875, -0.0827789306640625, -0.060882568359375, -0.0389862060546875, -0.01708984375, 0.0048065185546875, 0.026702880859375, 0.0485992431640625, 0.07049560546875, 0.0923919677734375, 0.114288330078125, 0.1361846923828125, 0.1580810546875, 0.1799774169921875, 0.201873779296875, 0.2237701416015625, 0.24566650390625, 0.2675628662109375, 0.289459228515625, 0.3113555908203125, 0.333251953125, 0.3551483154296875, 0.377044677734375, 0.3989410400390625, 0.42083740234375, 0.4427337646484375, 0.464630126953125, 0.4865264892578125, 0.5084228515625, 0.5303192138671875, 0.552215576171875, 0.5741119384765625, 0.59600830078125, 0.6179046630859375, 0.639801025390625, 0.6616973876953125, 0.68359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 13.0, 12.0, 16.0, 30.0, 47.0, 71.0, 103.0, 132.0, 159.0, 137.0, 105.0, 60.0, 28.0, 24.0, 23.0, 11.0, 12.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.506111145019531e-05, -4.3122097849845886e-05, -4.118308424949646e-05, -3.9244070649147034e-05, -3.730505704879761e-05, -3.536604344844818e-05, -3.3427029848098755e-05, -3.148801624774933e-05, -2.9549002647399902e-05, -2.7609989047050476e-05, -2.567097544670105e-05, -2.3731961846351624e-05, -2.1792948246002197e-05, -1.985393464565277e-05, -1.7914921045303345e-05, -1.597590744495392e-05, -1.4036893844604492e-05, -1.2097880244255066e-05, -1.015886664390564e-05, -8.219853043556213e-06, -6.280839443206787e-06, -4.341825842857361e-06, -2.4028122425079346e-06, -4.637986421585083e-07, 1.475214958190918e-06, 3.4142285585403442e-06, 5.3532421588897705e-06, 7.292255759239197e-06, 9.231269359588623e-06, 1.117028295993805e-05, 1.3109296560287476e-05, 1.5048310160636902e-05, 1.6987323760986328e-05, 1.8926337361335754e-05, 2.086535096168518e-05, 2.2804364562034607e-05, 2.4743378162384033e-05, 2.668239176273346e-05, 2.8621405363082886e-05, 3.056041896343231e-05, 3.249943256378174e-05, 3.4438446164131165e-05, 3.637745976448059e-05, 3.831647336483002e-05, 4.025548696517944e-05, 4.219450056552887e-05, 4.4133514165878296e-05, 4.607252776622772e-05, 4.801154136657715e-05, 4.9950554966926575e-05, 5.1889568567276e-05, 5.382858216762543e-05, 5.5767595767974854e-05, 5.770660936832428e-05, 5.9645622968673706e-05, 6.158463656902313e-05, 6.352365016937256e-05, 6.546266376972198e-05, 6.740167737007141e-05, 6.934069097042084e-05, 7.127970457077026e-05, 7.321871817111969e-05, 7.515773177146912e-05, 7.709674537181854e-05, 7.903575897216797e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 14.0, 20.0, 23.0, 23.0, 60.0, 90.0, 181.0, 377.0, 905.0, 2832.0, 15340.0, 317671.0, 680294.0, 24828.0, 3806.0, 1102.0, 474.0, 216.0, 123.0, 66.0, 24.0, 24.0, 10.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5450363159179688, -0.5280609130859375, -0.5110855102539062, -0.494110107421875, -0.47713470458984375, -0.4601593017578125, -0.44318389892578125, -0.42620849609375, -0.40923309326171875, -0.3922576904296875, -0.37528228759765625, -0.358306884765625, -0.34133148193359375, -0.3243560791015625, -0.30738067626953125, -0.2904052734375, -0.27342987060546875, -0.2564544677734375, -0.23947906494140625, -0.222503662109375, -0.20552825927734375, -0.1885528564453125, -0.17157745361328125, -0.15460205078125, -0.13762664794921875, -0.1206512451171875, -0.10367584228515625, -0.086700439453125, -0.06972503662109375, -0.0527496337890625, -0.03577423095703125, -0.018798828125, -0.00182342529296875, 0.0151519775390625, 0.03212738037109375, 0.049102783203125, 0.06607818603515625, 0.0830535888671875, 0.10002899169921875, 0.11700439453125, 0.13397979736328125, 0.1509552001953125, 0.16793060302734375, 0.184906005859375, 0.20188140869140625, 0.2188568115234375, 0.23583221435546875, 0.2528076171875, 0.26978302001953125, 0.2867584228515625, 0.30373382568359375, 0.320709228515625, 0.33768463134765625, 0.3546600341796875, 0.37163543701171875, 0.38861083984375, 0.40558624267578125, 0.4225616455078125, 0.43953704833984375, 0.456512451171875, 0.47348785400390625, 0.4904632568359375, 0.5074386596679688, 0.5244140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 14.0, 26.0, 38.0, 60.0, 111.0, 147.0, 164.0, 174.0, 102.0, 59.0, 33.0, 25.0, 17.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6777496337890625, -0.658721923828125, -0.6396942138671875, -0.62066650390625, -0.6016387939453125, -0.582611083984375, -0.5635833740234375, -0.5445556640625, -0.5255279541015625, -0.506500244140625, -0.4874725341796875, -0.46844482421875, -0.4494171142578125, -0.430389404296875, -0.4113616943359375, -0.392333984375, -0.3733062744140625, -0.354278564453125, -0.3352508544921875, -0.31622314453125, -0.2971954345703125, -0.278167724609375, -0.2591400146484375, -0.2401123046875, -0.2210845947265625, -0.202056884765625, -0.1830291748046875, -0.16400146484375, -0.1449737548828125, -0.125946044921875, -0.1069183349609375, -0.087890625, -0.0688629150390625, -0.049835205078125, -0.0308074951171875, -0.01177978515625, 0.0072479248046875, 0.026275634765625, 0.0453033447265625, 0.0643310546875, 0.0833587646484375, 0.102386474609375, 0.1214141845703125, 0.14044189453125, 0.1594696044921875, 0.178497314453125, 0.1975250244140625, 0.216552734375, 0.2355804443359375, 0.254608154296875, 0.2736358642578125, 0.29266357421875, 0.3116912841796875, 0.330718994140625, 0.3497467041015625, 0.3687744140625, 0.3878021240234375, 0.406829833984375, 0.4258575439453125, 0.44488525390625, 0.4639129638671875, 0.482940673828125, 0.5019683837890625, 0.52099609375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 7.0, 13.0, 38.0, 110.0, 220.0, 268.0, 203.0, 94.0, 33.0, 14.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.797433853149414, -8.476529121398926, -8.155624389648438, -7.834719181060791, -7.5138139724731445, -7.192909240722656, -6.872004508972168, -6.55109977722168, -6.230194568634033, -5.909289836883545, -5.588384628295898, -5.26747989654541, -4.946575164794922, -4.625669956207275, -4.304765224456787, -3.9838602542877197, -3.6629552841186523, -3.342050313949585, -3.0211453437805176, -2.7002406120300293, -2.379335641860962, -2.0584306716918945, -1.7375258207321167, -1.4166209697723389, -1.0957159996032715, -0.7748110890388489, -0.45390617847442627, -0.13300126791000366, 0.18790364265441895, 0.5088086128234863, 0.8297134637832642, 1.150618314743042, 1.4715242385864258, 1.7924292087554932, 2.1133341789245605, 2.434238910675049, 2.755143880844116, 3.0760488510131836, 3.396953582763672, 3.7178585529327393, 4.038763523101807, 4.359668254852295, 4.680573463439941, 5.00147819519043, 5.322382926940918, 5.6432881355285645, 5.964192867279053, 6.285098075866699, 6.6060028076171875, 6.926907539367676, 7.247812747955322, 7.5687174797058105, 7.889622688293457, 8.210527420043945, 8.531432151794434, 8.852336883544922, 9.173242568969727, 9.494147300720215, 9.815052032470703, 10.135957717895508, 10.456862449645996, 10.777767181396484, 11.098671913146973, 11.419576644897461, 11.74048137664795]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 3.0, 3.0, 4.0, 5.0, 9.0, 9.0, 14.0, 13.0, 12.0, 16.0, 13.0, 21.0, 20.0, 26.0, 24.0, 30.0, 29.0, 28.0, 34.0, 25.0, 37.0, 35.0, 54.0, 38.0, 44.0, 41.0, 44.0, 39.0, 43.0, 35.0, 38.0, 23.0, 36.0, 23.0, 22.0, 18.0, 13.0, 17.0, 9.0, 13.0, 8.0, 9.0, 3.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.4409196376800537, -2.3617517948150635, -2.282583713531494, -2.203415870666504, -2.1242480278015137, -2.0450801849365234, -1.9659122228622437, -1.8867442607879639, -1.8075764179229736, -1.7284085750579834, -1.6492406129837036, -1.5700726509094238, -1.4909048080444336, -1.4117369651794434, -1.3325690031051636, -1.2534010410308838, -1.1742331981658936, -1.0950653553009033, -1.0158973932266235, -0.9367294907569885, -0.8575615882873535, -0.7783936858177185, -0.6992257833480835, -0.6200578808784485, -0.5408899784088135, -0.46172207593917847, -0.38255417346954346, -0.30338627099990845, -0.22421836853027344, -0.14505046606063843, -0.06588256359100342, 0.013285338878631592, 0.0924530029296875, 0.1716209053993225, 0.2507888078689575, 0.32995671033859253, 0.40912461280822754, 0.48829251527786255, 0.5674604177474976, 0.6466283202171326, 0.7257962226867676, 0.8049641251564026, 0.8841320276260376, 0.9632999300956726, 1.0424678325653076, 1.1216356754302979, 1.2008036375045776, 1.2799715995788574, 1.3591394424438477, 1.438307285308838, 1.5174752473831177, 1.5966432094573975, 1.6758110523223877, 1.754978895187378, 1.8341468572616577, 1.9133148193359375, 1.9924826622009277, 2.071650505065918, 2.150818347930908, 2.2299864292144775, 2.3091542720794678, 2.388322114944458, 2.4674901962280273, 2.5466580390930176, 2.625825881958008]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 11.0, 21.0, 23.0, 48.0, 80.0, 148.0, 439.0, 1505.0, 10438.0, 4131290.0, 46281.0, 3021.0, 621.0, 181.0, 73.0, 29.0, 18.0, 10.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.07421875, -2.0127105712890625, -1.951202392578125, -1.8896942138671875, -1.82818603515625, -1.7666778564453125, -1.705169677734375, -1.6436614990234375, -1.5821533203125, -1.5206451416015625, -1.459136962890625, -1.3976287841796875, -1.33612060546875, -1.2746124267578125, -1.213104248046875, -1.1515960693359375, -1.090087890625, -1.0285797119140625, -0.967071533203125, -0.9055633544921875, -0.84405517578125, -0.7825469970703125, -0.721038818359375, -0.6595306396484375, -0.5980224609375, -0.5365142822265625, -0.475006103515625, -0.4134979248046875, -0.35198974609375, -0.2904815673828125, -0.228973388671875, -0.1674652099609375, -0.10595703125, -0.0444488525390625, 0.017059326171875, 0.0785675048828125, 0.14007568359375, 0.2015838623046875, 0.263092041015625, 0.3246002197265625, 0.3861083984375, 0.4476165771484375, 0.509124755859375, 0.5706329345703125, 0.63214111328125, 0.6936492919921875, 0.755157470703125, 0.8166656494140625, 0.878173828125, 0.9396820068359375, 1.001190185546875, 1.0626983642578125, 1.12420654296875, 1.1857147216796875, 1.247222900390625, 1.3087310791015625, 1.3702392578125, 1.4317474365234375, 1.493255615234375, 1.5547637939453125, 1.61627197265625, 1.6777801513671875, 1.739288330078125, 1.8007965087890625, 1.8623046875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 8.0, 12.0, 19.0, 24.0, 56.0, 51.0, 58.0, 102.0, 109.0, 140.0, 98.0, 104.0, 56.0, 50.0, 28.0, 29.0, 10.0, 16.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2322998046875, -0.22586822509765625, -0.2194366455078125, -0.21300506591796875, -0.206573486328125, -0.20014190673828125, -0.1937103271484375, -0.18727874755859375, -0.18084716796875, -0.17441558837890625, -0.1679840087890625, -0.16155242919921875, -0.155120849609375, -0.14868927001953125, -0.1422576904296875, -0.13582611083984375, -0.12939453125, -0.12296295166015625, -0.1165313720703125, -0.11009979248046875, -0.103668212890625, -0.09723663330078125, -0.0908050537109375, -0.08437347412109375, -0.07794189453125, -0.07151031494140625, -0.0650787353515625, -0.05864715576171875, -0.052215576171875, -0.04578399658203125, -0.0393524169921875, -0.03292083740234375, -0.0264892578125, -0.02005767822265625, -0.0136260986328125, -0.00719451904296875, -0.000762939453125, 0.00566864013671875, 0.0121002197265625, 0.01853179931640625, 0.02496337890625, 0.03139495849609375, 0.0378265380859375, 0.04425811767578125, 0.050689697265625, 0.05712127685546875, 0.0635528564453125, 0.06998443603515625, 0.076416015625, 0.08284759521484375, 0.0892791748046875, 0.09571075439453125, 0.102142333984375, 0.10857391357421875, 0.1150054931640625, 0.12143707275390625, 0.12786865234375, 0.13430023193359375, 0.1407318115234375, 0.14716339111328125, 0.153594970703125, 0.16002655029296875, 0.1664581298828125, 0.17288970947265625, 0.1793212890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 19.0, 10.0, 19.0, 24.0, 46.0, 48.0, 83.0, 123.0, 235.0, 363.0, 665.0, 1195.0, 2349.0, 5085.0, 13387.0, 49476.0, 3850410.0, 226282.0, 27936.0, 8755.0, 3729.0, 1754.0, 884.0, 519.0, 295.0, 209.0, 147.0, 97.0, 49.0, 23.0, 21.0, 14.0, 11.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6237106323242188, -0.5975189208984375, -0.5713272094726562, -0.545135498046875, -0.5189437866210938, -0.4927520751953125, -0.46656036376953125, -0.44036865234375, -0.41417694091796875, -0.3879852294921875, -0.36179351806640625, -0.335601806640625, -0.30941009521484375, -0.2832183837890625, -0.25702667236328125, -0.2308349609375, -0.20464324951171875, -0.1784515380859375, -0.15225982666015625, -0.126068115234375, -0.09987640380859375, -0.0736846923828125, -0.04749298095703125, -0.02130126953125, 0.00489044189453125, 0.0310821533203125, 0.05727386474609375, 0.083465576171875, 0.10965728759765625, 0.1358489990234375, 0.16204071044921875, 0.188232421875, 0.21442413330078125, 0.2406158447265625, 0.26680755615234375, 0.292999267578125, 0.31919097900390625, 0.3453826904296875, 0.37157440185546875, 0.39776611328125, 0.42395782470703125, 0.4501495361328125, 0.47634124755859375, 0.502532958984375, 0.5287246704101562, 0.5549163818359375, 0.5811080932617188, 0.6072998046875, 0.6334915161132812, 0.6596832275390625, 0.6858749389648438, 0.712066650390625, 0.7382583618164062, 0.7644500732421875, 0.7906417846679688, 0.81683349609375, 0.8430252075195312, 0.8692169189453125, 0.8954086303710938, 0.921600341796875, 0.9477920532226562, 0.9739837646484375, 1.0001754760742188, 1.0263671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 7.0, 9.0, 11.0, 32.0, 41.0, 65.0, 126.0, 3110.0, 395.0, 102.0, 59.0, 31.0, 16.0, 12.0, 6.0, 9.0, 6.0, 8.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378173828125, -0.3662681579589844, -0.35436248779296875, -0.3424568176269531, -0.3305511474609375, -0.3186454772949219, -0.30673980712890625, -0.2948341369628906, -0.282928466796875, -0.2710227966308594, -0.25911712646484375, -0.24721145629882812, -0.2353057861328125, -0.22340011596679688, -0.21149444580078125, -0.19958877563476562, -0.18768310546875, -0.17577743530273438, -0.16387176513671875, -0.15196609497070312, -0.1400604248046875, -0.12815475463867188, -0.11624908447265625, -0.10434341430664062, -0.092437744140625, -0.08053207397460938, -0.06862640380859375, -0.056720733642578125, -0.0448150634765625, -0.032909393310546875, -0.02100372314453125, -0.009098052978515625, 0.0028076171875, 0.014713287353515625, 0.02661895751953125, 0.038524627685546875, 0.0504302978515625, 0.062335968017578125, 0.07424163818359375, 0.08614730834960938, 0.098052978515625, 0.10995864868164062, 0.12186431884765625, 0.13376998901367188, 0.1456756591796875, 0.15758132934570312, 0.16948699951171875, 0.18139266967773438, 0.19329833984375, 0.20520401000976562, 0.21710968017578125, 0.22901535034179688, 0.2409210205078125, 0.2528266906738281, 0.26473236083984375, 0.2766380310058594, 0.288543701171875, 0.3004493713378906, 0.31235504150390625, 0.3242607116699219, 0.3361663818359375, 0.3480720520019531, 0.35997772216796875, 0.3718833923339844, 0.3837890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 20.0, 40.0, 79.0, 164.0, 216.0, 202.0, 130.0, 74.0, 42.0, 15.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8567283153533936, -1.7719531059265137, -1.6871777772903442, -1.6024024486541748, -1.517627239227295, -1.432852029800415, -1.3480767011642456, -1.2633013725280762, -1.1785261631011963, -1.0937509536743164, -1.008975625038147, -0.9242003560066223, -0.8394250869750977, -0.754649817943573, -0.6698745489120483, -0.5850992798805237, -0.500324010848999, -0.41554874181747437, -0.3307734727859497, -0.24599820375442505, -0.1612229347229004, -0.07644766569137573, 0.008327603340148926, 0.09310287237167358, 0.17787814140319824, 0.2626534104347229, 0.34742867946624756, 0.4322039484977722, 0.5169792175292969, 0.6017544865608215, 0.6865297555923462, 0.7713050246238708, 0.8560802936553955, 0.9408555626869202, 1.0256308317184448, 1.1104061603546143, 1.1951813697814941, 1.279956579208374, 1.3647319078445435, 1.449507236480713, 1.5342824459075928, 1.6190576553344727, 1.703832983970642, 1.7886083126068115, 1.8733835220336914, 1.9581587314605713, 2.042933940887451, 2.12770938873291, 2.21248459815979, 2.29725980758667, 2.382035255432129, 2.466810464859009, 2.5515856742858887, 2.6363608837127686, 2.7211360931396484, 2.8059115409851074, 2.8906867504119873, 2.975461959838867, 3.060237407684326, 3.145012617111206, 3.229787826538086, 3.314563035964966, 3.3993382453918457, 3.4841136932373047, 3.5688889026641846]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 10.0, 8.0, 7.0, 9.0, 7.0, 12.0, 18.0, 22.0, 12.0, 18.0, 25.0, 35.0, 18.0, 22.0, 34.0, 35.0, 37.0, 40.0, 30.0, 33.0, 46.0, 62.0, 30.0, 40.0, 37.0, 34.0, 29.0, 35.0, 31.0, 32.0, 20.0, 24.0, 14.0, 21.0, 14.0, 18.0, 12.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.7917454242706299, -0.7680073976516724, -0.7442693114280701, -0.7205312252044678, -0.6967931985855103, -0.6730551719665527, -0.6493170857429504, -0.6255789995193481, -0.6018409729003906, -0.5781029462814331, -0.5543648600578308, -0.5306267738342285, -0.506888747215271, -0.4831506907939911, -0.4594126343727112, -0.4356745779514313, -0.41193652153015137, -0.38819846510887146, -0.36446040868759155, -0.34072235226631165, -0.31698429584503174, -0.29324623942375183, -0.2695081830024719, -0.24577012658119202, -0.2220320701599121, -0.1982940137386322, -0.1745559573173523, -0.1508179008960724, -0.12707984447479248, -0.10334178805351257, -0.07960373163223267, -0.05586567521095276, -0.03212767839431763, -0.00838962197303772, 0.015348434448242188, 0.039086490869522095, 0.062824547290802, 0.08656260371208191, 0.11030066013336182, 0.13403871655464172, 0.15777677297592163, 0.18151482939720154, 0.20525288581848145, 0.22899094223976135, 0.25272899866104126, 0.27646705508232117, 0.3002051115036011, 0.323943167924881, 0.3476812243461609, 0.3714192807674408, 0.3951573371887207, 0.4188953936100006, 0.4426334500312805, 0.4663715064525604, 0.49010956287384033, 0.5138475894927979, 0.5375856757164001, 0.5613237619400024, 0.58506178855896, 0.6087998151779175, 0.6325379014015198, 0.6562759876251221, 0.6800140142440796, 0.7037520408630371, 0.7274901270866394]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 18.0, 21.0, 25.0, 26.0, 56.0, 87.0, 167.0, 274.0, 572.0, 1258.0, 3708.0, 14494.0, 78477.0, 513055.0, 367165.0, 53472.0, 10623.0, 2911.0, 1082.0, 449.0, 230.0, 134.0, 68.0, 46.0, 31.0, 20.0, 14.0, 9.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.650390625, -0.6270751953125, -0.603759765625, -0.5804443359375, -0.55712890625, -0.5338134765625, -0.510498046875, -0.4871826171875, -0.4638671875, -0.4405517578125, -0.417236328125, -0.3939208984375, -0.37060546875, -0.3472900390625, -0.323974609375, -0.3006591796875, -0.27734375, -0.2540283203125, -0.230712890625, -0.2073974609375, -0.18408203125, -0.1607666015625, -0.137451171875, -0.1141357421875, -0.0908203125, -0.0675048828125, -0.044189453125, -0.0208740234375, 0.00244140625, 0.0257568359375, 0.049072265625, 0.0723876953125, 0.095703125, 0.1190185546875, 0.142333984375, 0.1656494140625, 0.18896484375, 0.2122802734375, 0.235595703125, 0.2589111328125, 0.2822265625, 0.3055419921875, 0.328857421875, 0.3521728515625, 0.37548828125, 0.3988037109375, 0.422119140625, 0.4454345703125, 0.46875, 0.4920654296875, 0.515380859375, 0.5386962890625, 0.56201171875, 0.5853271484375, 0.608642578125, 0.6319580078125, 0.6552734375, 0.6785888671875, 0.701904296875, 0.7252197265625, 0.74853515625, 0.7718505859375, 0.795166015625, 0.8184814453125, 0.841796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 20.0, 18.0, 25.0, 36.0, 34.0, 39.0, 60.0, 55.0, 63.0, 72.0, 79.0, 88.0, 69.0, 72.0, 53.0, 42.0, 36.0, 30.0, 25.0, 8.0, 16.0, 9.0, 6.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1971435546875, -0.1918468475341797, -0.18655014038085938, -0.18125343322753906, -0.17595672607421875, -0.17066001892089844, -0.16536331176757812, -0.1600666046142578, -0.1547698974609375, -0.1494731903076172, -0.14417648315429688, -0.13887977600097656, -0.13358306884765625, -0.12828636169433594, -0.12298965454101562, -0.11769294738769531, -0.112396240234375, -0.10709953308105469, -0.10180282592773438, -0.09650611877441406, -0.09120941162109375, -0.08591270446777344, -0.08061599731445312, -0.07531929016113281, -0.0700225830078125, -0.06472587585449219, -0.059429168701171875, -0.05413246154785156, -0.04883575439453125, -0.04353904724121094, -0.038242340087890625, -0.03294563293457031, -0.02764892578125, -0.022352218627929688, -0.017055511474609375, -0.011758804321289062, -0.00646209716796875, -0.0011653900146484375, 0.004131317138671875, 0.009428024291992188, 0.0147247314453125, 0.020021438598632812, 0.025318145751953125, 0.030614852905273438, 0.03591156005859375, 0.04120826721191406, 0.046504974365234375, 0.05180168151855469, 0.057098388671875, 0.06239509582519531, 0.06769180297851562, 0.07298851013183594, 0.07828521728515625, 0.08358192443847656, 0.08887863159179688, 0.09417533874511719, 0.0994720458984375, 0.10476875305175781, 0.11006546020507812, 0.11536216735839844, 0.12065887451171875, 0.12595558166503906, 0.13125228881835938, 0.1365489959716797, 0.141845703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 4.0, 17.0, 24.0, 36.0, 48.0, 97.0, 130.0, 237.0, 378.0, 666.0, 1403.0, 3276.0, 10735.0, 65699.0, 630315.0, 294199.0, 30146.0, 6370.0, 2337.0, 1054.0, 519.0, 327.0, 178.0, 122.0, 83.0, 44.0, 36.0, 28.0, 10.0, 6.0, 7.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72802734375, -0.7027587890625, -0.677490234375, -0.6522216796875, -0.626953125, -0.6016845703125, -0.576416015625, -0.5511474609375, -0.52587890625, -0.5006103515625, -0.475341796875, -0.4500732421875, -0.4248046875, -0.3995361328125, -0.374267578125, -0.3489990234375, -0.32373046875, -0.2984619140625, -0.273193359375, -0.2479248046875, -0.22265625, -0.1973876953125, -0.172119140625, -0.1468505859375, -0.12158203125, -0.0963134765625, -0.071044921875, -0.0457763671875, -0.0205078125, 0.0047607421875, 0.030029296875, 0.0552978515625, 0.08056640625, 0.1058349609375, 0.131103515625, 0.1563720703125, 0.181640625, 0.2069091796875, 0.232177734375, 0.2574462890625, 0.28271484375, 0.3079833984375, 0.333251953125, 0.3585205078125, 0.3837890625, 0.4090576171875, 0.434326171875, 0.4595947265625, 0.48486328125, 0.5101318359375, 0.535400390625, 0.5606689453125, 0.5859375, 0.6112060546875, 0.636474609375, 0.6617431640625, 0.68701171875, 0.7122802734375, 0.737548828125, 0.7628173828125, 0.7880859375, 0.8133544921875, 0.838623046875, 0.8638916015625, 0.88916015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 19.0, 13.0, 23.0, 34.0, 39.0, 37.0, 42.0, 52.0, 73.0, 49.0, 46.0, 64.0, 75.0, 66.0, 64.0, 57.0, 45.0, 42.0, 35.0, 22.0, 16.0, 16.0, 8.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88671875, -0.8615341186523438, -0.8363494873046875, -0.8111648559570312, -0.785980224609375, -0.7607955932617188, -0.7356109619140625, -0.7104263305664062, -0.68524169921875, -0.6600570678710938, -0.6348724365234375, -0.6096878051757812, -0.584503173828125, -0.5593185424804688, -0.5341339111328125, -0.5089492797851562, -0.4837646484375, -0.45858001708984375, -0.4333953857421875, -0.40821075439453125, -0.383026123046875, -0.35784149169921875, -0.3326568603515625, -0.30747222900390625, -0.28228759765625, -0.25710296630859375, -0.2319183349609375, -0.20673370361328125, -0.181549072265625, -0.15636444091796875, -0.1311798095703125, -0.10599517822265625, -0.080810546875, -0.05562591552734375, -0.0304412841796875, -0.00525665283203125, 0.019927978515625, 0.04511260986328125, 0.0702972412109375, 0.09548187255859375, 0.12066650390625, 0.14585113525390625, 0.1710357666015625, 0.19622039794921875, 0.221405029296875, 0.24658966064453125, 0.2717742919921875, 0.29695892333984375, 0.3221435546875, 0.34732818603515625, 0.3725128173828125, 0.39769744873046875, 0.422882080078125, 0.44806671142578125, 0.4732513427734375, 0.49843597412109375, 0.52362060546875, 0.5488052368164062, 0.5739898681640625, 0.5991744995117188, 0.624359130859375, 0.6495437622070312, 0.6747283935546875, 0.6999130249023438, 0.72509765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 3.0, 10.0, 9.0, 22.0, 25.0, 36.0, 59.0, 101.0, 187.0, 365.0, 947.0, 4044.0, 69840.0, 942180.0, 26653.0, 2641.0, 764.0, 282.0, 165.0, 77.0, 48.0, 22.0, 31.0, 12.0, 6.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66748046875, -0.6455078125, -0.62353515625, -0.6015625, -0.57958984375, -0.5576171875, -0.53564453125, -0.513671875, -0.49169921875, -0.4697265625, -0.44775390625, -0.42578125, -0.40380859375, -0.3818359375, -0.35986328125, -0.337890625, -0.31591796875, -0.2939453125, -0.27197265625, -0.25, -0.22802734375, -0.2060546875, -0.18408203125, -0.162109375, -0.14013671875, -0.1181640625, -0.09619140625, -0.07421875, -0.05224609375, -0.0302734375, -0.00830078125, 0.013671875, 0.03564453125, 0.0576171875, 0.07958984375, 0.1015625, 0.12353515625, 0.1455078125, 0.16748046875, 0.189453125, 0.21142578125, 0.2333984375, 0.25537109375, 0.27734375, 0.29931640625, 0.3212890625, 0.34326171875, 0.365234375, 0.38720703125, 0.4091796875, 0.43115234375, 0.453125, 0.47509765625, 0.4970703125, 0.51904296875, 0.541015625, 0.56298828125, 0.5849609375, 0.60693359375, 0.62890625, 0.65087890625, 0.6728515625, 0.69482421875, 0.716796875, 0.73876953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 29.0, 65.0, 114.0, 255.0, 273.0, 164.0, 53.0, 31.0, 12.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015974044799804688, -0.00015505775809288025, -0.00015037506818771362, -0.000145692378282547, -0.00014100968837738037, -0.00013632699847221375, -0.00013164430856704712, -0.0001269616186618805, -0.00012227892875671387, -0.00011759623885154724, -0.00011291354894638062, -0.00010823085904121399, -0.00010354816913604736, -9.886547923088074e-05, -9.418278932571411e-05, -8.950009942054749e-05, -8.481740951538086e-05, -8.013471961021423e-05, -7.545202970504761e-05, -7.076933979988098e-05, -6.608664989471436e-05, -6.140395998954773e-05, -5.6721270084381104e-05, -5.203858017921448e-05, -4.735589027404785e-05, -4.2673200368881226e-05, -3.79905104637146e-05, -3.3307820558547974e-05, -2.8625130653381348e-05, -2.394244074821472e-05, -1.9259750843048096e-05, -1.457706093788147e-05, -9.894371032714844e-06, -5.211681127548218e-06, -5.289912223815918e-07, 4.153698682785034e-06, 8.83638858795166e-06, 1.3519078493118286e-05, 1.8201768398284912e-05, 2.2884458303451538e-05, 2.7567148208618164e-05, 3.224983811378479e-05, 3.6932528018951416e-05, 4.161521792411804e-05, 4.629790782928467e-05, 5.0980597734451294e-05, 5.566328763961792e-05, 6.0345977544784546e-05, 6.502866744995117e-05, 6.97113573551178e-05, 7.439404726028442e-05, 7.907673716545105e-05, 8.375942707061768e-05, 8.84421169757843e-05, 9.312480688095093e-05, 9.780749678611755e-05, 0.00010249018669128418, 0.0001071728765964508, 0.00011185556650161743, 0.00011653825640678406, 0.00012122094631195068, 0.0001259036362171173, 0.00013058632612228394, 0.00013526901602745056, 0.0001399517059326172]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 4.0, 8.0, 10.0, 13.0, 35.0, 28.0, 52.0, 123.0, 261.0, 510.0, 1561.0, 7017.0, 143554.0, 868763.0, 21938.0, 3063.0, 864.0, 326.0, 170.0, 103.0, 39.0, 48.0, 17.0, 10.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.490814208984375, -0.47137451171875, -0.451934814453125, -0.4324951171875, -0.413055419921875, -0.39361572265625, -0.374176025390625, -0.354736328125, -0.335296630859375, -0.31585693359375, -0.296417236328125, -0.2769775390625, -0.257537841796875, -0.23809814453125, -0.218658447265625, -0.19921875, -0.179779052734375, -0.16033935546875, -0.140899658203125, -0.1214599609375, -0.102020263671875, -0.08258056640625, -0.063140869140625, -0.043701171875, -0.024261474609375, -0.00482177734375, 0.014617919921875, 0.0340576171875, 0.053497314453125, 0.07293701171875, 0.092376708984375, 0.11181640625, 0.131256103515625, 0.15069580078125, 0.170135498046875, 0.1895751953125, 0.209014892578125, 0.22845458984375, 0.247894287109375, 0.267333984375, 0.286773681640625, 0.30621337890625, 0.325653076171875, 0.3450927734375, 0.364532470703125, 0.38397216796875, 0.403411865234375, 0.4228515625, 0.442291259765625, 0.46173095703125, 0.481170654296875, 0.5006103515625, 0.520050048828125, 0.53948974609375, 0.558929443359375, 0.578369140625, 0.597808837890625, 0.61724853515625, 0.636688232421875, 0.6561279296875, 0.675567626953125, 0.69500732421875, 0.714447021484375, 0.73388671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 9.0, 11.0, 9.0, 25.0, 44.0, 91.0, 163.0, 223.0, 181.0, 113.0, 58.0, 39.0, 13.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5458984375, -0.5254440307617188, -0.5049896240234375, -0.48453521728515625, -0.464080810546875, -0.44362640380859375, -0.4231719970703125, -0.40271759033203125, -0.38226318359375, -0.36180877685546875, -0.3413543701171875, -0.32089996337890625, -0.300445556640625, -0.27999114990234375, -0.2595367431640625, -0.23908233642578125, -0.2186279296875, -0.19817352294921875, -0.1777191162109375, -0.15726470947265625, -0.136810302734375, -0.11635589599609375, -0.0959014892578125, -0.07544708251953125, -0.05499267578125, -0.03453826904296875, -0.0140838623046875, 0.00637054443359375, 0.026824951171875, 0.04727935791015625, 0.0677337646484375, 0.08818817138671875, 0.108642578125, 0.12909698486328125, 0.1495513916015625, 0.17000579833984375, 0.190460205078125, 0.21091461181640625, 0.2313690185546875, 0.25182342529296875, 0.27227783203125, 0.29273223876953125, 0.3131866455078125, 0.33364105224609375, 0.354095458984375, 0.37454986572265625, 0.3950042724609375, 0.41545867919921875, 0.4359130859375, 0.45636749267578125, 0.4768218994140625, 0.49727630615234375, 0.517730712890625, 0.5381851196289062, 0.5586395263671875, 0.5790939331054688, 0.59954833984375, 0.6200027465820312, 0.6404571533203125, 0.6609115600585938, 0.681365966796875, 0.7018203735351562, 0.7222747802734375, 0.7427291870117188, 0.76318359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 13.0, 9.0, 6.0, 25.0, 66.0, 83.0, 130.0, 170.0, 184.0, 135.0, 72.0, 58.0, 26.0, 13.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.41426944732666, -9.200115203857422, -8.985960960388184, -8.771806716918945, -8.557652473449707, -8.343498229980469, -8.129343032836914, -7.915189266204834, -7.7010345458984375, -7.486880302429199, -7.272726058959961, -7.058571815490723, -6.844417095184326, -6.630262851715088, -6.41610860824585, -6.201954364776611, -5.987800121307373, -5.773645877838135, -5.5594916343688965, -5.3453369140625, -5.131182670593262, -4.917028427124023, -4.702874183654785, -4.488719940185547, -4.274565696716309, -4.06041145324707, -3.846256971359253, -3.6321027278900146, -3.4179482460021973, -3.203794002532959, -2.9896397590637207, -2.7754855155944824, -2.561330795288086, -2.3471765518188477, -2.1330220699310303, -1.918867826461792, -1.7047134637832642, -1.4905591011047363, -1.276404857635498, -1.0622504949569702, -0.8480961322784424, -0.6339417695999146, -0.4197874665260315, -0.20563316345214844, 0.008521199226379395, 0.22267556190490723, 0.4368298053741455, 0.6509841680526733, 0.8651385307312012, 1.079292893409729, 1.2934472560882568, 1.5076014995574951, 1.721755862236023, 1.9359102249145508, 2.150064468383789, 2.3642187118530273, 2.5783731937408447, 2.792527437210083, 3.0066819190979004, 3.2208361625671387, 3.434990406036377, 3.6491448879241943, 3.8632991313934326, 4.07745361328125, 4.291607856750488]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 4.0, 4.0, 11.0, 6.0, 18.0, 20.0, 20.0, 24.0, 15.0, 32.0, 33.0, 29.0, 35.0, 51.0, 34.0, 43.0, 40.0, 49.0, 52.0, 50.0, 49.0, 45.0, 48.0, 43.0, 29.0, 34.0, 25.0, 18.0, 20.0, 23.0, 16.0, 14.0, 12.0, 9.0, 10.0, 8.0, 7.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5441877841949463, -2.4545912742614746, -2.364994525909424, -2.275397777557373, -2.1858012676239014, -2.0962047576904297, -2.006608009338379, -1.9170113801956177, -1.8274147510528564, -1.7378181219100952, -1.648221492767334, -1.5586248636245728, -1.4690282344818115, -1.3794316053390503, -1.289834976196289, -1.2002383470535278, -1.1106417179107666, -1.0210450887680054, -0.9314484596252441, -0.8418518304824829, -0.7522552013397217, -0.6626585721969604, -0.5730619430541992, -0.483465313911438, -0.39386868476867676, -0.3042720556259155, -0.2146754264831543, -0.12507879734039307, -0.035482168197631836, 0.054114460945129395, 0.14371109008789062, 0.23330771923065186, 0.3229045867919922, 0.4125012159347534, 0.5020978450775146, 0.5916944742202759, 0.6812911033630371, 0.7708877325057983, 0.8604843616485596, 0.9500809907913208, 1.039677619934082, 1.1292742490768433, 1.2188708782196045, 1.3084675073623657, 1.398064136505127, 1.4876607656478882, 1.5772573947906494, 1.6668540239334106, 1.7564506530761719, 1.846047282218933, 1.9356439113616943, 2.025240421295166, 2.114837169647217, 2.2044339179992676, 2.2940304279327393, 2.383626937866211, 2.4732236862182617, 2.5628204345703125, 2.652416944503784, 2.742013454437256, 2.8316102027893066, 2.9212069511413574, 3.010803461074829, 3.100399971008301, 3.1899967193603516]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 16.0, 19.0, 30.0, 81.0, 139.0, 305.0, 939.0, 4155.0, 36961.0, 3856217.0, 281310.0, 11444.0, 1731.0, 470.0, 191.0, 91.0, 49.0, 38.0, 21.0, 23.0, 8.0, 6.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4501953125, -0.4233551025390625, -0.396514892578125, -0.3696746826171875, -0.34283447265625, -0.3159942626953125, -0.289154052734375, -0.2623138427734375, -0.2354736328125, -0.2086334228515625, -0.181793212890625, -0.1549530029296875, -0.12811279296875, -0.1012725830078125, -0.074432373046875, -0.0475921630859375, -0.020751953125, 0.0060882568359375, 0.032928466796875, 0.0597686767578125, 0.08660888671875, 0.1134490966796875, 0.140289306640625, 0.1671295166015625, 0.1939697265625, 0.2208099365234375, 0.247650146484375, 0.2744903564453125, 0.30133056640625, 0.3281707763671875, 0.355010986328125, 0.3818511962890625, 0.40869140625, 0.4355316162109375, 0.462371826171875, 0.4892120361328125, 0.51605224609375, 0.5428924560546875, 0.569732666015625, 0.5965728759765625, 0.6234130859375, 0.6502532958984375, 0.677093505859375, 0.7039337158203125, 0.73077392578125, 0.7576141357421875, 0.784454345703125, 0.8112945556640625, 0.838134765625, 0.8649749755859375, 0.891815185546875, 0.9186553955078125, 0.94549560546875, 0.9723358154296875, 0.999176025390625, 1.0260162353515625, 1.0528564453125, 1.0796966552734375, 1.106536865234375, 1.1333770751953125, 1.16021728515625, 1.1870574951171875, 1.213897705078125, 1.2407379150390625, 1.267578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 9.0, 7.0, 12.0, 16.0, 17.0, 28.0, 30.0, 33.0, 42.0, 54.0, 59.0, 62.0, 64.0, 74.0, 75.0, 76.0, 69.0, 65.0, 46.0, 37.0, 24.0, 16.0, 23.0, 17.0, 9.0, 9.0, 10.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1868896484375, -0.18204021453857422, -0.17719078063964844, -0.17234134674072266, -0.16749191284179688, -0.1626424789428711, -0.1577930450439453, -0.15294361114501953, -0.14809417724609375, -0.14324474334716797, -0.1383953094482422, -0.1335458755493164, -0.12869644165039062, -0.12384700775146484, -0.11899757385253906, -0.11414813995361328, -0.1092987060546875, -0.10444927215576172, -0.09959983825683594, -0.09475040435791016, -0.08990097045898438, -0.0850515365600586, -0.08020210266113281, -0.07535266876220703, -0.07050323486328125, -0.06565380096435547, -0.06080436706542969, -0.055954933166503906, -0.051105499267578125, -0.046256065368652344, -0.04140663146972656, -0.03655719757080078, -0.031707763671875, -0.02685832977294922, -0.022008895874023438, -0.017159461975097656, -0.012310028076171875, -0.007460594177246094, -0.0026111602783203125, 0.0022382736206054688, 0.00708770751953125, 0.011937141418457031, 0.016786575317382812, 0.021636009216308594, 0.026485443115234375, 0.031334877014160156, 0.03618431091308594, 0.04103374481201172, 0.0458831787109375, 0.05073261260986328, 0.05558204650878906, 0.060431480407714844, 0.06528091430664062, 0.0701303482055664, 0.07497978210449219, 0.07982921600341797, 0.08467864990234375, 0.08952808380126953, 0.09437751770019531, 0.0992269515991211, 0.10407638549804688, 0.10892581939697266, 0.11377525329589844, 0.11862468719482422, 0.12347412109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 13.0, 15.0, 28.0, 20.0, 43.0, 51.0, 112.0, 178.0, 319.0, 625.0, 1175.0, 2634.0, 6658.0, 18999.0, 74722.0, 760945.0, 3134548.0, 144891.0, 30844.0, 10018.0, 3791.0, 1703.0, 812.0, 438.0, 258.0, 145.0, 89.0, 59.0, 44.0, 33.0, 18.0, 11.0, 10.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5546875, -0.5393600463867188, -0.5240325927734375, -0.5087051391601562, -0.493377685546875, -0.47805023193359375, -0.4627227783203125, -0.44739532470703125, -0.43206787109375, -0.41674041748046875, -0.4014129638671875, -0.38608551025390625, -0.370758056640625, -0.35543060302734375, -0.3401031494140625, -0.32477569580078125, -0.3094482421875, -0.29412078857421875, -0.2787933349609375, -0.26346588134765625, -0.248138427734375, -0.23281097412109375, -0.2174835205078125, -0.20215606689453125, -0.18682861328125, -0.17150115966796875, -0.1561737060546875, -0.14084625244140625, -0.125518798828125, -0.11019134521484375, -0.0948638916015625, -0.07953643798828125, -0.064208984375, -0.04888153076171875, -0.0335540771484375, -0.01822662353515625, -0.002899169921875, 0.01242828369140625, 0.0277557373046875, 0.04308319091796875, 0.05841064453125, 0.07373809814453125, 0.0890655517578125, 0.10439300537109375, 0.119720458984375, 0.13504791259765625, 0.1503753662109375, 0.16570281982421875, 0.1810302734375, 0.19635772705078125, 0.2116851806640625, 0.22701263427734375, 0.242340087890625, 0.25766754150390625, 0.2729949951171875, 0.28832244873046875, 0.30364990234375, 0.31897735595703125, 0.3343048095703125, 0.34963226318359375, 0.364959716796875, 0.38028717041015625, 0.3956146240234375, 0.41094207763671875, 0.42626953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 9.0, 19.0, 17.0, 18.0, 27.0, 25.0, 52.0, 73.0, 91.0, 134.0, 213.0, 400.0, 808.0, 966.0, 432.0, 227.0, 150.0, 115.0, 63.0, 59.0, 33.0, 22.0, 21.0, 12.0, 11.0, 11.0, 7.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37353515625, -0.3602180480957031, -0.34690093994140625, -0.3335838317871094, -0.3202667236328125, -0.3069496154785156, -0.29363250732421875, -0.2803153991699219, -0.266998291015625, -0.2536811828613281, -0.24036407470703125, -0.22704696655273438, -0.2137298583984375, -0.20041275024414062, -0.18709564208984375, -0.17377853393554688, -0.16046142578125, -0.14714431762695312, -0.13382720947265625, -0.12051010131835938, -0.1071929931640625, -0.09387588500976562, -0.08055877685546875, -0.06724166870117188, -0.053924560546875, -0.040607452392578125, -0.02729034423828125, -0.013973236083984375, -0.0006561279296875, 0.012660980224609375, 0.02597808837890625, 0.039295196533203125, 0.0526123046875, 0.06592941284179688, 0.07924652099609375, 0.09256362915039062, 0.1058807373046875, 0.11919784545898438, 0.13251495361328125, 0.14583206176757812, 0.159149169921875, 0.17246627807617188, 0.18578338623046875, 0.19910049438476562, 0.2124176025390625, 0.22573471069335938, 0.23905181884765625, 0.2523689270019531, 0.26568603515625, 0.2790031433105469, 0.29232025146484375, 0.3056373596191406, 0.3189544677734375, 0.3322715759277344, 0.34558868408203125, 0.3589057922363281, 0.372222900390625, 0.3855400085449219, 0.39885711669921875, 0.4121742248535156, 0.4254913330078125, 0.4388084411621094, 0.45212554931640625, 0.4654426574707031, 0.478759765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 26.0, 88.0, 233.0, 329.0, 202.0, 76.0, 22.0, 11.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9684925079345703, -2.6815989017486572, -2.394705295562744, -2.107811450958252, -1.8209178447723389, -1.5340242385864258, -1.2471305131912231, -0.9602367877960205, -0.6733431816101074, -0.38644951581954956, -0.0995558500289917, 0.18733781576156616, 0.474231481552124, 0.7611250877380371, 1.0480188131332397, 1.3349125385284424, 1.6218061447143555, 1.9086997509002686, 2.1955933570861816, 2.482487201690674, 2.769380807876587, 3.0562744140625, 3.343168258666992, 3.6300618648529053, 3.9169554710388184, 4.2038493156433105, 4.4907426834106445, 4.777636528015137, 5.064530372619629, 5.351423740386963, 5.638317584991455, 5.925210952758789, 6.212103843688965, 6.498997688293457, 6.785891056060791, 7.072784900665283, 7.359678268432617, 7.646572113037109, 7.933465957641602, 8.220359802246094, 8.507253646850586, 8.794147491455078, 9.08104133605957, 9.367934226989746, 9.654828071594238, 9.94172191619873, 10.228615760803223, 10.515509605407715, 10.80240249633789, 11.089296340942383, 11.376190185546875, 11.66308307647705, 11.949976921081543, 12.236870765686035, 12.523764610290527, 12.81065845489502, 13.097551345825195, 13.384445190429688, 13.67133903503418, 13.958231925964355, 14.245125770568848, 14.53201961517334, 14.818913459777832, 15.105807304382324, 15.392701148986816]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 10.0, 9.0, 6.0, 14.0, 17.0, 20.0, 28.0, 19.0, 24.0, 27.0, 36.0, 21.0, 35.0, 37.0, 33.0, 43.0, 50.0, 38.0, 39.0, 55.0, 55.0, 29.0, 47.0, 28.0, 43.0, 32.0, 32.0, 33.0, 25.0, 19.0, 22.0, 16.0, 13.0, 10.0, 5.0, 5.0, 6.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7780075073242188, -1.7137035131454468, -1.6493996381759644, -1.5850956439971924, -1.52079176902771, -1.456487774848938, -1.392183780670166, -1.3278799057006836, -1.2635759115219116, -1.1992719173431396, -1.1349680423736572, -1.0706640481948853, -1.0063600540161133, -0.9420561790466309, -0.8777521848678589, -0.8134482502937317, -0.7491443157196045, -0.6848403811454773, -0.6205364465713501, -0.5562324523925781, -0.4919285178184509, -0.42762458324432373, -0.36332061886787415, -0.29901665449142456, -0.23471271991729736, -0.17040877044200897, -0.10610482096672058, -0.04180087149143219, 0.0225030779838562, 0.0868070125579834, 0.15111097693443298, 0.21541494131088257, 0.27971863746643066, 0.34402257204055786, 0.40832653641700745, 0.47263050079345703, 0.5369344353675842, 0.6012383699417114, 0.6655423641204834, 0.7298462986946106, 0.7941502332687378, 0.858454167842865, 0.9227581024169922, 0.9870620965957642, 1.0513660907745361, 1.1156699657440186, 1.1799739599227905, 1.2442779541015625, 1.308581829071045, 1.372885823249817, 1.4371896982192993, 1.5014936923980713, 1.5657975673675537, 1.6301015615463257, 1.6944055557250977, 1.75870943069458, 1.823013424873352, 1.887317419052124, 1.9516212940216064, 2.015925168991089, 2.0802292823791504, 2.144533157348633, 2.2088370323181152, 2.2731411457061768, 2.337445020675659]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 11.0, 5.0, 12.0, 26.0, 51.0, 82.0, 125.0, 254.0, 631.0, 1426.0, 4483.0, 18164.0, 122351.0, 687145.0, 180402.0, 24741.0, 5472.0, 1812.0, 690.0, 320.0, 133.0, 82.0, 48.0, 20.0, 22.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62890625, -0.606109619140625, -0.58331298828125, -0.560516357421875, -0.5377197265625, -0.514923095703125, -0.49212646484375, -0.469329833984375, -0.446533203125, -0.423736572265625, -0.40093994140625, -0.378143310546875, -0.3553466796875, -0.332550048828125, -0.30975341796875, -0.286956787109375, -0.26416015625, -0.241363525390625, -0.21856689453125, -0.195770263671875, -0.1729736328125, -0.150177001953125, -0.12738037109375, -0.104583740234375, -0.081787109375, -0.058990478515625, -0.03619384765625, -0.013397216796875, 0.0093994140625, 0.032196044921875, 0.05499267578125, 0.077789306640625, 0.1005859375, 0.123382568359375, 0.14617919921875, 0.168975830078125, 0.1917724609375, 0.214569091796875, 0.23736572265625, 0.260162353515625, 0.282958984375, 0.305755615234375, 0.32855224609375, 0.351348876953125, 0.3741455078125, 0.396942138671875, 0.41973876953125, 0.442535400390625, 0.46533203125, 0.488128662109375, 0.51092529296875, 0.533721923828125, 0.5565185546875, 0.579315185546875, 0.60211181640625, 0.624908447265625, 0.647705078125, 0.670501708984375, 0.69329833984375, 0.716094970703125, 0.7388916015625, 0.761688232421875, 0.78448486328125, 0.807281494140625, 0.830078125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 8.0, 10.0, 8.0, 8.0, 12.0, 24.0, 21.0, 30.0, 31.0, 33.0, 41.0, 37.0, 37.0, 43.0, 53.0, 69.0, 51.0, 47.0, 57.0, 66.0, 50.0, 38.0, 56.0, 27.0, 26.0, 14.0, 27.0, 8.0, 13.0, 7.0, 8.0, 14.0, 12.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.1183481216430664, -0.11432075500488281, -0.11029338836669922, -0.10626602172851562, -0.10223865509033203, -0.09821128845214844, -0.09418392181396484, -0.09015655517578125, -0.08612918853759766, -0.08210182189941406, -0.07807445526123047, -0.07404708862304688, -0.07001972198486328, -0.06599235534667969, -0.061964988708496094, -0.0579376220703125, -0.053910255432128906, -0.04988288879394531, -0.04585552215576172, -0.041828155517578125, -0.03780078887939453, -0.03377342224121094, -0.029746055603027344, -0.02571868896484375, -0.021691322326660156, -0.017663955688476562, -0.013636589050292969, -0.009609222412109375, -0.005581855773925781, -0.0015544891357421875, 0.0024728775024414062, 0.006500244140625, 0.010527610778808594, 0.014554977416992188, 0.01858234405517578, 0.022609710693359375, 0.02663707733154297, 0.030664443969726562, 0.034691810607910156, 0.03871917724609375, 0.042746543884277344, 0.04677391052246094, 0.05080127716064453, 0.054828643798828125, 0.05885601043701172, 0.06288337707519531, 0.0669107437133789, 0.0709381103515625, 0.0749654769897461, 0.07899284362792969, 0.08302021026611328, 0.08704757690429688, 0.09107494354248047, 0.09510231018066406, 0.09912967681884766, 0.10315704345703125, 0.10718441009521484, 0.11121177673339844, 0.11523914337158203, 0.11926651000976562, 0.12329387664794922, 0.1273212432861328, 0.1313486099243164, 0.1353759765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 10.0, 20.0, 26.0, 43.0, 52.0, 109.0, 159.0, 285.0, 415.0, 866.0, 1756.0, 5156.0, 22700.0, 221069.0, 720745.0, 59736.0, 9778.0, 2876.0, 1192.0, 649.0, 341.0, 198.0, 122.0, 75.0, 48.0, 29.0, 26.0, 17.0, 11.0, 4.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.849609375, -0.8240509033203125, -0.798492431640625, -0.7729339599609375, -0.74737548828125, -0.7218170166015625, -0.696258544921875, -0.6707000732421875, -0.6451416015625, -0.6195831298828125, -0.594024658203125, -0.5684661865234375, -0.54290771484375, -0.5173492431640625, -0.491790771484375, -0.4662322998046875, -0.440673828125, -0.4151153564453125, -0.389556884765625, -0.3639984130859375, -0.33843994140625, -0.3128814697265625, -0.287322998046875, -0.2617645263671875, -0.2362060546875, -0.2106475830078125, -0.185089111328125, -0.1595306396484375, -0.13397216796875, -0.1084136962890625, -0.082855224609375, -0.0572967529296875, -0.03173828125, -0.0061798095703125, 0.019378662109375, 0.0449371337890625, 0.07049560546875, 0.0960540771484375, 0.121612548828125, 0.1471710205078125, 0.1727294921875, 0.1982879638671875, 0.223846435546875, 0.2494049072265625, 0.27496337890625, 0.3005218505859375, 0.326080322265625, 0.3516387939453125, 0.377197265625, 0.4027557373046875, 0.428314208984375, 0.4538726806640625, 0.47943115234375, 0.5049896240234375, 0.530548095703125, 0.5561065673828125, 0.5816650390625, 0.6072235107421875, 0.632781982421875, 0.6583404541015625, 0.68389892578125, 0.7094573974609375, 0.735015869140625, 0.7605743408203125, 0.7861328125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 5.0, 6.0, 3.0, 12.0, 19.0, 15.0, 20.0, 28.0, 29.0, 39.0, 38.0, 44.0, 48.0, 53.0, 54.0, 58.0, 60.0, 45.0, 77.0, 54.0, 44.0, 31.0, 48.0, 37.0, 35.0, 22.0, 12.0, 10.0, 13.0, 17.0, 6.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5305328369140625, -0.508819580078125, -0.4871063232421875, -0.46539306640625, -0.4436798095703125, -0.421966552734375, -0.4002532958984375, -0.3785400390625, -0.3568267822265625, -0.335113525390625, -0.3134002685546875, -0.29168701171875, -0.2699737548828125, -0.248260498046875, -0.2265472412109375, -0.204833984375, -0.1831207275390625, -0.161407470703125, -0.1396942138671875, -0.11798095703125, -0.0962677001953125, -0.074554443359375, -0.0528411865234375, -0.0311279296875, -0.0094146728515625, 0.012298583984375, 0.0340118408203125, 0.05572509765625, 0.0774383544921875, 0.099151611328125, 0.1208648681640625, 0.142578125, 0.1642913818359375, 0.186004638671875, 0.2077178955078125, 0.22943115234375, 0.2511444091796875, 0.272857666015625, 0.2945709228515625, 0.3162841796875, 0.3379974365234375, 0.359710693359375, 0.3814239501953125, 0.40313720703125, 0.4248504638671875, 0.446563720703125, 0.4682769775390625, 0.489990234375, 0.5117034912109375, 0.533416748046875, 0.5551300048828125, 0.57684326171875, 0.5985565185546875, 0.620269775390625, 0.6419830322265625, 0.6636962890625, 0.6854095458984375, 0.707122802734375, 0.7288360595703125, 0.75054931640625, 0.7722625732421875, 0.793975830078125, 0.8156890869140625, 0.83740234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 10.0, 14.0, 33.0, 29.0, 52.0, 78.0, 93.0, 193.0, 326.0, 622.0, 1323.0, 3514.0, 14276.0, 94738.0, 694743.0, 203725.0, 25589.0, 5510.0, 1851.0, 768.0, 401.0, 266.0, 126.0, 79.0, 53.0, 40.0, 22.0, 13.0, 16.0, 11.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.34765625, -0.3393135070800781, -0.33097076416015625, -0.3226280212402344, -0.3142852783203125, -0.3059425354003906, -0.29759979248046875, -0.2892570495605469, -0.280914306640625, -0.2725715637207031, -0.26422882080078125, -0.2558860778808594, -0.2475433349609375, -0.23920059204101562, -0.23085784912109375, -0.22251510620117188, -0.21417236328125, -0.20582962036132812, -0.19748687744140625, -0.18914413452148438, -0.1808013916015625, -0.17245864868164062, -0.16411590576171875, -0.15577316284179688, -0.147430419921875, -0.13908767700195312, -0.13074493408203125, -0.12240219116210938, -0.1140594482421875, -0.10571670532226562, -0.09737396240234375, -0.08903121948242188, -0.0806884765625, -0.07234573364257812, -0.06400299072265625, -0.055660247802734375, -0.0473175048828125, -0.038974761962890625, -0.03063201904296875, -0.022289276123046875, -0.013946533203125, -0.005603790283203125, 0.00273895263671875, 0.011081695556640625, 0.0194244384765625, 0.027767181396484375, 0.03610992431640625, 0.044452667236328125, 0.05279541015625, 0.061138153076171875, 0.06948089599609375, 0.07782363891601562, 0.0861663818359375, 0.09450912475585938, 0.10285186767578125, 0.11119461059570312, 0.119537353515625, 0.12788009643554688, 0.13622283935546875, 0.14456558227539062, 0.1529083251953125, 0.16125106811523438, 0.16959381103515625, 0.17793655395507812, 0.186279296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 2.0, 4.0, 7.0, 18.0, 11.0, 16.0, 25.0, 30.0, 29.0, 44.0, 56.0, 68.0, 77.0, 97.0, 106.0, 93.0, 57.0, 55.0, 34.0, 37.0, 35.0, 23.0, 18.0, 10.0, 6.0, 5.0, 3.0, 7.0, 6.0, 3.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.707408905029297e-05, -3.569014370441437e-05, -3.4306198358535767e-05, -3.2922253012657166e-05, -3.1538307666778564e-05, -3.0154362320899963e-05, -2.8770416975021362e-05, -2.738647162914276e-05, -2.600252628326416e-05, -2.461858093738556e-05, -2.3234635591506958e-05, -2.1850690245628357e-05, -2.0466744899749756e-05, -1.9082799553871155e-05, -1.7698854207992554e-05, -1.6314908862113953e-05, -1.4930963516235352e-05, -1.354701817035675e-05, -1.216307282447815e-05, -1.0779127478599548e-05, -9.395182132720947e-06, -8.011236786842346e-06, -6.627291440963745e-06, -5.243346095085144e-06, -3.859400749206543e-06, -2.475455403327942e-06, -1.0915100574493408e-06, 2.9243528842926025e-07, 1.6763806343078613e-06, 3.0603259801864624e-06, 4.4442713260650635e-06, 5.8282166719436646e-06, 7.212162017822266e-06, 8.596107363700867e-06, 9.980052709579468e-06, 1.1363998055458069e-05, 1.274794340133667e-05, 1.4131888747215271e-05, 1.5515834093093872e-05, 1.6899779438972473e-05, 1.8283724784851074e-05, 1.9667670130729675e-05, 2.1051615476608276e-05, 2.2435560822486877e-05, 2.381950616836548e-05, 2.520345151424408e-05, 2.658739686012268e-05, 2.7971342206001282e-05, 2.9355287551879883e-05, 3.0739232897758484e-05, 3.2123178243637085e-05, 3.3507123589515686e-05, 3.489106893539429e-05, 3.627501428127289e-05, 3.765895962715149e-05, 3.904290497303009e-05, 4.042685031890869e-05, 4.181079566478729e-05, 4.3194741010665894e-05, 4.4578686356544495e-05, 4.5962631702423096e-05, 4.73465770483017e-05, 4.87305223941803e-05, 5.01144677400589e-05, 5.14984130859375e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 4.0, 2.0, 6.0, 12.0, 12.0, 19.0, 32.0, 51.0, 53.0, 99.0, 129.0, 235.0, 393.0, 689.0, 1440.0, 3174.0, 9325.0, 42039.0, 331522.0, 573754.0, 65199.0, 12587.0, 3995.0, 1715.0, 825.0, 423.0, 277.0, 181.0, 122.0, 63.0, 48.0, 44.0, 13.0, 21.0, 18.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.22412109375, -0.2169189453125, -0.209716796875, -0.2025146484375, -0.1953125, -0.1881103515625, -0.180908203125, -0.1737060546875, -0.16650390625, -0.1593017578125, -0.152099609375, -0.1448974609375, -0.1376953125, -0.1304931640625, -0.123291015625, -0.1160888671875, -0.10888671875, -0.1016845703125, -0.094482421875, -0.0872802734375, -0.080078125, -0.0728759765625, -0.065673828125, -0.0584716796875, -0.05126953125, -0.0440673828125, -0.036865234375, -0.0296630859375, -0.0224609375, -0.0152587890625, -0.008056640625, -0.0008544921875, 0.00634765625, 0.0135498046875, 0.020751953125, 0.0279541015625, 0.03515625, 0.0423583984375, 0.049560546875, 0.0567626953125, 0.06396484375, 0.0711669921875, 0.078369140625, 0.0855712890625, 0.0927734375, 0.0999755859375, 0.107177734375, 0.1143798828125, 0.12158203125, 0.1287841796875, 0.135986328125, 0.1431884765625, 0.150390625, 0.1575927734375, 0.164794921875, 0.1719970703125, 0.17919921875, 0.1864013671875, 0.193603515625, 0.2008056640625, 0.2080078125, 0.2152099609375, 0.222412109375, 0.2296142578125, 0.23681640625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 5.0, 8.0, 10.0, 11.0, 13.0, 15.0, 24.0, 31.0, 35.0, 36.0, 46.0, 41.0, 44.0, 44.0, 63.0, 65.0, 54.0, 62.0, 52.0, 50.0, 56.0, 36.0, 25.0, 32.0, 25.0, 20.0, 20.0, 18.0, 7.0, 5.0, 8.0, 6.0, 3.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17304420471191406, -0.16762161254882812, -0.1621990203857422, -0.15677642822265625, -0.1513538360595703, -0.14593124389648438, -0.14050865173339844, -0.1350860595703125, -0.12966346740722656, -0.12424087524414062, -0.11881828308105469, -0.11339569091796875, -0.10797309875488281, -0.10255050659179688, -0.09712791442871094, -0.091705322265625, -0.08628273010253906, -0.08086013793945312, -0.07543754577636719, -0.07001495361328125, -0.06459236145019531, -0.059169769287109375, -0.05374717712402344, -0.0483245849609375, -0.04290199279785156, -0.037479400634765625, -0.03205680847167969, -0.02663421630859375, -0.021211624145507812, -0.015789031982421875, -0.010366439819335938, -0.00494384765625, 0.0004787445068359375, 0.005901336669921875, 0.011323928833007812, 0.01674652099609375, 0.022169113159179688, 0.027591705322265625, 0.03301429748535156, 0.0384368896484375, 0.04385948181152344, 0.049282073974609375, 0.05470466613769531, 0.06012725830078125, 0.06554985046386719, 0.07097244262695312, 0.07639503479003906, 0.081817626953125, 0.08724021911621094, 0.09266281127929688, 0.09808540344238281, 0.10350799560546875, 0.10893058776855469, 0.11435317993164062, 0.11977577209472656, 0.1251983642578125, 0.13062095642089844, 0.13604354858398438, 0.1414661407470703, 0.14688873291015625, 0.1523113250732422, 0.15773391723632812, 0.16315650939941406, 0.1685791015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 4.0, 8.0, 47.0, 106.0, 225.0, 292.0, 178.0, 89.0, 26.0, 12.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.987371444702148, -9.73983383178711, -9.492295265197754, -9.244757652282715, -8.99721908569336, -8.74968147277832, -8.502142906188965, -8.254605293273926, -8.00706672668457, -7.759528636932373, -7.511990547180176, -7.2644524574279785, -7.016914367675781, -6.769376277923584, -6.521838188171387, -6.2743000984191895, -6.026762008666992, -5.779223918914795, -5.531685829162598, -5.2841477394104, -5.036609649658203, -4.789071559906006, -4.541533470153809, -4.293995380401611, -4.046457767486572, -3.798919677734375, -3.5513815879821777, -3.3038434982299805, -3.056305408477783, -2.808767318725586, -2.5612292289733887, -2.3136911392211914, -2.066153049468994, -1.8186149597167969, -1.5710768699645996, -1.3235387802124023, -1.076000690460205, -0.8284627199172974, -0.5809246301651001, -0.33338654041290283, -0.08584845066070557, 0.1616896241903305, 0.4092276990413666, 0.6567657589912415, 0.9043038487434387, 1.1518418788909912, 1.3993799686431885, 1.6469180583953857, 1.894456148147583, 2.1419942378997803, 2.3895323276519775, 2.637070417404175, 2.884608507156372, 3.1321463584899902, 3.3796844482421875, 3.6272225379943848, 3.874760627746582, 4.122298717498779, 4.369836807250977, 4.617374897003174, 4.864912986755371, 5.112451076507568, 5.359989166259766, 5.607527256011963, 5.85506534576416]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 17.0, 25.0, 24.0, 23.0, 30.0, 27.0, 27.0, 43.0, 40.0, 41.0, 39.0, 71.0, 46.0, 65.0, 57.0, 51.0, 50.0, 38.0, 44.0, 27.0, 33.0, 28.0, 23.0, 17.0, 19.0, 16.0, 10.0, 13.0, 6.0, 9.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9872527122497559, -1.9145749807357788, -1.8418972492218018, -1.7692193984985352, -1.696541666984558, -1.623863935470581, -1.551186203956604, -1.478508472442627, -1.4058306217193604, -1.3331528902053833, -1.2604751586914062, -1.1877973079681396, -1.1151195764541626, -1.0424418449401855, -0.9697641134262085, -0.8970863223075867, -0.8244086503982544, -0.7517309188842773, -0.6790531277656555, -0.6063753962516785, -0.5336976051330566, -0.4610198736190796, -0.38834214210510254, -0.3156643509864807, -0.24298661947250366, -0.17030885815620422, -0.09763111174106598, -0.024953365325927734, 0.047724395990371704, 0.12040215730667114, 0.1930798888206482, 0.26575767993927, 0.33843541145324707, 0.4111131727695465, 0.48379093408584595, 0.556468665599823, 0.6291464567184448, 0.7018241882324219, 0.7745019197463989, 0.8471797108650208, 0.9198574423789978, 0.9925351738929749, 1.0652129650115967, 1.1378906965255737, 1.2105684280395508, 1.2832462787628174, 1.3559238910675049, 1.4286017417907715, 1.5012794733047485, 1.5739572048187256, 1.6466349363327026, 1.7193126678466797, 1.7919905185699463, 1.8646682500839233, 1.9373459815979004, 2.010023832321167, 2.0827014446258545, 2.155379295349121, 2.2280569076538086, 2.300734758377075, 2.3734123706817627, 2.4460902214050293, 2.518767833709717, 2.5914456844329834, 2.66412353515625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 3.0, 14.0, 22.0, 33.0, 60.0, 108.0, 218.0, 472.0, 975.0, 2346.0, 6184.0, 19754.0, 98580.0, 3238607.0, 754723.0, 52427.0, 12491.0, 4094.0, 1604.0, 681.0, 341.0, 186.0, 93.0, 75.0, 38.0, 25.0, 16.0, 28.0, 11.0, 9.0, 9.0, 12.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.244384765625, -0.23265457153320312, -0.22092437744140625, -0.20919418334960938, -0.1974639892578125, -0.18573379516601562, -0.17400360107421875, -0.16227340698242188, -0.150543212890625, -0.13881301879882812, -0.12708282470703125, -0.11535263061523438, -0.1036224365234375, -0.09189224243164062, -0.08016204833984375, -0.06843185424804688, -0.05670166015625, -0.044971466064453125, -0.03324127197265625, -0.021511077880859375, -0.0097808837890625, 0.001949310302734375, 0.01367950439453125, 0.025409698486328125, 0.037139892578125, 0.048870086669921875, 0.06060028076171875, 0.07233047485351562, 0.0840606689453125, 0.09579086303710938, 0.10752105712890625, 0.11925125122070312, 0.1309814453125, 0.14271163940429688, 0.15444183349609375, 0.16617202758789062, 0.1779022216796875, 0.18963241577148438, 0.20136260986328125, 0.21309280395507812, 0.224822998046875, 0.23655319213867188, 0.24828338623046875, 0.2600135803222656, 0.2717437744140625, 0.2834739685058594, 0.29520416259765625, 0.3069343566894531, 0.31866455078125, 0.3303947448730469, 0.34212493896484375, 0.3538551330566406, 0.3655853271484375, 0.3773155212402344, 0.38904571533203125, 0.4007759094238281, 0.412506103515625, 0.4242362976074219, 0.43596649169921875, 0.4476966857910156, 0.4594268798828125, 0.4711570739746094, 0.48288726806640625, 0.4946174621582031, 0.50634765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 17.0, 18.0, 41.0, 55.0, 66.0, 86.0, 97.0, 130.0, 122.0, 97.0, 83.0, 67.0, 49.0, 27.0, 17.0, 14.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.10167407989501953, -0.09379005432128906, -0.0859060287475586, -0.07802200317382812, -0.07013797760009766, -0.06225395202636719, -0.05436992645263672, -0.04648590087890625, -0.03860187530517578, -0.030717849731445312, -0.022833824157714844, -0.014949798583984375, -0.007065773010253906, 0.0008182525634765625, 0.008702278137207031, 0.0165863037109375, 0.02447032928466797, 0.03235435485839844, 0.040238380432128906, 0.048122406005859375, 0.056006431579589844, 0.06389045715332031, 0.07177448272705078, 0.07965850830078125, 0.08754253387451172, 0.09542655944824219, 0.10331058502197266, 0.11119461059570312, 0.1190786361694336, 0.12696266174316406, 0.13484668731689453, 0.142730712890625, 0.15061473846435547, 0.15849876403808594, 0.1663827896118164, 0.17426681518554688, 0.18215084075927734, 0.1900348663330078, 0.19791889190673828, 0.20580291748046875, 0.21368694305419922, 0.2215709686279297, 0.22945499420166016, 0.23733901977539062, 0.2452230453491211, 0.25310707092285156, 0.26099109649658203, 0.2688751220703125, 0.27675914764404297, 0.28464317321777344, 0.2925271987915039, 0.3004112243652344, 0.30829524993896484, 0.3161792755126953, 0.3240633010864258, 0.33194732666015625, 0.3398313522338867, 0.3477153778076172, 0.35559940338134766, 0.3634834289550781, 0.3713674545288086, 0.37925148010253906, 0.38713550567626953, 0.39501953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 4.0, 10.0, 18.0, 19.0, 30.0, 77.0, 116.0, 184.0, 287.0, 485.0, 967.0, 1932.0, 4475.0, 12118.0, 44693.0, 398143.0, 3516454.0, 169848.0, 28921.0, 8875.0, 3339.0, 1506.0, 777.0, 410.0, 227.0, 127.0, 102.0, 44.0, 33.0, 21.0, 12.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6435546875, -0.6263236999511719, -0.6090927124023438, -0.5918617248535156, -0.5746307373046875, -0.5573997497558594, -0.5401687622070312, -0.5229377746582031, -0.505706787109375, -0.4884757995605469, -0.47124481201171875, -0.4540138244628906, -0.4367828369140625, -0.4195518493652344, -0.40232086181640625, -0.3850898742675781, -0.36785888671875, -0.3506278991699219, -0.33339691162109375, -0.3161659240722656, -0.2989349365234375, -0.2817039489746094, -0.26447296142578125, -0.24724197387695312, -0.230010986328125, -0.21277999877929688, -0.19554901123046875, -0.17831802368164062, -0.1610870361328125, -0.14385604858398438, -0.12662506103515625, -0.10939407348632812, -0.0921630859375, -0.07493209838867188, -0.05770111083984375, -0.040470123291015625, -0.0232391357421875, -0.006008148193359375, 0.01122283935546875, 0.028453826904296875, 0.045684814453125, 0.06291580200195312, 0.08014678955078125, 0.09737777709960938, 0.1146087646484375, 0.13183975219726562, 0.14907073974609375, 0.16630172729492188, 0.18353271484375, 0.20076370239257812, 0.21799468994140625, 0.23522567749023438, 0.2524566650390625, 0.2696876525878906, 0.28691864013671875, 0.3041496276855469, 0.321380615234375, 0.3386116027832031, 0.35584259033203125, 0.3730735778808594, 0.3903045654296875, 0.4075355529785156, 0.42476654052734375, 0.4419975280761719, 0.459228515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 11.0, 12.0, 15.0, 26.0, 52.0, 71.0, 157.0, 315.0, 814.0, 1524.0, 549.0, 220.0, 92.0, 75.0, 40.0, 29.0, 18.0, 11.0, 8.0, 3.0, 2.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6777496337890625, -0.656768798828125, -0.6357879638671875, -0.61480712890625, -0.5938262939453125, -0.572845458984375, -0.5518646240234375, -0.5308837890625, -0.5099029541015625, -0.488922119140625, -0.4679412841796875, -0.44696044921875, -0.4259796142578125, -0.404998779296875, -0.3840179443359375, -0.363037109375, -0.3420562744140625, -0.321075439453125, -0.3000946044921875, -0.27911376953125, -0.2581329345703125, -0.237152099609375, -0.2161712646484375, -0.1951904296875, -0.1742095947265625, -0.153228759765625, -0.1322479248046875, -0.11126708984375, -0.0902862548828125, -0.069305419921875, -0.0483245849609375, -0.02734375, -0.0063629150390625, 0.014617919921875, 0.0355987548828125, 0.05657958984375, 0.0775604248046875, 0.098541259765625, 0.1195220947265625, 0.1405029296875, 0.1614837646484375, 0.182464599609375, 0.2034454345703125, 0.22442626953125, 0.2454071044921875, 0.266387939453125, 0.2873687744140625, 0.308349609375, 0.3293304443359375, 0.350311279296875, 0.3712921142578125, 0.39227294921875, 0.4132537841796875, 0.434234619140625, 0.4552154541015625, 0.4761962890625, 0.4971771240234375, 0.518157958984375, 0.5391387939453125, 0.56011962890625, 0.5811004638671875, 0.602081298828125, 0.6230621337890625, 0.64404296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 34.0, 164.0, 471.0, 262.0, 36.0, 15.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.789292335510254, -9.408763885498047, -9.02823543548584, -8.647706985473633, -8.267179489135742, -7.886651039123535, -7.506122589111328, -7.125594139099121, -6.745066165924072, -6.364537715911865, -5.984009742736816, -5.603481292724609, -5.222952842712402, -4.8424248695373535, -4.4618964195251465, -4.081368446350098, -3.7008399963378906, -3.3203117847442627, -2.9397835731506348, -2.5592551231384277, -2.1787269115448, -1.7981986999511719, -1.4176702499389648, -1.037142038345337, -0.656613826751709, -0.2760855555534363, 0.10444271564483643, 0.4849710464477539, 0.8654992580413818, 1.2460274696350098, 1.6265559196472168, 2.0070841312408447, 2.387613296508789, 2.768141508102417, 3.148669719696045, 3.529198169708252, 3.90972638130188, 4.290254592895508, 4.670783042907715, 5.051311492919922, 5.431839466094971, 5.812367916107178, 6.192895889282227, 6.573424339294434, 6.953952789306641, 7.3344807624816895, 7.7150092124938965, 8.095537185668945, 8.476065635681152, 8.85659408569336, 9.237122535705566, 9.617650985717773, 9.998178482055664, 10.378706932067871, 10.759235382080078, 11.139763832092285, 11.520292282104492, 11.9008207321167, 12.281349182128906, 12.661876678466797, 13.042405128479004, 13.422933578491211, 13.803462028503418, 14.183990478515625, 14.564517974853516]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 4.0, 13.0, 23.0, 29.0, 20.0, 34.0, 41.0, 52.0, 66.0, 65.0, 53.0, 69.0, 66.0, 71.0, 46.0, 58.0, 54.0, 44.0, 43.0, 37.0, 15.0, 15.0, 18.0, 11.0, 18.0, 10.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.178518295288086, -3.0744235515594482, -2.9703288078308105, -2.866234064102173, -2.762139320373535, -2.6580445766448975, -2.5539498329162598, -2.449855089187622, -2.3457603454589844, -2.2416656017303467, -2.137570858001709, -2.0334761142730713, -1.9293813705444336, -1.825286626815796, -1.7211918830871582, -1.6170971393585205, -1.5130023956298828, -1.4089076519012451, -1.3048129081726074, -1.2007181644439697, -1.096623420715332, -0.9925286769866943, -0.8884339332580566, -0.784339189529419, -0.6802444458007812, -0.5761497020721436, -0.47205495834350586, -0.36796021461486816, -0.26386547088623047, -0.15977072715759277, -0.05567598342895508, 0.04841876029968262, 0.1525135040283203, 0.256608247756958, 0.3607029914855957, 0.4647977352142334, 0.5688924789428711, 0.6729872226715088, 0.7770819664001465, 0.8811767101287842, 0.9852714538574219, 1.0893661975860596, 1.1934609413146973, 1.297555685043335, 1.4016504287719727, 1.5057451725006104, 1.609839916229248, 1.7139346599578857, 1.8180294036865234, 1.9221241474151611, 2.026218891143799, 2.1303136348724365, 2.234408378601074, 2.338503122329712, 2.4425978660583496, 2.5466926097869873, 2.650787353515625, 2.7548820972442627, 2.8589768409729004, 2.963071584701538, 3.067166328430176, 3.1712610721588135, 3.275355815887451, 3.379450559616089, 3.4835453033447266]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 14.0, 10.0, 20.0, 28.0, 74.0, 156.0, 341.0, 709.0, 1821.0, 5794.0, 23256.0, 146831.0, 680391.0, 155493.0, 24297.0, 6009.0, 1894.0, 740.0, 323.0, 163.0, 80.0, 44.0, 25.0, 17.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86328125, -0.8408660888671875, -0.818450927734375, -0.7960357666015625, -0.77362060546875, -0.7512054443359375, -0.728790283203125, -0.7063751220703125, -0.6839599609375, -0.6615447998046875, -0.639129638671875, -0.6167144775390625, -0.59429931640625, -0.5718841552734375, -0.549468994140625, -0.5270538330078125, -0.504638671875, -0.4822235107421875, -0.459808349609375, -0.4373931884765625, -0.41497802734375, -0.3925628662109375, -0.370147705078125, -0.3477325439453125, -0.3253173828125, -0.3029022216796875, -0.280487060546875, -0.2580718994140625, -0.23565673828125, -0.2132415771484375, -0.190826416015625, -0.1684112548828125, -0.14599609375, -0.1235809326171875, -0.101165771484375, -0.0787506103515625, -0.05633544921875, -0.0339202880859375, -0.011505126953125, 0.0109100341796875, 0.0333251953125, 0.0557403564453125, 0.078155517578125, 0.1005706787109375, 0.12298583984375, 0.1454010009765625, 0.167816162109375, 0.1902313232421875, 0.212646484375, 0.2350616455078125, 0.257476806640625, 0.2798919677734375, 0.30230712890625, 0.3247222900390625, 0.347137451171875, 0.3695526123046875, 0.3919677734375, 0.4143829345703125, 0.436798095703125, 0.4592132568359375, 0.48162841796875, 0.5040435791015625, 0.526458740234375, 0.5488739013671875, 0.5712890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 11.0, 9.0, 15.0, 26.0, 28.0, 44.0, 42.0, 37.0, 53.0, 69.0, 63.0, 78.0, 67.0, 73.0, 72.0, 69.0, 48.0, 41.0, 35.0, 23.0, 26.0, 19.0, 18.0, 8.0, 5.0, 9.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.14665603637695312, -0.14060211181640625, -0.13454818725585938, -0.1284942626953125, -0.12244033813476562, -0.11638641357421875, -0.11033248901367188, -0.104278564453125, -0.09822463989257812, -0.09217071533203125, -0.08611679077148438, -0.0800628662109375, -0.07400894165039062, -0.06795501708984375, -0.061901092529296875, -0.05584716796875, -0.049793243408203125, -0.04373931884765625, -0.037685394287109375, -0.0316314697265625, -0.025577545166015625, -0.01952362060546875, -0.013469696044921875, -0.007415771484375, -0.001361846923828125, 0.00469207763671875, 0.010746002197265625, 0.0167999267578125, 0.022853851318359375, 0.02890777587890625, 0.034961700439453125, 0.041015625, 0.047069549560546875, 0.05312347412109375, 0.059177398681640625, 0.0652313232421875, 0.07128524780273438, 0.07733917236328125, 0.08339309692382812, 0.089447021484375, 0.09550094604492188, 0.10155487060546875, 0.10760879516601562, 0.1136627197265625, 0.11971664428710938, 0.12577056884765625, 0.13182449340820312, 0.13787841796875, 0.14393234252929688, 0.14998626708984375, 0.15604019165039062, 0.1620941162109375, 0.16814804077148438, 0.17420196533203125, 0.18025588989257812, 0.186309814453125, 0.19236373901367188, 0.19841766357421875, 0.20447158813476562, 0.2105255126953125, 0.21657943725585938, 0.22263336181640625, 0.22868728637695312, 0.2347412109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 11.0, 13.0, 37.0, 36.0, 50.0, 84.0, 148.0, 266.0, 426.0, 903.0, 1959.0, 5621.0, 23261.0, 171317.0, 731280.0, 91078.0, 14785.0, 4009.0, 1515.0, 735.0, 367.0, 227.0, 144.0, 72.0, 56.0, 46.0, 21.0, 17.0, 11.0, 8.0, 8.0, 8.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7666015625, -0.742156982421875, -0.71771240234375, -0.693267822265625, -0.6688232421875, -0.644378662109375, -0.61993408203125, -0.595489501953125, -0.571044921875, -0.546600341796875, -0.52215576171875, -0.497711181640625, -0.4732666015625, -0.448822021484375, -0.42437744140625, -0.399932861328125, -0.37548828125, -0.351043701171875, -0.32659912109375, -0.302154541015625, -0.2777099609375, -0.253265380859375, -0.22882080078125, -0.204376220703125, -0.179931640625, -0.155487060546875, -0.13104248046875, -0.106597900390625, -0.0821533203125, -0.057708740234375, -0.03326416015625, -0.008819580078125, 0.015625, 0.040069580078125, 0.06451416015625, 0.088958740234375, 0.1134033203125, 0.137847900390625, 0.16229248046875, 0.186737060546875, 0.211181640625, 0.235626220703125, 0.26007080078125, 0.284515380859375, 0.3089599609375, 0.333404541015625, 0.35784912109375, 0.382293701171875, 0.40673828125, 0.431182861328125, 0.45562744140625, 0.480072021484375, 0.5045166015625, 0.528961181640625, 0.55340576171875, 0.577850341796875, 0.602294921875, 0.626739501953125, 0.65118408203125, 0.675628662109375, 0.7000732421875, 0.724517822265625, 0.74896240234375, 0.773406982421875, 0.7978515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 8.0, 7.0, 7.0, 8.0, 22.0, 20.0, 26.0, 26.0, 27.0, 17.0, 41.0, 42.0, 47.0, 46.0, 44.0, 59.0, 60.0, 46.0, 58.0, 54.0, 43.0, 45.0, 36.0, 36.0, 29.0, 29.0, 28.0, 18.0, 7.0, 13.0, 8.0, 9.0, 5.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.664642333984375, -0.64324951171875, -0.621856689453125, -0.6004638671875, -0.579071044921875, -0.55767822265625, -0.536285400390625, -0.514892578125, -0.493499755859375, -0.47210693359375, -0.450714111328125, -0.4293212890625, -0.407928466796875, -0.38653564453125, -0.365142822265625, -0.34375, -0.322357177734375, -0.30096435546875, -0.279571533203125, -0.2581787109375, -0.236785888671875, -0.21539306640625, -0.194000244140625, -0.172607421875, -0.151214599609375, -0.12982177734375, -0.108428955078125, -0.0870361328125, -0.065643310546875, -0.04425048828125, -0.022857666015625, -0.00146484375, 0.019927978515625, 0.04132080078125, 0.062713623046875, 0.0841064453125, 0.105499267578125, 0.12689208984375, 0.148284912109375, 0.169677734375, 0.191070556640625, 0.21246337890625, 0.233856201171875, 0.2552490234375, 0.276641845703125, 0.29803466796875, 0.319427490234375, 0.3408203125, 0.362213134765625, 0.38360595703125, 0.404998779296875, 0.4263916015625, 0.447784423828125, 0.46917724609375, 0.490570068359375, 0.511962890625, 0.533355712890625, 0.55474853515625, 0.576141357421875, 0.5975341796875, 0.618927001953125, 0.64031982421875, 0.661712646484375, 0.68310546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 6.0, 9.0, 21.0, 33.0, 56.0, 63.0, 125.0, 255.0, 464.0, 1149.0, 4087.0, 29375.0, 760724.0, 234542.0, 13423.0, 2587.0, 839.0, 333.0, 172.0, 100.0, 59.0, 34.0, 28.0, 17.0, 26.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.445556640625, -0.4301033020019531, -0.41464996337890625, -0.3991966247558594, -0.3837432861328125, -0.3682899475097656, -0.35283660888671875, -0.3373832702636719, -0.321929931640625, -0.3064765930175781, -0.29102325439453125, -0.2755699157714844, -0.2601165771484375, -0.24466323852539062, -0.22920989990234375, -0.21375656127929688, -0.19830322265625, -0.18284988403320312, -0.16739654541015625, -0.15194320678710938, -0.1364898681640625, -0.12103652954101562, -0.10558319091796875, -0.09012985229492188, -0.074676513671875, -0.059223175048828125, -0.04376983642578125, -0.028316497802734375, -0.0128631591796875, 0.002590179443359375, 0.01804351806640625, 0.033496856689453125, 0.0489501953125, 0.06440353393554688, 0.07985687255859375, 0.09531021118164062, 0.1107635498046875, 0.12621688842773438, 0.14167022705078125, 0.15712356567382812, 0.172576904296875, 0.18803024291992188, 0.20348358154296875, 0.21893692016601562, 0.2343902587890625, 0.24984359741210938, 0.26529693603515625, 0.2807502746582031, 0.29620361328125, 0.3116569519042969, 0.32711029052734375, 0.3425636291503906, 0.3580169677734375, 0.3734703063964844, 0.38892364501953125, 0.4043769836425781, 0.419830322265625, 0.4352836608886719, 0.45073699951171875, 0.4661903381347656, 0.4816436767578125, 0.4970970153808594, 0.5125503540039062, 0.5280036926269531, 0.54345703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 11.0, 13.0, 20.0, 21.0, 33.0, 53.0, 63.0, 85.0, 101.0, 124.0, 131.0, 92.0, 70.0, 35.0, 40.0, 19.0, 17.0, 16.0, 11.0, 6.0, 7.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.488229751586914e-05, -4.306808114051819e-05, -4.1253864765167236e-05, -3.9439648389816284e-05, -3.762543201446533e-05, -3.581121563911438e-05, -3.399699926376343e-05, -3.2182782888412476e-05, -3.0368566513061523e-05, -2.855435013771057e-05, -2.674013376235962e-05, -2.4925917387008667e-05, -2.3111701011657715e-05, -2.1297484636306763e-05, -1.948326826095581e-05, -1.766905188560486e-05, -1.5854835510253906e-05, -1.4040619134902954e-05, -1.2226402759552002e-05, -1.041218638420105e-05, -8.597970008850098e-06, -6.7837536334991455e-06, -4.969537258148193e-06, -3.155320882797241e-06, -1.341104507446289e-06, 4.731118679046631e-07, 2.2873282432556152e-06, 4.101544618606567e-06, 5.9157609939575195e-06, 7.729977369308472e-06, 9.544193744659424e-06, 1.1358410120010376e-05, 1.3172626495361328e-05, 1.498684287071228e-05, 1.6801059246063232e-05, 1.8615275621414185e-05, 2.0429491996765137e-05, 2.224370837211609e-05, 2.405792474746704e-05, 2.5872141122817993e-05, 2.7686357498168945e-05, 2.9500573873519897e-05, 3.131479024887085e-05, 3.31290066242218e-05, 3.4943222999572754e-05, 3.6757439374923706e-05, 3.857165575027466e-05, 4.038587212562561e-05, 4.220008850097656e-05, 4.4014304876327515e-05, 4.582852125167847e-05, 4.764273762702942e-05, 4.945695400238037e-05, 5.127117037773132e-05, 5.3085386753082275e-05, 5.489960312843323e-05, 5.671381950378418e-05, 5.852803587913513e-05, 6.0342252254486084e-05, 6.215646862983704e-05, 6.397068500518799e-05, 6.578490138053894e-05, 6.759911775588989e-05, 6.941333413124084e-05, 7.12275505065918e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 7.0, 4.0, 9.0, 9.0, 16.0, 25.0, 39.0, 44.0, 80.0, 112.0, 195.0, 351.0, 649.0, 1456.0, 3881.0, 14519.0, 121780.0, 811426.0, 76844.0, 11250.0, 3261.0, 1238.0, 549.0, 296.0, 161.0, 103.0, 86.0, 33.0, 28.0, 28.0, 16.0, 9.0, 12.0, 3.0, 8.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.373046875, -0.3615379333496094, -0.35002899169921875, -0.3385200500488281, -0.3270111083984375, -0.3155021667480469, -0.30399322509765625, -0.2924842834472656, -0.280975341796875, -0.2694664001464844, -0.25795745849609375, -0.24644851684570312, -0.2349395751953125, -0.22343063354492188, -0.21192169189453125, -0.20041275024414062, -0.18890380859375, -0.17739486694335938, -0.16588592529296875, -0.15437698364257812, -0.1428680419921875, -0.13135910034179688, -0.11985015869140625, -0.10834121704101562, -0.096832275390625, -0.08532333374023438, -0.07381439208984375, -0.062305450439453125, -0.0507965087890625, -0.039287567138671875, -0.02777862548828125, -0.016269683837890625, -0.0047607421875, 0.006748199462890625, 0.01825714111328125, 0.029766082763671875, 0.0412750244140625, 0.052783966064453125, 0.06429290771484375, 0.07580184936523438, 0.087310791015625, 0.09881973266601562, 0.11032867431640625, 0.12183761596679688, 0.1333465576171875, 0.14485549926757812, 0.15636444091796875, 0.16787338256835938, 0.17938232421875, 0.19089126586914062, 0.20240020751953125, 0.21390914916992188, 0.2254180908203125, 0.23692703247070312, 0.24843597412109375, 0.2599449157714844, 0.271453857421875, 0.2829627990722656, 0.29447174072265625, 0.3059806823730469, 0.3174896240234375, 0.3289985656738281, 0.34050750732421875, 0.3520164489746094, 0.363525390625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 1.0, 7.0, 9.0, 6.0, 11.0, 16.0, 34.0, 34.0, 46.0, 63.0, 74.0, 92.0, 120.0, 108.0, 94.0, 68.0, 53.0, 45.0, 25.0, 28.0, 10.0, 16.0, 8.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2846412658691406, -0.27509307861328125, -0.2655448913574219, -0.2559967041015625, -0.24644851684570312, -0.23690032958984375, -0.22735214233398438, -0.217803955078125, -0.20825576782226562, -0.19870758056640625, -0.18915939331054688, -0.1796112060546875, -0.17006301879882812, -0.16051483154296875, -0.15096664428710938, -0.14141845703125, -0.13187026977539062, -0.12232208251953125, -0.11277389526367188, -0.1032257080078125, -0.09367752075195312, -0.08412933349609375, -0.07458114624023438, -0.065032958984375, -0.055484771728515625, -0.04593658447265625, -0.036388397216796875, -0.0268402099609375, -0.017292022705078125, -0.00774383544921875, 0.001804351806640625, 0.0113525390625, 0.020900726318359375, 0.03044891357421875, 0.039997100830078125, 0.0495452880859375, 0.059093475341796875, 0.06864166259765625, 0.07818984985351562, 0.087738037109375, 0.09728622436523438, 0.10683441162109375, 0.11638259887695312, 0.1259307861328125, 0.13547897338867188, 0.14502716064453125, 0.15457534790039062, 0.16412353515625, 0.17367172241210938, 0.18321990966796875, 0.19276809692382812, 0.2023162841796875, 0.21186447143554688, 0.22141265869140625, 0.23096084594726562, 0.240509033203125, 0.2500572204589844, 0.25960540771484375, 0.2691535949707031, 0.2787017822265625, 0.2882499694824219, 0.29779815673828125, 0.3073463439941406, 0.31689453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 8.0, 9.0, 38.0, 85.0, 113.0, 150.0, 232.0, 155.0, 91.0, 39.0, 31.0, 11.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.218542098999023, -5.046980381011963, -4.875418663024902, -4.703856945037842, -4.532295227050781, -4.360733985900879, -4.18917179107666, -4.017610549926758, -3.8460488319396973, -3.6744871139526367, -3.502925395965576, -3.3313636779785156, -3.159802198410034, -2.9882404804229736, -2.816678762435913, -2.6451172828674316, -2.473555326461792, -2.3019936084747314, -2.130431890487671, -1.9588702917099, -1.787308692932129, -1.6157469749450684, -1.4441852569580078, -1.2726236581802368, -1.1010619401931763, -0.9295002818107605, -0.7579386234283447, -0.5863769054412842, -0.4148152470588684, -0.24325358867645264, -0.07169187068939209, 0.0998697280883789, 0.27143144607543945, 0.4429931044578552, 0.614554762840271, 0.7861164808273315, 0.9576781392097473, 1.129239797592163, 1.3008015155792236, 1.4723631143569946, 1.6439248323440552, 1.8154865503311157, 1.9870481491088867, 2.1586098670959473, 2.330171585083008, 2.5017333030700684, 2.673295021057129, 2.8448565006256104, 3.016418218612671, 3.1879799365997314, 3.359541654586792, 3.5311031341552734, 3.702664852142334, 3.8742265701293945, 4.045788288116455, 4.217350006103516, 4.388911724090576, 4.560473442077637, 4.732035160064697, 4.903596878051758, 5.075158596038818, 5.246720314025879, 5.418281555175781, 5.589843273162842, 5.761404991149902]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 1.0, 5.0, 4.0, 2.0, 7.0, 8.0, 10.0, 15.0, 14.0, 20.0, 16.0, 29.0, 28.0, 42.0, 42.0, 48.0, 68.0, 58.0, 76.0, 82.0, 61.0, 49.0, 51.0, 40.0, 43.0, 28.0, 24.0, 30.0, 21.0, 13.0, 17.0, 12.0, 12.0, 6.0, 6.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.550157070159912, -2.4499804973602295, -2.349803924560547, -2.2496273517608643, -2.1494507789611816, -2.04927396774292, -1.9490973949432373, -1.8489208221435547, -1.748744249343872, -1.6485676765441895, -1.5483911037445068, -1.4482144117355347, -1.348037838935852, -1.2478612661361694, -1.1476845741271973, -1.0475080013275146, -0.947331428527832, -0.8471548557281494, -0.746978223323822, -0.6468015909194946, -0.546625018119812, -0.4464484453201294, -0.346271812915802, -0.2460951805114746, -0.145918607711792, -0.04574200510978699, 0.05443459749221802, 0.15461120009422302, 0.254787802696228, 0.35496437549591064, 0.45514100790023804, 0.5553176403045654, 0.655493974685669, 0.7556705474853516, 0.855847179889679, 0.9560238122940063, 1.056200385093689, 1.1563769578933716, 1.2565536499023438, 1.3567302227020264, 1.456906795501709, 1.5570833683013916, 1.6572599411010742, 1.7574366331100464, 1.857613205909729, 1.9577897787094116, 2.057966470718384, 2.1581430435180664, 2.258319616317749, 2.3584961891174316, 2.4586727619171143, 2.558849334716797, 2.6590261459350586, 2.759202480316162, 2.859379291534424, 2.9595558643341064, 3.059732437133789, 3.1599090099334717, 3.2600855827331543, 3.360262155532837, 3.4604387283325195, 3.5606155395507812, 3.660792112350464, 3.7609686851501465, 3.861145257949829]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 7.0, 15.0, 20.0, 36.0, 45.0, 80.0, 135.0, 267.0, 513.0, 967.0, 1930.0, 4276.0, 10498.0, 29198.0, 105966.0, 791529.0, 2836303.0, 318533.0, 61146.0, 19147.0, 7204.0, 3154.0, 1477.0, 767.0, 439.0, 254.0, 126.0, 82.0, 63.0, 30.0, 19.0, 21.0, 8.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2255859375, -0.21761703491210938, -0.20964813232421875, -0.20167922973632812, -0.1937103271484375, -0.18574142456054688, -0.17777252197265625, -0.16980361938476562, -0.161834716796875, -0.15386581420898438, -0.14589691162109375, -0.13792800903320312, -0.1299591064453125, -0.12199020385742188, -0.11402130126953125, -0.10605239868164062, -0.09808349609375, -0.09011459350585938, -0.08214569091796875, -0.07417678833007812, -0.0662078857421875, -0.058238983154296875, -0.05027008056640625, -0.042301177978515625, -0.034332275390625, -0.026363372802734375, -0.01839447021484375, -0.010425567626953125, -0.0024566650390625, 0.005512237548828125, 0.01348114013671875, 0.021450042724609375, 0.0294189453125, 0.037387847900390625, 0.04535675048828125, 0.053325653076171875, 0.0612945556640625, 0.06926345825195312, 0.07723236083984375, 0.08520126342773438, 0.093170166015625, 0.10113906860351562, 0.10910797119140625, 0.11707687377929688, 0.1250457763671875, 0.13301467895507812, 0.14098358154296875, 0.14895248413085938, 0.15692138671875, 0.16489028930664062, 0.17285919189453125, 0.18082809448242188, 0.1887969970703125, 0.19676589965820312, 0.20473480224609375, 0.21270370483398438, 0.220672607421875, 0.22864151000976562, 0.23661041259765625, 0.24457931518554688, 0.2525482177734375, 0.2605171203613281, 0.26848602294921875, 0.2764549255371094, 0.284423828125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 0.0, 2.0, 5.0, 5.0, 9.0, 17.0, 13.0, 18.0, 23.0, 20.0, 26.0, 36.0, 47.0, 58.0, 51.0, 50.0, 69.0, 65.0, 55.0, 55.0, 58.0, 53.0, 48.0, 41.0, 36.0, 31.0, 23.0, 18.0, 18.0, 8.0, 11.0, 10.0, 5.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1397705078125, -0.13523101806640625, -0.1306915283203125, -0.12615203857421875, -0.121612548828125, -0.11707305908203125, -0.1125335693359375, -0.10799407958984375, -0.10345458984375, -0.09891510009765625, -0.0943756103515625, -0.08983612060546875, -0.085296630859375, -0.08075714111328125, -0.0762176513671875, -0.07167816162109375, -0.067138671875, -0.06259918212890625, -0.0580596923828125, -0.05352020263671875, -0.048980712890625, -0.04444122314453125, -0.0399017333984375, -0.03536224365234375, -0.03082275390625, -0.02628326416015625, -0.0217437744140625, -0.01720428466796875, -0.012664794921875, -0.00812530517578125, -0.0035858154296875, 0.00095367431640625, 0.0054931640625, 0.01003265380859375, 0.0145721435546875, 0.01911163330078125, 0.023651123046875, 0.02819061279296875, 0.0327301025390625, 0.03726959228515625, 0.04180908203125, 0.04634857177734375, 0.0508880615234375, 0.05542755126953125, 0.059967041015625, 0.06450653076171875, 0.0690460205078125, 0.07358551025390625, 0.078125, 0.08266448974609375, 0.0872039794921875, 0.09174346923828125, 0.096282958984375, 0.10082244873046875, 0.1053619384765625, 0.10990142822265625, 0.11444091796875, 0.11898040771484375, 0.1235198974609375, 0.12805938720703125, 0.132598876953125, 0.13713836669921875, 0.1416778564453125, 0.14621734619140625, 0.1507568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 12.0, 12.0, 16.0, 29.0, 41.0, 92.0, 121.0, 292.0, 580.0, 1242.0, 3239.0, 10131.0, 41232.0, 318158.0, 3485689.0, 283261.0, 36229.0, 8738.0, 2855.0, 1157.0, 539.0, 251.0, 150.0, 81.0, 39.0, 33.0, 21.0, 12.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45361328125, -0.437103271484375, -0.42059326171875, -0.404083251953125, -0.3875732421875, -0.371063232421875, -0.35455322265625, -0.338043212890625, -0.321533203125, -0.305023193359375, -0.28851318359375, -0.272003173828125, -0.2554931640625, -0.238983154296875, -0.22247314453125, -0.205963134765625, -0.189453125, -0.172943115234375, -0.15643310546875, -0.139923095703125, -0.1234130859375, -0.106903076171875, -0.09039306640625, -0.073883056640625, -0.057373046875, -0.040863037109375, -0.02435302734375, -0.007843017578125, 0.0086669921875, 0.025177001953125, 0.04168701171875, 0.058197021484375, 0.07470703125, 0.091217041015625, 0.10772705078125, 0.124237060546875, 0.1407470703125, 0.157257080078125, 0.17376708984375, 0.190277099609375, 0.206787109375, 0.223297119140625, 0.23980712890625, 0.256317138671875, 0.2728271484375, 0.289337158203125, 0.30584716796875, 0.322357177734375, 0.3388671875, 0.355377197265625, 0.37188720703125, 0.388397216796875, 0.4049072265625, 0.421417236328125, 0.43792724609375, 0.454437255859375, 0.470947265625, 0.487457275390625, 0.50396728515625, 0.520477294921875, 0.5369873046875, 0.553497314453125, 0.57000732421875, 0.586517333984375, 0.60302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 2.0, 4.0, 9.0, 5.0, 11.0, 7.0, 14.0, 18.0, 23.0, 37.0, 33.0, 41.0, 86.0, 78.0, 170.0, 269.0, 476.0, 792.0, 783.0, 425.0, 251.0, 152.0, 118.0, 74.0, 54.0, 35.0, 30.0, 22.0, 12.0, 10.0, 6.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4145927429199219, -0.39974212646484375, -0.3848915100097656, -0.3700408935546875, -0.3551902770996094, -0.34033966064453125, -0.3254890441894531, -0.310638427734375, -0.2957878112792969, -0.28093719482421875, -0.2660865783691406, -0.2512359619140625, -0.23638534545898438, -0.22153472900390625, -0.20668411254882812, -0.19183349609375, -0.17698287963867188, -0.16213226318359375, -0.14728164672851562, -0.1324310302734375, -0.11758041381835938, -0.10272979736328125, -0.08787918090820312, -0.073028564453125, -0.058177947998046875, -0.04332733154296875, -0.028476715087890625, -0.0136260986328125, 0.001224517822265625, 0.01607513427734375, 0.030925750732421875, 0.0457763671875, 0.060626983642578125, 0.07547760009765625, 0.09032821655273438, 0.1051788330078125, 0.12002944946289062, 0.13488006591796875, 0.14973068237304688, 0.164581298828125, 0.17943191528320312, 0.19428253173828125, 0.20913314819335938, 0.2239837646484375, 0.23883438110351562, 0.25368499755859375, 0.2685356140136719, 0.28338623046875, 0.2982368469238281, 0.31308746337890625, 0.3279380798339844, 0.3427886962890625, 0.3576393127441406, 0.37248992919921875, 0.3873405456542969, 0.402191162109375, 0.4170417785644531, 0.43189239501953125, 0.4467430114746094, 0.4615936279296875, 0.4764442443847656, 0.49129486083984375, 0.5061454772949219, 0.52099609375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 18.0, 37.0, 99.0, 200.0, 261.0, 200.0, 83.0, 39.0, 19.0, 10.0, 0.0, 0.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.507318496704102, -5.313638687133789, -5.119959354400635, -4.926279544830322, -4.732600212097168, -4.5389204025268555, -4.345241069793701, -4.151561260223389, -3.9578819274902344, -3.764202356338501, -3.5705227851867676, -3.376843214035034, -3.183163642883301, -2.9894840717315674, -2.795804500579834, -2.6021246910095215, -2.408445119857788, -2.2147655487060547, -2.0210859775543213, -1.827406406402588, -1.6337268352508545, -1.440047264099121, -1.2463675737380981, -1.0526880025863647, -0.8590084314346313, -0.665328860282898, -0.47164925932884216, -0.2779696583747864, -0.08429008722305298, 0.10938948392868042, 0.3030691146850586, 0.496748685836792, 0.6904282569885254, 0.8841078281402588, 1.0777873992919922, 1.2714669704437256, 1.465146541595459, 1.6588261127471924, 1.8525058031082153, 2.0461854934692383, 2.2398648262023926, 2.433544397354126, 2.6272239685058594, 2.8209035396575928, 3.014583110809326, 3.2082626819610596, 3.401942253112793, 3.5956220626831055, 3.789301633834839, 3.9829812049865723, 4.176661014556885, 4.370340347290039, 4.564020156860352, 4.757699489593506, 4.951379299163818, 5.145058631896973, 5.338738441467285, 5.532418251037598, 5.726097583770752, 5.9197773933410645, 6.113456726074219, 6.307136535644531, 6.5008158683776855, 6.694495677947998, 6.888175010681152]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 12.0, 23.0, 22.0, 24.0, 25.0, 27.0, 35.0, 30.0, 35.0, 48.0, 39.0, 52.0, 50.0, 59.0, 58.0, 51.0, 44.0, 53.0, 43.0, 32.0, 28.0, 30.0, 15.0, 31.0, 23.0, 18.0, 10.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.3649065494537354, -2.2884933948516846, -2.212080478668213, -2.135667324066162, -2.0592544078826904, -1.9828412532806396, -1.9064282178878784, -1.8300151824951172, -1.753602147102356, -1.6771891117095947, -1.6007760763168335, -1.5243630409240723, -1.4479498863220215, -1.3715369701385498, -1.295123815536499, -1.2187107801437378, -1.1422977447509766, -1.0658847093582153, -0.9894716739654541, -0.9130585789680481, -0.8366455435752869, -0.7602325081825256, -0.6838194131851196, -0.6074063777923584, -0.5309933423995972, -0.45458030700683594, -0.3781672418117523, -0.3017541766166687, -0.22534114122390747, -0.14892810583114624, -0.07251504063606262, 0.003898024559020996, 0.08031129837036133, 0.15672434866428375, 0.23313739895820618, 0.3095504641532898, 0.385963499546051, 0.46237653493881226, 0.5387896299362183, 0.6152026653289795, 0.6916157007217407, 0.768028736114502, 0.8444417715072632, 0.9208548665046692, 0.9972679018974304, 1.0736808776855469, 1.1500940322875977, 1.2265070676803589, 1.3029201030731201, 1.3793331384658813, 1.4557461738586426, 1.5321592092514038, 1.608572244644165, 1.6849853992462158, 1.761398434638977, 1.8378114700317383, 1.9142245054244995, 1.9906375408172607, 2.0670506954193115, 2.143463611602783, 2.219876766204834, 2.2962896823883057, 2.3727028369903564, 2.449115753173828, 2.525528907775879]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 6.0, 8.0, 17.0, 17.0, 21.0, 32.0, 59.0, 84.0, 139.0, 203.0, 274.0, 534.0, 771.0, 1214.0, 2089.0, 3597.0, 6469.0, 12035.0, 23965.0, 50311.0, 108405.0, 236776.0, 305206.0, 155183.0, 70908.0, 33500.0, 16435.0, 8623.0, 4735.0, 2736.0, 1557.0, 932.0, 614.0, 363.0, 222.0, 171.0, 105.0, 85.0, 46.0, 43.0, 20.0, 11.0, 14.0, 13.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2646484375, -0.2558937072753906, -0.24713897705078125, -0.23838424682617188, -0.2296295166015625, -0.22087478637695312, -0.21212005615234375, -0.20336532592773438, -0.194610595703125, -0.18585586547851562, -0.17710113525390625, -0.16834640502929688, -0.1595916748046875, -0.15083694458007812, -0.14208221435546875, -0.13332748413085938, -0.12457275390625, -0.11581802368164062, -0.10706329345703125, -0.09830856323242188, -0.0895538330078125, -0.08079910278320312, -0.07204437255859375, -0.06328964233398438, -0.054534912109375, -0.045780181884765625, -0.03702545166015625, -0.028270721435546875, -0.0195159912109375, -0.010761260986328125, -0.00200653076171875, 0.006748199462890625, 0.0155029296875, 0.024257659912109375, 0.03301239013671875, 0.041767120361328125, 0.0505218505859375, 0.059276580810546875, 0.06803131103515625, 0.07678604125976562, 0.085540771484375, 0.09429550170898438, 0.10305023193359375, 0.11180496215820312, 0.1205596923828125, 0.12931442260742188, 0.13806915283203125, 0.14682388305664062, 0.15557861328125, 0.16433334350585938, 0.17308807373046875, 0.18184280395507812, 0.1905975341796875, 0.19935226440429688, 0.20810699462890625, 0.21686172485351562, 0.225616455078125, 0.23437118530273438, 0.24312591552734375, 0.2518806457519531, 0.2606353759765625, 0.2693901062011719, 0.27814483642578125, 0.2868995666503906, 0.295654296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 3.0, 13.0, 13.0, 26.0, 14.0, 30.0, 25.0, 22.0, 35.0, 36.0, 44.0, 38.0, 45.0, 46.0, 58.0, 68.0, 44.0, 43.0, 51.0, 43.0, 51.0, 45.0, 32.0, 31.0, 24.0, 16.0, 14.0, 14.0, 14.0, 10.0, 12.0, 6.0, 5.0, 1.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.13260841369628906, -0.12837600708007812, -0.12414360046386719, -0.11991119384765625, -0.11567878723144531, -0.11144638061523438, -0.10721397399902344, -0.1029815673828125, -0.09874916076660156, -0.09451675415039062, -0.09028434753417969, -0.08605194091796875, -0.08181953430175781, -0.07758712768554688, -0.07335472106933594, -0.069122314453125, -0.06488990783691406, -0.060657501220703125, -0.05642509460449219, -0.05219268798828125, -0.04796028137207031, -0.043727874755859375, -0.03949546813964844, -0.0352630615234375, -0.031030654907226562, -0.026798248291015625, -0.022565841674804688, -0.01833343505859375, -0.014101028442382812, -0.009868621826171875, -0.0056362152099609375, -0.00140380859375, 0.0028285980224609375, 0.007061004638671875, 0.011293411254882812, 0.01552581787109375, 0.019758224487304688, 0.023990631103515625, 0.028223037719726562, 0.0324554443359375, 0.03668785095214844, 0.040920257568359375, 0.04515266418457031, 0.04938507080078125, 0.05361747741699219, 0.057849884033203125, 0.06208229064941406, 0.066314697265625, 0.07054710388183594, 0.07477951049804688, 0.07901191711425781, 0.08324432373046875, 0.08747673034667969, 0.09170913696289062, 0.09594154357910156, 0.1001739501953125, 0.10440635681152344, 0.10863876342773438, 0.11287117004394531, 0.11710357666015625, 0.12133598327636719, 0.12556838989257812, 0.12980079650878906, 0.134033203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 12.0, 19.0, 28.0, 56.0, 111.0, 209.0, 456.0, 1197.0, 3770.0, 24701.0, 821894.0, 182599.0, 9773.0, 2254.0, 756.0, 384.0, 151.0, 92.0, 36.0, 25.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0331878662109375, -0.993133544921875, -0.9530792236328125, -0.91302490234375, -0.8729705810546875, -0.832916259765625, -0.7928619384765625, -0.7528076171875, -0.7127532958984375, -0.672698974609375, -0.6326446533203125, -0.59259033203125, -0.5525360107421875, -0.512481689453125, -0.4724273681640625, -0.432373046875, -0.3923187255859375, -0.352264404296875, -0.3122100830078125, -0.27215576171875, -0.2321014404296875, -0.192047119140625, -0.1519927978515625, -0.1119384765625, -0.0718841552734375, -0.031829833984375, 0.0082244873046875, 0.04827880859375, 0.0883331298828125, 0.128387451171875, 0.1684417724609375, 0.20849609375, 0.2485504150390625, 0.288604736328125, 0.3286590576171875, 0.36871337890625, 0.4087677001953125, 0.448822021484375, 0.4888763427734375, 0.5289306640625, 0.5689849853515625, 0.609039306640625, 0.6490936279296875, 0.68914794921875, 0.7292022705078125, 0.769256591796875, 0.8093109130859375, 0.849365234375, 0.8894195556640625, 0.929473876953125, 0.9695281982421875, 1.00958251953125, 1.0496368408203125, 1.089691162109375, 1.1297454833984375, 1.1697998046875, 1.2098541259765625, 1.249908447265625, 1.2899627685546875, 1.33001708984375, 1.3700714111328125, 1.410125732421875, 1.4501800537109375, 1.490234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 13.0, 16.0, 19.0, 30.0, 34.0, 41.0, 44.0, 62.0, 58.0, 73.0, 58.0, 67.0, 70.0, 56.0, 55.0, 58.0, 52.0, 45.0, 26.0, 18.0, 19.0, 15.0, 14.0, 10.0, 8.0, 9.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7789840698242188, -0.7518157958984375, -0.7246475219726562, -0.697479248046875, -0.6703109741210938, -0.6431427001953125, -0.6159744262695312, -0.58880615234375, -0.5616378784179688, -0.5344696044921875, -0.5073013305664062, -0.480133056640625, -0.45296478271484375, -0.4257965087890625, -0.39862823486328125, -0.3714599609375, -0.34429168701171875, -0.3171234130859375, -0.28995513916015625, -0.262786865234375, -0.23561859130859375, -0.2084503173828125, -0.18128204345703125, -0.15411376953125, -0.12694549560546875, -0.0997772216796875, -0.07260894775390625, -0.045440673828125, -0.01827239990234375, 0.0088958740234375, 0.03606414794921875, 0.063232421875, 0.09040069580078125, 0.1175689697265625, 0.14473724365234375, 0.171905517578125, 0.19907379150390625, 0.2262420654296875, 0.25341033935546875, 0.28057861328125, 0.30774688720703125, 0.3349151611328125, 0.36208343505859375, 0.389251708984375, 0.41641998291015625, 0.4435882568359375, 0.47075653076171875, 0.4979248046875, 0.5250930786132812, 0.5522613525390625, 0.5794296264648438, 0.606597900390625, 0.6337661743164062, 0.6609344482421875, 0.6881027221679688, 0.71527099609375, 0.7424392700195312, 0.7696075439453125, 0.7967758178710938, 0.823944091796875, 0.8511123657226562, 0.8782806396484375, 0.9054489135742188, 0.9326171875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 13.0, 18.0, 33.0, 48.0, 58.0, 81.0, 138.0, 267.0, 410.0, 862.0, 1956.0, 6036.0, 31221.0, 325572.0, 625620.0, 44311.0, 7493.0, 2273.0, 926.0, 494.0, 261.0, 153.0, 112.0, 71.0, 38.0, 22.0, 17.0, 7.0, 9.0, 8.0, 4.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.188720703125, -0.18054580688476562, -0.17237091064453125, -0.16419601440429688, -0.1560211181640625, -0.14784622192382812, -0.13967132568359375, -0.13149642944335938, -0.123321533203125, -0.11514663696289062, -0.10697174072265625, -0.09879684448242188, -0.0906219482421875, -0.08244705200195312, -0.07427215576171875, -0.06609725952148438, -0.05792236328125, -0.049747467041015625, -0.04157257080078125, -0.033397674560546875, -0.0252227783203125, -0.017047882080078125, -0.00887298583984375, -0.000698089599609375, 0.007476806640625, 0.015651702880859375, 0.02382659912109375, 0.032001495361328125, 0.0401763916015625, 0.048351287841796875, 0.05652618408203125, 0.06470108032226562, 0.0728759765625, 0.08105087280273438, 0.08922576904296875, 0.09740066528320312, 0.1055755615234375, 0.11375045776367188, 0.12192535400390625, 0.13010025024414062, 0.138275146484375, 0.14645004272460938, 0.15462493896484375, 0.16279983520507812, 0.1709747314453125, 0.17914962768554688, 0.18732452392578125, 0.19549942016601562, 0.20367431640625, 0.21184921264648438, 0.22002410888671875, 0.22819900512695312, 0.2363739013671875, 0.24454879760742188, 0.25272369384765625, 0.2608985900878906, 0.269073486328125, 0.2772483825683594, 0.28542327880859375, 0.2935981750488281, 0.3017730712890625, 0.3099479675292969, 0.31812286376953125, 0.3262977600097656, 0.33447265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 9.0, 6.0, 12.0, 10.0, 9.0, 11.0, 24.0, 25.0, 23.0, 40.0, 51.0, 71.0, 74.0, 110.0, 117.0, 104.0, 65.0, 56.0, 47.0, 29.0, 26.0, 20.0, 16.0, 15.0, 6.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.369020462036133e-05, -4.2137689888477325e-05, -4.058517515659332e-05, -3.903266042470932e-05, -3.748014569282532e-05, -3.5927630960941315e-05, -3.437511622905731e-05, -3.282260149717331e-05, -3.127008676528931e-05, -2.9717572033405304e-05, -2.81650573015213e-05, -2.66125425696373e-05, -2.5060027837753296e-05, -2.3507513105869293e-05, -2.195499837398529e-05, -2.0402483642101288e-05, -1.8849968910217285e-05, -1.7297454178333282e-05, -1.574493944644928e-05, -1.4192424714565277e-05, -1.2639909982681274e-05, -1.1087395250797272e-05, -9.534880518913269e-06, -7.982365787029266e-06, -6.429851055145264e-06, -4.877336323261261e-06, -3.3248215913772583e-06, -1.7723068594932556e-06, -2.1979212760925293e-07, 1.3327226042747498e-06, 2.8852373361587524e-06, 4.437752068042755e-06, 5.990266799926758e-06, 7.5427815318107605e-06, 9.095296263694763e-06, 1.0647810995578766e-05, 1.2200325727462769e-05, 1.3752840459346771e-05, 1.5305355191230774e-05, 1.6857869923114777e-05, 1.841038465499878e-05, 1.9962899386882782e-05, 2.1515414118766785e-05, 2.3067928850650787e-05, 2.462044358253479e-05, 2.6172958314418793e-05, 2.7725473046302795e-05, 2.9277987778186798e-05, 3.08305025100708e-05, 3.2383017241954803e-05, 3.3935531973838806e-05, 3.548804670572281e-05, 3.704056143760681e-05, 3.8593076169490814e-05, 4.014559090137482e-05, 4.169810563325882e-05, 4.325062036514282e-05, 4.4803135097026825e-05, 4.635564982891083e-05, 4.790816456079483e-05, 4.946067929267883e-05, 5.1013194024562836e-05, 5.256570875644684e-05, 5.411822348833084e-05, 5.5670738220214844e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 4.0, 5.0, 1.0, 2.0, 11.0, 11.0, 12.0, 16.0, 24.0, 46.0, 45.0, 54.0, 76.0, 150.0, 163.0, 271.0, 405.0, 745.0, 1221.0, 2581.0, 6673.0, 24045.0, 163907.0, 734595.0, 87775.0, 15820.0, 5038.0, 2074.0, 1002.0, 606.0, 366.0, 224.0, 136.0, 131.0, 86.0, 54.0, 44.0, 26.0, 14.0, 23.0, 18.0, 20.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.215087890625, -0.20844078063964844, -0.20179367065429688, -0.1951465606689453, -0.18849945068359375, -0.1818523406982422, -0.17520523071289062, -0.16855812072753906, -0.1619110107421875, -0.15526390075683594, -0.14861679077148438, -0.1419696807861328, -0.13532257080078125, -0.1286754608154297, -0.12202835083007812, -0.11538124084472656, -0.108734130859375, -0.10208702087402344, -0.09543991088867188, -0.08879280090332031, -0.08214569091796875, -0.07549858093261719, -0.06885147094726562, -0.06220436096191406, -0.0555572509765625, -0.04891014099121094, -0.042263031005859375, -0.03561592102050781, -0.02896881103515625, -0.022321701049804688, -0.015674591064453125, -0.009027481079101562, -0.00238037109375, 0.0042667388916015625, 0.010913848876953125, 0.017560958862304688, 0.02420806884765625, 0.030855178833007812, 0.037502288818359375, 0.04414939880371094, 0.0507965087890625, 0.05744361877441406, 0.06409072875976562, 0.07073783874511719, 0.07738494873046875, 0.08403205871582031, 0.09067916870117188, 0.09732627868652344, 0.103973388671875, 0.11062049865722656, 0.11726760864257812, 0.12391471862792969, 0.13056182861328125, 0.1372089385986328, 0.14385604858398438, 0.15050315856933594, 0.1571502685546875, 0.16379737854003906, 0.17044448852539062, 0.1770915985107422, 0.18373870849609375, 0.1903858184814453, 0.19703292846679688, 0.20368003845214844, 0.2103271484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 5.0, 5.0, 10.0, 7.0, 16.0, 16.0, 11.0, 22.0, 24.0, 35.0, 57.0, 56.0, 65.0, 87.0, 83.0, 90.0, 86.0, 49.0, 54.0, 43.0, 33.0, 31.0, 17.0, 17.0, 15.0, 10.0, 10.0, 11.0, 6.0, 4.0, 6.0, 3.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.222412109375, -0.21569061279296875, -0.2089691162109375, -0.20224761962890625, -0.195526123046875, -0.18880462646484375, -0.1820831298828125, -0.17536163330078125, -0.16864013671875, -0.16191864013671875, -0.1551971435546875, -0.14847564697265625, -0.141754150390625, -0.13503265380859375, -0.1283111572265625, -0.12158966064453125, -0.1148681640625, -0.10814666748046875, -0.1014251708984375, -0.09470367431640625, -0.087982177734375, -0.08126068115234375, -0.0745391845703125, -0.06781768798828125, -0.06109619140625, -0.05437469482421875, -0.0476531982421875, -0.04093170166015625, -0.034210205078125, -0.02748870849609375, -0.0207672119140625, -0.01404571533203125, -0.00732421875, -0.00060272216796875, 0.0061187744140625, 0.01284027099609375, 0.019561767578125, 0.02628326416015625, 0.0330047607421875, 0.03972625732421875, 0.04644775390625, 0.05316925048828125, 0.0598907470703125, 0.06661224365234375, 0.073333740234375, 0.08005523681640625, 0.0867767333984375, 0.09349822998046875, 0.1002197265625, 0.10694122314453125, 0.1136627197265625, 0.12038421630859375, 0.127105712890625, 0.13382720947265625, 0.1405487060546875, 0.14727020263671875, 0.15399169921875, 0.16071319580078125, 0.1674346923828125, 0.17415618896484375, 0.180877685546875, 0.18759918212890625, 0.1943206787109375, 0.20104217529296875, 0.207763671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 17.0, 36.0, 81.0, 128.0, 233.0, 200.0, 129.0, 78.0, 35.0, 20.0, 7.0, 9.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2071380615234375, -4.0379958152771, -3.868853807449341, -3.699711561203003, -3.530569553375244, -3.3614273071289062, -3.1922850608825684, -3.0231428146362305, -2.8540008068084717, -2.684858560562134, -2.515716552734375, -2.346574306488037, -2.177432060241699, -2.0082900524139404, -1.8391478061676025, -1.6700056791305542, -1.5008635520935059, -1.3317214250564575, -1.1625792980194092, -0.9934370517730713, -0.824294924736023, -0.6551527976989746, -0.4860105514526367, -0.3168684244155884, -0.14772629737854004, 0.02141585946083069, 0.19055801630020142, 0.35970020294189453, 0.5288423299789429, 0.6979844570159912, 0.8671267032623291, 1.0362688302993774, 1.2054109573364258, 1.3745530843734741, 1.5436952114105225, 1.7128374576568604, 1.8819795846939087, 2.051121711730957, 2.220263957977295, 2.389406204223633, 2.5585482120513916, 2.7276904582977295, 2.8968324661254883, 3.065974712371826, 3.235116958618164, 3.404258966445923, 3.5734012126922607, 3.7425432205200195, 3.9116854667663574, 4.080827713012695, 4.249969959259033, 4.419112205505371, 4.588253974914551, 4.757396221160889, 4.926538467407227, 5.0956807136535645, 5.264822959899902, 5.43396520614624, 5.603107452392578, 5.772249221801758, 5.941391468048096, 6.110533714294434, 6.2796759605407715, 6.448818206787109, 6.617959976196289]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 10.0, 11.0, 18.0, 26.0, 20.0, 23.0, 26.0, 37.0, 31.0, 40.0, 43.0, 54.0, 46.0, 75.0, 73.0, 46.0, 56.0, 39.0, 38.0, 36.0, 34.0, 28.0, 27.0, 21.0, 24.0, 17.0, 17.0, 19.0, 9.0, 8.0, 6.0, 6.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3175606727600098, -2.2391176223754883, -2.160674571990967, -2.0822315216064453, -2.003788471221924, -1.9253454208374023, -1.8469023704528809, -1.7684593200683594, -1.690016269683838, -1.6115732192993164, -1.533130168914795, -1.4546871185302734, -1.376244068145752, -1.2978010177612305, -1.219357967376709, -1.1409149169921875, -1.0624719858169556, -0.9840289354324341, -0.9055858850479126, -0.8271428346633911, -0.7486997842788696, -0.6702567338943481, -0.5918137431144714, -0.51337069272995, -0.43492764234542847, -0.356484591960907, -0.2780415415763855, -0.1995985209941864, -0.12115547060966492, -0.04271242022514343, 0.035730600357055664, 0.11417365074157715, 0.19261670112609863, 0.2710597515106201, 0.3495028018951416, 0.4279458224773407, 0.5063889026641846, 0.584831953048706, 0.6632749438285828, 0.7417179942131042, 0.8201610445976257, 0.8986040949821472, 0.9770471453666687, 1.0554901361465454, 1.133933186531067, 1.2123762369155884, 1.2908192873001099, 1.3692623376846313, 1.4477053880691528, 1.5261484384536743, 1.6045914888381958, 1.6830345392227173, 1.7614775896072388, 1.8399206399917603, 1.9183635711669922, 1.9968066215515137, 2.075249671936035, 2.1536927223205566, 2.232135772705078, 2.3105788230895996, 2.389021873474121, 2.4674649238586426, 2.545907974243164, 2.6243510246276855, 2.702794075012207]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 20.0, 29.0, 33.0, 53.0, 82.0, 114.0, 176.0, 281.0, 386.0, 602.0, 997.0, 1630.0, 2977.0, 5441.0, 10876.0, 24084.0, 63090.0, 224237.0, 1252333.0, 2076199.0, 376070.0, 92369.0, 32493.0, 14220.0, 6858.0, 3554.0, 2046.0, 1133.0, 643.0, 445.0, 268.0, 160.0, 95.0, 83.0, 47.0, 36.0, 27.0, 19.0, 13.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1524658203125, -0.14757347106933594, -0.14268112182617188, -0.1377887725830078, -0.13289642333984375, -0.1280040740966797, -0.12311172485351562, -0.11821937561035156, -0.1133270263671875, -0.10843467712402344, -0.10354232788085938, -0.09864997863769531, -0.09375762939453125, -0.08886528015136719, -0.08397293090820312, -0.07908058166503906, -0.074188232421875, -0.06929588317871094, -0.06440353393554688, -0.05951118469238281, -0.05461883544921875, -0.04972648620605469, -0.044834136962890625, -0.03994178771972656, -0.0350494384765625, -0.030157089233398438, -0.025264739990234375, -0.020372390747070312, -0.01548004150390625, -0.010587692260742188, -0.005695343017578125, -0.0008029937744140625, 0.00408935546875, 0.008981704711914062, 0.013874053955078125, 0.018766403198242188, 0.02365875244140625, 0.028551101684570312, 0.033443450927734375, 0.03833580017089844, 0.0432281494140625, 0.04812049865722656, 0.053012847900390625, 0.05790519714355469, 0.06279754638671875, 0.06768989562988281, 0.07258224487304688, 0.07747459411621094, 0.082366943359375, 0.08725929260253906, 0.09215164184570312, 0.09704399108886719, 0.10193634033203125, 0.10682868957519531, 0.11172103881835938, 0.11661338806152344, 0.1215057373046875, 0.12639808654785156, 0.13129043579101562, 0.1361827850341797, 0.14107513427734375, 0.1459674835205078, 0.15085983276367188, 0.15575218200683594, 0.16064453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 11.0, 4.0, 9.0, 4.0, 17.0, 13.0, 20.0, 23.0, 42.0, 42.0, 33.0, 49.0, 45.0, 55.0, 54.0, 62.0, 57.0, 57.0, 39.0, 48.0, 43.0, 46.0, 43.0, 28.0, 24.0, 33.0, 17.0, 20.0, 19.0, 9.0, 14.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12469482421875, -0.12030696868896484, -0.11591911315917969, -0.11153125762939453, -0.10714340209960938, -0.10275554656982422, -0.09836769104003906, -0.0939798355102539, -0.08959197998046875, -0.0852041244506836, -0.08081626892089844, -0.07642841339111328, -0.07204055786132812, -0.06765270233154297, -0.06326484680175781, -0.058876991271972656, -0.0544891357421875, -0.050101280212402344, -0.04571342468261719, -0.04132556915283203, -0.036937713623046875, -0.03254985809326172, -0.028162002563476562, -0.023774147033691406, -0.01938629150390625, -0.014998435974121094, -0.010610580444335938, -0.006222724914550781, -0.001834869384765625, 0.0025529861450195312, 0.0069408416748046875, 0.011328697204589844, 0.015716552734375, 0.020104408264160156, 0.024492263793945312, 0.02888011932373047, 0.033267974853515625, 0.03765583038330078, 0.04204368591308594, 0.046431541442871094, 0.05081939697265625, 0.055207252502441406, 0.05959510803222656, 0.06398296356201172, 0.06837081909179688, 0.07275867462158203, 0.07714653015136719, 0.08153438568115234, 0.0859222412109375, 0.09031009674072266, 0.09469795227050781, 0.09908580780029297, 0.10347366333007812, 0.10786151885986328, 0.11224937438964844, 0.1166372299194336, 0.12102508544921875, 0.1254129409790039, 0.12980079650878906, 0.13418865203857422, 0.13857650756835938, 0.14296436309814453, 0.1473522186279297, 0.15174007415771484, 0.1561279296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 13.0, 14.0, 12.0, 19.0, 44.0, 84.0, 159.0, 313.0, 689.0, 1767.0, 5786.0, 25146.0, 178424.0, 3556631.0, 374266.0, 38685.0, 8363.0, 2339.0, 794.0, 351.0, 151.0, 92.0, 49.0, 29.0, 19.0, 12.0, 9.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59130859375, -0.575592041015625, -0.55987548828125, -0.544158935546875, -0.5284423828125, -0.512725830078125, -0.49700927734375, -0.481292724609375, -0.465576171875, -0.449859619140625, -0.43414306640625, -0.418426513671875, -0.4027099609375, -0.386993408203125, -0.37127685546875, -0.355560302734375, -0.33984375, -0.324127197265625, -0.30841064453125, -0.292694091796875, -0.2769775390625, -0.261260986328125, -0.24554443359375, -0.229827880859375, -0.214111328125, -0.198394775390625, -0.18267822265625, -0.166961669921875, -0.1512451171875, -0.135528564453125, -0.11981201171875, -0.104095458984375, -0.08837890625, -0.072662353515625, -0.05694580078125, -0.041229248046875, -0.0255126953125, -0.009796142578125, 0.00592041015625, 0.021636962890625, 0.037353515625, 0.053070068359375, 0.06878662109375, 0.084503173828125, 0.1002197265625, 0.115936279296875, 0.13165283203125, 0.147369384765625, 0.1630859375, 0.178802490234375, 0.19451904296875, 0.210235595703125, 0.2259521484375, 0.241668701171875, 0.25738525390625, 0.273101806640625, 0.288818359375, 0.304534912109375, 0.32025146484375, 0.335968017578125, 0.3516845703125, 0.367401123046875, 0.38311767578125, 0.398834228515625, 0.41455078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 7.0, 4.0, 7.0, 7.0, 11.0, 18.0, 24.0, 20.0, 29.0, 45.0, 60.0, 60.0, 113.0, 167.0, 313.0, 609.0, 943.0, 679.0, 314.0, 211.0, 116.0, 83.0, 57.0, 35.0, 25.0, 28.0, 23.0, 12.0, 17.0, 9.0, 6.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424560546875, -0.4114990234375, -0.3984375, -0.3853759765625, -0.372314453125, -0.3592529296875, -0.34619140625, -0.3331298828125, -0.320068359375, -0.3070068359375, -0.2939453125, -0.2808837890625, -0.267822265625, -0.2547607421875, -0.24169921875, -0.2286376953125, -0.215576171875, -0.2025146484375, -0.189453125, -0.1763916015625, -0.163330078125, -0.1502685546875, -0.13720703125, -0.1241455078125, -0.111083984375, -0.0980224609375, -0.0849609375, -0.0718994140625, -0.058837890625, -0.0457763671875, -0.03271484375, -0.0196533203125, -0.006591796875, 0.0064697265625, 0.01953125, 0.0325927734375, 0.045654296875, 0.0587158203125, 0.07177734375, 0.0848388671875, 0.097900390625, 0.1109619140625, 0.1240234375, 0.1370849609375, 0.150146484375, 0.1632080078125, 0.17626953125, 0.1893310546875, 0.202392578125, 0.2154541015625, 0.228515625, 0.2415771484375, 0.254638671875, 0.2677001953125, 0.28076171875, 0.2938232421875, 0.306884765625, 0.3199462890625, 0.3330078125, 0.3460693359375, 0.359130859375, 0.3721923828125, 0.38525390625, 0.3983154296875, 0.411376953125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 20.0, 51.0, 208.0, 423.0, 214.0, 47.0, 15.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.605573654174805, -11.34486198425293, -11.084150314331055, -10.82343864440918, -10.562726974487305, -10.30201530456543, -10.041303634643555, -9.78059196472168, -9.519880294799805, -9.25916862487793, -8.998456954956055, -8.73774528503418, -8.477033615112305, -8.21632194519043, -7.9556097984313965, -7.6948981285095215, -7.434185981750488, -7.173474311828613, -6.912762641906738, -6.652050971984863, -6.391339302062988, -6.130627632141113, -5.86991548538208, -5.609203815460205, -5.34849214553833, -5.087780475616455, -4.82706880569458, -4.566357135772705, -4.305644989013672, -4.044933319091797, -3.784221649169922, -3.523509979248047, -3.2627992630004883, -3.0020875930786133, -2.7413759231567383, -2.480664014816284, -2.219952344894409, -1.9592406749725342, -1.6985288858413696, -1.437817096710205, -1.17710542678833, -0.9163936972618103, -0.6556819677352905, -0.39497023820877075, -0.13425850868225098, 0.12645316123962402, 0.3871649503707886, 0.6478767395019531, 0.9085884094238281, 1.1693000793457031, 1.4300118684768677, 1.6907236576080322, 1.9514353275299072, 2.2121469974517822, 2.4728589057922363, 2.7335705757141113, 2.9942822456359863, 3.2549939155578613, 3.5157055854797363, 3.7764174938201904, 4.0371294021606445, 4.2978410720825195, 4.5585527420043945, 4.8192644119262695, 5.0799760818481445]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 7.0, 11.0, 12.0, 17.0, 30.0, 24.0, 26.0, 24.0, 35.0, 38.0, 55.0, 45.0, 53.0, 43.0, 54.0, 60.0, 59.0, 55.0, 39.0, 35.0, 41.0, 37.0, 39.0, 27.0, 24.0, 20.0, 9.0, 11.0, 10.0, 13.0, 4.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8796813488006592, -1.8156640529632568, -1.751646876335144, -1.6876295804977417, -1.623612403869629, -1.5595951080322266, -1.4955778121948242, -1.4315605163574219, -1.367543339729309, -1.3035260438919067, -1.239508867263794, -1.1754915714263916, -1.1114742755889893, -1.0474570989608765, -0.9834398031234741, -0.9194225668907166, -0.855405330657959, -0.7913880944252014, -0.7273708581924438, -0.6633535623550415, -0.5993363261222839, -0.5353190898895264, -0.4713018238544464, -0.40728455781936646, -0.3432673215866089, -0.2792500853538513, -0.21523281931877136, -0.1512155681848526, -0.08719831705093384, -0.02318108081817627, 0.040836185216903687, 0.10485345125198364, 0.1688706874847412, 0.23288793861865997, 0.29690518975257874, 0.3609224557876587, 0.42493969202041626, 0.48895692825317383, 0.5529742240905762, 0.6169914603233337, 0.6810086965560913, 0.7450259327888489, 0.8090431690216064, 0.8730604648590088, 0.9370777010917664, 1.001094937324524, 1.0651122331619263, 1.129129409790039, 1.1931467056274414, 1.2571640014648438, 1.3211811780929565, 1.3851984739303589, 1.4492156505584717, 1.513232946395874, 1.5772502422332764, 1.6412675380706787, 1.7052847146987915, 1.7693020105361938, 1.8333191871643066, 1.897336483001709, 1.9613537788391113, 2.0253710746765137, 2.089388132095337, 2.1534054279327393, 2.2174227237701416]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 13.0, 14.0, 11.0, 18.0, 34.0, 57.0, 82.0, 121.0, 142.0, 226.0, 357.0, 571.0, 829.0, 1415.0, 2450.0, 4306.0, 8263.0, 17647.0, 40203.0, 100664.0, 264585.0, 347300.0, 151837.0, 58325.0, 24284.0, 11436.0, 5677.0, 2962.0, 1735.0, 1076.0, 709.0, 385.0, 243.0, 179.0, 133.0, 75.0, 39.0, 55.0, 29.0, 21.0, 11.0, 14.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2743644714355469, -0.26528167724609375, -0.2561988830566406, -0.2471160888671875, -0.23803329467773438, -0.22895050048828125, -0.21986770629882812, -0.210784912109375, -0.20170211791992188, -0.19261932373046875, -0.18353652954101562, -0.1744537353515625, -0.16537094116210938, -0.15628814697265625, -0.14720535278320312, -0.13812255859375, -0.12903976440429688, -0.11995697021484375, -0.11087417602539062, -0.1017913818359375, -0.09270858764648438, -0.08362579345703125, -0.07454299926757812, -0.065460205078125, -0.056377410888671875, -0.04729461669921875, -0.038211822509765625, -0.0291290283203125, -0.020046234130859375, -0.01096343994140625, -0.001880645751953125, 0.0072021484375, 0.016284942626953125, 0.02536773681640625, 0.034450531005859375, 0.0435333251953125, 0.052616119384765625, 0.06169891357421875, 0.07078170776367188, 0.079864501953125, 0.08894729614257812, 0.09803009033203125, 0.10711288452148438, 0.1161956787109375, 0.12527847290039062, 0.13436126708984375, 0.14344406127929688, 0.15252685546875, 0.16160964965820312, 0.17069244384765625, 0.17977523803710938, 0.1888580322265625, 0.19794082641601562, 0.20702362060546875, 0.21610641479492188, 0.225189208984375, 0.23427200317382812, 0.24335479736328125, 0.2524375915527344, 0.2615203857421875, 0.2706031799316406, 0.27968597412109375, 0.2887687683105469, 0.2978515625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 11.0, 11.0, 12.0, 13.0, 22.0, 17.0, 19.0, 26.0, 33.0, 25.0, 29.0, 38.0, 45.0, 42.0, 46.0, 47.0, 43.0, 52.0, 39.0, 41.0, 42.0, 38.0, 33.0, 51.0, 36.0, 32.0, 29.0, 26.0, 22.0, 18.0, 11.0, 9.0, 9.0, 7.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1368408203125, -0.1328134536743164, -0.1287860870361328, -0.12475872039794922, -0.12073135375976562, -0.11670398712158203, -0.11267662048339844, -0.10864925384521484, -0.10462188720703125, -0.10059452056884766, -0.09656715393066406, -0.09253978729248047, -0.08851242065429688, -0.08448505401611328, -0.08045768737792969, -0.0764303207397461, -0.0724029541015625, -0.0683755874633789, -0.06434822082519531, -0.06032085418701172, -0.056293487548828125, -0.05226612091064453, -0.04823875427246094, -0.044211387634277344, -0.04018402099609375, -0.036156654357910156, -0.03212928771972656, -0.02810192108154297, -0.024074554443359375, -0.02004718780517578, -0.016019821166992188, -0.011992454528808594, -0.007965087890625, -0.003937721252441406, 8.96453857421875e-05, 0.004117012023925781, 0.008144378662109375, 0.012171745300292969, 0.016199111938476562, 0.020226478576660156, 0.02425384521484375, 0.028281211853027344, 0.03230857849121094, 0.03633594512939453, 0.040363311767578125, 0.04439067840576172, 0.04841804504394531, 0.052445411682128906, 0.0564727783203125, 0.060500144958496094, 0.06452751159667969, 0.06855487823486328, 0.07258224487304688, 0.07660961151123047, 0.08063697814941406, 0.08466434478759766, 0.08869171142578125, 0.09271907806396484, 0.09674644470214844, 0.10077381134033203, 0.10480117797851562, 0.10882854461669922, 0.11285591125488281, 0.1168832778930664, 0.12091064453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 3.0, 8.0, 19.0, 23.0, 30.0, 43.0, 47.0, 78.0, 118.0, 188.0, 278.0, 550.0, 980.0, 2209.0, 5876.0, 24491.0, 238760.0, 706604.0, 52722.0, 9403.0, 3074.0, 1368.0, 674.0, 353.0, 200.0, 151.0, 91.0, 61.0, 35.0, 26.0, 26.0, 18.0, 13.0, 13.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6685104370117188, -0.6470794677734375, -0.6256484985351562, -0.604217529296875, -0.5827865600585938, -0.5613555908203125, -0.5399246215820312, -0.51849365234375, -0.49706268310546875, -0.4756317138671875, -0.45420074462890625, -0.432769775390625, -0.41133880615234375, -0.3899078369140625, -0.36847686767578125, -0.3470458984375, -0.32561492919921875, -0.3041839599609375, -0.28275299072265625, -0.261322021484375, -0.23989105224609375, -0.2184600830078125, -0.19702911376953125, -0.17559814453125, -0.15416717529296875, -0.1327362060546875, -0.11130523681640625, -0.089874267578125, -0.06844329833984375, -0.0470123291015625, -0.02558135986328125, -0.004150390625, 0.01728057861328125, 0.0387115478515625, 0.06014251708984375, 0.081573486328125, 0.10300445556640625, 0.1244354248046875, 0.14586639404296875, 0.16729736328125, 0.18872833251953125, 0.2101593017578125, 0.23159027099609375, 0.253021240234375, 0.27445220947265625, 0.2958831787109375, 0.31731414794921875, 0.3387451171875, 0.36017608642578125, 0.3816070556640625, 0.40303802490234375, 0.424468994140625, 0.44589996337890625, 0.4673309326171875, 0.48876190185546875, 0.51019287109375, 0.5316238403320312, 0.5530548095703125, 0.5744857788085938, 0.595916748046875, 0.6173477172851562, 0.6387786865234375, 0.6602096557617188, 0.681640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 16.0, 9.0, 17.0, 18.0, 28.0, 39.0, 43.0, 45.0, 57.0, 52.0, 69.0, 49.0, 62.0, 61.0, 72.0, 63.0, 39.0, 33.0, 39.0, 29.0, 31.0, 19.0, 21.0, 10.0, 18.0, 9.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.74267578125, -0.7222366333007812, -0.7017974853515625, -0.6813583374023438, -0.660919189453125, -0.6404800415039062, -0.6200408935546875, -0.5996017456054688, -0.57916259765625, -0.5587234497070312, -0.5382843017578125, -0.5178451538085938, -0.497406005859375, -0.47696685791015625, -0.4565277099609375, -0.43608856201171875, -0.4156494140625, -0.39521026611328125, -0.3747711181640625, -0.35433197021484375, -0.333892822265625, -0.31345367431640625, -0.2930145263671875, -0.27257537841796875, -0.25213623046875, -0.23169708251953125, -0.2112579345703125, -0.19081878662109375, -0.170379638671875, -0.14994049072265625, -0.1295013427734375, -0.10906219482421875, -0.088623046875, -0.06818389892578125, -0.0477447509765625, -0.02730560302734375, -0.006866455078125, 0.01357269287109375, 0.0340118408203125, 0.05445098876953125, 0.07489013671875, 0.09532928466796875, 0.1157684326171875, 0.13620758056640625, 0.156646728515625, 0.17708587646484375, 0.1975250244140625, 0.21796417236328125, 0.2384033203125, 0.25884246826171875, 0.2792816162109375, 0.29972076416015625, 0.320159912109375, 0.34059906005859375, 0.3610382080078125, 0.38147735595703125, 0.40191650390625, 0.42235565185546875, 0.4427947998046875, 0.46323394775390625, 0.483673095703125, 0.5041122436523438, 0.5245513916015625, 0.5449905395507812, 0.5654296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 9.0, 6.0, 5.0, 13.0, 10.0, 21.0, 15.0, 22.0, 36.0, 68.0, 87.0, 140.0, 180.0, 282.0, 524.0, 980.0, 1936.0, 4968.0, 14853.0, 60980.0, 381419.0, 493779.0, 63633.0, 15239.0, 4960.0, 2044.0, 917.0, 525.0, 316.0, 180.0, 122.0, 84.0, 50.0, 33.0, 26.0, 25.0, 12.0, 14.0, 7.0, 10.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1259765625, -0.12147903442382812, -0.11698150634765625, -0.11248397827148438, -0.1079864501953125, -0.10348892211914062, -0.09899139404296875, -0.09449386596679688, -0.089996337890625, -0.08549880981445312, -0.08100128173828125, -0.07650375366210938, -0.0720062255859375, -0.06750869750976562, -0.06301116943359375, -0.058513641357421875, -0.05401611328125, -0.049518585205078125, -0.04502105712890625, -0.040523529052734375, -0.0360260009765625, -0.031528472900390625, -0.02703094482421875, -0.022533416748046875, -0.018035888671875, -0.013538360595703125, -0.00904083251953125, -0.004543304443359375, -4.57763671875e-05, 0.004451751708984375, 0.00894927978515625, 0.013446807861328125, 0.0179443359375, 0.022441864013671875, 0.02693939208984375, 0.031436920166015625, 0.0359344482421875, 0.040431976318359375, 0.04492950439453125, 0.049427032470703125, 0.053924560546875, 0.058422088623046875, 0.06291961669921875, 0.06741714477539062, 0.0719146728515625, 0.07641220092773438, 0.08090972900390625, 0.08540725708007812, 0.08990478515625, 0.09440231323242188, 0.09889984130859375, 0.10339736938476562, 0.1078948974609375, 0.11239242553710938, 0.11688995361328125, 0.12138748168945312, 0.125885009765625, 0.13038253784179688, 0.13488006591796875, 0.13937759399414062, 0.1438751220703125, 0.14837265014648438, 0.15287017822265625, 0.15736770629882812, 0.161865234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 7.0, 12.0, 6.0, 10.0, 16.0, 20.0, 21.0, 37.0, 40.0, 58.0, 59.0, 103.0, 83.0, 92.0, 85.0, 74.0, 55.0, 45.0, 46.0, 24.0, 22.0, 16.0, 14.0, 6.0, 4.0, 8.0, 7.0, 8.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.981590270996094e-05, -3.8615427911281586e-05, -3.7414953112602234e-05, -3.621447831392288e-05, -3.501400351524353e-05, -3.381352871656418e-05, -3.261305391788483e-05, -3.1412579119205475e-05, -3.0212104320526123e-05, -2.901162952184677e-05, -2.781115472316742e-05, -2.6610679924488068e-05, -2.5410205125808716e-05, -2.4209730327129364e-05, -2.3009255528450012e-05, -2.180878072977066e-05, -2.060830593109131e-05, -1.9407831132411957e-05, -1.8207356333732605e-05, -1.7006881535053253e-05, -1.58064067363739e-05, -1.460593193769455e-05, -1.3405457139015198e-05, -1.2204982340335846e-05, -1.1004507541656494e-05, -9.804032742977142e-06, -8.60355794429779e-06, -7.403083145618439e-06, -6.202608346939087e-06, -5.002133548259735e-06, -3.8016587495803833e-06, -2.6011839509010315e-06, -1.4007091522216797e-06, -2.0023435354232788e-07, 1.000240445137024e-06, 2.2007152438163757e-06, 3.4011900424957275e-06, 4.601664841175079e-06, 5.802139639854431e-06, 7.002614438533783e-06, 8.203089237213135e-06, 9.403564035892487e-06, 1.0604038834571838e-05, 1.180451363325119e-05, 1.3004988431930542e-05, 1.4205463230609894e-05, 1.5405938029289246e-05, 1.6606412827968597e-05, 1.780688762664795e-05, 1.90073624253273e-05, 2.0207837224006653e-05, 2.1408312022686005e-05, 2.2608786821365356e-05, 2.3809261620044708e-05, 2.500973641872406e-05, 2.6210211217403412e-05, 2.7410686016082764e-05, 2.8611160814762115e-05, 2.9811635613441467e-05, 3.101211041212082e-05, 3.221258521080017e-05, 3.341306000947952e-05, 3.4613534808158875e-05, 3.5814009606838226e-05, 3.701448440551758e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 13.0, 22.0, 33.0, 69.0, 119.0, 203.0, 346.0, 687.0, 1704.0, 5541.0, 31658.0, 608863.0, 365653.0, 25777.0, 4825.0, 1580.0, 682.0, 309.0, 186.0, 93.0, 42.0, 40.0, 26.0, 19.0, 9.0, 3.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.18879127502441406, -0.18227005004882812, -0.1757488250732422, -0.16922760009765625, -0.1627063751220703, -0.15618515014648438, -0.14966392517089844, -0.1431427001953125, -0.13662147521972656, -0.13010025024414062, -0.12357902526855469, -0.11705780029296875, -0.11053657531738281, -0.10401535034179688, -0.09749412536621094, -0.090972900390625, -0.08445167541503906, -0.07793045043945312, -0.07140922546386719, -0.06488800048828125, -0.05836677551269531, -0.051845550537109375, -0.04532432556152344, -0.0388031005859375, -0.03228187561035156, -0.025760650634765625, -0.019239425659179688, -0.01271820068359375, -0.0061969757080078125, 0.000324249267578125, 0.0068454742431640625, 0.01336669921875, 0.019887924194335938, 0.026409149169921875, 0.03293037414550781, 0.03945159912109375, 0.04597282409667969, 0.052494049072265625, 0.05901527404785156, 0.0655364990234375, 0.07205772399902344, 0.07857894897460938, 0.08510017395019531, 0.09162139892578125, 0.09814262390136719, 0.10466384887695312, 0.11118507385253906, 0.117706298828125, 0.12422752380371094, 0.13074874877929688, 0.1372699737548828, 0.14379119873046875, 0.1503124237060547, 0.15683364868164062, 0.16335487365722656, 0.1698760986328125, 0.17639732360839844, 0.18291854858398438, 0.1894397735595703, 0.19596099853515625, 0.2024822235107422, 0.20900344848632812, 0.21552467346191406, 0.2220458984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 17.0, 19.0, 13.0, 18.0, 29.0, 42.0, 35.0, 61.0, 47.0, 67.0, 68.0, 50.0, 90.0, 54.0, 52.0, 64.0, 49.0, 48.0, 36.0, 39.0, 16.0, 16.0, 12.0, 4.0, 3.0, 9.0, 2.0, 4.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1102294921875, -0.10625648498535156, -0.10228347778320312, -0.09831047058105469, -0.09433746337890625, -0.09036445617675781, -0.08639144897460938, -0.08241844177246094, -0.0784454345703125, -0.07447242736816406, -0.07049942016601562, -0.06652641296386719, -0.06255340576171875, -0.05858039855957031, -0.054607391357421875, -0.05063438415527344, -0.046661376953125, -0.04268836975097656, -0.038715362548828125, -0.03474235534667969, -0.03076934814453125, -0.026796340942382812, -0.022823333740234375, -0.018850326538085938, -0.0148773193359375, -0.010904312133789062, -0.006931304931640625, -0.0029582977294921875, 0.00101470947265625, 0.0049877166748046875, 0.008960723876953125, 0.012933731079101562, 0.01690673828125, 0.020879745483398438, 0.024852752685546875, 0.028825759887695312, 0.03279876708984375, 0.03677177429199219, 0.040744781494140625, 0.04471778869628906, 0.0486907958984375, 0.05266380310058594, 0.056636810302734375, 0.06060981750488281, 0.06458282470703125, 0.06855583190917969, 0.07252883911132812, 0.07650184631347656, 0.080474853515625, 0.08444786071777344, 0.08842086791992188, 0.09239387512207031, 0.09636688232421875, 0.10033988952636719, 0.10431289672851562, 0.10828590393066406, 0.1122589111328125, 0.11623191833496094, 0.12020492553710938, 0.12417793273925781, 0.12815093994140625, 0.1321239471435547, 0.13609695434570312, 0.14006996154785156, 0.14404296875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 21.0, 62.0, 197.0, 447.0, 195.0, 50.0, 18.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.500463485717773, -12.243213653564453, -11.98596477508545, -11.728714942932129, -11.471466064453125, -11.214216232299805, -10.956966400146484, -10.69971752166748, -10.44246768951416, -10.18521785736084, -9.927968978881836, -9.670719146728516, -9.413470268249512, -9.156220436096191, -8.898971557617188, -8.641721725463867, -8.384471893310547, -8.127222061157227, -7.869973182678223, -7.612723350524902, -7.35547399520874, -7.098224639892578, -6.840975284576416, -6.583725929260254, -6.32647705078125, -6.069227695465088, -5.811978340148926, -5.5547285079956055, -5.297479152679443, -5.040229797363281, -4.782980442047119, -4.525731086730957, -4.268481254577637, -4.011231899261475, -3.7539823055267334, -3.4967329502105713, -3.23948335647583, -2.982234001159668, -2.724984645843506, -2.4677352905273438, -2.2104854583740234, -1.9532359838485718, -1.6959865093231201, -1.438737154006958, -1.1814876794815063, -0.9242382049560547, -0.6669888496398926, -0.4097393751144409, -0.15248990058898926, 0.10475954413414001, 0.3620089888572693, 0.6192584037780762, 0.8765078783035278, 1.1337573528289795, 1.3910067081451416, 1.6482561826705933, 1.905505657196045, 2.162755012512207, 2.4200046062469482, 2.6772539615631104, 2.9345035552978516, 3.1917529106140137, 3.449002265930176, 3.706251621246338, 3.963501214981079]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 14.0, 8.0, 16.0, 13.0, 27.0, 21.0, 24.0, 42.0, 27.0, 44.0, 45.0, 55.0, 79.0, 81.0, 79.0, 53.0, 52.0, 51.0, 40.0, 35.0, 32.0, 32.0, 17.0, 18.0, 15.0, 13.0, 10.0, 8.0, 7.0, 6.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.246676445007324, -3.1662709712982178, -3.0858652591705322, -3.005459785461426, -2.9250543117523193, -2.844648599624634, -2.7642431259155273, -2.683837413787842, -2.6034319400787354, -2.523026466369629, -2.4426207542419434, -2.362215280532837, -2.2818098068237305, -2.201404094696045, -2.1209986209869385, -2.040593147277832, -1.960187554359436, -1.87978196144104, -1.7993764877319336, -1.7189708948135376, -1.6385653018951416, -1.5581598281860352, -1.4777542352676392, -1.3973486423492432, -1.3169431686401367, -1.2365375757217407, -1.1561321020126343, -1.0757265090942383, -0.9953209161758423, -0.9149153828620911, -0.8345098495483398, -0.7541042566299438, -0.6736987829208374, -0.5932932496070862, -0.5128876566886902, -0.43248212337493896, -0.35207656025886536, -0.27167099714279175, -0.19126546382904053, -0.11085987091064453, -0.03045433759689331, 0.0499512180685997, 0.1303567737340927, 0.21076232194900513, 0.29116788506507874, 0.37157344818115234, 0.45197898149490356, 0.5323845744132996, 0.6127901077270508, 0.693195641040802, 0.773601233959198, 0.8540067672729492, 0.9344123601913452, 1.0148179531097412, 1.0952234268188477, 1.1756290197372437, 1.2560346126556396, 1.3364402055740356, 1.416845679283142, 1.497251272201538, 1.577656865119934, 1.65806245803833, 1.7384679317474365, 1.8188735246658325, 1.899278998374939]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 6.0, 15.0, 15.0, 17.0, 28.0, 34.0, 51.0, 77.0, 113.0, 171.0, 259.0, 433.0, 617.0, 946.0, 1498.0, 2468.0, 4214.0, 7385.0, 14466.0, 33578.0, 104472.0, 493187.0, 2296597.0, 958716.0, 182244.0, 50579.0, 19439.0, 9393.0, 5133.0, 3018.0, 1836.0, 1097.0, 720.0, 472.0, 323.0, 211.0, 120.0, 83.0, 63.0, 39.0, 21.0, 31.0, 22.0, 17.0, 9.0, 8.0, 10.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.130615234375, -0.1264934539794922, -0.12237167358398438, -0.11824989318847656, -0.11412811279296875, -0.11000633239746094, -0.10588455200195312, -0.10176277160644531, -0.0976409912109375, -0.09351921081542969, -0.08939743041992188, -0.08527565002441406, -0.08115386962890625, -0.07703208923339844, -0.07291030883789062, -0.06878852844238281, -0.064666748046875, -0.06054496765136719, -0.056423187255859375, -0.05230140686035156, -0.04817962646484375, -0.04405784606933594, -0.039936065673828125, -0.03581428527832031, -0.0316925048828125, -0.027570724487304688, -0.023448944091796875, -0.019327163696289062, -0.01520538330078125, -0.011083602905273438, -0.006961822509765625, -0.0028400421142578125, 0.00128173828125, 0.0054035186767578125, 0.009525299072265625, 0.013647079467773438, 0.01776885986328125, 0.021890640258789062, 0.026012420654296875, 0.030134201049804688, 0.0342559814453125, 0.03837776184082031, 0.042499542236328125, 0.04662132263183594, 0.05074310302734375, 0.05486488342285156, 0.058986663818359375, 0.06310844421386719, 0.067230224609375, 0.07135200500488281, 0.07547378540039062, 0.07959556579589844, 0.08371734619140625, 0.08783912658691406, 0.09196090698242188, 0.09608268737792969, 0.1002044677734375, 0.10432624816894531, 0.10844802856445312, 0.11256980895996094, 0.11669158935546875, 0.12081336975097656, 0.12493515014648438, 0.1290569305419922, 0.1331787109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 8.0, 9.0, 7.0, 11.0, 8.0, 11.0, 11.0, 17.0, 14.0, 24.0, 28.0, 18.0, 29.0, 43.0, 33.0, 34.0, 45.0, 34.0, 68.0, 48.0, 44.0, 50.0, 32.0, 40.0, 43.0, 33.0, 41.0, 28.0, 38.0, 23.0, 36.0, 10.0, 10.0, 21.0, 10.0, 10.0, 10.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.122314453125, -0.11870384216308594, -0.11509323120117188, -0.11148262023925781, -0.10787200927734375, -0.10426139831542969, -0.10065078735351562, -0.09704017639160156, -0.0934295654296875, -0.08981895446777344, -0.08620834350585938, -0.08259773254394531, -0.07898712158203125, -0.07537651062011719, -0.07176589965820312, -0.06815528869628906, -0.064544677734375, -0.06093406677246094, -0.057323455810546875, -0.05371284484863281, -0.05010223388671875, -0.04649162292480469, -0.042881011962890625, -0.03927040100097656, -0.0356597900390625, -0.03204917907714844, -0.028438568115234375, -0.024827957153320312, -0.02121734619140625, -0.017606735229492188, -0.013996124267578125, -0.010385513305664062, -0.00677490234375, -0.0031642913818359375, 0.000446319580078125, 0.0040569305419921875, 0.00766754150390625, 0.011278152465820312, 0.014888763427734375, 0.018499374389648438, 0.0221099853515625, 0.025720596313476562, 0.029331207275390625, 0.03294181823730469, 0.03655242919921875, 0.04016304016113281, 0.043773651123046875, 0.04738426208496094, 0.050994873046875, 0.05460548400878906, 0.058216094970703125, 0.06182670593261719, 0.06543731689453125, 0.06904792785644531, 0.07265853881835938, 0.07626914978027344, 0.0798797607421875, 0.08349037170410156, 0.08710098266601562, 0.09071159362792969, 0.09432220458984375, 0.09793281555175781, 0.10154342651367188, 0.10515403747558594, 0.1087646484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 3.0, 14.0, 18.0, 26.0, 38.0, 53.0, 129.0, 306.0, 672.0, 2029.0, 7443.0, 50219.0, 2829836.0, 1260367.0, 34455.0, 5830.0, 1636.0, 634.0, 277.0, 121.0, 70.0, 37.0, 16.0, 10.0, 13.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5032806396484375, -0.487518310546875, -0.4717559814453125, -0.45599365234375, -0.4402313232421875, -0.424468994140625, -0.4087066650390625, -0.3929443359375, -0.3771820068359375, -0.361419677734375, -0.3456573486328125, -0.32989501953125, -0.3141326904296875, -0.298370361328125, -0.2826080322265625, -0.266845703125, -0.2510833740234375, -0.235321044921875, -0.2195587158203125, -0.20379638671875, -0.1880340576171875, -0.172271728515625, -0.1565093994140625, -0.1407470703125, -0.1249847412109375, -0.109222412109375, -0.0934600830078125, -0.07769775390625, -0.0619354248046875, -0.046173095703125, -0.0304107666015625, -0.0146484375, 0.0011138916015625, 0.016876220703125, 0.0326385498046875, 0.04840087890625, 0.0641632080078125, 0.079925537109375, 0.0956878662109375, 0.1114501953125, 0.1272125244140625, 0.142974853515625, 0.1587371826171875, 0.17449951171875, 0.1902618408203125, 0.206024169921875, 0.2217864990234375, 0.237548828125, 0.2533111572265625, 0.269073486328125, 0.2848358154296875, 0.30059814453125, 0.3163604736328125, 0.332122802734375, 0.3478851318359375, 0.3636474609375, 0.3794097900390625, 0.395172119140625, 0.4109344482421875, 0.42669677734375, 0.4424591064453125, 0.458221435546875, 0.4739837646484375, 0.48974609375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 1.0, 7.0, 3.0, 12.0, 18.0, 19.0, 29.0, 39.0, 48.0, 84.0, 135.0, 258.0, 610.0, 1049.0, 869.0, 415.0, 187.0, 97.0, 59.0, 44.0, 20.0, 19.0, 11.0, 12.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3729438781738281, -0.36038970947265625, -0.3478355407714844, -0.3352813720703125, -0.3227272033691406, -0.31017303466796875, -0.2976188659667969, -0.285064697265625, -0.2725105285644531, -0.25995635986328125, -0.24740219116210938, -0.2348480224609375, -0.22229385375976562, -0.20973968505859375, -0.19718551635742188, -0.18463134765625, -0.17207717895507812, -0.15952301025390625, -0.14696884155273438, -0.1344146728515625, -0.12186050415039062, -0.10930633544921875, -0.09675216674804688, -0.084197998046875, -0.07164382934570312, -0.05908966064453125, -0.046535491943359375, -0.0339813232421875, -0.021427154541015625, -0.00887298583984375, 0.003681182861328125, 0.0162353515625, 0.028789520263671875, 0.04134368896484375, 0.053897857666015625, 0.0664520263671875, 0.07900619506835938, 0.09156036376953125, 0.10411453247070312, 0.116668701171875, 0.12922286987304688, 0.14177703857421875, 0.15433120727539062, 0.1668853759765625, 0.17943954467773438, 0.19199371337890625, 0.20454788208007812, 0.21710205078125, 0.22965621948242188, 0.24221038818359375, 0.2547645568847656, 0.2673187255859375, 0.2798728942871094, 0.29242706298828125, 0.3049812316894531, 0.317535400390625, 0.3300895690917969, 0.34264373779296875, 0.3551979064941406, 0.3677520751953125, 0.3803062438964844, 0.39286041259765625, 0.4054145812988281, 0.41796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 9.0, 26.0, 68.0, 241.0, 369.0, 188.0, 58.0, 14.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.0794901847839355, -6.91627311706543, -6.753055572509766, -6.58983850479126, -6.426621437072754, -6.263404369354248, -6.100187301635742, -5.936969757080078, -5.773752689361572, -5.610535621643066, -5.447318077087402, -5.2841010093688965, -5.120883941650391, -4.957666873931885, -4.794449806213379, -4.631232261657715, -4.468015193939209, -4.304798126220703, -4.141580581665039, -3.978363513946533, -3.8151464462280273, -3.6519293785095215, -3.4887120723724365, -3.3254947662353516, -3.1622776985168457, -2.99906063079834, -2.835843324661255, -2.67262601852417, -2.509408950805664, -2.346191883087158, -2.1829745769500732, -2.0197572708129883, -1.8565397262573242, -1.6933225393295288, -1.5301053524017334, -1.366888165473938, -1.2036709785461426, -1.0404537916183472, -0.8772366046905518, -0.7140194177627563, -0.5508022308349609, -0.3875850439071655, -0.22436785697937012, -0.06115067005157471, 0.1020665168762207, 0.2652837038040161, 0.4285008907318115, 0.5917180776596069, 0.7549352645874023, 0.9181524515151978, 1.0813696384429932, 1.2445868253707886, 1.407804012298584, 1.5710211992263794, 1.7342383861541748, 1.8974555730819702, 2.0606727600097656, 2.2238898277282715, 2.3871071338653564, 2.5503244400024414, 2.7135415077209473, 2.876758575439453, 3.039975881576538, 3.203193187713623, 3.366410255432129]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 12.0, 10.0, 13.0, 14.0, 12.0, 20.0, 30.0, 26.0, 35.0, 31.0, 43.0, 35.0, 60.0, 47.0, 57.0, 47.0, 54.0, 59.0, 54.0, 47.0, 62.0, 38.0, 34.0, 34.0, 22.0, 22.0, 12.0, 18.0, 9.0, 9.0, 14.0, 8.0, 2.0, 1.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3091931343078613, -1.26043701171875, -1.2116807699203491, -1.1629245281219482, -1.114168405532837, -1.0654122829437256, -1.0166560411453247, -0.9678998589515686, -0.9191436767578125, -0.8703874945640564, -0.8216313123703003, -0.7728751301765442, -0.7241189479827881, -0.675362765789032, -0.6266065835952759, -0.5778504014015198, -0.5290942192077637, -0.48033803701400757, -0.43158185482025146, -0.38282567262649536, -0.33406949043273926, -0.28531330823898315, -0.23655712604522705, -0.18780094385147095, -0.13904476165771484, -0.09028857946395874, -0.04153239727020264, 0.007223784923553467, 0.05597996711730957, 0.10473614931106567, 0.15349233150482178, 0.20224851369857788, 0.251004695892334, 0.2997608780860901, 0.3485170602798462, 0.3972732424736023, 0.4460294246673584, 0.4947856068611145, 0.5435417890548706, 0.5922979712486267, 0.6410541534423828, 0.6898103356361389, 0.738566517829895, 0.7873227000236511, 0.8360788822174072, 0.8848350644111633, 0.9335912466049194, 0.9823474287986755, 1.0311036109924316, 1.079859733581543, 1.1286159753799438, 1.1773722171783447, 1.226128339767456, 1.2748844623565674, 1.3236407041549683, 1.3723969459533691, 1.4211530685424805, 1.4699091911315918, 1.5186654329299927, 1.5674216747283936, 1.6161777973175049, 1.6649339199066162, 1.713690161705017, 1.762446403503418, 1.8112025260925293]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 18.0, 26.0, 27.0, 31.0, 47.0, 82.0, 109.0, 153.0, 245.0, 343.0, 540.0, 784.0, 1367.0, 2292.0, 4217.0, 8313.0, 18113.0, 43191.0, 109058.0, 250689.0, 315272.0, 170816.0, 69191.0, 27786.0, 12125.0, 5849.0, 3035.0, 1715.0, 1052.0, 680.0, 444.0, 292.0, 203.0, 135.0, 98.0, 61.0, 47.0, 35.0, 19.0, 13.0, 6.0, 10.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18271827697753906, -0.17647171020507812, -0.1702251434326172, -0.16397857666015625, -0.1577320098876953, -0.15148544311523438, -0.14523887634277344, -0.1389923095703125, -0.13274574279785156, -0.12649917602539062, -0.12025260925292969, -0.11400604248046875, -0.10775947570800781, -0.10151290893554688, -0.09526634216308594, -0.089019775390625, -0.08277320861816406, -0.07652664184570312, -0.07028007507324219, -0.06403350830078125, -0.05778694152832031, -0.051540374755859375, -0.04529380798339844, -0.0390472412109375, -0.03280067443847656, -0.026554107666015625, -0.020307540893554688, -0.01406097412109375, -0.007814407348632812, -0.001567840576171875, 0.0046787261962890625, 0.01092529296875, 0.017171859741210938, 0.023418426513671875, 0.029664993286132812, 0.03591156005859375, 0.04215812683105469, 0.048404693603515625, 0.05465126037597656, 0.0608978271484375, 0.06714439392089844, 0.07339096069335938, 0.07963752746582031, 0.08588409423828125, 0.09213066101074219, 0.09837722778320312, 0.10462379455566406, 0.110870361328125, 0.11711692810058594, 0.12336349487304688, 0.1296100616455078, 0.13585662841796875, 0.1421031951904297, 0.14834976196289062, 0.15459632873535156, 0.1608428955078125, 0.16708946228027344, 0.17333602905273438, 0.1795825958251953, 0.18582916259765625, 0.1920757293701172, 0.19832229614257812, 0.20456886291503906, 0.2108154296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 2.0, 5.0, 3.0, 5.0, 11.0, 15.0, 5.0, 7.0, 17.0, 8.0, 20.0, 21.0, 16.0, 19.0, 28.0, 27.0, 31.0, 21.0, 44.0, 32.0, 52.0, 46.0, 53.0, 37.0, 47.0, 45.0, 39.0, 39.0, 31.0, 30.0, 36.0, 27.0, 28.0, 26.0, 16.0, 24.0, 19.0, 9.0, 14.0, 13.0, 10.0, 2.0, 8.0, 3.0, 5.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11712646484375, -0.11359882354736328, -0.11007118225097656, -0.10654354095458984, -0.10301589965820312, -0.0994882583618164, -0.09596061706542969, -0.09243297576904297, -0.08890533447265625, -0.08537769317626953, -0.08185005187988281, -0.0783224105834961, -0.07479476928710938, -0.07126712799072266, -0.06773948669433594, -0.06421184539794922, -0.0606842041015625, -0.05715656280517578, -0.05362892150878906, -0.050101280212402344, -0.046573638916015625, -0.043045997619628906, -0.03951835632324219, -0.03599071502685547, -0.03246307373046875, -0.02893543243408203, -0.025407791137695312, -0.021880149841308594, -0.018352508544921875, -0.014824867248535156, -0.011297225952148438, -0.007769584655761719, -0.004241943359375, -0.0007143020629882812, 0.0028133392333984375, 0.006340980529785156, 0.009868621826171875, 0.013396263122558594, 0.016923904418945312, 0.02045154571533203, 0.02397918701171875, 0.02750682830810547, 0.031034469604492188, 0.034562110900878906, 0.038089752197265625, 0.041617393493652344, 0.04514503479003906, 0.04867267608642578, 0.0522003173828125, 0.05572795867919922, 0.05925559997558594, 0.06278324127197266, 0.06631088256835938, 0.0698385238647461, 0.07336616516113281, 0.07689380645751953, 0.08042144775390625, 0.08394908905029297, 0.08747673034667969, 0.0910043716430664, 0.09453201293945312, 0.09805965423583984, 0.10158729553222656, 0.10511493682861328, 0.108642578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 15.0, 12.0, 14.0, 13.0, 24.0, 19.0, 47.0, 62.0, 73.0, 137.0, 210.0, 415.0, 942.0, 2638.0, 9866.0, 59577.0, 614663.0, 310774.0, 38220.0, 7088.0, 2078.0, 715.0, 335.0, 205.0, 122.0, 78.0, 43.0, 45.0, 31.0, 15.0, 16.0, 12.0, 12.0, 14.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37841796875, -0.36531829833984375, -0.3522186279296875, -0.33911895751953125, -0.326019287109375, -0.31291961669921875, -0.2998199462890625, -0.28672027587890625, -0.27362060546875, -0.26052093505859375, -0.2474212646484375, -0.23432159423828125, -0.221221923828125, -0.20812225341796875, -0.1950225830078125, -0.18192291259765625, -0.1688232421875, -0.15572357177734375, -0.1426239013671875, -0.12952423095703125, -0.116424560546875, -0.10332489013671875, -0.0902252197265625, -0.07712554931640625, -0.06402587890625, -0.05092620849609375, -0.0378265380859375, -0.02472686767578125, -0.011627197265625, 0.00147247314453125, 0.0145721435546875, 0.02767181396484375, 0.040771484375, 0.05387115478515625, 0.0669708251953125, 0.08007049560546875, 0.093170166015625, 0.10626983642578125, 0.1193695068359375, 0.13246917724609375, 0.14556884765625, 0.15866851806640625, 0.1717681884765625, 0.18486785888671875, 0.197967529296875, 0.21106719970703125, 0.2241668701171875, 0.23726654052734375, 0.2503662109375, 0.26346588134765625, 0.2765655517578125, 0.28966522216796875, 0.302764892578125, 0.31586456298828125, 0.3289642333984375, 0.34206390380859375, 0.35516357421875, 0.36826324462890625, 0.3813629150390625, 0.39446258544921875, 0.407562255859375, 0.42066192626953125, 0.4337615966796875, 0.44686126708984375, 0.4599609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 15.0, 22.0, 15.0, 23.0, 22.0, 24.0, 30.0, 44.0, 53.0, 40.0, 66.0, 64.0, 58.0, 66.0, 77.0, 56.0, 49.0, 56.0, 39.0, 37.0, 23.0, 27.0, 15.0, 14.0, 14.0, 5.0, 10.0, 10.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.6346702575683594, -0.6174850463867188, -0.6002998352050781, -0.5831146240234375, -0.5659294128417969, -0.5487442016601562, -0.5315589904785156, -0.514373779296875, -0.4971885681152344, -0.48000335693359375, -0.4628181457519531, -0.4456329345703125, -0.4284477233886719, -0.41126251220703125, -0.3940773010253906, -0.37689208984375, -0.3597068786621094, -0.34252166748046875, -0.3253364562988281, -0.3081512451171875, -0.2909660339355469, -0.27378082275390625, -0.2565956115722656, -0.239410400390625, -0.22222518920898438, -0.20503997802734375, -0.18785476684570312, -0.1706695556640625, -0.15348434448242188, -0.13629913330078125, -0.11911392211914062, -0.1019287109375, -0.08474349975585938, -0.06755828857421875, -0.050373077392578125, -0.0331878662109375, -0.016002655029296875, 0.00118255615234375, 0.018367767333984375, 0.035552978515625, 0.052738189697265625, 0.06992340087890625, 0.08710861206054688, 0.1042938232421875, 0.12147903442382812, 0.13866424560546875, 0.15584945678710938, 0.17303466796875, 0.19021987915039062, 0.20740509033203125, 0.22459030151367188, 0.2417755126953125, 0.2589607238769531, 0.27614593505859375, 0.2933311462402344, 0.310516357421875, 0.3277015686035156, 0.34488677978515625, 0.3620719909667969, 0.3792572021484375, 0.3964424133300781, 0.41362762451171875, 0.4308128356933594, 0.447998046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 5.0, 6.0, 14.0, 18.0, 26.0, 25.0, 60.0, 154.0, 310.0, 863.0, 3344.0, 22108.0, 308376.0, 671058.0, 35664.0, 4683.0, 1111.0, 370.0, 173.0, 63.0, 36.0, 24.0, 19.0, 8.0, 9.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1513671875, -0.1459808349609375, -0.140594482421875, -0.1352081298828125, -0.12982177734375, -0.1244354248046875, -0.119049072265625, -0.1136627197265625, -0.1082763671875, -0.1028900146484375, -0.097503662109375, -0.0921173095703125, -0.08673095703125, -0.0813446044921875, -0.075958251953125, -0.0705718994140625, -0.065185546875, -0.0597991943359375, -0.054412841796875, -0.0490264892578125, -0.04364013671875, -0.0382537841796875, -0.032867431640625, -0.0274810791015625, -0.0220947265625, -0.0167083740234375, -0.011322021484375, -0.0059356689453125, -0.00054931640625, 0.0048370361328125, 0.010223388671875, 0.0156097412109375, 0.02099609375, 0.0263824462890625, 0.031768798828125, 0.0371551513671875, 0.04254150390625, 0.0479278564453125, 0.053314208984375, 0.0587005615234375, 0.0640869140625, 0.0694732666015625, 0.074859619140625, 0.0802459716796875, 0.08563232421875, 0.0910186767578125, 0.096405029296875, 0.1017913818359375, 0.107177734375, 0.1125640869140625, 0.117950439453125, 0.1233367919921875, 0.12872314453125, 0.1341094970703125, 0.139495849609375, 0.1448822021484375, 0.1502685546875, 0.1556549072265625, 0.161041259765625, 0.1664276123046875, 0.17181396484375, 0.1772003173828125, 0.182586669921875, 0.1879730224609375, 0.193359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 5.0, 6.0, 7.0, 10.0, 18.0, 17.0, 21.0, 8.0, 32.0, 44.0, 37.0, 48.0, 64.0, 71.0, 64.0, 86.0, 76.0, 72.0, 54.0, 53.0, 40.0, 30.0, 24.0, 17.0, 22.0, 11.0, 15.0, 10.0, 9.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.2172927856445312e-05, -2.1414831280708313e-05, -2.0656734704971313e-05, -1.9898638129234314e-05, -1.9140541553497314e-05, -1.8382444977760315e-05, -1.7624348402023315e-05, -1.6866251826286316e-05, -1.6108155250549316e-05, -1.5350058674812317e-05, -1.4591962099075317e-05, -1.3833865523338318e-05, -1.3075768947601318e-05, -1.2317672371864319e-05, -1.155957579612732e-05, -1.080147922039032e-05, -1.004338264465332e-05, -9.28528606891632e-06, -8.527189493179321e-06, -7.769092917442322e-06, -7.010996341705322e-06, -6.252899765968323e-06, -5.494803190231323e-06, -4.736706614494324e-06, -3.978610038757324e-06, -3.2205134630203247e-06, -2.462416887283325e-06, -1.7043203115463257e-06, -9.462237358093262e-07, -1.8812716007232666e-07, 5.699694156646729e-07, 1.3280659914016724e-06, 2.086162567138672e-06, 2.8442591428756714e-06, 3.602355718612671e-06, 4.36045229434967e-06, 5.11854887008667e-06, 5.8766454458236694e-06, 6.634742021560669e-06, 7.3928385972976685e-06, 8.150935173034668e-06, 8.909031748771667e-06, 9.667128324508667e-06, 1.0425224900245667e-05, 1.1183321475982666e-05, 1.1941418051719666e-05, 1.2699514627456665e-05, 1.3457611203193665e-05, 1.4215707778930664e-05, 1.4973804354667664e-05, 1.5731900930404663e-05, 1.6489997506141663e-05, 1.7248094081878662e-05, 1.800619065761566e-05, 1.876428723335266e-05, 1.952238380908966e-05, 2.028048038482666e-05, 2.103857696056366e-05, 2.179667353630066e-05, 2.255477011203766e-05, 2.3312866687774658e-05, 2.4070963263511658e-05, 2.4829059839248657e-05, 2.5587156414985657e-05, 2.6345252990722656e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 4.0, 10.0, 17.0, 20.0, 38.0, 65.0, 94.0, 178.0, 368.0, 874.0, 2621.0, 12233.0, 88753.0, 754744.0, 163085.0, 19521.0, 3867.0, 1089.0, 430.0, 220.0, 116.0, 64.0, 47.0, 28.0, 21.0, 12.0, 9.0, 9.0, 4.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.183349609375, -0.17883682250976562, -0.17432403564453125, -0.16981124877929688, -0.1652984619140625, -0.16078567504882812, -0.15627288818359375, -0.15176010131835938, -0.147247314453125, -0.14273452758789062, -0.13822174072265625, -0.13370895385742188, -0.1291961669921875, -0.12468338012695312, -0.12017059326171875, -0.11565780639648438, -0.11114501953125, -0.10663223266601562, -0.10211944580078125, -0.09760665893554688, -0.0930938720703125, -0.08858108520507812, -0.08406829833984375, -0.07955551147460938, -0.075042724609375, -0.07052993774414062, -0.06601715087890625, -0.061504364013671875, -0.0569915771484375, -0.052478790283203125, -0.04796600341796875, -0.043453216552734375, -0.0389404296875, -0.034427642822265625, -0.02991485595703125, -0.025402069091796875, -0.0208892822265625, -0.016376495361328125, -0.01186370849609375, -0.007350921630859375, -0.002838134765625, 0.001674652099609375, 0.00618743896484375, 0.010700225830078125, 0.0152130126953125, 0.019725799560546875, 0.02423858642578125, 0.028751373291015625, 0.03326416015625, 0.037776947021484375, 0.04228973388671875, 0.046802520751953125, 0.0513153076171875, 0.055828094482421875, 0.06034088134765625, 0.06485366821289062, 0.069366455078125, 0.07387924194335938, 0.07839202880859375, 0.08290481567382812, 0.0874176025390625, 0.09193038940429688, 0.09644317626953125, 0.10095596313476562, 0.10546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 1.0, 9.0, 9.0, 15.0, 10.0, 15.0, 15.0, 17.0, 21.0, 27.0, 39.0, 57.0, 54.0, 46.0, 64.0, 56.0, 51.0, 67.0, 60.0, 62.0, 45.0, 46.0, 36.0, 36.0, 22.0, 23.0, 15.0, 13.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0], "bins": [-0.0892333984375, -0.08663368225097656, -0.08403396606445312, -0.08143424987792969, -0.07883453369140625, -0.07623481750488281, -0.07363510131835938, -0.07103538513183594, -0.0684356689453125, -0.06583595275878906, -0.06323623657226562, -0.06063652038574219, -0.05803680419921875, -0.05543708801269531, -0.052837371826171875, -0.05023765563964844, -0.047637939453125, -0.04503822326660156, -0.042438507080078125, -0.03983879089355469, -0.03723907470703125, -0.03463935852050781, -0.032039642333984375, -0.029439926147460938, -0.0268402099609375, -0.024240493774414062, -0.021640777587890625, -0.019041061401367188, -0.01644134521484375, -0.013841629028320312, -0.011241912841796875, -0.008642196655273438, -0.00604248046875, -0.0034427642822265625, -0.000843048095703125, 0.0017566680908203125, 0.00435638427734375, 0.0069561004638671875, 0.009555816650390625, 0.012155532836914062, 0.0147552490234375, 0.017354965209960938, 0.019954681396484375, 0.022554397583007812, 0.02515411376953125, 0.027753829956054688, 0.030353546142578125, 0.03295326232910156, 0.035552978515625, 0.03815269470214844, 0.040752410888671875, 0.04335212707519531, 0.04595184326171875, 0.04855155944824219, 0.051151275634765625, 0.05375099182128906, 0.0563507080078125, 0.05895042419433594, 0.061550140380859375, 0.06414985656738281, 0.06674957275390625, 0.06934928894042969, 0.07194900512695312, 0.07454872131347656, 0.0771484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 8.0, 21.0, 43.0, 92.0, 160.0, 303.0, 193.0, 100.0, 28.0, 16.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.93854284286499, -4.832653045654297, -4.726762771606445, -4.620872974395752, -4.5149827003479, -4.409092903137207, -4.3032026290893555, -4.197312831878662, -4.091423034667969, -3.9855329990386963, -3.879642963409424, -3.7737529277801514, -3.667862892150879, -3.5619730949401855, -3.456083059310913, -3.3501930236816406, -3.244302749633789, -3.1384127140045166, -3.032522678375244, -2.9266326427459717, -2.820742607116699, -2.714852809906006, -2.6089627742767334, -2.503072738647461, -2.3971827030181885, -2.291292667388916, -2.1854026317596436, -2.079512596130371, -1.9736226797103882, -1.8677326440811157, -1.7618427276611328, -1.6559526920318604, -1.550062656402588, -1.4441726207733154, -1.338282585144043, -1.23239266872406, -1.1265026330947876, -1.0206125974655151, -0.9147226214408875, -0.8088326454162598, -0.7029426097869873, -0.5970525741577148, -0.49116259813308716, -0.3852725923061371, -0.279382586479187, -0.17349255084991455, -0.06760257482528687, 0.03828740119934082, 0.14417743682861328, 0.25006744265556335, 0.3559574484825134, 0.4618474543094635, 0.5677374601364136, 0.673627495765686, 0.7795174717903137, 0.8854074478149414, 0.9912974834442139, 1.0971875190734863, 1.2030775547027588, 1.3089674711227417, 1.4148575067520142, 1.5207475423812866, 1.6266374588012695, 1.732527494430542, 1.8384175300598145]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 0.0, 1.0, 5.0, 6.0, 7.0, 10.0, 6.0, 20.0, 16.0, 15.0, 18.0, 20.0, 25.0, 33.0, 24.0, 26.0, 31.0, 39.0, 51.0, 73.0, 75.0, 82.0, 53.0, 39.0, 50.0, 33.0, 35.0, 23.0, 34.0, 22.0, 17.0, 18.0, 13.0, 13.0, 13.0, 11.0, 7.0, 16.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.682951807975769, -1.6318519115447998, -1.5807520151138306, -1.5296521186828613, -1.4785523414611816, -1.4274523258209229, -1.3763525485992432, -1.325252652168274, -1.2741527557373047, -1.2230528593063354, -1.1719529628753662, -1.120853066444397, -1.0697531700134277, -1.018653392791748, -0.9675534963607788, -0.9164535999298096, -0.8653537034988403, -0.8142538070678711, -0.7631539106369019, -0.7120540738105774, -0.6609541773796082, -0.6098542809486389, -0.5587544441223145, -0.5076545476913452, -0.456554651260376, -0.40545475482940674, -0.3543548882007599, -0.30325502157211304, -0.2521551251411438, -0.20105522871017456, -0.1499553620815277, -0.09885549545288086, -0.04775547981262207, 0.003344401717185974, 0.05444428324699402, 0.10554416477680206, 0.1566440463066101, 0.20774394273757935, 0.2588438093662262, 0.30994367599487305, 0.3610435724258423, 0.4121434688568115, 0.4632433354854584, 0.5143432021141052, 0.5654430985450745, 0.6165429949760437, 0.6676428318023682, 0.7187427282333374, 0.7698426246643066, 0.8209425210952759, 0.8720424175262451, 0.9231422543525696, 0.9742421507835388, 1.0253419876098633, 1.0764418840408325, 1.1275417804718018, 1.178641676902771, 1.2297415733337402, 1.2808414697647095, 1.3319413661956787, 1.3830411434173584, 1.4341411590576172, 1.4852409362792969, 1.5363408327102661, 1.5874407291412354]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 3.0, 5.0, 10.0, 10.0, 10.0, 11.0, 16.0, 23.0, 23.0, 34.0, 55.0, 51.0, 107.0, 194.0, 319.0, 488.0, 825.0, 1610.0, 3250.0, 7546.0, 21290.0, 96369.0, 871123.0, 2797727.0, 320834.0, 48210.0, 13244.0, 5387.0, 2475.0, 1218.0, 737.0, 372.0, 244.0, 137.0, 89.0, 57.0, 44.0, 34.0, 31.0, 16.0, 18.0, 12.0, 5.0, 5.0, 7.0, 2.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.197265625, -0.1915130615234375, -0.185760498046875, -0.1800079345703125, -0.17425537109375, -0.1685028076171875, -0.162750244140625, -0.1569976806640625, -0.1512451171875, -0.1454925537109375, -0.139739990234375, -0.1339874267578125, -0.12823486328125, -0.1224822998046875, -0.116729736328125, -0.1109771728515625, -0.105224609375, -0.0994720458984375, -0.093719482421875, -0.0879669189453125, -0.08221435546875, -0.0764617919921875, -0.070709228515625, -0.0649566650390625, -0.0592041015625, -0.0534515380859375, -0.047698974609375, -0.0419464111328125, -0.03619384765625, -0.0304412841796875, -0.024688720703125, -0.0189361572265625, -0.01318359375, -0.0074310302734375, -0.001678466796875, 0.0040740966796875, 0.00982666015625, 0.0155792236328125, 0.021331787109375, 0.0270843505859375, 0.0328369140625, 0.0385894775390625, 0.044342041015625, 0.0500946044921875, 0.05584716796875, 0.0615997314453125, 0.067352294921875, 0.0731048583984375, 0.078857421875, 0.0846099853515625, 0.090362548828125, 0.0961151123046875, 0.10186767578125, 0.1076202392578125, 0.113372802734375, 0.1191253662109375, 0.1248779296875, 0.1306304931640625, 0.136383056640625, 0.1421356201171875, 0.14788818359375, 0.1536407470703125, 0.159393310546875, 0.1651458740234375, 0.1708984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 6.0, 13.0, 3.0, 5.0, 10.0, 7.0, 14.0, 16.0, 15.0, 18.0, 20.0, 24.0, 25.0, 30.0, 24.0, 27.0, 40.0, 35.0, 33.0, 60.0, 40.0, 33.0, 37.0, 41.0, 46.0, 33.0, 33.0, 37.0, 31.0, 20.0, 24.0, 27.0, 25.0, 20.0, 18.0, 23.0, 16.0, 13.0, 7.0, 8.0, 9.0, 3.0, 9.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.10565185546875, -0.10251235961914062, -0.09937286376953125, -0.09623336791992188, -0.0930938720703125, -0.08995437622070312, -0.08681488037109375, -0.08367538452148438, -0.080535888671875, -0.07739639282226562, -0.07425689697265625, -0.07111740112304688, -0.0679779052734375, -0.06483840942382812, -0.06169891357421875, -0.058559417724609375, -0.055419921875, -0.052280426025390625, -0.04914093017578125, -0.046001434326171875, -0.0428619384765625, -0.039722442626953125, -0.03658294677734375, -0.033443450927734375, -0.030303955078125, -0.027164459228515625, -0.02402496337890625, -0.020885467529296875, -0.0177459716796875, -0.014606475830078125, -0.01146697998046875, -0.008327484130859375, -0.00518798828125, -0.002048492431640625, 0.00109100341796875, 0.004230499267578125, 0.0073699951171875, 0.010509490966796875, 0.01364898681640625, 0.016788482666015625, 0.019927978515625, 0.023067474365234375, 0.02620697021484375, 0.029346466064453125, 0.0324859619140625, 0.035625457763671875, 0.03876495361328125, 0.041904449462890625, 0.0450439453125, 0.048183441162109375, 0.05132293701171875, 0.054462432861328125, 0.0576019287109375, 0.060741424560546875, 0.06388092041015625, 0.06702041625976562, 0.070159912109375, 0.07329940795898438, 0.07643890380859375, 0.07957839965820312, 0.0827178955078125, 0.08585739135742188, 0.08899688720703125, 0.09213638305664062, 0.09527587890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 11.0, 10.0, 19.0, 25.0, 48.0, 65.0, 168.0, 301.0, 820.0, 2326.0, 9711.0, 91942.0, 3760931.0, 304042.0, 18070.0, 3670.0, 1158.0, 477.0, 179.0, 119.0, 59.0, 38.0, 23.0, 11.0, 8.0, 6.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3574409484863281, -0.34452056884765625, -0.3316001892089844, -0.3186798095703125, -0.3057594299316406, -0.29283905029296875, -0.2799186706542969, -0.266998291015625, -0.2540779113769531, -0.24115753173828125, -0.22823715209960938, -0.2153167724609375, -0.20239639282226562, -0.18947601318359375, -0.17655563354492188, -0.16363525390625, -0.15071487426757812, -0.13779449462890625, -0.12487411499023438, -0.1119537353515625, -0.09903335571289062, -0.08611297607421875, -0.07319259643554688, -0.060272216796875, -0.047351837158203125, -0.03443145751953125, -0.021511077880859375, -0.0085906982421875, 0.004329681396484375, 0.01725006103515625, 0.030170440673828125, 0.0430908203125, 0.056011199951171875, 0.06893157958984375, 0.08185195922851562, 0.0947723388671875, 0.10769271850585938, 0.12061309814453125, 0.13353347778320312, 0.146453857421875, 0.15937423706054688, 0.17229461669921875, 0.18521499633789062, 0.1981353759765625, 0.21105575561523438, 0.22397613525390625, 0.23689651489257812, 0.24981689453125, 0.2627372741699219, 0.27565765380859375, 0.2885780334472656, 0.3014984130859375, 0.3144187927246094, 0.32733917236328125, 0.3402595520019531, 0.353179931640625, 0.3661003112792969, 0.37902069091796875, 0.3919410705566406, 0.4048614501953125, 0.4177818298339844, 0.43070220947265625, 0.4436225891113281, 0.45654296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 6.0, 10.0, 8.0, 10.0, 25.0, 42.0, 61.0, 113.0, 221.0, 463.0, 962.0, 1082.0, 536.0, 244.0, 103.0, 70.0, 40.0, 24.0, 15.0, 8.0, 15.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.2676582336425781, -0.25601959228515625, -0.24438095092773438, -0.2327423095703125, -0.22110366821289062, -0.20946502685546875, -0.19782638549804688, -0.186187744140625, -0.17454910278320312, -0.16291046142578125, -0.15127182006835938, -0.1396331787109375, -0.12799453735351562, -0.11635589599609375, -0.10471725463867188, -0.09307861328125, -0.08143997192382812, -0.06980133056640625, -0.058162689208984375, -0.0465240478515625, -0.034885406494140625, -0.02324676513671875, -0.011608123779296875, 3.0517578125e-05, 0.011669158935546875, 0.02330780029296875, 0.034946441650390625, 0.0465850830078125, 0.058223724365234375, 0.06986236572265625, 0.08150100708007812, 0.0931396484375, 0.10477828979492188, 0.11641693115234375, 0.12805557250976562, 0.1396942138671875, 0.15133285522460938, 0.16297149658203125, 0.17461013793945312, 0.186248779296875, 0.19788742065429688, 0.20952606201171875, 0.22116470336914062, 0.2328033447265625, 0.24444198608398438, 0.25608062744140625, 0.2677192687988281, 0.27935791015625, 0.2909965515136719, 0.30263519287109375, 0.3142738342285156, 0.3259124755859375, 0.3375511169433594, 0.34918975830078125, 0.3608283996582031, 0.372467041015625, 0.3841056823730469, 0.39574432373046875, 0.4073829650878906, 0.4190216064453125, 0.4306602478027344, 0.44229888916015625, 0.4539375305175781, 0.465576171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 14.0, 20.0, 51.0, 174.0, 333.0, 260.0, 91.0, 37.0, 13.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.620966911315918, -4.491460800170898, -4.361954212188721, -4.232448101043701, -4.102941513061523, -3.973435401916504, -3.8439290523529053, -3.7144227027893066, -3.584916353225708, -3.4554100036621094, -3.3259036540985107, -3.196397304534912, -3.0668911933898926, -2.937384605407715, -2.8078784942626953, -2.6783721446990967, -2.548865795135498, -2.4193594455718994, -2.289853096008301, -2.160346746444702, -2.0308403968811035, -1.9013341665267944, -1.7718279361724854, -1.6423215866088867, -1.512815237045288, -1.3833088874816895, -1.2538025379180908, -1.1242963075637817, -0.9947899580001831, -0.8652836084365845, -0.7357773184776306, -0.6062710285186768, -0.476764440536499, -0.3472581207752228, -0.21775180101394653, -0.08824548125267029, 0.04126083850860596, 0.1707671880722046, 0.30027347803115845, 0.4297797679901123, 0.5592861175537109, 0.6887924671173096, 0.8182987570762634, 0.9478050470352173, 1.077311396598816, 1.2068177461624146, 1.3363239765167236, 1.4658303260803223, 1.595336675643921, 1.7248430252075195, 1.8543493747711182, 1.9838556051254272, 2.1133618354797363, 2.242868423461914, 2.3723745346069336, 2.5018808841705322, 2.631387233734131, 2.7608935832977295, 2.890399932861328, 3.0199062824249268, 3.1494126319885254, 3.278918743133545, 3.4084250926971436, 3.537931442260742, 3.667437791824341]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 11.0, 9.0, 17.0, 15.0, 20.0, 19.0, 18.0, 24.0, 29.0, 23.0, 28.0, 34.0, 38.0, 44.0, 48.0, 42.0, 38.0, 45.0, 29.0, 36.0, 53.0, 40.0, 31.0, 33.0, 22.0, 37.0, 18.0, 26.0, 20.0, 25.0, 19.0, 18.0, 15.0, 3.0, 19.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 5.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9687450528144836, -0.9358394742012024, -0.9029338955879211, -0.8700283169746399, -0.8371227383613586, -0.8042171597480774, -0.7713115215301514, -0.7384059429168701, -0.7055003643035889, -0.6725947856903076, -0.6396892070770264, -0.6067836284637451, -0.5738780498504639, -0.5409724712371826, -0.5080668926239014, -0.47516128420829773, -0.44225573539733887, -0.4093501567840576, -0.37644457817077637, -0.3435389995574951, -0.31063342094421387, -0.2777278423309326, -0.24482223391532898, -0.21191665530204773, -0.17901107668876648, -0.14610549807548523, -0.11319991201162338, -0.08029432594776154, -0.047388747334480286, -0.014483168721199036, 0.018422424793243408, 0.05132800340652466, 0.08423364162445068, 0.11713922023773193, 0.15004479885101318, 0.18295039236545563, 0.21585597097873688, 0.24876154959201813, 0.28166714310646057, 0.3145727217197418, 0.34747830033302307, 0.3803838789463043, 0.41328945755958557, 0.4461950659751892, 0.47910064458847046, 0.5120062232017517, 0.544911801815033, 0.5778173804283142, 0.6107229590415955, 0.6436285376548767, 0.676534116268158, 0.7094396948814392, 0.7423452734947205, 0.7752508521080017, 0.8081564903259277, 0.841062068939209, 0.8739676475524902, 0.9068732261657715, 0.9397788047790527, 0.972684383392334, 1.0055899620056152, 1.0384955406188965, 1.0714011192321777, 1.104306697845459, 1.1372122764587402]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 6.0, 9.0, 7.0, 9.0, 21.0, 21.0, 30.0, 34.0, 68.0, 105.0, 165.0, 206.0, 326.0, 543.0, 954.0, 1726.0, 3457.0, 7618.0, 18147.0, 50563.0, 150602.0, 369366.0, 285483.0, 100161.0, 34013.0, 13050.0, 5661.0, 2662.0, 1446.0, 831.0, 449.0, 256.0, 184.0, 129.0, 57.0, 49.0, 38.0, 27.0, 19.0, 21.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.237060546875, -0.23025131225585938, -0.22344207763671875, -0.21663284301757812, -0.2098236083984375, -0.20301437377929688, -0.19620513916015625, -0.18939590454101562, -0.182586669921875, -0.17577743530273438, -0.16896820068359375, -0.16215896606445312, -0.1553497314453125, -0.14854049682617188, -0.14173126220703125, -0.13492202758789062, -0.12811279296875, -0.12130355834960938, -0.11449432373046875, -0.10768508911132812, -0.1008758544921875, -0.09406661987304688, -0.08725738525390625, -0.08044815063476562, -0.073638916015625, -0.06682968139648438, -0.06002044677734375, -0.053211212158203125, -0.0464019775390625, -0.039592742919921875, -0.03278350830078125, -0.025974273681640625, -0.0191650390625, -0.012355804443359375, -0.00554656982421875, 0.001262664794921875, 0.0080718994140625, 0.014881134033203125, 0.02169036865234375, 0.028499603271484375, 0.035308837890625, 0.042118072509765625, 0.04892730712890625, 0.055736541748046875, 0.0625457763671875, 0.06935501098632812, 0.07616424560546875, 0.08297348022460938, 0.08978271484375, 0.09659194946289062, 0.10340118408203125, 0.11021041870117188, 0.1170196533203125, 0.12382888793945312, 0.13063812255859375, 0.13744735717773438, 0.144256591796875, 0.15106582641601562, 0.15787506103515625, 0.16468429565429688, 0.1714935302734375, 0.17830276489257812, 0.18511199951171875, 0.19192123413085938, 0.19873046875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 6.0, 8.0, 6.0, 3.0, 9.0, 7.0, 14.0, 16.0, 19.0, 13.0, 23.0, 21.0, 18.0, 30.0, 28.0, 34.0, 35.0, 43.0, 43.0, 40.0, 51.0, 58.0, 48.0, 47.0, 31.0, 38.0, 36.0, 34.0, 35.0, 20.0, 28.0, 23.0, 19.0, 22.0, 18.0, 19.0, 11.0, 9.0, 6.0, 5.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1090087890625, -0.10563182830810547, -0.10225486755371094, -0.0988779067993164, -0.09550094604492188, -0.09212398529052734, -0.08874702453613281, -0.08537006378173828, -0.08199310302734375, -0.07861614227294922, -0.07523918151855469, -0.07186222076416016, -0.06848526000976562, -0.0651082992553711, -0.06173133850097656, -0.05835437774658203, -0.0549774169921875, -0.05160045623779297, -0.04822349548339844, -0.044846534729003906, -0.041469573974609375, -0.038092613220214844, -0.03471565246582031, -0.03133869171142578, -0.02796173095703125, -0.02458477020263672, -0.021207809448242188, -0.017830848693847656, -0.014453887939453125, -0.011076927185058594, -0.0076999664306640625, -0.004323005676269531, -0.000946044921875, 0.0024309158325195312, 0.0058078765869140625, 0.009184837341308594, 0.012561798095703125, 0.015938758850097656, 0.019315719604492188, 0.02269268035888672, 0.02606964111328125, 0.02944660186767578, 0.03282356262207031, 0.036200523376464844, 0.039577484130859375, 0.042954444885253906, 0.04633140563964844, 0.04970836639404297, 0.0530853271484375, 0.05646228790283203, 0.05983924865722656, 0.0632162094116211, 0.06659317016601562, 0.06997013092041016, 0.07334709167480469, 0.07672405242919922, 0.08010101318359375, 0.08347797393798828, 0.08685493469238281, 0.09023189544677734, 0.09360885620117188, 0.0969858169555664, 0.10036277770996094, 0.10373973846435547, 0.10711669921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 8.0, 11.0, 14.0, 31.0, 37.0, 48.0, 104.0, 169.0, 271.0, 521.0, 1099.0, 3090.0, 13620.0, 123386.0, 800454.0, 89870.0, 11064.0, 2655.0, 926.0, 485.0, 244.0, 142.0, 96.0, 59.0, 44.0, 27.0, 18.0, 13.0, 13.0, 9.0, 0.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.52880859375, -0.5153999328613281, -0.5019912719726562, -0.4885826110839844, -0.4751739501953125, -0.4617652893066406, -0.44835662841796875, -0.4349479675292969, -0.421539306640625, -0.4081306457519531, -0.39472198486328125, -0.3813133239746094, -0.3679046630859375, -0.3544960021972656, -0.34108734130859375, -0.3276786804199219, -0.31427001953125, -0.3008613586425781, -0.28745269775390625, -0.2740440368652344, -0.2606353759765625, -0.24722671508789062, -0.23381805419921875, -0.22040939331054688, -0.207000732421875, -0.19359207153320312, -0.18018341064453125, -0.16677474975585938, -0.1533660888671875, -0.13995742797851562, -0.12654876708984375, -0.11314010620117188, -0.0997314453125, -0.08632278442382812, -0.07291412353515625, -0.059505462646484375, -0.0460968017578125, -0.032688140869140625, -0.01927947998046875, -0.005870819091796875, 0.007537841796875, 0.020946502685546875, 0.03435516357421875, 0.047763824462890625, 0.0611724853515625, 0.07458114624023438, 0.08798980712890625, 0.10139846801757812, 0.11480712890625, 0.12821578979492188, 0.14162445068359375, 0.15503311157226562, 0.1684417724609375, 0.18185043334960938, 0.19525909423828125, 0.20866775512695312, 0.222076416015625, 0.23548507690429688, 0.24889373779296875, 0.2623023986816406, 0.2757110595703125, 0.2891197204589844, 0.30252838134765625, 0.3159370422363281, 0.329345703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 11.0, 4.0, 7.0, 8.0, 12.0, 11.0, 18.0, 19.0, 27.0, 23.0, 32.0, 45.0, 46.0, 53.0, 60.0, 57.0, 62.0, 43.0, 59.0, 47.0, 52.0, 57.0, 30.0, 46.0, 30.0, 24.0, 18.0, 14.0, 13.0, 16.0, 8.0, 5.0, 5.0, 7.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353271484375, -0.3397254943847656, -0.32617950439453125, -0.3126335144042969, -0.2990875244140625, -0.2855415344238281, -0.27199554443359375, -0.2584495544433594, -0.244903564453125, -0.23135757446289062, -0.21781158447265625, -0.20426559448242188, -0.1907196044921875, -0.17717361450195312, -0.16362762451171875, -0.15008163452148438, -0.13653564453125, -0.12298965454101562, -0.10944366455078125, -0.09589767456054688, -0.0823516845703125, -0.06880569458007812, -0.05525970458984375, -0.041713714599609375, -0.028167724609375, -0.014621734619140625, -0.00107574462890625, 0.012470245361328125, 0.0260162353515625, 0.039562225341796875, 0.05310821533203125, 0.06665420532226562, 0.0802001953125, 0.09374618530273438, 0.10729217529296875, 0.12083816528320312, 0.1343841552734375, 0.14793014526367188, 0.16147613525390625, 0.17502212524414062, 0.188568115234375, 0.20211410522460938, 0.21566009521484375, 0.22920608520507812, 0.2427520751953125, 0.2562980651855469, 0.26984405517578125, 0.2833900451660156, 0.29693603515625, 0.3104820251464844, 0.32402801513671875, 0.3375740051269531, 0.3511199951171875, 0.3646659851074219, 0.37821197509765625, 0.3917579650878906, 0.405303955078125, 0.4188499450683594, 0.43239593505859375, 0.4459419250488281, 0.4594879150390625, 0.4730339050292969, 0.48657989501953125, 0.5001258850097656, 0.513671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 7.0, 6.0, 3.0, 6.0, 8.0, 14.0, 28.0, 27.0, 36.0, 58.0, 88.0, 129.0, 229.0, 388.0, 706.0, 1345.0, 2906.0, 7297.0, 23759.0, 138705.0, 757641.0, 86423.0, 17705.0, 5956.0, 2452.0, 1073.0, 611.0, 325.0, 225.0, 128.0, 83.0, 63.0, 31.0, 27.0, 17.0, 18.0, 6.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1124267578125, -0.10915756225585938, -0.10588836669921875, -0.10261917114257812, -0.0993499755859375, -0.09608078002929688, -0.09281158447265625, -0.08954238891601562, -0.086273193359375, -0.08300399780273438, -0.07973480224609375, -0.07646560668945312, -0.0731964111328125, -0.06992721557617188, -0.06665802001953125, -0.06338882446289062, -0.06011962890625, -0.056850433349609375, -0.05358123779296875, -0.050312042236328125, -0.0470428466796875, -0.043773651123046875, -0.04050445556640625, -0.037235260009765625, -0.033966064453125, -0.030696868896484375, -0.02742767333984375, -0.024158477783203125, -0.0208892822265625, -0.017620086669921875, -0.01435089111328125, -0.011081695556640625, -0.0078125, -0.004543304443359375, -0.00127410888671875, 0.001995086669921875, 0.0052642822265625, 0.008533477783203125, 0.01180267333984375, 0.015071868896484375, 0.018341064453125, 0.021610260009765625, 0.02487945556640625, 0.028148651123046875, 0.0314178466796875, 0.034687042236328125, 0.03795623779296875, 0.041225433349609375, 0.04449462890625, 0.047763824462890625, 0.05103302001953125, 0.054302215576171875, 0.0575714111328125, 0.060840606689453125, 0.06410980224609375, 0.06737899780273438, 0.070648193359375, 0.07391738891601562, 0.07718658447265625, 0.08045578002929688, 0.0837249755859375, 0.08699417114257812, 0.09026336669921875, 0.09353256225585938, 0.0968017578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 9.0, 6.0, 10.0, 13.0, 18.0, 26.0, 43.0, 72.0, 94.0, 127.0, 127.0, 116.0, 86.0, 73.0, 41.0, 35.0, 23.0, 27.0, 15.0, 3.0, 3.0, 9.0, 2.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0100345611572266e-05, -2.917274832725525e-05, -2.8245151042938232e-05, -2.7317553758621216e-05, -2.63899564743042e-05, -2.5462359189987183e-05, -2.4534761905670166e-05, -2.360716462135315e-05, -2.2679567337036133e-05, -2.1751970052719116e-05, -2.08243727684021e-05, -1.9896775484085083e-05, -1.8969178199768066e-05, -1.804158091545105e-05, -1.7113983631134033e-05, -1.6186386346817017e-05, -1.52587890625e-05, -1.4331191778182983e-05, -1.3403594493865967e-05, -1.247599720954895e-05, -1.1548399925231934e-05, -1.0620802640914917e-05, -9.6932053565979e-06, -8.765608072280884e-06, -7.838010787963867e-06, -6.910413503646851e-06, -5.982816219329834e-06, -5.055218935012817e-06, -4.127621650695801e-06, -3.200024366378784e-06, -2.2724270820617676e-06, -1.344829797744751e-06, -4.172325134277344e-07, 5.103647708892822e-07, 1.4379620552062988e-06, 2.3655593395233154e-06, 3.293156623840332e-06, 4.220753908157349e-06, 5.148351192474365e-06, 6.075948476791382e-06, 7.0035457611083984e-06, 7.931143045425415e-06, 8.858740329742432e-06, 9.786337614059448e-06, 1.0713934898376465e-05, 1.1641532182693481e-05, 1.2569129467010498e-05, 1.3496726751327515e-05, 1.4424324035644531e-05, 1.5351921319961548e-05, 1.6279518604278564e-05, 1.720711588859558e-05, 1.8134713172912598e-05, 1.9062310457229614e-05, 1.998990774154663e-05, 2.0917505025863647e-05, 2.1845102310180664e-05, 2.277269959449768e-05, 2.3700296878814697e-05, 2.4627894163131714e-05, 2.555549144744873e-05, 2.6483088731765747e-05, 2.7410686016082764e-05, 2.833828330039978e-05, 2.9265880584716797e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 8.0, 14.0, 15.0, 14.0, 19.0, 32.0, 41.0, 59.0, 106.0, 160.0, 310.0, 531.0, 1310.0, 3787.0, 14389.0, 83829.0, 801759.0, 117330.0, 17367.0, 4453.0, 1559.0, 610.0, 333.0, 183.0, 110.0, 69.0, 59.0, 30.0, 21.0, 15.0, 19.0, 3.0, 11.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09844970703125, -0.09474468231201172, -0.09103965759277344, -0.08733463287353516, -0.08362960815429688, -0.0799245834350586, -0.07621955871582031, -0.07251453399658203, -0.06880950927734375, -0.06510448455810547, -0.06139945983886719, -0.057694435119628906, -0.053989410400390625, -0.050284385681152344, -0.04657936096191406, -0.04287433624267578, -0.0391693115234375, -0.03546428680419922, -0.03175926208496094, -0.028054237365722656, -0.024349212646484375, -0.020644187927246094, -0.016939163208007812, -0.013234138488769531, -0.00952911376953125, -0.005824089050292969, -0.0021190643310546875, 0.0015859603881835938, 0.005290985107421875, 0.008996009826660156, 0.012701034545898438, 0.01640605926513672, 0.020111083984375, 0.02381610870361328, 0.027521133422851562, 0.031226158142089844, 0.034931182861328125, 0.038636207580566406, 0.04234123229980469, 0.04604625701904297, 0.04975128173828125, 0.05345630645751953, 0.05716133117675781, 0.060866355895996094, 0.06457138061523438, 0.06827640533447266, 0.07198143005371094, 0.07568645477294922, 0.0793914794921875, 0.08309650421142578, 0.08680152893066406, 0.09050655364990234, 0.09421157836914062, 0.0979166030883789, 0.10162162780761719, 0.10532665252685547, 0.10903167724609375, 0.11273670196533203, 0.11644172668457031, 0.1201467514038086, 0.12385177612304688, 0.12755680084228516, 0.13126182556152344, 0.13496685028076172, 0.138671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 11.0, 7.0, 12.0, 8.0, 8.0, 18.0, 23.0, 15.0, 36.0, 49.0, 65.0, 76.0, 107.0, 106.0, 92.0, 92.0, 57.0, 41.0, 32.0, 27.0, 34.0, 16.0, 17.0, 14.0, 10.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08734130859375, -0.08433246612548828, -0.08132362365722656, -0.07831478118896484, -0.07530593872070312, -0.0722970962524414, -0.06928825378417969, -0.06627941131591797, -0.06327056884765625, -0.06026172637939453, -0.05725288391113281, -0.054244041442871094, -0.051235198974609375, -0.048226356506347656, -0.04521751403808594, -0.04220867156982422, -0.0391998291015625, -0.03619098663330078, -0.03318214416503906, -0.030173301696777344, -0.027164459228515625, -0.024155616760253906, -0.021146774291992188, -0.01813793182373047, -0.01512908935546875, -0.012120246887207031, -0.009111404418945312, -0.006102561950683594, -0.003093719482421875, -8.487701416015625e-05, 0.0029239654541015625, 0.005932807922363281, 0.008941650390625, 0.011950492858886719, 0.014959335327148438, 0.017968177795410156, 0.020977020263671875, 0.023985862731933594, 0.026994705200195312, 0.03000354766845703, 0.03301239013671875, 0.03602123260498047, 0.03903007507324219, 0.042038917541503906, 0.045047760009765625, 0.048056602478027344, 0.05106544494628906, 0.05407428741455078, 0.0570831298828125, 0.06009197235107422, 0.06310081481933594, 0.06610965728759766, 0.06911849975585938, 0.0721273422241211, 0.07513618469238281, 0.07814502716064453, 0.08115386962890625, 0.08416271209716797, 0.08717155456542969, 0.0901803970336914, 0.09318923950195312, 0.09619808197021484, 0.09920692443847656, 0.10221576690673828, 0.105224609375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 22.0, 51.0, 91.0, 175.0, 323.0, 139.0, 88.0, 35.0, 26.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.404208183288574, -2.319385051727295, -2.2345621585845947, -2.1497392654418945, -2.0649161338806152, -1.9800931215286255, -1.8952701091766357, -1.810447096824646, -1.7256240844726562, -1.6408010721206665, -1.5559780597686768, -1.471155047416687, -1.3863320350646973, -1.3015090227127075, -1.2166860103607178, -1.131862998008728, -1.0470399856567383, -0.9622169733047485, -0.8773939609527588, -0.792570948600769, -0.7077479362487793, -0.6229249238967896, -0.5381019115447998, -0.45327889919281006, -0.3684558868408203, -0.28363287448883057, -0.19880986213684082, -0.11398684978485107, -0.029163837432861328, 0.05565917491912842, 0.14048218727111816, 0.2253051996231079, 0.31012821197509766, 0.3949512243270874, 0.47977423667907715, 0.5645972490310669, 0.6494202613830566, 0.7342432737350464, 0.8190662860870361, 0.9038892984390259, 0.9887123107910156, 1.0735353231430054, 1.1583583354949951, 1.2431813478469849, 1.3280043601989746, 1.4128273725509644, 1.497650384902954, 1.5824733972549438, 1.6672964096069336, 1.7521194219589233, 1.836942434310913, 1.9217654466629028, 2.0065884590148926, 2.091411590576172, 2.176234483718872, 2.2610573768615723, 2.3458805084228516, 2.430703639984131, 2.515526533126831, 2.6003494262695312, 2.6851725578308105, 2.76999568939209, 2.85481858253479, 2.9396414756774902, 3.0244646072387695]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 4.0, 9.0, 10.0, 6.0, 18.0, 16.0, 22.0, 29.0, 22.0, 14.0, 29.0, 39.0, 39.0, 51.0, 74.0, 123.0, 87.0, 50.0, 37.0, 33.0, 41.0, 24.0, 32.0, 27.0, 19.0, 18.0, 21.0, 17.0, 13.0, 9.0, 8.0, 9.0, 8.0, 3.0, 4.0, 2.0, 3.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7743232250213623, -1.7247140407562256, -1.6751049757003784, -1.6254957914352417, -1.5758867263793945, -1.5262775421142578, -1.4766684770584106, -1.427059292793274, -1.3774502277374268, -1.32784104347229, -1.2782319784164429, -1.2286227941513062, -1.179013729095459, -1.1294045448303223, -1.079795479774475, -1.0301862955093384, -0.9805771708488464, -0.9309680461883545, -0.8813589215278625, -0.8317497968673706, -0.7821406722068787, -0.7325315475463867, -0.68292236328125, -0.6333132982254028, -0.5837041139602661, -0.5340949892997742, -0.4844858646392822, -0.4348767399787903, -0.38526761531829834, -0.3356584906578064, -0.28604933619499207, -0.23644021153450012, -0.18683111667633057, -0.13722199201583862, -0.08761285990476608, -0.03800372779369354, 0.011605396866798401, 0.061214521527290344, 0.11082366108894348, 0.16043278574943542, 0.21004191040992737, 0.2596510350704193, 0.30926015973091125, 0.3588693141937256, 0.40847843885421753, 0.4580875635147095, 0.5076966881752014, 0.5573058128356934, 0.6069149374961853, 0.6565240621566772, 0.7061331868171692, 0.7557423114776611, 0.8053514361381531, 0.854960560798645, 0.9045697450637817, 0.9541788101196289, 1.0037879943847656, 1.0533971786499023, 1.1030062437057495, 1.1526154279708862, 1.2022244930267334, 1.2518336772918701, 1.3014427423477173, 1.351051926612854, 1.4006609916687012]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 6.0, 6.0, 13.0, 18.0, 22.0, 35.0, 47.0, 66.0, 101.0, 170.0, 239.0, 412.0, 719.0, 1114.0, 2065.0, 4015.0, 8478.0, 22646.0, 88834.0, 610541.0, 2670328.0, 645584.0, 97425.0, 23344.0, 8809.0, 4086.0, 2133.0, 1153.0, 715.0, 427.0, 280.0, 146.0, 97.0, 61.0, 46.0, 33.0, 21.0, 11.0, 8.0, 9.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.159759521484375, -0.15484619140625, -0.149932861328125, -0.14501953125, -0.140106201171875, -0.13519287109375, -0.130279541015625, -0.1253662109375, -0.120452880859375, -0.11553955078125, -0.110626220703125, -0.105712890625, -0.100799560546875, -0.09588623046875, -0.090972900390625, -0.0860595703125, -0.081146240234375, -0.07623291015625, -0.071319580078125, -0.06640625, -0.061492919921875, -0.05657958984375, -0.051666259765625, -0.0467529296875, -0.041839599609375, -0.03692626953125, -0.032012939453125, -0.027099609375, -0.022186279296875, -0.01727294921875, -0.012359619140625, -0.0074462890625, -0.002532958984375, 0.00238037109375, 0.007293701171875, 0.01220703125, 0.017120361328125, 0.02203369140625, 0.026947021484375, 0.0318603515625, 0.036773681640625, 0.04168701171875, 0.046600341796875, 0.051513671875, 0.056427001953125, 0.06134033203125, 0.066253662109375, 0.0711669921875, 0.076080322265625, 0.08099365234375, 0.085906982421875, 0.0908203125, 0.095733642578125, 0.10064697265625, 0.105560302734375, 0.1104736328125, 0.115386962890625, 0.12030029296875, 0.125213623046875, 0.130126953125, 0.135040283203125, 0.13995361328125, 0.144866943359375, 0.1497802734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 8.0, 3.0, 3.0, 6.0, 5.0, 10.0, 13.0, 12.0, 10.0, 8.0, 15.0, 24.0, 14.0, 28.0, 26.0, 34.0, 31.0, 37.0, 37.0, 45.0, 53.0, 48.0, 45.0, 45.0, 41.0, 39.0, 33.0, 36.0, 35.0, 31.0, 28.0, 20.0, 36.0, 28.0, 24.0, 14.0, 15.0, 7.0, 11.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.10540771484375, -0.10235023498535156, -0.09929275512695312, -0.09623527526855469, -0.09317779541015625, -0.09012031555175781, -0.08706283569335938, -0.08400535583496094, -0.0809478759765625, -0.07789039611816406, -0.07483291625976562, -0.07177543640136719, -0.06871795654296875, -0.06566047668457031, -0.06260299682617188, -0.05954551696777344, -0.056488037109375, -0.05343055725097656, -0.050373077392578125, -0.04731559753417969, -0.04425811767578125, -0.04120063781738281, -0.038143157958984375, -0.03508567810058594, -0.0320281982421875, -0.028970718383789062, -0.025913238525390625, -0.022855758666992188, -0.01979827880859375, -0.016740798950195312, -0.013683319091796875, -0.010625839233398438, -0.007568359375, -0.0045108795166015625, -0.001453399658203125, 0.0016040802001953125, 0.00466156005859375, 0.0077190399169921875, 0.010776519775390625, 0.013833999633789062, 0.0168914794921875, 0.019948959350585938, 0.023006439208984375, 0.026063919067382812, 0.02912139892578125, 0.03217887878417969, 0.035236358642578125, 0.03829383850097656, 0.041351318359375, 0.04440879821777344, 0.047466278076171875, 0.05052375793457031, 0.05358123779296875, 0.05663871765136719, 0.059696197509765625, 0.06275367736816406, 0.0658111572265625, 0.06886863708496094, 0.07192611694335938, 0.07498359680175781, 0.07804107666015625, 0.08109855651855469, 0.08415603637695312, 0.08721351623535156, 0.09027099609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 4.0, 8.0, 11.0, 19.0, 20.0, 25.0, 41.0, 48.0, 90.0, 165.0, 346.0, 828.0, 2805.0, 13430.0, 127950.0, 3676762.0, 342168.0, 23179.0, 4187.0, 1263.0, 420.0, 193.0, 112.0, 57.0, 41.0, 28.0, 22.0, 13.0, 15.0, 11.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.294677734375, -0.2843894958496094, -0.27410125732421875, -0.2638130187988281, -0.2535247802734375, -0.24323654174804688, -0.23294830322265625, -0.22266006469726562, -0.212371826171875, -0.20208358764648438, -0.19179534912109375, -0.18150711059570312, -0.1712188720703125, -0.16093063354492188, -0.15064239501953125, -0.14035415649414062, -0.13006591796875, -0.11977767944335938, -0.10948944091796875, -0.09920120239257812, -0.0889129638671875, -0.07862472534179688, -0.06833648681640625, -0.058048248291015625, -0.047760009765625, -0.037471771240234375, -0.02718353271484375, -0.016895294189453125, -0.0066070556640625, 0.003681182861328125, 0.01396942138671875, 0.024257659912109375, 0.0345458984375, 0.044834136962890625, 0.05512237548828125, 0.06541061401367188, 0.0756988525390625, 0.08598709106445312, 0.09627532958984375, 0.10656356811523438, 0.116851806640625, 0.12714004516601562, 0.13742828369140625, 0.14771652221679688, 0.1580047607421875, 0.16829299926757812, 0.17858123779296875, 0.18886947631835938, 0.19915771484375, 0.20944595336914062, 0.21973419189453125, 0.23002243041992188, 0.2403106689453125, 0.2505989074707031, 0.26088714599609375, 0.2711753845214844, 0.281463623046875, 0.2917518615722656, 0.30204010009765625, 0.3123283386230469, 0.3226165771484375, 0.3329048156738281, 0.34319305419921875, 0.3534812927246094, 0.36376953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 9.0, 5.0, 12.0, 13.0, 19.0, 16.0, 37.0, 50.0, 55.0, 93.0, 116.0, 186.0, 346.0, 475.0, 705.0, 648.0, 450.0, 276.0, 158.0, 102.0, 81.0, 59.0, 38.0, 27.0, 20.0, 16.0, 12.0, 10.0, 8.0, 9.0, 6.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.222412109375, -0.215423583984375, -0.20843505859375, -0.201446533203125, -0.1944580078125, -0.187469482421875, -0.18048095703125, -0.173492431640625, -0.16650390625, -0.159515380859375, -0.15252685546875, -0.145538330078125, -0.1385498046875, -0.131561279296875, -0.12457275390625, -0.117584228515625, -0.110595703125, -0.103607177734375, -0.09661865234375, -0.089630126953125, -0.0826416015625, -0.075653076171875, -0.06866455078125, -0.061676025390625, -0.0546875, -0.047698974609375, -0.04071044921875, -0.033721923828125, -0.0267333984375, -0.019744873046875, -0.01275634765625, -0.005767822265625, 0.001220703125, 0.008209228515625, 0.01519775390625, 0.022186279296875, 0.0291748046875, 0.036163330078125, 0.04315185546875, 0.050140380859375, 0.05712890625, 0.064117431640625, 0.07110595703125, 0.078094482421875, 0.0850830078125, 0.092071533203125, 0.09906005859375, 0.106048583984375, 0.113037109375, 0.120025634765625, 0.12701416015625, 0.134002685546875, 0.1409912109375, 0.147979736328125, 0.15496826171875, 0.161956787109375, 0.1689453125, 0.175933837890625, 0.18292236328125, 0.189910888671875, 0.1968994140625, 0.203887939453125, 0.21087646484375, 0.217864990234375, 0.224853515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 16.0, 14.0, 28.0, 44.0, 57.0, 115.0, 114.0, 134.0, 124.0, 105.0, 67.0, 65.0, 35.0, 18.0, 10.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5559303760528564, -1.5110000371932983, -1.4660696983337402, -1.4211394786834717, -1.3762091398239136, -1.3312788009643555, -1.2863484621047974, -1.2414181232452393, -1.1964879035949707, -1.1515575647354126, -1.1066272258758545, -1.061697006225586, -1.0167666673660278, -0.9718363285064697, -0.9269059896469116, -0.8819756507873535, -0.8370453119277954, -0.7921149730682373, -0.747184693813324, -0.7022543549537659, -0.6573240756988525, -0.6123937368392944, -0.5674633979797363, -0.5225330591201782, -0.4776027798652649, -0.4326724708080292, -0.38774216175079346, -0.34281182289123535, -0.29788151383399963, -0.2529512047767639, -0.2080208659172058, -0.1630905568599701, -0.11816024780273438, -0.07322993129491806, -0.028299614787101746, 0.016630709171295166, 0.061561018228530884, 0.1064913272857666, 0.1514216661453247, 0.19635197520256042, 0.24128228425979614, 0.28621259331703186, 0.3311429023742676, 0.3760732412338257, 0.4210035502910614, 0.4659338593482971, 0.5108641982078552, 0.5557944774627686, 0.6007248163223267, 0.6456551551818848, 0.6905854344367981, 0.7355157732963562, 0.7804460525512695, 0.8253763914108276, 0.8703067302703857, 0.9152370691299438, 0.9601673483848572, 1.0050976276397705, 1.0500279664993286, 1.0949583053588867, 1.1398886442184448, 1.184818983078003, 1.2297492027282715, 1.2746795415878296, 1.3196098804473877]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 9.0, 2.0, 5.0, 12.0, 8.0, 14.0, 21.0, 16.0, 20.0, 29.0, 22.0, 19.0, 29.0, 24.0, 34.0, 29.0, 43.0, 47.0, 44.0, 38.0, 48.0, 49.0, 46.0, 43.0, 33.0, 32.0, 29.0, 23.0, 37.0, 15.0, 29.0, 15.0, 19.0, 16.0, 15.0, 15.0, 8.0, 7.0, 4.0, 5.0, 7.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.727314293384552, -0.7006673812866211, -0.674020528793335, -0.647373616695404, -0.6207267642021179, -0.594079852104187, -0.5674329996109009, -0.54078608751297, -0.5141391754150391, -0.48749229311943054, -0.460845410823822, -0.4341984987258911, -0.407551646232605, -0.3809047341346741, -0.35425785183906555, -0.32761096954345703, -0.3009641170501709, -0.2743172347545624, -0.24767035245895386, -0.22102345526218414, -0.19437657296657562, -0.1677296906709671, -0.1410827934741974, -0.11443591117858887, -0.08778902888298035, -0.06114214286208153, -0.03449525684118271, -0.007848367094993591, 0.01879851520061493, 0.04544539749622345, 0.07209229469299316, 0.09873917698860168, 0.12538599967956543, 0.15203288197517395, 0.17867976427078247, 0.20532666146755219, 0.2319735437631607, 0.2586204409599304, 0.28526732325553894, 0.31191420555114746, 0.338561087846756, 0.3652079701423645, 0.391854852437973, 0.41850173473358154, 0.44514864683151245, 0.4717954993247986, 0.4984424114227295, 0.5250892639160156, 0.5517361760139465, 0.5783830881118774, 0.6050299406051636, 0.6316768527030945, 0.6583237051963806, 0.6849706172943115, 0.7116174697875977, 0.7382643818855286, 0.7649112939834595, 0.7915582060813904, 0.8182050585746765, 0.8448519706726074, 0.8714988231658936, 0.8981457352638245, 0.9247926473617554, 0.9514394998550415, 0.9780863523483276]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 12.0, 14.0, 10.0, 37.0, 27.0, 47.0, 70.0, 71.0, 135.0, 207.0, 318.0, 553.0, 879.0, 1659.0, 3081.0, 6041.0, 12808.0, 30055.0, 78874.0, 230095.0, 397857.0, 177448.0, 61946.0, 24366.0, 10574.0, 5061.0, 2714.0, 1467.0, 811.0, 448.0, 300.0, 199.0, 122.0, 72.0, 54.0, 36.0, 32.0, 13.0, 21.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.224365234375, -0.21764373779296875, -0.2109222412109375, -0.20420074462890625, -0.197479248046875, -0.19075775146484375, -0.1840362548828125, -0.17731475830078125, -0.17059326171875, -0.16387176513671875, -0.1571502685546875, -0.15042877197265625, -0.143707275390625, -0.13698577880859375, -0.1302642822265625, -0.12354278564453125, -0.1168212890625, -0.11009979248046875, -0.1033782958984375, -0.09665679931640625, -0.089935302734375, -0.08321380615234375, -0.0764923095703125, -0.06977081298828125, -0.06304931640625, -0.05632781982421875, -0.0496063232421875, -0.04288482666015625, -0.036163330078125, -0.02944183349609375, -0.0227203369140625, -0.01599884033203125, -0.00927734375, -0.00255584716796875, 0.0041656494140625, 0.01088714599609375, 0.017608642578125, 0.02433013916015625, 0.0310516357421875, 0.03777313232421875, 0.04449462890625, 0.05121612548828125, 0.0579376220703125, 0.06465911865234375, 0.071380615234375, 0.07810211181640625, 0.0848236083984375, 0.09154510498046875, 0.0982666015625, 0.10498809814453125, 0.1117095947265625, 0.11843109130859375, 0.125152587890625, 0.13187408447265625, 0.1385955810546875, 0.14531707763671875, 0.15203857421875, 0.15876007080078125, 0.1654815673828125, 0.17220306396484375, 0.178924560546875, 0.18564605712890625, 0.1923675537109375, 0.19908905029296875, 0.205810546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 9.0, 6.0, 6.0, 7.0, 10.0, 11.0, 9.0, 13.0, 17.0, 19.0, 16.0, 21.0, 29.0, 26.0, 30.0, 39.0, 27.0, 41.0, 57.0, 45.0, 40.0, 46.0, 47.0, 49.0, 34.0, 39.0, 28.0, 27.0, 35.0, 35.0, 28.0, 21.0, 17.0, 18.0, 14.0, 16.0, 11.0, 20.0, 11.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.10406494140625, -0.10093879699707031, -0.09781265258789062, -0.09468650817871094, -0.09156036376953125, -0.08843421936035156, -0.08530807495117188, -0.08218193054199219, -0.0790557861328125, -0.07592964172363281, -0.07280349731445312, -0.06967735290527344, -0.06655120849609375, -0.06342506408691406, -0.060298919677734375, -0.05717277526855469, -0.054046630859375, -0.05092048645019531, -0.047794342041015625, -0.04466819763183594, -0.04154205322265625, -0.03841590881347656, -0.035289764404296875, -0.03216361999511719, -0.0290374755859375, -0.025911331176757812, -0.022785186767578125, -0.019659042358398438, -0.01653289794921875, -0.013406753540039062, -0.010280609130859375, -0.0071544647216796875, -0.0040283203125, -0.0009021759033203125, 0.002223968505859375, 0.0053501129150390625, 0.00847625732421875, 0.011602401733398438, 0.014728546142578125, 0.017854690551757812, 0.0209808349609375, 0.024106979370117188, 0.027233123779296875, 0.030359268188476562, 0.03348541259765625, 0.03661155700683594, 0.039737701416015625, 0.04286384582519531, 0.045989990234375, 0.04911613464355469, 0.052242279052734375, 0.05536842346191406, 0.05849456787109375, 0.06162071228027344, 0.06474685668945312, 0.06787300109863281, 0.0709991455078125, 0.07412528991699219, 0.07725143432617188, 0.08037757873535156, 0.08350372314453125, 0.08662986755371094, 0.08975601196289062, 0.09288215637207031, 0.09600830078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 10.0, 15.0, 13.0, 21.0, 28.0, 51.0, 60.0, 93.0, 113.0, 163.0, 224.0, 359.0, 622.0, 1067.0, 2264.0, 5684.0, 19115.0, 104963.0, 747878.0, 131395.0, 22734.0, 6261.0, 2476.0, 1131.0, 625.0, 395.0, 231.0, 157.0, 114.0, 72.0, 55.0, 49.0, 24.0, 24.0, 17.0, 13.0, 8.0, 8.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250732421875, -0.2409210205078125, -0.231109619140625, -0.2212982177734375, -0.21148681640625, -0.2016754150390625, -0.191864013671875, -0.1820526123046875, -0.1722412109375, -0.1624298095703125, -0.152618408203125, -0.1428070068359375, -0.13299560546875, -0.1231842041015625, -0.113372802734375, -0.1035614013671875, -0.09375, -0.0839385986328125, -0.074127197265625, -0.0643157958984375, -0.05450439453125, -0.0446929931640625, -0.034881591796875, -0.0250701904296875, -0.0152587890625, -0.0054473876953125, 0.004364013671875, 0.0141754150390625, 0.02398681640625, 0.0337982177734375, 0.043609619140625, 0.0534210205078125, 0.063232421875, 0.0730438232421875, 0.082855224609375, 0.0926666259765625, 0.10247802734375, 0.1122894287109375, 0.122100830078125, 0.1319122314453125, 0.1417236328125, 0.1515350341796875, 0.161346435546875, 0.1711578369140625, 0.18096923828125, 0.1907806396484375, 0.200592041015625, 0.2104034423828125, 0.22021484375, 0.2300262451171875, 0.239837646484375, 0.2496490478515625, 0.25946044921875, 0.2692718505859375, 0.279083251953125, 0.2888946533203125, 0.2987060546875, 0.3085174560546875, 0.318328857421875, 0.3281402587890625, 0.33795166015625, 0.3477630615234375, 0.357574462890625, 0.3673858642578125, 0.377197265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 6.0, 1.0, 2.0, 2.0, 9.0, 9.0, 7.0, 10.0, 10.0, 18.0, 15.0, 19.0, 31.0, 23.0, 23.0, 27.0, 41.0, 41.0, 43.0, 48.0, 53.0, 54.0, 47.0, 48.0, 54.0, 47.0, 50.0, 41.0, 39.0, 33.0, 23.0, 28.0, 21.0, 13.0, 13.0, 7.0, 13.0, 7.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.35546875, -0.34333038330078125, -0.3311920166015625, -0.31905364990234375, -0.306915283203125, -0.29477691650390625, -0.2826385498046875, -0.27050018310546875, -0.25836181640625, -0.24622344970703125, -0.2340850830078125, -0.22194671630859375, -0.209808349609375, -0.19766998291015625, -0.1855316162109375, -0.17339324951171875, -0.1612548828125, -0.14911651611328125, -0.1369781494140625, -0.12483978271484375, -0.112701416015625, -0.10056304931640625, -0.0884246826171875, -0.07628631591796875, -0.06414794921875, -0.05200958251953125, -0.0398712158203125, -0.02773284912109375, -0.015594482421875, -0.00345611572265625, 0.0086822509765625, 0.02082061767578125, 0.032958984375, 0.04509735107421875, 0.0572357177734375, 0.06937408447265625, 0.081512451171875, 0.09365081787109375, 0.1057891845703125, 0.11792755126953125, 0.13006591796875, 0.14220428466796875, 0.1543426513671875, 0.16648101806640625, 0.178619384765625, 0.19075775146484375, 0.2028961181640625, 0.21503448486328125, 0.2271728515625, 0.23931121826171875, 0.2514495849609375, 0.26358795166015625, 0.275726318359375, 0.28786468505859375, 0.3000030517578125, 0.31214141845703125, 0.32427978515625, 0.33641815185546875, 0.3485565185546875, 0.36069488525390625, 0.372833251953125, 0.38497161865234375, 0.3971099853515625, 0.40924835205078125, 0.42138671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 5.0, 5.0, 11.0, 20.0, 19.0, 32.0, 32.0, 58.0, 98.0, 140.0, 268.0, 465.0, 899.0, 1935.0, 4791.0, 15363.0, 68641.0, 699158.0, 207060.0, 34316.0, 9065.0, 3291.0, 1302.0, 669.0, 369.0, 204.0, 96.0, 78.0, 55.0, 30.0, 23.0, 14.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07208251953125, -0.06974124908447266, -0.06739997863769531, -0.06505870819091797, -0.06271743774414062, -0.06037616729736328, -0.05803489685058594, -0.055693626403808594, -0.05335235595703125, -0.051011085510253906, -0.04866981506347656, -0.04632854461669922, -0.043987274169921875, -0.04164600372314453, -0.03930473327636719, -0.036963462829589844, -0.0346221923828125, -0.032280921936035156, -0.029939651489257812, -0.02759838104248047, -0.025257110595703125, -0.02291584014892578, -0.020574569702148438, -0.018233299255371094, -0.01589202880859375, -0.013550758361816406, -0.011209487915039062, -0.008868217468261719, -0.006526947021484375, -0.004185676574707031, -0.0018444061279296875, 0.0004968643188476562, 0.002838134765625, 0.005179405212402344, 0.0075206756591796875, 0.009861946105957031, 0.012203216552734375, 0.014544486999511719, 0.016885757446289062, 0.019227027893066406, 0.02156829833984375, 0.023909568786621094, 0.026250839233398438, 0.02859210968017578, 0.030933380126953125, 0.03327465057373047, 0.03561592102050781, 0.037957191467285156, 0.0402984619140625, 0.042639732360839844, 0.04498100280761719, 0.04732227325439453, 0.049663543701171875, 0.05200481414794922, 0.05434608459472656, 0.056687355041503906, 0.05902862548828125, 0.061369895935058594, 0.06371116638183594, 0.06605243682861328, 0.06839370727539062, 0.07073497772216797, 0.07307624816894531, 0.07541751861572266, 0.0777587890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 10.0, 12.0, 13.0, 16.0, 24.0, 33.0, 35.0, 51.0, 58.0, 95.0, 105.0, 159.0, 95.0, 77.0, 56.0, 34.0, 34.0, 20.0, 23.0, 8.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0338764190673828e-05, -2.9481016099452972e-05, -2.8623268008232117e-05, -2.776551991701126e-05, -2.6907771825790405e-05, -2.605002373456955e-05, -2.5192275643348694e-05, -2.4334527552127838e-05, -2.3476779460906982e-05, -2.2619031369686127e-05, -2.176128327846527e-05, -2.0903535187244415e-05, -2.004578709602356e-05, -1.9188039004802704e-05, -1.8330290913581848e-05, -1.7472542822360992e-05, -1.6614794731140137e-05, -1.575704663991928e-05, -1.4899298548698425e-05, -1.404155045747757e-05, -1.3183802366256714e-05, -1.2326054275035858e-05, -1.1468306183815002e-05, -1.0610558092594147e-05, -9.752810001373291e-06, -8.895061910152435e-06, -8.03731381893158e-06, -7.179565727710724e-06, -6.321817636489868e-06, -5.4640695452690125e-06, -4.606321454048157e-06, -3.748573362827301e-06, -2.8908252716064453e-06, -2.0330771803855896e-06, -1.1753290891647339e-06, -3.175809979438782e-07, 5.401670932769775e-07, 1.3979151844978333e-06, 2.255663275718689e-06, 3.1134113669395447e-06, 3.9711594581604e-06, 4.828907549381256e-06, 5.686655640602112e-06, 6.5444037318229675e-06, 7.402151823043823e-06, 8.259899914264679e-06, 9.117648005485535e-06, 9.97539609670639e-06, 1.0833144187927246e-05, 1.1690892279148102e-05, 1.2548640370368958e-05, 1.3406388461589813e-05, 1.4264136552810669e-05, 1.5121884644031525e-05, 1.597963273525238e-05, 1.6837380826473236e-05, 1.7695128917694092e-05, 1.8552877008914948e-05, 1.9410625100135803e-05, 2.026837319135666e-05, 2.1126121282577515e-05, 2.198386937379837e-05, 2.2841617465019226e-05, 2.3699365556240082e-05, 2.4557113647460938e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 11.0, 9.0, 13.0, 15.0, 17.0, 25.0, 47.0, 66.0, 81.0, 118.0, 184.0, 293.0, 509.0, 853.0, 1683.0, 3875.0, 10454.0, 35721.0, 168745.0, 689841.0, 98573.0, 23732.0, 7451.0, 3007.0, 1298.0, 773.0, 388.0, 234.0, 161.0, 99.0, 94.0, 57.0, 34.0, 21.0, 21.0, 14.0, 8.0, 5.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.06939697265625, -0.06737613677978516, -0.06535530090332031, -0.06333446502685547, -0.061313629150390625, -0.05929279327392578, -0.05727195739746094, -0.055251121520996094, -0.05323028564453125, -0.051209449768066406, -0.04918861389160156, -0.04716777801513672, -0.045146942138671875, -0.04312610626220703, -0.04110527038574219, -0.039084434509277344, -0.0370635986328125, -0.035042762756347656, -0.03302192687988281, -0.03100109100341797, -0.028980255126953125, -0.02695941925048828, -0.024938583374023438, -0.022917747497558594, -0.02089691162109375, -0.018876075744628906, -0.016855239868164062, -0.014834403991699219, -0.012813568115234375, -0.010792732238769531, -0.008771896362304688, -0.006751060485839844, -0.004730224609375, -0.0027093887329101562, -0.0006885528564453125, 0.0013322830200195312, 0.003353118896484375, 0.005373954772949219, 0.0073947906494140625, 0.009415626525878906, 0.01143646240234375, 0.013457298278808594, 0.015478134155273438, 0.01749897003173828, 0.019519805908203125, 0.02154064178466797, 0.023561477661132812, 0.025582313537597656, 0.0276031494140625, 0.029623985290527344, 0.03164482116699219, 0.03366565704345703, 0.035686492919921875, 0.03770732879638672, 0.03972816467285156, 0.041749000549316406, 0.04376983642578125, 0.045790672302246094, 0.04781150817871094, 0.04983234405517578, 0.051853179931640625, 0.05387401580810547, 0.05589485168457031, 0.057915687561035156, 0.0599365234375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 15.0, 10.0, 14.0, 14.0, 12.0, 17.0, 30.0, 38.0, 43.0, 70.0, 80.0, 85.0, 93.0, 92.0, 68.0, 70.0, 51.0, 46.0, 22.0, 20.0, 25.0, 15.0, 12.0, 4.0, 13.0, 7.0, 4.0, 8.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07571887969970703, -0.07325172424316406, -0.0707845687866211, -0.06831741333007812, -0.06585025787353516, -0.06338310241699219, -0.06091594696044922, -0.05844879150390625, -0.05598163604736328, -0.05351448059082031, -0.051047325134277344, -0.048580169677734375, -0.046113014221191406, -0.04364585876464844, -0.04117870330810547, -0.0387115478515625, -0.03624439239501953, -0.03377723693847656, -0.031310081481933594, -0.028842926025390625, -0.026375770568847656, -0.023908615112304688, -0.02144145965576172, -0.01897430419921875, -0.01650714874267578, -0.014039993286132812, -0.011572837829589844, -0.009105682373046875, -0.006638526916503906, -0.0041713714599609375, -0.0017042160034179688, 0.000762939453125, 0.0032300949096679688, 0.0056972503662109375, 0.008164405822753906, 0.010631561279296875, 0.013098716735839844, 0.015565872192382812, 0.01803302764892578, 0.02050018310546875, 0.02296733856201172, 0.025434494018554688, 0.027901649475097656, 0.030368804931640625, 0.032835960388183594, 0.03530311584472656, 0.03777027130126953, 0.0402374267578125, 0.04270458221435547, 0.04517173767089844, 0.047638893127441406, 0.050106048583984375, 0.052573204040527344, 0.05504035949707031, 0.05750751495361328, 0.05997467041015625, 0.06244182586669922, 0.06490898132324219, 0.06737613677978516, 0.06984329223632812, 0.0723104476928711, 0.07477760314941406, 0.07724475860595703, 0.0797119140625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 11.0, 30.0, 66.0, 133.0, 381.0, 189.0, 98.0, 46.0, 19.0, 11.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.464256763458252, -2.368776798248291, -2.27329683303833, -2.177816867828369, -2.082336902618408, -1.9868569374084473, -1.8913769721984863, -1.7958970069885254, -1.7004170417785645, -1.6049370765686035, -1.5094571113586426, -1.4139771461486816, -1.3184971809387207, -1.2230172157287598, -1.1275372505187988, -1.032057285308838, -0.936577320098877, -0.841097354888916, -0.7456173896789551, -0.6501374244689941, -0.5546574592590332, -0.45917749404907227, -0.36369752883911133, -0.2682175636291504, -0.17273759841918945, -0.07725763320922852, 0.018222332000732422, 0.11370229721069336, 0.2091822624206543, 0.30466222763061523, 0.40014219284057617, 0.4956221580505371, 0.591101884841919, 0.6865818500518799, 0.7820618152618408, 0.8775417804718018, 0.9730217456817627, 1.0685017108917236, 1.1639816761016846, 1.2594616413116455, 1.3549416065216064, 1.4504215717315674, 1.5459015369415283, 1.6413815021514893, 1.7368614673614502, 1.8323414325714111, 1.927821397781372, 2.023301362991333, 2.118781328201294, 2.214261293411255, 2.309741258621216, 2.4052212238311768, 2.5007011890411377, 2.5961811542510986, 2.6916611194610596, 2.7871410846710205, 2.8826210498809814, 2.9781010150909424, 3.0735809803009033, 3.1690609455108643, 3.264540910720825, 3.360020875930786, 3.455500841140747, 3.550980806350708, 3.646460771560669]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 4.0, 5.0, 6.0, 9.0, 10.0, 10.0, 18.0, 18.0, 17.0, 20.0, 24.0, 21.0, 27.0, 31.0, 31.0, 43.0, 57.0, 126.0, 133.0, 65.0, 45.0, 27.0, 25.0, 41.0, 23.0, 23.0, 17.0, 13.0, 16.0, 14.0, 20.0, 12.0, 7.0, 14.0, 14.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3714683055877686, -1.3274106979370117, -1.2833532094955444, -1.2392956018447876, -1.1952381134033203, -1.1511805057525635, -1.1071230173110962, -1.0630654096603394, -1.019007921218872, -0.97495037317276, -0.930892825126648, -0.8868352770805359, -0.8427777290344238, -0.7987201809883118, -0.7546626329421997, -0.7106050252914429, -0.6665474772453308, -0.6224899291992188, -0.5784323811531067, -0.5343748331069946, -0.49031728506088257, -0.4462597370147705, -0.40220215916633606, -0.358144611120224, -0.31408706307411194, -0.2700295150279999, -0.22597196698188782, -0.18191440403461456, -0.1378568559885025, -0.09379930794239044, -0.04974174499511719, -0.005684196949005127, 0.038373351097106934, 0.082430899143219, 0.12648844718933105, 0.1705460101366043, 0.21460355818271637, 0.25866109132766724, 0.3027186691761017, 0.34677621722221375, 0.3908337652683258, 0.43489131331443787, 0.4789488613605499, 0.5230064392089844, 0.5670639872550964, 0.6111215353012085, 0.6551790833473206, 0.6992366313934326, 0.7432941794395447, 0.7873517274856567, 0.8314092755317688, 0.8754668235778809, 0.9195243716239929, 0.963581919670105, 1.0076395273208618, 1.051697015762329, 1.095754623413086, 1.1398122310638428, 1.18386971950531, 1.227927327156067, 1.2719848155975342, 1.316042423248291, 1.3600999116897583, 1.4041575193405151, 1.4482150077819824]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 3.0, 7.0, 15.0, 22.0, 21.0, 34.0, 48.0, 62.0, 95.0, 125.0, 183.0, 274.0, 430.0, 596.0, 951.0, 1600.0, 2815.0, 5171.0, 10345.0, 22717.0, 58254.0, 191155.0, 745956.0, 1900873.0, 901583.0, 231712.0, 67968.0, 25851.0, 11724.0, 5745.0, 3056.0, 1779.0, 1082.0, 649.0, 442.0, 282.0, 206.0, 134.0, 83.0, 73.0, 51.0, 27.0, 25.0, 21.0, 9.0, 9.0, 7.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.15771484375, -0.15238189697265625, -0.1470489501953125, -0.14171600341796875, -0.136383056640625, -0.13105010986328125, -0.1257171630859375, -0.12038421630859375, -0.11505126953125, -0.10971832275390625, -0.1043853759765625, -0.09905242919921875, -0.093719482421875, -0.08838653564453125, -0.0830535888671875, -0.07772064208984375, -0.0723876953125, -0.06705474853515625, -0.0617218017578125, -0.05638885498046875, -0.051055908203125, -0.04572296142578125, -0.0403900146484375, -0.03505706787109375, -0.02972412109375, -0.02439117431640625, -0.0190582275390625, -0.01372528076171875, -0.008392333984375, -0.00305938720703125, 0.0022735595703125, 0.00760650634765625, 0.012939453125, 0.01827239990234375, 0.0236053466796875, 0.02893829345703125, 0.034271240234375, 0.03960418701171875, 0.0449371337890625, 0.05027008056640625, 0.05560302734375, 0.06093597412109375, 0.0662689208984375, 0.07160186767578125, 0.076934814453125, 0.08226776123046875, 0.0876007080078125, 0.09293365478515625, 0.0982666015625, 0.10359954833984375, 0.1089324951171875, 0.11426544189453125, 0.119598388671875, 0.12493133544921875, 0.1302642822265625, 0.13559722900390625, 0.14093017578125, 0.14626312255859375, 0.1515960693359375, 0.15692901611328125, 0.162261962890625, 0.16759490966796875, 0.1729278564453125, 0.17826080322265625, 0.18359375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 6.0, 9.0, 14.0, 14.0, 9.0, 21.0, 13.0, 19.0, 28.0, 31.0, 26.0, 29.0, 41.0, 48.0, 54.0, 46.0, 41.0, 45.0, 41.0, 51.0, 48.0, 34.0, 22.0, 33.0, 37.0, 28.0, 31.0, 31.0, 18.0, 17.0, 14.0, 19.0, 15.0, 11.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.104736328125, -0.1016397476196289, -0.09854316711425781, -0.09544658660888672, -0.09235000610351562, -0.08925342559814453, -0.08615684509277344, -0.08306026458740234, -0.07996368408203125, -0.07686710357666016, -0.07377052307128906, -0.07067394256591797, -0.06757736206054688, -0.06448078155517578, -0.06138420104980469, -0.058287620544433594, -0.0551910400390625, -0.052094459533691406, -0.04899787902832031, -0.04590129852294922, -0.042804718017578125, -0.03970813751220703, -0.03661155700683594, -0.033514976501464844, -0.03041839599609375, -0.027321815490722656, -0.024225234985351562, -0.02112865447998047, -0.018032073974609375, -0.014935493469238281, -0.011838912963867188, -0.008742332458496094, -0.005645751953125, -0.0025491714477539062, 0.0005474090576171875, 0.0036439895629882812, 0.006740570068359375, 0.009837150573730469, 0.012933731079101562, 0.016030311584472656, 0.01912689208984375, 0.022223472595214844, 0.025320053100585938, 0.02841663360595703, 0.031513214111328125, 0.03460979461669922, 0.03770637512207031, 0.040802955627441406, 0.0438995361328125, 0.046996116638183594, 0.05009269714355469, 0.05318927764892578, 0.056285858154296875, 0.05938243865966797, 0.06247901916503906, 0.06557559967041016, 0.06867218017578125, 0.07176876068115234, 0.07486534118652344, 0.07796192169189453, 0.08105850219726562, 0.08415508270263672, 0.08725166320800781, 0.0903482437133789, 0.09344482421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 12.0, 16.0, 20.0, 13.0, 33.0, 50.0, 50.0, 87.0, 139.0, 192.0, 307.0, 599.0, 1444.0, 4435.0, 30695.0, 2744881.0, 1379851.0, 24498.0, 4108.0, 1341.0, 619.0, 302.0, 186.0, 119.0, 79.0, 62.0, 34.0, 27.0, 23.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6011810302734375, -0.581756591796875, -0.5623321533203125, -0.54290771484375, -0.5234832763671875, -0.504058837890625, -0.4846343994140625, -0.4652099609375, -0.4457855224609375, -0.426361083984375, -0.4069366455078125, -0.38751220703125, -0.3680877685546875, -0.348663330078125, -0.3292388916015625, -0.309814453125, -0.2903900146484375, -0.270965576171875, -0.2515411376953125, -0.23211669921875, -0.2126922607421875, -0.193267822265625, -0.1738433837890625, -0.1544189453125, -0.1349945068359375, -0.115570068359375, -0.0961456298828125, -0.07672119140625, -0.0572967529296875, -0.037872314453125, -0.0184478759765625, 0.0009765625, 0.0204010009765625, 0.039825439453125, 0.0592498779296875, 0.07867431640625, 0.0980987548828125, 0.117523193359375, 0.1369476318359375, 0.1563720703125, 0.1757965087890625, 0.195220947265625, 0.2146453857421875, 0.23406982421875, 0.2534942626953125, 0.272918701171875, 0.2923431396484375, 0.311767578125, 0.3311920166015625, 0.350616455078125, 0.3700408935546875, 0.38946533203125, 0.4088897705078125, 0.428314208984375, 0.4477386474609375, 0.4671630859375, 0.4865875244140625, 0.506011962890625, 0.5254364013671875, 0.54486083984375, 0.5642852783203125, 0.583709716796875, 0.6031341552734375, 0.62255859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 9.0, 25.0, 14.0, 31.0, 34.0, 48.0, 79.0, 130.0, 153.0, 223.0, 322.0, 447.0, 641.0, 579.0, 388.0, 209.0, 181.0, 144.0, 85.0, 86.0, 63.0, 42.0, 38.0, 18.0, 14.0, 15.0, 12.0, 6.0, 11.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.35237884521484375, -0.3412322998046875, -0.33008575439453125, -0.318939208984375, -0.30779266357421875, -0.2966461181640625, -0.28549957275390625, -0.27435302734375, -0.26320648193359375, -0.2520599365234375, -0.24091339111328125, -0.229766845703125, -0.21862030029296875, -0.2074737548828125, -0.19632720947265625, -0.1851806640625, -0.17403411865234375, -0.1628875732421875, -0.15174102783203125, -0.140594482421875, -0.12944793701171875, -0.1183013916015625, -0.10715484619140625, -0.09600830078125, -0.08486175537109375, -0.0737152099609375, -0.06256866455078125, -0.051422119140625, -0.04027557373046875, -0.0291290283203125, -0.01798248291015625, -0.0068359375, 0.00431060791015625, 0.0154571533203125, 0.02660369873046875, 0.037750244140625, 0.04889678955078125, 0.0600433349609375, 0.07118988037109375, 0.08233642578125, 0.09348297119140625, 0.1046295166015625, 0.11577606201171875, 0.126922607421875, 0.13806915283203125, 0.1492156982421875, 0.16036224365234375, 0.1715087890625, 0.18265533447265625, 0.1938018798828125, 0.20494842529296875, 0.216094970703125, 0.22724151611328125, 0.2383880615234375, 0.24953460693359375, 0.26068115234375, 0.27182769775390625, 0.2829742431640625, 0.29412078857421875, 0.305267333984375, 0.31641387939453125, 0.3275604248046875, 0.33870697021484375, 0.349853515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 13.0, 10.0, 10.0, 36.0, 48.0, 120.0, 178.0, 223.0, 148.0, 82.0, 55.0, 30.0, 14.0, 12.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.677733898162842, -4.527527809143066, -4.377321720123291, -4.227116107940674, -4.076910018920898, -3.926703929901123, -3.7764978408813477, -3.6262917518615723, -3.476085901260376, -3.3258798122406006, -3.1756739616394043, -3.025467872619629, -2.8752617835998535, -2.7250559329986572, -2.574849843978882, -2.4246439933776855, -2.27443790435791, -2.1242318153381348, -1.9740259647369385, -1.823819875717163, -1.6736139059066772, -1.5234079360961914, -1.373201847076416, -1.2229958772659302, -1.0727899074554443, -0.9225839376449585, -0.7723779082298279, -0.6221718788146973, -0.4719659090042114, -0.3217599391937256, -0.17155390977859497, -0.021347880363464355, 0.12885808944702148, 0.2790640890598297, 0.42927008867263794, 0.5794761180877686, 0.7296820878982544, 0.8798880577087402, 1.0300941467285156, 1.1803001165390015, 1.3305060863494873, 1.4807120561599731, 1.630918025970459, 1.7811241149902344, 1.9313300848007202, 2.081536054611206, 2.2317421436309814, 2.3819479942321777, 2.532154083251953, 2.6823601722717285, 2.832566022872925, 2.9827721118927, 3.1329779624938965, 3.283184051513672, 3.4333901405334473, 3.5835962295532227, 3.733802080154419, 3.8840081691741943, 4.034214019775391, 4.184420108795166, 4.334626197814941, 4.484831809997559, 4.635037899017334, 4.785243988037109, 4.935450077056885]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 2.0, 7.0, 13.0, 11.0, 12.0, 13.0, 15.0, 16.0, 18.0, 19.0, 18.0, 31.0, 23.0, 31.0, 27.0, 47.0, 42.0, 31.0, 41.0, 46.0, 68.0, 49.0, 57.0, 53.0, 39.0, 34.0, 25.0, 37.0, 27.0, 20.0, 23.0, 13.0, 22.0, 12.0, 9.0, 8.0, 9.0, 8.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.937659740447998, -1.8766385316848755, -1.8156172037124634, -1.7545959949493408, -1.6935746669769287, -1.6325534582138062, -1.5715322494506836, -1.5105109214782715, -1.4494895935058594, -1.3884683847427368, -1.3274470567703247, -1.2664258480072021, -1.20540452003479, -1.1443833112716675, -1.083362102508545, -1.0223407745361328, -0.9613195657730103, -0.9002982974052429, -0.8392770290374756, -0.778255820274353, -0.7172344923019409, -0.6562132835388184, -0.595192015171051, -0.5341707468032837, -0.47314947843551636, -0.412128210067749, -0.3511069416999817, -0.29008570313453674, -0.2290644347667694, -0.16804316639900208, -0.10702192783355713, -0.046000659465789795, 0.015020608901977539, 0.07604186981916428, 0.137063130736351, 0.19808438420295715, 0.2591056525707245, 0.3201269209384918, 0.38114815950393677, 0.4421694278717041, 0.5031906962394714, 0.5642119646072388, 0.6252332329750061, 0.6862545013427734, 0.747275710105896, 0.8082970380783081, 0.8693182468414307, 0.930339515209198, 0.9913607835769653, 1.052381992340088, 1.1134033203125, 1.1744245290756226, 1.2354458570480347, 1.2964670658111572, 1.3574883937835693, 1.418509602546692, 1.4795308113098145, 1.540552020072937, 1.6015733480453491, 1.6625945568084717, 1.7236158847808838, 1.7846370935440063, 1.845658302307129, 1.906679630279541, 1.9677009582519531]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 12.0, 14.0, 20.0, 22.0, 42.0, 70.0, 109.0, 152.0, 279.0, 432.0, 928.0, 1821.0, 3667.0, 8627.0, 22631.0, 70905.0, 291947.0, 487806.0, 105882.0, 31951.0, 11654.0, 4788.0, 2278.0, 1126.0, 595.0, 290.0, 191.0, 126.0, 61.0, 45.0, 26.0, 19.0, 12.0, 6.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1961669921875, -0.1894397735595703, -0.18271255493164062, -0.17598533630371094, -0.16925811767578125, -0.16253089904785156, -0.15580368041992188, -0.1490764617919922, -0.1423492431640625, -0.1356220245361328, -0.12889480590820312, -0.12216758728027344, -0.11544036865234375, -0.10871315002441406, -0.10198593139648438, -0.09525871276855469, -0.088531494140625, -0.08180427551269531, -0.07507705688476562, -0.06834983825683594, -0.06162261962890625, -0.05489540100097656, -0.048168182373046875, -0.04144096374511719, -0.0347137451171875, -0.027986526489257812, -0.021259307861328125, -0.014532089233398438, -0.00780487060546875, -0.0010776519775390625, 0.005649566650390625, 0.012376785278320312, 0.01910400390625, 0.025831222534179688, 0.032558441162109375, 0.03928565979003906, 0.04601287841796875, 0.05274009704589844, 0.059467315673828125, 0.06619453430175781, 0.0729217529296875, 0.07964897155761719, 0.08637619018554688, 0.09310340881347656, 0.09983062744140625, 0.10655784606933594, 0.11328506469726562, 0.12001228332519531, 0.126739501953125, 0.1334667205810547, 0.14019393920898438, 0.14692115783691406, 0.15364837646484375, 0.16037559509277344, 0.16710281372070312, 0.1738300323486328, 0.1805572509765625, 0.1872844696044922, 0.19401168823242188, 0.20073890686035156, 0.20746612548828125, 0.21419334411621094, 0.22092056274414062, 0.2276477813720703, 0.234375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 9.0, 6.0, 8.0, 22.0, 16.0, 18.0, 29.0, 28.0, 37.0, 47.0, 50.0, 58.0, 57.0, 70.0, 68.0, 70.0, 64.0, 62.0, 48.0, 45.0, 42.0, 44.0, 31.0, 18.0, 10.0, 11.0, 10.0, 4.0, 12.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17919921875, -0.17367172241210938, -0.16814422607421875, -0.16261672973632812, -0.1570892333984375, -0.15156173706054688, -0.14603424072265625, -0.14050674438476562, -0.134979248046875, -0.12945175170898438, -0.12392425537109375, -0.11839675903320312, -0.1128692626953125, -0.10734176635742188, -0.10181427001953125, -0.09628677368164062, -0.09075927734375, -0.08523178100585938, -0.07970428466796875, -0.07417678833007812, -0.0686492919921875, -0.06312179565429688, -0.05759429931640625, -0.052066802978515625, -0.046539306640625, -0.041011810302734375, -0.03548431396484375, -0.029956817626953125, -0.0244293212890625, -0.018901824951171875, -0.01337432861328125, -0.007846832275390625, -0.0023193359375, 0.003208160400390625, 0.00873565673828125, 0.014263153076171875, 0.0197906494140625, 0.025318145751953125, 0.03084564208984375, 0.036373138427734375, 0.041900634765625, 0.047428131103515625, 0.05295562744140625, 0.058483123779296875, 0.0640106201171875, 0.06953811645507812, 0.07506561279296875, 0.08059310913085938, 0.08612060546875, 0.09164810180664062, 0.09717559814453125, 0.10270309448242188, 0.1082305908203125, 0.11375808715820312, 0.11928558349609375, 0.12481307983398438, 0.130340576171875, 0.13586807250976562, 0.14139556884765625, 0.14692306518554688, 0.1524505615234375, 0.15797805786132812, 0.16350555419921875, 0.16903305053710938, 0.174560546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 13.0, 18.0, 18.0, 36.0, 56.0, 101.0, 168.0, 332.0, 738.0, 2055.0, 8032.0, 66978.0, 908751.0, 51287.0, 6747.0, 1716.0, 713.0, 345.0, 158.0, 113.0, 49.0, 44.0, 25.0, 15.0, 18.0, 9.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48291015625, -0.4706687927246094, -0.45842742919921875, -0.4461860656738281, -0.4339447021484375, -0.4217033386230469, -0.40946197509765625, -0.3972206115722656, -0.384979248046875, -0.3727378845214844, -0.36049652099609375, -0.3482551574707031, -0.3360137939453125, -0.3237724304199219, -0.31153106689453125, -0.2992897033691406, -0.28704833984375, -0.2748069763183594, -0.26256561279296875, -0.2503242492675781, -0.2380828857421875, -0.22584152221679688, -0.21360015869140625, -0.20135879516601562, -0.189117431640625, -0.17687606811523438, -0.16463470458984375, -0.15239334106445312, -0.1401519775390625, -0.12791061401367188, -0.11566925048828125, -0.10342788696289062, -0.0911865234375, -0.07894515991210938, -0.06670379638671875, -0.054462432861328125, -0.0422210693359375, -0.029979705810546875, -0.01773834228515625, -0.005496978759765625, 0.006744384765625, 0.018985748291015625, 0.03122711181640625, 0.043468475341796875, 0.0557098388671875, 0.06795120239257812, 0.08019256591796875, 0.09243392944335938, 0.10467529296875, 0.11691665649414062, 0.12915802001953125, 0.14139938354492188, 0.1536407470703125, 0.16588211059570312, 0.17812347412109375, 0.19036483764648438, 0.202606201171875, 0.21484756469726562, 0.22708892822265625, 0.23933029174804688, 0.2515716552734375, 0.2638130187988281, 0.27605438232421875, 0.2882957458496094, 0.300537109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 7.0, 10.0, 13.0, 23.0, 23.0, 17.0, 22.0, 32.0, 41.0, 34.0, 67.0, 77.0, 92.0, 88.0, 73.0, 71.0, 55.0, 34.0, 34.0, 23.0, 21.0, 29.0, 13.0, 16.0, 8.0, 15.0, 10.0, 10.0, 7.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5786285400390625, -0.560089111328125, -0.5415496826171875, -0.52301025390625, -0.5044708251953125, -0.485931396484375, -0.4673919677734375, -0.4488525390625, -0.4303131103515625, -0.411773681640625, -0.3932342529296875, -0.37469482421875, -0.3561553955078125, -0.337615966796875, -0.3190765380859375, -0.300537109375, -0.2819976806640625, -0.263458251953125, -0.2449188232421875, -0.22637939453125, -0.2078399658203125, -0.189300537109375, -0.1707611083984375, -0.1522216796875, -0.1336822509765625, -0.115142822265625, -0.0966033935546875, -0.07806396484375, -0.0595245361328125, -0.040985107421875, -0.0224456787109375, -0.00390625, 0.0146331787109375, 0.033172607421875, 0.0517120361328125, 0.07025146484375, 0.0887908935546875, 0.107330322265625, 0.1258697509765625, 0.1444091796875, 0.1629486083984375, 0.181488037109375, 0.2000274658203125, 0.21856689453125, 0.2371063232421875, 0.255645751953125, 0.2741851806640625, 0.292724609375, 0.3112640380859375, 0.329803466796875, 0.3483428955078125, 0.36688232421875, 0.3854217529296875, 0.403961181640625, 0.4225006103515625, 0.4410400390625, 0.4595794677734375, 0.478118896484375, 0.4966583251953125, 0.51519775390625, 0.5337371826171875, 0.552276611328125, 0.5708160400390625, 0.58935546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 6.0, 7.0, 13.0, 20.0, 28.0, 22.0, 43.0, 67.0, 111.0, 249.0, 395.0, 1070.0, 2901.0, 9804.0, 48465.0, 850241.0, 110605.0, 17304.0, 4428.0, 1459.0, 634.0, 288.0, 139.0, 69.0, 49.0, 38.0, 39.0, 20.0, 12.0, 5.0, 10.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060516357421875, -0.05866527557373047, -0.05681419372558594, -0.054963111877441406, -0.053112030029296875, -0.051260948181152344, -0.04940986633300781, -0.04755878448486328, -0.04570770263671875, -0.04385662078857422, -0.04200553894042969, -0.040154457092285156, -0.038303375244140625, -0.036452293395996094, -0.03460121154785156, -0.03275012969970703, -0.0308990478515625, -0.02904796600341797, -0.027196884155273438, -0.025345802307128906, -0.023494720458984375, -0.021643638610839844, -0.019792556762695312, -0.01794147491455078, -0.01609039306640625, -0.014239311218261719, -0.012388229370117188, -0.010537147521972656, -0.008686065673828125, -0.006834983825683594, -0.0049839019775390625, -0.0031328201293945312, -0.00128173828125, 0.0005693435668945312, 0.0024204254150390625, 0.004271507263183594, 0.006122589111328125, 0.007973670959472656, 0.009824752807617188, 0.011675834655761719, 0.01352691650390625, 0.015377998352050781, 0.017229080200195312, 0.019080162048339844, 0.020931243896484375, 0.022782325744628906, 0.024633407592773438, 0.02648448944091797, 0.0283355712890625, 0.03018665313720703, 0.03203773498535156, 0.033888816833496094, 0.035739898681640625, 0.037590980529785156, 0.03944206237792969, 0.04129314422607422, 0.04314422607421875, 0.04499530792236328, 0.04684638977050781, 0.048697471618652344, 0.050548553466796875, 0.052399635314941406, 0.05425071716308594, 0.05610179901123047, 0.057952880859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 3.0, 5.0, 8.0, 17.0, 6.0, 13.0, 12.0, 19.0, 23.0, 33.0, 37.0, 57.0, 73.0, 84.0, 99.0, 94.0, 86.0, 75.0, 48.0, 45.0, 24.0, 25.0, 19.0, 13.0, 10.0, 8.0, 12.0, 6.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4781951904296875e-05, -1.4320947229862213e-05, -1.3859942555427551e-05, -1.339893788099289e-05, -1.2937933206558228e-05, -1.2476928532123566e-05, -1.2015923857688904e-05, -1.1554919183254242e-05, -1.109391450881958e-05, -1.0632909834384918e-05, -1.0171905159950256e-05, -9.710900485515594e-06, -9.249895811080933e-06, -8.78889113664627e-06, -8.327886462211609e-06, -7.866881787776947e-06, -7.405877113342285e-06, -6.944872438907623e-06, -6.4838677644729614e-06, -6.0228630900382996e-06, -5.561858415603638e-06, -5.100853741168976e-06, -4.639849066734314e-06, -4.178844392299652e-06, -3.7178397178649902e-06, -3.2568350434303284e-06, -2.7958303689956665e-06, -2.3348256945610046e-06, -1.8738210201263428e-06, -1.412816345691681e-06, -9.51811671257019e-07, -4.908069968223572e-07, -2.9802322387695312e-08, 4.3120235204696655e-07, 8.922070264816284e-07, 1.3532117009162903e-06, 1.8142163753509521e-06, 2.275221049785614e-06, 2.736225724220276e-06, 3.1972303986549377e-06, 3.6582350730895996e-06, 4.1192397475242615e-06, 4.580244421958923e-06, 5.041249096393585e-06, 5.502253770828247e-06, 5.963258445262909e-06, 6.424263119697571e-06, 6.885267794132233e-06, 7.3462724685668945e-06, 7.807277143001556e-06, 8.268281817436218e-06, 8.72928649187088e-06, 9.190291166305542e-06, 9.651295840740204e-06, 1.0112300515174866e-05, 1.0573305189609528e-05, 1.103430986404419e-05, 1.1495314538478851e-05, 1.1956319212913513e-05, 1.2417323887348175e-05, 1.2878328561782837e-05, 1.3339333236217499e-05, 1.380033791065216e-05, 1.4261342585086823e-05, 1.4722347259521484e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 12.0, 14.0, 18.0, 23.0, 24.0, 42.0, 52.0, 76.0, 88.0, 171.0, 257.0, 422.0, 701.0, 1138.0, 2029.0, 3924.0, 7986.0, 18829.0, 54596.0, 612822.0, 265615.0, 47297.0, 16758.0, 7179.0, 3549.0, 1892.0, 1100.0, 625.0, 421.0, 276.0, 161.0, 122.0, 81.0, 60.0, 37.0, 33.0, 21.0, 19.0, 19.0, 8.0, 15.0, 9.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0286407470703125, -0.027651071548461914, -0.026661396026611328, -0.025671720504760742, -0.024682044982910156, -0.02369236946105957, -0.022702693939208984, -0.0217130184173584, -0.020723342895507812, -0.019733667373657227, -0.01874399185180664, -0.017754316329956055, -0.01676464080810547, -0.015774965286254883, -0.014785289764404297, -0.013795614242553711, -0.012805938720703125, -0.011816263198852539, -0.010826587677001953, -0.009836912155151367, -0.008847236633300781, -0.007857561111450195, -0.006867885589599609, -0.0058782100677490234, -0.0048885345458984375, -0.0038988590240478516, -0.0029091835021972656, -0.0019195079803466797, -0.0009298324584960938, 5.984306335449219e-05, 0.0010495185852050781, 0.002039194107055664, 0.00302886962890625, 0.004018545150756836, 0.005008220672607422, 0.005997896194458008, 0.006987571716308594, 0.00797724723815918, 0.008966922760009766, 0.009956598281860352, 0.010946273803710938, 0.011935949325561523, 0.01292562484741211, 0.013915300369262695, 0.014904975891113281, 0.015894651412963867, 0.016884326934814453, 0.01787400245666504, 0.018863677978515625, 0.01985335350036621, 0.020843029022216797, 0.021832704544067383, 0.02282238006591797, 0.023812055587768555, 0.02480173110961914, 0.025791406631469727, 0.026781082153320312, 0.0277707576751709, 0.028760433197021484, 0.02975010871887207, 0.030739784240722656, 0.03172945976257324, 0.03271913528442383, 0.033708810806274414, 0.034698486328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 2.0, 9.0, 11.0, 9.0, 15.0, 22.0, 23.0, 55.0, 61.0, 64.0, 108.0, 113.0, 113.0, 107.0, 81.0, 51.0, 35.0, 25.0, 32.0, 19.0, 12.0, 11.0, 4.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067626953125, -0.06545639038085938, -0.06328582763671875, -0.061115264892578125, -0.0589447021484375, -0.056774139404296875, -0.05460357666015625, -0.052433013916015625, -0.050262451171875, -0.048091888427734375, -0.04592132568359375, -0.043750762939453125, -0.0415802001953125, -0.039409637451171875, -0.03723907470703125, -0.035068511962890625, -0.03289794921875, -0.030727386474609375, -0.02855682373046875, -0.026386260986328125, -0.0242156982421875, -0.022045135498046875, -0.01987457275390625, -0.017704010009765625, -0.015533447265625, -0.013362884521484375, -0.01119232177734375, -0.009021759033203125, -0.0068511962890625, -0.004680633544921875, -0.00251007080078125, -0.000339508056640625, 0.0018310546875, 0.004001617431640625, 0.00617218017578125, 0.008342742919921875, 0.0105133056640625, 0.012683868408203125, 0.01485443115234375, 0.017024993896484375, 0.019195556640625, 0.021366119384765625, 0.02353668212890625, 0.025707244873046875, 0.0278778076171875, 0.030048370361328125, 0.03221893310546875, 0.034389495849609375, 0.03656005859375, 0.038730621337890625, 0.04090118408203125, 0.043071746826171875, 0.0452423095703125, 0.047412872314453125, 0.04958343505859375, 0.051753997802734375, 0.053924560546875, 0.056095123291015625, 0.05826568603515625, 0.060436248779296875, 0.0626068115234375, 0.06477737426757812, 0.06694793701171875, 0.06911849975585938, 0.0712890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 16.0, 40.0, 111.0, 560.0, 167.0, 52.0, 25.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.295884132385254, -4.1818695068359375, -4.067854881286621, -3.9538402557373047, -3.8398256301879883, -3.725811004638672, -3.6117963790893555, -3.497781753540039, -3.3837671279907227, -3.2697525024414062, -3.15573787689209, -3.0417232513427734, -2.927708625793457, -2.8136940002441406, -2.699679374694824, -2.585664749145508, -2.4716501235961914, -2.357635498046875, -2.2436208724975586, -2.129606246948242, -2.015591621398926, -1.9015769958496094, -1.787562370300293, -1.6735477447509766, -1.559532880783081, -1.4455182552337646, -1.3315036296844482, -1.2174890041351318, -1.1034743785858154, -0.9894596934318542, -0.8754450678825378, -0.7614304423332214, -0.6474158763885498, -0.5334012508392334, -0.419386625289917, -0.3053719699382782, -0.1913573443889618, -0.077342689037323, 0.03667193651199341, 0.15068656206130981, 0.2647011876106262, 0.3787158131599426, 0.49273043870925903, 0.6067451238632202, 0.7207597494125366, 0.834774374961853, 0.9487890005111694, 1.0628036260604858, 1.1768182516098022, 1.2908328771591187, 1.404847502708435, 1.5188621282577515, 1.6328767538070679, 1.7468914985656738, 1.8609061241149902, 1.9749207496643066, 2.088935375213623, 2.2029500007629395, 2.316964626312256, 2.4309792518615723, 2.5449938774108887, 2.659008502960205, 2.7730231285095215, 2.887037754058838, 3.0010523796081543]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 8.0, 8.0, 8.0, 11.0, 22.0, 15.0, 21.0, 20.0, 28.0, 31.0, 62.0, 187.0, 249.0, 87.0, 38.0, 21.0, 31.0, 18.0, 21.0, 21.0, 18.0, 16.0, 8.0, 12.0, 6.0, 5.0, 8.0, 2.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.3782219886779785, -2.3190507888793945, -2.2598795890808105, -2.2007083892822266, -2.1415371894836426, -2.0823659896850586, -2.0231947898864746, -1.9640235900878906, -1.9048523902893066, -1.8456811904907227, -1.7865099906921387, -1.7273387908935547, -1.6681675910949707, -1.6089963912963867, -1.5498251914978027, -1.4906539916992188, -1.4314827919006348, -1.3723115921020508, -1.3131403923034668, -1.2539691925048828, -1.1947979927062988, -1.1356267929077148, -1.0764555931091309, -1.0172843933105469, -0.9581131935119629, -0.8989419937133789, -0.8397707939147949, -0.7805995941162109, -0.721428394317627, -0.662257194519043, -0.603085994720459, -0.543914794921875, -0.484743595123291, -0.42557239532470703, -0.36640119552612305, -0.30722999572753906, -0.24805879592895508, -0.1888875961303711, -0.1297163963317871, -0.07054519653320312, -0.01137399673461914, 0.047797203063964844, 0.10696840286254883, 0.1661396026611328, 0.2253108024597168, 0.2844820022583008, 0.34365320205688477, 0.40282440185546875, 0.46199560165405273, 0.5211668014526367, 0.5803380012512207, 0.6395092010498047, 0.6986804008483887, 0.7578516006469727, 0.8170228004455566, 0.8761940002441406, 0.9353652000427246, 0.9945363998413086, 1.0537075996398926, 1.1128787994384766, 1.1720499992370605, 1.2312211990356445, 1.2903923988342285, 1.3495635986328125, 1.4087347984313965]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 5.0, 8.0, 7.0, 12.0, 8.0, 16.0, 21.0, 20.0, 20.0, 17.0, 24.0, 28.0, 35.0, 61.0, 161.0, 190.0, 65.0, 36.0, 35.0, 29.0, 31.0, 21.0, 17.0, 23.0, 13.0, 15.0, 13.0, 11.0, 5.0, 6.0, 9.0, 7.0, 2.0, 3.0, 1.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.12359619140625, -0.11985111236572266, -0.11610603332519531, -0.11236095428466797, -0.10861587524414062, -0.10487079620361328, -0.10112571716308594, -0.0973806381225586, -0.09363555908203125, -0.0898904800415039, -0.08614540100097656, -0.08240032196044922, -0.07865524291992188, -0.07491016387939453, -0.07116508483886719, -0.06742000579833984, -0.0636749267578125, -0.059929847717285156, -0.05618476867675781, -0.05243968963623047, -0.048694610595703125, -0.04494953155517578, -0.04120445251464844, -0.037459373474121094, -0.03371429443359375, -0.029969215393066406, -0.026224136352539062, -0.02247905731201172, -0.018733978271484375, -0.014988899230957031, -0.011243820190429688, -0.007498741149902344, -0.003753662109375, -8.58306884765625e-06, 0.0037364959716796875, 0.007481575012207031, 0.011226654052734375, 0.014971733093261719, 0.018716812133789062, 0.022461891174316406, 0.02620697021484375, 0.029952049255371094, 0.03369712829589844, 0.03744220733642578, 0.041187286376953125, 0.04493236541748047, 0.04867744445800781, 0.052422523498535156, 0.0561676025390625, 0.059912681579589844, 0.06365776062011719, 0.06740283966064453, 0.07114791870117188, 0.07489299774169922, 0.07863807678222656, 0.0823831558227539, 0.08612823486328125, 0.0898733139038086, 0.09361839294433594, 0.09736347198486328, 0.10110855102539062, 0.10485363006591797, 0.10859870910644531, 0.11234378814697266, 0.1160888671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 4.0, 4.0, 9.0, 9.0, 12.0, 27.0, 35.0, 60.0, 159.0, 350.0, 1103.0, 5729.0, 8316968.0, 59084.0, 3649.0, 820.0, 251.0, 118.0, 63.0, 33.0, 26.0, 13.0, 7.0, 10.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-1.5188714265823364, -1.4643621444702148, -1.4098529815673828, -1.3553436994552612, -1.3008344173431396, -1.246325135231018, -1.1918158531188965, -1.1373066902160645, -1.0827974081039429, -1.0282881259918213, -0.9737789034843445, -0.9192696809768677, -0.8647603988647461, -0.8102511167526245, -0.7557418942451477, -0.7012326717376709, -0.6467233896255493, -0.5922141075134277, -0.5377048850059509, -0.48319563269615173, -0.42868638038635254, -0.37417712807655334, -0.31966787576675415, -0.26515862345695496, -0.21064937114715576, -0.15614011883735657, -0.10163086652755737, -0.04712161421775818, 0.007387638092041016, 0.06189689040184021, 0.1164061427116394, 0.1709153950214386, 0.22542476654052734, 0.27993401885032654, 0.33444327116012573, 0.3889525234699249, 0.4434617757797241, 0.4979710280895233, 0.5524802803993225, 0.6069895029067993, 0.6614987850189209, 0.7160080671310425, 0.7705172896385193, 0.8250265121459961, 0.8795357942581177, 0.9340450763702393, 0.9885542988777161, 1.0430635213851929, 1.0975728034973145, 1.152082085609436, 1.2065913677215576, 1.2611005306243896, 1.3156098127365112, 1.3701190948486328, 1.4246282577514648, 1.4791375398635864, 1.533646821975708, 1.5881561040878296, 1.6426653861999512, 1.6971745491027832, 1.7516838312149048, 1.8061931133270264, 1.8607022762298584, 1.91521155834198, 1.9697208404541016]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 1.0, 7.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 5.0, 7.0, 3.0, 6.0, 3.0, 6.0, 7.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7271131873130798, -0.6771088242530823, -0.6271044611930847, -0.5771000385284424, -0.5270956754684448, -0.47709134221076965, -0.4270869493484497, -0.37708258628845215, -0.3270782232284546, -0.27707386016845703, -0.22706948220729828, -0.17706510424613953, -0.12706074118614197, -0.07705637812614441, -0.027051985263824463, 0.022952377796173096, 0.07295674085617065, 0.12296111136674881, 0.17296548187732697, 0.22296985983848572, 0.2729742228984833, 0.32297858595848083, 0.3729829788208008, 0.42298734188079834, 0.4729917049407959, 0.5229960680007935, 0.573000431060791, 0.6230047941207886, 0.6730091571807861, 0.7230135202407837, 0.773017942905426, 0.8230223059654236, 0.8730266094207764, 0.9230309724807739, 0.9730353355407715, 1.023039698600769, 1.0730440616607666, 1.1230484247207642, 1.1730527877807617, 1.2230572700500488, 1.2730615139007568, 1.3230658769607544, 1.373070240020752, 1.4230746030807495, 1.473078966140747, 1.5230833292007446, 1.5730876922607422, 1.6230921745300293, 1.6730965375900269, 1.7231009006500244, 1.773105263710022, 1.8231096267700195, 1.873113989830017, 1.9231183528900146, 1.9731228351593018, 2.0231270790100098, 2.073131561279297, 2.123136043548584, 2.173140287399292, 2.223144769668579, 2.273149013519287, 2.323153495788574, 2.3731577396392822, 2.4231622219085693, 2.4731664657592773]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 3.0, 6.0, 10.0, 11.0, 14.0, 16.0, 15.0, 24.0, 31.0, 50.0, 62.0, 102.0, 163.0, 262.0, 563.0, 1238.0, 3245.0, 11061.0, 42097.0, 175405.0, 215055.0, 54298.0, 13742.0, 4003.0, 1405.0, 597.0, 256.0, 179.0, 99.0, 58.0, 54.0, 39.0, 18.0, 15.0, 18.0, 14.0, 11.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.4697265625, -1.4278564453125, -1.385986328125, -1.3441162109375, -1.30224609375, -1.2603759765625, -1.218505859375, -1.1766357421875, -1.134765625, -1.0928955078125, -1.051025390625, -1.0091552734375, -0.96728515625, -0.9254150390625, -0.883544921875, -0.8416748046875, -0.7998046875, -0.7579345703125, -0.716064453125, -0.6741943359375, -0.63232421875, -0.5904541015625, -0.548583984375, -0.5067138671875, -0.46484375, -0.4229736328125, -0.381103515625, -0.3392333984375, -0.29736328125, -0.2554931640625, -0.213623046875, -0.1717529296875, -0.1298828125, -0.0880126953125, -0.046142578125, -0.0042724609375, 0.03759765625, 0.0794677734375, 0.121337890625, 0.1632080078125, 0.205078125, 0.2469482421875, 0.288818359375, 0.3306884765625, 0.37255859375, 0.4144287109375, 0.456298828125, 0.4981689453125, 0.5400390625, 0.5819091796875, 0.623779296875, 0.6656494140625, 0.70751953125, 0.7493896484375, 0.791259765625, 0.8331298828125, 0.875, 0.9168701171875, 0.958740234375, 1.0006103515625, 1.04248046875, 1.0843505859375, 1.126220703125, 1.1680908203125, 1.2099609375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 10.0, 15.0, 13.0, 15.0, 24.0, 35.0, 46.0, 40.0, 42.0, 64.0, 63.0, 64.0, 53.0, 67.0, 78.0, 50.0, 51.0, 52.0, 52.0, 35.0, 32.0, 20.0, 20.0, 12.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16796875, -0.162811279296875, -0.15765380859375, -0.152496337890625, -0.1473388671875, -0.142181396484375, -0.13702392578125, -0.131866455078125, -0.126708984375, -0.121551513671875, -0.11639404296875, -0.111236572265625, -0.1060791015625, -0.100921630859375, -0.09576416015625, -0.090606689453125, -0.08544921875, -0.080291748046875, -0.07513427734375, -0.069976806640625, -0.0648193359375, -0.059661865234375, -0.05450439453125, -0.049346923828125, -0.044189453125, -0.039031982421875, -0.03387451171875, -0.028717041015625, -0.0235595703125, -0.018402099609375, -0.01324462890625, -0.008087158203125, -0.0029296875, 0.002227783203125, 0.00738525390625, 0.012542724609375, 0.0177001953125, 0.022857666015625, 0.02801513671875, 0.033172607421875, 0.038330078125, 0.043487548828125, 0.04864501953125, 0.053802490234375, 0.0589599609375, 0.064117431640625, 0.06927490234375, 0.074432373046875, 0.07958984375, 0.084747314453125, 0.08990478515625, 0.095062255859375, 0.1002197265625, 0.105377197265625, 0.11053466796875, 0.115692138671875, 0.120849609375, 0.126007080078125, 0.13116455078125, 0.136322021484375, 0.1414794921875, 0.146636962890625, 0.15179443359375, 0.156951904296875, 0.162109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 15.0, 57.0, 58.0, 77.0, 89.0, 60.0, 31.0, 17.0, 18.0, 10.0, 7.0, 4.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408031463623047, -1.3034625053405762, -1.2661219835281372, -1.2287813425064087, -1.1914408206939697, -1.1541001796722412, -1.1167596578598022, -1.0794190168380737, -1.0420784950256348, -1.0047378540039062, -0.9673973321914673, -0.9300567507743835, -0.8927161693572998, -0.8553755283355713, -0.8180349469184875, -0.7806943655014038, -0.7433537244796753, -0.7060131430625916, -0.6686725616455078, -0.6313319802284241, -0.5939913988113403, -0.5566507577896118, -0.5193101763725281, -0.48196959495544434, -0.4446290135383606, -0.40728843212127686, -0.3699478507041931, -0.332607239484787, -0.29526665806770325, -0.2579260766506195, -0.22058548033237457, -0.18324488401412964, -0.1459043025970459, -0.10856371372938156, -0.07122312486171722, -0.03388253599405289, 0.00345805287361145, 0.04079863429069519, 0.07813923060894012, 0.11547982692718506, 0.1528204083442688, 0.19016098976135254, 0.22750158607959747, 0.2648421823978424, 0.30218276381492615, 0.3395233452320099, 0.376863956451416, 0.41420453786849976, 0.4515451192855835, 0.48888570070266724, 0.526226282119751, 0.5635668635368347, 0.6009074449539185, 0.638248085975647, 0.6755886673927307, 0.7129292488098145, 0.7502698302268982, 0.7876104116439819, 0.8249509930610657, 0.8622915744781494, 0.8996322154998779, 0.9369727373123169, 0.9743133783340454, 1.0116539001464844, 1.048994541168213]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 0.0, 3.0, 1.0, 8.0, 9.0, 8.0, 7.0, 31.0, 78.0, 103.0, 92.0, 58.0, 26.0, 12.0, 9.0, 6.0, 9.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9133681654930115, -0.8843495845794678, -0.8553310036659241, -0.8263124227523804, -0.7972938418388367, -0.768275260925293, -0.739256739616394, -0.7102380990982056, -0.6812195777893066, -0.6522009968757629, -0.6231824159622192, -0.5941638350486755, -0.5651452541351318, -0.5361266732215881, -0.5071080923080444, -0.4780895411968231, -0.44907093048095703, -0.42005234956741333, -0.39103376865386963, -0.3620151877403259, -0.3329966068267822, -0.3039780259132385, -0.2749594748020172, -0.2459408938884735, -0.2169223129749298, -0.1879037320613861, -0.1588851511478424, -0.1298665851354599, -0.1008480042219162, -0.0718294233083725, -0.04281085729598999, -0.013792276382446289, 0.015226364135742188, 0.04424494132399559, 0.07326351851224899, 0.1022820919752121, 0.1313006728887558, 0.1603192538022995, 0.189337819814682, 0.2183564007282257, 0.2473749816417694, 0.2763935625553131, 0.3054121434688568, 0.3344306945800781, 0.3634492754936218, 0.3924678564071655, 0.42148643732070923, 0.45050501823425293, 0.47952359914779663, 0.5085421800613403, 0.537560760974884, 0.5665793418884277, 0.5955979228019714, 0.6246165037155151, 0.6536350250244141, 0.6826536655426025, 0.7116721868515015, 0.7406907677650452, 0.7697093486785889, 0.7987279295921326, 0.8277465105056763, 0.85676509141922, 0.8857836723327637, 0.9148021936416626, 0.9438208341598511]}, "eval/loss": 4.745861530303955, "eval/wer": 1.976279254264181, "eval/runtime": 966.758, "eval/samples_per_second": 2.733, "eval/steps_per_second": 0.342} \ No newline at end of file +{"train/loss": 3.9784, "train/learning_rate": 9.345794392523364e-07, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 8574, "_timestamp": 1646219749, "_step": 1787, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 13.0, 17.0, 52.0, 415.0, 420.0, 70.0, 16.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-925.3422241210938, -902.2313232421875, -879.120361328125, -856.0094604492188, -832.8985595703125, -809.78759765625, -786.6766967773438, -763.5657958984375, -740.454833984375, -717.3439331054688, -694.2329711914062, -671.1220703125, -648.0111083984375, -624.9002075195312, -601.789306640625, -578.6783447265625, -555.5674438476562, -532.45654296875, -509.3455810546875, -486.23468017578125, -463.1237487792969, -440.0128173828125, -416.90191650390625, -393.7909851074219, -370.6800537109375, -347.5691223144531, -324.45819091796875, -301.3472900390625, -278.2363586425781, -255.12542724609375, -232.01451110839844, -208.90359497070312, -185.79266357421875, -162.68173217773438, -139.57081604003906, -116.45989227294922, -93.34896850585938, -70.23804473876953, -47.12712097167969, -24.016204833984375, -0.9052734375, 22.205650329589844, 45.31657409667969, 68.42749786376953, 91.53842163085938, 114.64934539794922, 137.76026916503906, 160.87118530273438, 183.98211669921875, 207.09304809570312, 230.20396423339844, 253.31488037109375, 276.4258117675781, 299.5367431640625, 322.64764404296875, 345.7585754394531, 368.8695068359375, 391.9804382324219, 415.09136962890625, 438.2022705078125, 461.3132019042969, 484.42413330078125, 507.5350341796875, 530.64599609375, 553.7568969726562]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 11.0, 7.0, 8.0, 15.0, 18.0, 21.0, 20.0, 18.0, 25.0, 30.0, 34.0, 27.0, 70.0, 176.0, 140.0, 82.0, 30.0, 23.0, 28.0, 28.0, 23.0, 23.0, 17.0, 17.0, 14.0, 13.0, 5.0, 7.0, 10.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-667.4768676757812, -646.577392578125, -625.6779174804688, -604.7784423828125, -583.8789672851562, -562.9794921875, -542.0800170898438, -521.1805419921875, -500.2810974121094, -479.3816223144531, -458.4821472167969, -437.5826721191406, -416.6832275390625, -395.78375244140625, -374.88427734375, -353.98480224609375, -333.0853271484375, -312.18585205078125, -291.286376953125, -270.38690185546875, -249.48744201660156, -228.5879669189453, -207.68850708007812, -186.78903198242188, -165.88955688476562, -144.99008178710938, -124.09061431884766, -103.19114685058594, -82.29167175292969, -61.39219665527344, -40.49272918701172, -19.59326171875, 1.30621337890625, 22.205684661865234, 43.10515594482422, 64.00462341308594, 84.90409851074219, 105.80357360839844, 126.70304107666016, 147.60250854492188, 168.50198364257812, 189.40145874023438, 210.30093383789062, 231.2003936767578, 252.09986877441406, 272.99932861328125, 293.8988037109375, 314.79827880859375, 335.69775390625, 356.59722900390625, 377.4967041015625, 398.39617919921875, 419.295654296875, 440.19512939453125, 461.0945739746094, 481.9940490722656, 502.8935241699219, 523.79296875, 544.6924438476562, 565.5919189453125, 586.4913940429688, 607.390869140625, 628.2903442382812, 649.1898193359375, 670.0892944335938]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 10.0, 11.0, 9.0, 5.0, 10.0, 14.0, 11.0, 24.0, 20.0, 21.0, 19.0, 28.0, 39.0, 25.0, 67.0, 113.0, 133.0, 109.0, 60.0, 33.0, 24.0, 25.0, 24.0, 23.0, 21.0, 16.0, 22.0, 8.0, 11.0, 9.0, 5.0, 6.0, 9.0, 1.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.859375, -10.5013427734375, -10.143310546875, -9.7852783203125, -9.42724609375, -9.0692138671875, -8.711181640625, -8.3531494140625, -7.9951171875, -7.6370849609375, -7.279052734375, -6.9210205078125, -6.56298828125, -6.2049560546875, -5.846923828125, -5.4888916015625, -5.130859375, -4.7728271484375, -4.414794921875, -4.0567626953125, -3.69873046875, -3.3406982421875, -2.982666015625, -2.6246337890625, -2.2666015625, -1.9085693359375, -1.550537109375, -1.1925048828125, -0.83447265625, -0.4764404296875, -0.118408203125, 0.2396240234375, 0.59765625, 0.9556884765625, 1.313720703125, 1.6717529296875, 2.02978515625, 2.3878173828125, 2.745849609375, 3.1038818359375, 3.4619140625, 3.8199462890625, 4.177978515625, 4.5360107421875, 4.89404296875, 5.2520751953125, 5.610107421875, 5.9681396484375, 6.326171875, 6.6842041015625, 7.042236328125, 7.4002685546875, 7.75830078125, 8.1163330078125, 8.474365234375, 8.8323974609375, 9.1904296875, 9.5484619140625, 9.906494140625, 10.2645263671875, 10.62255859375, 10.9805908203125, 11.338623046875, 11.6966552734375, 12.0546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 14.0, 21.0, 33.0, 36.0, 59.0, 58.0, 72.0, 88.0, 145.0, 197.0, 306.0, 383.0, 600.0, 1027.0, 1953.0, 3929.0, 10399.0, 43091.0, 4044670.0, 65124.0, 12372.0, 4412.0, 2005.0, 1166.0, 640.0, 383.0, 269.0, 216.0, 166.0, 105.0, 78.0, 52.0, 40.0, 26.0, 31.0, 22.0, 17.0, 20.0, 7.0, 8.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-107.3125, -103.802734375, -100.29296875, -96.783203125, -93.2734375, -89.763671875, -86.25390625, -82.744140625, -79.234375, -75.724609375, -72.21484375, -68.705078125, -65.1953125, -61.685546875, -58.17578125, -54.666015625, -51.15625, -47.646484375, -44.13671875, -40.626953125, -37.1171875, -33.607421875, -30.09765625, -26.587890625, -23.078125, -19.568359375, -16.05859375, -12.548828125, -9.0390625, -5.529296875, -2.01953125, 1.490234375, 5.0, 8.509765625, 12.01953125, 15.529296875, 19.0390625, 22.548828125, 26.05859375, 29.568359375, 33.078125, 36.587890625, 40.09765625, 43.607421875, 47.1171875, 50.626953125, 54.13671875, 57.646484375, 61.15625, 64.666015625, 68.17578125, 71.685546875, 75.1953125, 78.705078125, 82.21484375, 85.724609375, 89.234375, 92.744140625, 96.25390625, 99.763671875, 103.2734375, 106.783203125, 110.29296875, 113.802734375, 117.3125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 12.0, 10.0, 13.0, 22.0, 19.0, 20.0, 29.0, 35.0, 32.0, 57.0, 56.0, 87.0, 189.0, 439.0, 1039.0, 927.0, 489.0, 192.0, 102.0, 66.0, 42.0, 30.0, 28.0, 23.0, 11.0, 26.0, 13.0, 7.0, 13.0, 6.0, 2.0, 7.0, 2.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.0, -36.77294921875, -35.5458984375, -34.31884765625, -33.091796875, -31.86474609375, -30.6376953125, -29.41064453125, -28.18359375, -26.95654296875, -25.7294921875, -24.50244140625, -23.275390625, -22.04833984375, -20.8212890625, -19.59423828125, -18.3671875, -17.14013671875, -15.9130859375, -14.68603515625, -13.458984375, -12.23193359375, -11.0048828125, -9.77783203125, -8.55078125, -7.32373046875, -6.0966796875, -4.86962890625, -3.642578125, -2.41552734375, -1.1884765625, 0.03857421875, 1.265625, 2.49267578125, 3.7197265625, 4.94677734375, 6.173828125, 7.40087890625, 8.6279296875, 9.85498046875, 11.08203125, 12.30908203125, 13.5361328125, 14.76318359375, 15.990234375, 17.21728515625, 18.4443359375, 19.67138671875, 20.8984375, 22.12548828125, 23.3525390625, 24.57958984375, 25.806640625, 27.03369140625, 28.2607421875, 29.48779296875, 30.71484375, 31.94189453125, 33.1689453125, 34.39599609375, 35.623046875, 36.85009765625, 38.0771484375, 39.30419921875, 40.53125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 6.0, 10.0, 8.0, 18.0, 14.0, 23.0, 28.0, 37.0, 53.0, 71.0, 76.0, 82.0, 129.0, 175.0, 280.0, 496.0, 1232.0, 5414.0, 40811.0, 3830796.0, 292463.0, 17032.0, 2993.0, 821.0, 371.0, 210.0, 128.0, 105.0, 82.0, 67.0, 48.0, 45.0, 31.0, 22.0, 24.0, 10.0, 14.0, 10.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-108.3125, -105.0107421875, -101.708984375, -98.4072265625, -95.10546875, -91.8037109375, -88.501953125, -85.2001953125, -81.8984375, -78.5966796875, -75.294921875, -71.9931640625, -68.69140625, -65.3896484375, -62.087890625, -58.7861328125, -55.484375, -52.1826171875, -48.880859375, -45.5791015625, -42.27734375, -38.9755859375, -35.673828125, -32.3720703125, -29.0703125, -25.7685546875, -22.466796875, -19.1650390625, -15.86328125, -12.5615234375, -9.259765625, -5.9580078125, -2.65625, 0.6455078125, 3.947265625, 7.2490234375, 10.55078125, 13.8525390625, 17.154296875, 20.4560546875, 23.7578125, 27.0595703125, 30.361328125, 33.6630859375, 36.96484375, 40.2666015625, 43.568359375, 46.8701171875, 50.171875, 53.4736328125, 56.775390625, 60.0771484375, 63.37890625, 66.6806640625, 69.982421875, 73.2841796875, 76.5859375, 79.8876953125, 83.189453125, 86.4912109375, 89.79296875, 93.0947265625, 96.396484375, 99.6982421875, 103.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 32.0, 28.0, 87.0, 247.0, 436.0, 126.0, 27.0, 10.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-182.33505249023438, -174.4733428955078, -166.61163330078125, -158.74990844726562, -150.88819885253906, -143.0264892578125, -135.16477966308594, -127.30306243896484, -119.44134521484375, -111.57963562011719, -103.7179183959961, -95.85620880126953, -87.99449157714844, -80.13278198242188, -72.27107238769531, -64.40935516357422, -56.547645568847656, -48.68593215942383, -40.82421875, -32.96250915527344, -25.100793838500977, -17.23908233642578, -9.377368927001953, -1.515655517578125, 6.346057891845703, 14.207771301269531, 22.06948471069336, 29.931196212768555, 37.79290771484375, 45.65462112426758, 53.516334533691406, 61.378047943115234, 69.23976135253906, 77.10147094726562, 84.96318817138672, 92.82489776611328, 100.68661499023438, 108.54832458496094, 116.4100341796875, 124.2717514038086, 132.1334686279297, 139.99517822265625, 147.8568878173828, 155.71861267089844, 163.580322265625, 171.44203186035156, 179.30374145507812, 187.16546630859375, 195.02716064453125, 202.8888702392578, 210.75057983398438, 218.6123046875, 226.47401428222656, 234.33572387695312, 242.1974334716797, 250.05914306640625, 257.9208679199219, 265.7825927734375, 273.644287109375, 281.5060119628906, 289.3677062988281, 297.22943115234375, 305.0911560058594, 312.9528503417969, 320.8145751953125]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 10.0, 13.0, 9.0, 15.0, 17.0, 19.0, 35.0, 24.0, 34.0, 32.0, 41.0, 29.0, 41.0, 39.0, 47.0, 45.0, 45.0, 40.0, 41.0, 40.0, 35.0, 36.0, 45.0, 33.0, 26.0, 21.0, 38.0, 20.0, 20.0, 17.0, 8.0, 11.0, 10.0, 8.0, 3.0, 11.0, 6.0, 0.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.60552978515625, -139.92665100097656, -135.24777221679688, -130.5688934326172, -125.89002227783203, -121.21114349365234, -116.53227233886719, -111.8533935546875, -107.17451477050781, -102.49563598632812, -97.81675720214844, -93.13788604736328, -88.4590072631836, -83.7801284790039, -79.10125732421875, -74.42237854003906, -69.74349975585938, -65.06462097167969, -60.385746002197266, -55.706871032714844, -51.027992248535156, -46.34911346435547, -41.67023849487305, -36.991363525390625, -32.31248474121094, -27.633607864379883, -22.954730987548828, -18.275854110717773, -13.596977233886719, -8.918100357055664, -4.239223480224609, 0.4396514892578125, 5.1185302734375, 9.797407150268555, 14.47628402709961, 19.155160903930664, 23.83403778076172, 28.512914657592773, 33.19179153442383, 37.87066650390625, 42.54954528808594, 47.228424072265625, 51.90729904174805, 56.58617401123047, 61.265052795410156, 65.94393157958984, 70.622802734375, 75.30168151855469, 79.98056030273438, 84.65943908691406, 89.33831787109375, 94.0171890258789, 98.6960678100586, 103.37494659423828, 108.05381774902344, 112.73269653320312, 117.41157531738281, 122.0904541015625, 126.76933288574219, 131.44821166992188, 136.1270751953125, 140.8059539794922, 145.48483276367188, 150.16371154785156, 154.84259033203125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 8.0, 9.0, 17.0, 18.0, 25.0, 16.0, 28.0, 30.0, 42.0, 58.0, 62.0, 94.0, 92.0, 99.0, 62.0, 49.0, 31.0, 28.0, 22.0, 20.0, 27.0, 12.0, 20.0, 10.0, 12.0, 8.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.666259765625, -8.34814453125, -8.030029296875, -7.7119140625, -7.393798828125, -7.07568359375, -6.757568359375, -6.439453125, -6.121337890625, -5.80322265625, -5.485107421875, -5.1669921875, -4.848876953125, -4.53076171875, -4.212646484375, -3.89453125, -3.576416015625, -3.25830078125, -2.940185546875, -2.6220703125, -2.303955078125, -1.98583984375, -1.667724609375, -1.349609375, -1.031494140625, -0.71337890625, -0.395263671875, -0.0771484375, 0.240966796875, 0.55908203125, 0.877197265625, 1.1953125, 1.513427734375, 1.83154296875, 2.149658203125, 2.4677734375, 2.785888671875, 3.10400390625, 3.422119140625, 3.740234375, 4.058349609375, 4.37646484375, 4.694580078125, 5.0126953125, 5.330810546875, 5.64892578125, 5.967041015625, 6.28515625, 6.603271484375, 6.92138671875, 7.239501953125, 7.5576171875, 7.875732421875, 8.19384765625, 8.511962890625, 8.830078125, 9.148193359375, 9.46630859375, 9.784423828125, 10.1025390625, 10.420654296875, 10.73876953125, 11.056884765625, 11.375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 2.0, 4.0, 5.0, 12.0, 7.0, 14.0, 27.0, 34.0, 32.0, 72.0, 101.0, 167.0, 251.0, 349.0, 549.0, 899.0, 1281.0, 2107.0, 3302.0, 5285.0, 8595.0, 14270.0, 24499.0, 45156.0, 91610.0, 220269.0, 345453.0, 139140.0, 63874.0, 33210.0, 18630.0, 11075.0, 6694.0, 4237.0, 2608.0, 1642.0, 1056.0, 724.0, 435.0, 307.0, 176.0, 145.0, 83.0, 59.0, 34.0, 23.0, 15.0, 18.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2169189453125, -0.2097492218017578, -0.20257949829101562, -0.19540977478027344, -0.18824005126953125, -0.18107032775878906, -0.17390060424804688, -0.1667308807373047, -0.1595611572265625, -0.1523914337158203, -0.14522171020507812, -0.13805198669433594, -0.13088226318359375, -0.12371253967285156, -0.11654281616210938, -0.10937309265136719, -0.102203369140625, -0.09503364562988281, -0.08786392211914062, -0.08069419860839844, -0.07352447509765625, -0.06635475158691406, -0.059185028076171875, -0.05201530456542969, -0.0448455810546875, -0.03767585754394531, -0.030506134033203125, -0.023336410522460938, -0.01616668701171875, -0.008996963500976562, -0.001827239990234375, 0.0053424835205078125, 0.01251220703125, 0.019681930541992188, 0.026851654052734375, 0.03402137756347656, 0.04119110107421875, 0.04836082458496094, 0.055530548095703125, 0.06270027160644531, 0.0698699951171875, 0.07703971862792969, 0.08420944213867188, 0.09137916564941406, 0.09854888916015625, 0.10571861267089844, 0.11288833618164062, 0.12005805969238281, 0.127227783203125, 0.1343975067138672, 0.14156723022460938, 0.14873695373535156, 0.15590667724609375, 0.16307640075683594, 0.17024612426757812, 0.1774158477783203, 0.1845855712890625, 0.1917552947998047, 0.19892501831054688, 0.20609474182128906, 0.21326446533203125, 0.22043418884277344, 0.22760391235351562, 0.2347736358642578, 0.241943359375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 5.0, 11.0, 9.0, 11.0, 10.0, 17.0, 15.0, 17.0, 39.0, 33.0, 32.0, 27.0, 39.0, 32.0, 42.0, 39.0, 41.0, 1076.0, 44.0, 38.0, 35.0, 56.0, 32.0, 27.0, 36.0, 36.0, 36.0, 30.0, 24.0, 20.0, 18.0, 15.0, 5.0, 13.0, 10.0, 9.0, 12.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.83203125, -3.71209716796875, -3.5921630859375, -3.47222900390625, -3.352294921875, -3.23236083984375, -3.1124267578125, -2.99249267578125, -2.87255859375, -2.75262451171875, -2.6326904296875, -2.51275634765625, -2.392822265625, -2.27288818359375, -2.1529541015625, -2.03302001953125, -1.9130859375, -1.79315185546875, -1.6732177734375, -1.55328369140625, -1.433349609375, -1.31341552734375, -1.1934814453125, -1.07354736328125, -0.95361328125, -0.83367919921875, -0.7137451171875, -0.59381103515625, -0.473876953125, -0.35394287109375, -0.2340087890625, -0.11407470703125, 0.005859375, 0.12579345703125, 0.2457275390625, 0.36566162109375, 0.485595703125, 0.60552978515625, 0.7254638671875, 0.84539794921875, 0.96533203125, 1.08526611328125, 1.2052001953125, 1.32513427734375, 1.445068359375, 1.56500244140625, 1.6849365234375, 1.80487060546875, 1.9248046875, 2.04473876953125, 2.1646728515625, 2.28460693359375, 2.404541015625, 2.52447509765625, 2.6444091796875, 2.76434326171875, 2.88427734375, 3.00421142578125, 3.1241455078125, 3.24407958984375, 3.364013671875, 3.48394775390625, 3.6038818359375, 3.72381591796875, 3.84375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 8.0, 6.0, 20.0, 23.0, 19.0, 32.0, 61.0, 103.0, 202.0, 247.0, 416.0, 651.0, 1078.0, 1692.0, 2530.0, 3929.0, 6618.0, 10139.0, 16359.0, 26951.0, 43944.0, 73001.0, 123554.0, 295003.0, 1173434.0, 125691.0, 74704.0, 44797.0, 27022.0, 16652.0, 10456.0, 6455.0, 4041.0, 2647.0, 1655.0, 1177.0, 669.0, 407.0, 248.0, 177.0, 96.0, 63.0, 56.0, 33.0, 18.0, 15.0, 16.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.07220458984375, -0.07001781463623047, -0.06783103942871094, -0.0656442642211914, -0.06345748901367188, -0.061270713806152344, -0.05908393859863281, -0.05689716339111328, -0.05471038818359375, -0.05252361297607422, -0.05033683776855469, -0.048150062561035156, -0.045963287353515625, -0.043776512145996094, -0.04158973693847656, -0.03940296173095703, -0.0372161865234375, -0.03502941131591797, -0.03284263610839844, -0.030655860900878906, -0.028469085693359375, -0.026282310485839844, -0.024095535278320312, -0.02190876007080078, -0.01972198486328125, -0.01753520965576172, -0.015348434448242188, -0.013161659240722656, -0.010974884033203125, -0.008788108825683594, -0.0066013336181640625, -0.004414558410644531, -0.002227783203125, -4.100799560546875e-05, 0.0021457672119140625, 0.004332542419433594, 0.006519317626953125, 0.008706092834472656, 0.010892868041992188, 0.013079643249511719, 0.01526641845703125, 0.01745319366455078, 0.019639968872070312, 0.021826744079589844, 0.024013519287109375, 0.026200294494628906, 0.028387069702148438, 0.03057384490966797, 0.0327606201171875, 0.03494739532470703, 0.03713417053222656, 0.039320945739746094, 0.041507720947265625, 0.043694496154785156, 0.04588127136230469, 0.04806804656982422, 0.05025482177734375, 0.05244159698486328, 0.05462837219238281, 0.056815147399902344, 0.059001922607421875, 0.061188697814941406, 0.06337547302246094, 0.06556224822998047, 0.0677490234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 8.0, 15.0, 22.0, 28.0, 20.0, 20.0, 39.0, 54.0, 57.0, 48.0, 71.0, 92.0, 79.0, 69.0, 71.0, 44.0, 47.0, 42.0, 32.0, 16.0, 20.0, 12.0, 20.0, 8.0, 9.0, 11.0, 4.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015306472778320312, -0.00014693289995193481, -0.0001408010721206665, -0.0001346692442893982, -0.00012853741645812988, -0.00012240558862686157, -0.00011627376079559326, -0.00011014193296432495, -0.00010401010513305664, -9.787827730178833e-05, -9.174644947052002e-05, -8.561462163925171e-05, -7.94827938079834e-05, -7.335096597671509e-05, -6.721913814544678e-05, -6.108731031417847e-05, -5.4955482482910156e-05, -4.8823654651641846e-05, -4.2691826820373535e-05, -3.6559998989105225e-05, -3.0428171157836914e-05, -2.4296343326568604e-05, -1.8164515495300293e-05, -1.2032687664031982e-05, -5.900859832763672e-06, 2.3096799850463867e-07, 6.362795829772949e-06, 1.249462366104126e-05, 1.862645149230957e-05, 2.475827932357788e-05, 3.089010715484619e-05, 3.70219349861145e-05, 4.315376281738281e-05, 4.928559064865112e-05, 5.5417418479919434e-05, 6.154924631118774e-05, 6.768107414245605e-05, 7.381290197372437e-05, 7.994472980499268e-05, 8.607655763626099e-05, 9.22083854675293e-05, 9.834021329879761e-05, 0.00010447204113006592, 0.00011060386896133423, 0.00011673569679260254, 0.00012286752462387085, 0.00012899935245513916, 0.00013513118028640747, 0.00014126300811767578, 0.0001473948359489441, 0.0001535266637802124, 0.0001596584916114807, 0.00016579031944274902, 0.00017192214727401733, 0.00017805397510528564, 0.00018418580293655396, 0.00019031763076782227, 0.00019644945859909058, 0.0002025812864303589, 0.0002087131142616272, 0.0002148449420928955, 0.00022097676992416382, 0.00022710859775543213, 0.00023324042558670044, 0.00023937225341796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 11.0, 15.0, 16.0, 28.0, 33.0, 37.0, 68.0, 77.0, 91.0, 108.0, 180.0, 256.0, 399.0, 1135.0, 1041621.0, 2885.0, 497.0, 285.0, 224.0, 157.0, 75.0, 82.0, 64.0, 54.0, 28.0, 39.0, 29.0, 15.0, 15.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004215240478515625, -0.004086136817932129, -0.003957033157348633, -0.0038279294967651367, -0.0036988258361816406, -0.0035697221755981445, -0.0034406185150146484, -0.0033115148544311523, -0.0031824111938476562, -0.00305330753326416, -0.002924203872680664, -0.002795100212097168, -0.002665996551513672, -0.0025368928909301758, -0.0024077892303466797, -0.0022786855697631836, -0.0021495819091796875, -0.0020204782485961914, -0.0018913745880126953, -0.0017622709274291992, -0.0016331672668457031, -0.001504063606262207, -0.001374959945678711, -0.0012458562850952148, -0.0011167526245117188, -0.0009876489639282227, -0.0008585453033447266, -0.0007294416427612305, -0.0006003379821777344, -0.0004712343215942383, -0.0003421306610107422, -0.0002130270004272461, -8.392333984375e-05, 4.5180320739746094e-05, 0.0001742839813232422, 0.0003033876419067383, 0.0004324913024902344, 0.0005615949630737305, 0.0006906986236572266, 0.0008198022842407227, 0.0009489059448242188, 0.0010780096054077148, 0.001207113265991211, 0.001336216926574707, 0.0014653205871582031, 0.0015944242477416992, 0.0017235279083251953, 0.0018526315689086914, 0.0019817352294921875, 0.0021108388900756836, 0.0022399425506591797, 0.0023690462112426758, 0.002498149871826172, 0.002627253532409668, 0.002756357192993164, 0.00288546085357666, 0.0030145645141601562, 0.0031436681747436523, 0.0032727718353271484, 0.0034018754959106445, 0.0035309791564941406, 0.0036600828170776367, 0.003789186477661133, 0.003918290138244629, 0.004047393798828125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1008.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.665895928861573e-05, 2.276245504617691e-05, 8.218386938096955e-05, 0.00014160529826767743, 0.00020102670532651246, 0.0002604481123853475, 0.00031986954854801297, 0.000379290955606848, 0.00043871236266568303, 0.0004981337697245181, 0.0005575551767833531, 0.000616976642049849, 0.0006763980491086841, 0.0007358194561675191, 0.0007952408632263541, 0.0008546622702851892, 0.0009140836773440242, 0.0009735050844028592, 0.0010329264914616942, 0.0010923478985205293, 0.0011517693055793643, 0.0012111907126381993, 0.0012706122361123562, 0.0013300336431711912, 0.0013894549338147044, 0.0014488763408735394, 0.0015082977479323745, 0.0015677191549912095, 0.0016271405620500445, 0.0016865619691088796, 0.0017459834925830364, 0.0018054048996418715, 0.0018648263067007065, 0.0019242477137595415, 0.0019836691208183765, 0.0020430905278772116, 0.0021025119349360466, 0.0021619333419948816, 0.0022213547490537167, 0.0022807761561125517, 0.0023401975631713867, 0.0023996189702302217, 0.0024590403772890568, 0.002518461784347892, 0.002577883191406727, 0.002637304598465562, 0.002696726005524397, 0.002756147412583232, 0.002815568819642067, 0.002874990226700902, 0.002934411633759737, 0.002993833040818572, 0.003053254447877407, 0.003112675854936242, 0.003172097261995077, 0.003231518669053912, 0.003290940308943391, 0.003350361716002226, 0.003409783123061061, 0.003469204530119896, 0.003528625937178731, 0.003588047344237566, 0.003647468751296401, 0.003706890158355236, 0.003766311565414071]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 15.0, 11.0, 22.0, 27.0, 40.0, 53.0, 48.0, 77.0, 82.0, 97.0, 58.0, 94.0, 76.0, 69.0, 56.0, 47.0, 35.0, 30.0, 18.0, 9.0, 12.0, 15.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001519322395324707, -0.00014598481357097626, -0.0001400373876094818, -0.00013408996164798737, -0.00012814253568649292, -0.00012219510972499847, -0.00011624768376350403, -0.00011030025780200958, -0.00010435283184051514, -9.840540587902069e-05, -9.245797991752625e-05, -8.65105539560318e-05, -8.056312799453735e-05, -7.461570203304291e-05, -6.866827607154846e-05, -6.272085011005402e-05, -5.677342414855957e-05, -5.0825998187065125e-05, -4.487857222557068e-05, -3.893114626407623e-05, -3.298372030258179e-05, -2.703629434108734e-05, -2.1088868379592896e-05, -1.514144241809845e-05, -9.194016456604004e-06, -3.246590495109558e-06, 2.7008354663848877e-06, 8.648261427879333e-06, 1.459568738937378e-05, 2.0543113350868225e-05, 2.649053931236267e-05, 3.243796527385712e-05, 3.838539123535156e-05, 4.433281719684601e-05, 5.0280243158340454e-05, 5.62276691198349e-05, 6.217509508132935e-05, 6.812252104282379e-05, 7.406994700431824e-05, 8.001737296581268e-05, 8.596479892730713e-05, 9.191222488880157e-05, 9.785965085029602e-05, 0.00010380707681179047, 0.00010975450277328491, 0.00011570192873477936, 0.0001216493546962738, 0.00012759678065776825, 0.0001335442066192627, 0.00013949163258075714, 0.0001454390585422516, 0.00015138648450374603, 0.00015733391046524048, 0.00016328133642673492, 0.00016922876238822937, 0.00017517618834972382, 0.00018112361431121826, 0.0001870710402727127, 0.00019301846623420715, 0.0001989658921957016, 0.00020491331815719604, 0.0002108607441186905, 0.00021680817008018494, 0.00022275559604167938, 0.00022870302200317383]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 8.0, 9.0, 17.0, 18.0, 25.0, 16.0, 28.0, 30.0, 42.0, 58.0, 62.0, 94.0, 92.0, 99.0, 62.0, 49.0, 31.0, 28.0, 22.0, 20.0, 27.0, 12.0, 20.0, 10.0, 12.0, 8.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.666259765625, -8.34814453125, -8.030029296875, -7.7119140625, -7.393798828125, -7.07568359375, -6.757568359375, -6.439453125, -6.121337890625, -5.80322265625, -5.485107421875, -5.1669921875, -4.848876953125, -4.53076171875, -4.212646484375, -3.89453125, -3.576416015625, -3.25830078125, -2.940185546875, -2.6220703125, -2.303955078125, -1.98583984375, -1.667724609375, -1.349609375, -1.031494140625, -0.71337890625, -0.395263671875, -0.0771484375, 0.240966796875, 0.55908203125, 0.877197265625, 1.1953125, 1.513427734375, 1.83154296875, 2.149658203125, 2.4677734375, 2.785888671875, 3.10400390625, 3.422119140625, 3.740234375, 4.058349609375, 4.37646484375, 4.694580078125, 5.0126953125, 5.330810546875, 5.64892578125, 5.967041015625, 6.28515625, 6.603271484375, 6.92138671875, 7.239501953125, 7.5576171875, 7.875732421875, 8.19384765625, 8.511962890625, 8.830078125, 9.148193359375, 9.46630859375, 9.784423828125, 10.1025390625, 10.420654296875, 10.73876953125, 11.056884765625, 11.375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 11.0, 17.0, 15.0, 33.0, 41.0, 53.0, 87.0, 105.0, 157.0, 181.0, 264.0, 365.0, 500.0, 749.0, 1109.0, 1650.0, 2760.0, 4670.0, 8910.0, 20372.0, 65274.0, 728714.0, 152277.0, 31795.0, 12404.0, 6218.0, 3351.0, 2094.0, 1351.0, 917.0, 573.0, 436.0, 290.0, 207.0, 177.0, 110.0, 87.0, 70.0, 42.0, 37.0, 27.0, 16.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.625, -37.36767578125, -36.1103515625, -34.85302734375, -33.595703125, -32.33837890625, -31.0810546875, -29.82373046875, -28.56640625, -27.30908203125, -26.0517578125, -24.79443359375, -23.537109375, -22.27978515625, -21.0224609375, -19.76513671875, -18.5078125, -17.25048828125, -15.9931640625, -14.73583984375, -13.478515625, -12.22119140625, -10.9638671875, -9.70654296875, -8.44921875, -7.19189453125, -5.9345703125, -4.67724609375, -3.419921875, -2.16259765625, -0.9052734375, 0.35205078125, 1.609375, 2.86669921875, 4.1240234375, 5.38134765625, 6.638671875, 7.89599609375, 9.1533203125, 10.41064453125, 11.66796875, 12.92529296875, 14.1826171875, 15.43994140625, 16.697265625, 17.95458984375, 19.2119140625, 20.46923828125, 21.7265625, 22.98388671875, 24.2412109375, 25.49853515625, 26.755859375, 28.01318359375, 29.2705078125, 30.52783203125, 31.78515625, 33.04248046875, 34.2998046875, 35.55712890625, 36.814453125, 38.07177734375, 39.3291015625, 40.58642578125, 41.84375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 4.0, 7.0, 7.0, 6.0, 8.0, 9.0, 11.0, 27.0, 24.0, 21.0, 26.0, 20.0, 29.0, 28.0, 36.0, 44.0, 46.0, 44.0, 59.0, 105.0, 281.0, 1538.0, 154.0, 86.0, 57.0, 32.0, 49.0, 31.0, 27.0, 35.0, 31.0, 27.0, 19.0, 21.0, 19.0, 11.0, 12.0, 10.0, 4.0, 5.0, 7.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.21875, -25.40380859375, -24.5888671875, -23.77392578125, -22.958984375, -22.14404296875, -21.3291015625, -20.51416015625, -19.69921875, -18.88427734375, -18.0693359375, -17.25439453125, -16.439453125, -15.62451171875, -14.8095703125, -13.99462890625, -13.1796875, -12.36474609375, -11.5498046875, -10.73486328125, -9.919921875, -9.10498046875, -8.2900390625, -7.47509765625, -6.66015625, -5.84521484375, -5.0302734375, -4.21533203125, -3.400390625, -2.58544921875, -1.7705078125, -0.95556640625, -0.140625, 0.67431640625, 1.4892578125, 2.30419921875, 3.119140625, 3.93408203125, 4.7490234375, 5.56396484375, 6.37890625, 7.19384765625, 8.0087890625, 8.82373046875, 9.638671875, 10.45361328125, 11.2685546875, 12.08349609375, 12.8984375, 13.71337890625, 14.5283203125, 15.34326171875, 16.158203125, 16.97314453125, 17.7880859375, 18.60302734375, 19.41796875, 20.23291015625, 21.0478515625, 21.86279296875, 22.677734375, 23.49267578125, 24.3076171875, 25.12255859375, 25.9375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 11.0, 13.0, 18.0, 18.0, 22.0, 35.0, 32.0, 45.0, 87.0, 114.0, 203.0, 562.0, 4534.0, 2598080.0, 537207.0, 3519.0, 475.0, 201.0, 118.0, 77.0, 56.0, 33.0, 34.0, 25.0, 23.0, 21.0, 20.0, 16.0, 11.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.0029296875, -99.318359375, -95.6337890625, -91.94921875, -88.2646484375, -84.580078125, -80.8955078125, -77.2109375, -73.5263671875, -69.841796875, -66.1572265625, -62.47265625, -58.7880859375, -55.103515625, -51.4189453125, -47.734375, -44.0498046875, -40.365234375, -36.6806640625, -32.99609375, -29.3115234375, -25.626953125, -21.9423828125, -18.2578125, -14.5732421875, -10.888671875, -7.2041015625, -3.51953125, 0.1650390625, 3.849609375, 7.5341796875, 11.21875, 14.9033203125, 18.587890625, 22.2724609375, 25.95703125, 29.6416015625, 33.326171875, 37.0107421875, 40.6953125, 44.3798828125, 48.064453125, 51.7490234375, 55.43359375, 59.1181640625, 62.802734375, 66.4873046875, 70.171875, 73.8564453125, 77.541015625, 81.2255859375, 84.91015625, 88.5947265625, 92.279296875, 95.9638671875, 99.6484375, 103.3330078125, 107.017578125, 110.7021484375, 114.38671875, 118.0712890625, 121.755859375, 125.4404296875, 129.125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 42.0, 305.0, 468.0, 138.0, 32.0, 17.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-177.86587524414062, -172.7935791015625, -167.7212677001953, -162.64895629882812, -157.57666015625, -152.50436401367188, -147.4320526123047, -142.3597412109375, -137.28744506835938, -132.21514892578125, -127.14283752441406, -122.0705337524414, -116.99822998046875, -111.9259262084961, -106.85362243652344, -101.78131866455078, -96.70901489257812, -91.63671112060547, -86.56440734863281, -81.49210357666016, -76.4197998046875, -71.34749603271484, -66.27519226074219, -61.20288848876953, -56.130584716796875, -51.05828094482422, -45.98597717285156, -40.913673400878906, -35.84136962890625, -30.769065856933594, -25.696762084960938, -20.62445831298828, -15.552154541015625, -10.479850769042969, -5.4075469970703125, -0.33524322509765625, 4.737060546875, 9.809364318847656, 14.881668090820312, 19.95397186279297, 25.026275634765625, 30.09857940673828, 35.17088317871094, 40.243186950683594, 45.31549072265625, 50.387794494628906, 55.46009826660156, 60.53240203857422, 65.60470581054688, 70.67700958251953, 75.74931335449219, 80.82161712646484, 85.8939208984375, 90.96622467041016, 96.03852844238281, 101.11083221435547, 106.18313598632812, 111.25543975830078, 116.32774353027344, 121.4000473022461, 126.47235107421875, 131.54464721679688, 136.61695861816406, 141.68927001953125, 146.76156616210938]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 12.0, 9.0, 11.0, 12.0, 18.0, 17.0, 28.0, 32.0, 31.0, 37.0, 45.0, 52.0, 49.0, 46.0, 61.0, 54.0, 65.0, 51.0, 52.0, 49.0, 55.0, 35.0, 30.0, 42.0, 28.0, 23.0, 14.0, 17.0, 9.0, 6.0, 3.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.12557983398438, -114.09078216552734, -110.05598449707031, -106.02118682861328, -101.98638916015625, -97.95159149169922, -93.91679382324219, -89.88199615478516, -85.84719848632812, -81.8124008178711, -77.77760314941406, -73.74280548095703, -69.7080078125, -65.67321014404297, -61.63841247558594, -57.603614807128906, -53.568817138671875, -49.534019470214844, -45.49922180175781, -41.46442413330078, -37.42962646484375, -33.39482879638672, -29.360031127929688, -25.325233459472656, -21.290435791015625, -17.255638122558594, -13.220840454101562, -9.186042785644531, -5.1512451171875, -1.1164474487304688, 2.9183502197265625, 6.953147888183594, 10.987945556640625, 15.022743225097656, 19.057540893554688, 23.09233856201172, 27.12713623046875, 31.16193389892578, 35.19673156738281, 39.231529235839844, 43.266326904296875, 47.301124572753906, 51.33592224121094, 55.37071990966797, 59.405517578125, 63.44031524658203, 67.47511291503906, 71.5099105834961, 75.54470825195312, 79.57950592041016, 83.61430358886719, 87.64910125732422, 91.68389892578125, 95.71869659423828, 99.75349426269531, 103.78829193115234, 107.82308959960938, 111.8578872680664, 115.89268493652344, 119.92748260498047, 123.9622802734375, 127.99707794189453, 132.03187561035156, 136.06668090820312, 140.10147094726562]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 17.0, 7.0, 12.0, 7.0, 6.0, 11.0, 16.0, 21.0, 18.0, 14.0, 26.0, 35.0, 39.0, 57.0, 76.0, 85.0, 66.0, 83.0, 73.0, 51.0, 43.0, 27.0, 36.0, 22.0, 13.0, 23.0, 17.0, 15.0, 7.0, 10.0, 7.0, 9.0, 8.0, 4.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.409912109375, -8.09326171875, -7.776611328125, -7.4599609375, -7.143310546875, -6.82666015625, -6.510009765625, -6.193359375, -5.876708984375, -5.56005859375, -5.243408203125, -4.9267578125, -4.610107421875, -4.29345703125, -3.976806640625, -3.66015625, -3.343505859375, -3.02685546875, -2.710205078125, -2.3935546875, -2.076904296875, -1.76025390625, -1.443603515625, -1.126953125, -0.810302734375, -0.49365234375, -0.177001953125, 0.1396484375, 0.456298828125, 0.77294921875, 1.089599609375, 1.40625, 1.722900390625, 2.03955078125, 2.356201171875, 2.6728515625, 2.989501953125, 3.30615234375, 3.622802734375, 3.939453125, 4.256103515625, 4.57275390625, 4.889404296875, 5.2060546875, 5.522705078125, 5.83935546875, 6.156005859375, 6.47265625, 6.789306640625, 7.10595703125, 7.422607421875, 7.7392578125, 8.055908203125, 8.37255859375, 8.689208984375, 9.005859375, 9.322509765625, 9.63916015625, 9.955810546875, 10.2724609375, 10.589111328125, 10.90576171875, 11.222412109375, 11.5390625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 14.0, 9.0, 9.0, 22.0, 13.0, 22.0, 46.0, 44.0, 88.0, 110.0, 220.0, 316.0, 607.0, 1356.0, 3679.0, 17056.0, 3957117.0, 201234.0, 7942.0, 2257.0, 905.0, 415.0, 273.0, 170.0, 103.0, 50.0, 51.0, 25.0, 27.0, 20.0, 10.0, 9.0, 13.0, 7.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5625, -76.6982421875, -73.833984375, -70.9697265625, -68.10546875, -65.2412109375, -62.376953125, -59.5126953125, -56.6484375, -53.7841796875, -50.919921875, -48.0556640625, -45.19140625, -42.3271484375, -39.462890625, -36.5986328125, -33.734375, -30.8701171875, -28.005859375, -25.1416015625, -22.27734375, -19.4130859375, -16.548828125, -13.6845703125, -10.8203125, -7.9560546875, -5.091796875, -2.2275390625, 0.63671875, 3.5009765625, 6.365234375, 9.2294921875, 12.09375, 14.9580078125, 17.822265625, 20.6865234375, 23.55078125, 26.4150390625, 29.279296875, 32.1435546875, 35.0078125, 37.8720703125, 40.736328125, 43.6005859375, 46.46484375, 49.3291015625, 52.193359375, 55.0576171875, 57.921875, 60.7861328125, 63.650390625, 66.5146484375, 69.37890625, 72.2431640625, 75.107421875, 77.9716796875, 80.8359375, 83.7001953125, 86.564453125, 89.4287109375, 92.29296875, 95.1572265625, 98.021484375, 100.8857421875, 103.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 2.0, 5.0, 6.0, 11.0, 9.0, 9.0, 13.0, 17.0, 33.0, 25.0, 38.0, 74.0, 125.0, 283.0, 601.0, 1021.0, 816.0, 403.0, 200.0, 95.0, 58.0, 41.0, 35.0, 20.0, 19.0, 16.0, 13.0, 11.0, 9.0, 8.0, 3.0, 4.0, 6.0, 8.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.4375, -28.537353515625, -27.63720703125, -26.737060546875, -25.8369140625, -24.936767578125, -24.03662109375, -23.136474609375, -22.236328125, -21.336181640625, -20.43603515625, -19.535888671875, -18.6357421875, -17.735595703125, -16.83544921875, -15.935302734375, -15.03515625, -14.135009765625, -13.23486328125, -12.334716796875, -11.4345703125, -10.534423828125, -9.63427734375, -8.734130859375, -7.833984375, -6.933837890625, -6.03369140625, -5.133544921875, -4.2333984375, -3.333251953125, -2.43310546875, -1.532958984375, -0.6328125, 0.267333984375, 1.16748046875, 2.067626953125, 2.9677734375, 3.867919921875, 4.76806640625, 5.668212890625, 6.568359375, 7.468505859375, 8.36865234375, 9.268798828125, 10.1689453125, 11.069091796875, 11.96923828125, 12.869384765625, 13.76953125, 14.669677734375, 15.56982421875, 16.469970703125, 17.3701171875, 18.270263671875, 19.17041015625, 20.070556640625, 20.970703125, 21.870849609375, 22.77099609375, 23.671142578125, 24.5712890625, 25.471435546875, 26.37158203125, 27.271728515625, 28.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 10.0, 6.0, 6.0, 11.0, 18.0, 21.0, 47.0, 46.0, 88.0, 136.0, 243.0, 485.0, 1025.0, 2727.0, 8026.0, 27596.0, 244579.0, 3791552.0, 91075.0, 17483.0, 5495.0, 1907.0, 751.0, 365.0, 199.0, 117.0, 69.0, 56.0, 34.0, 23.0, 18.0, 8.0, 7.0, 7.0, 7.0, 10.0, 3.0, 5.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.75, -60.86767578125, -58.9853515625, -57.10302734375, -55.220703125, -53.33837890625, -51.4560546875, -49.57373046875, -47.69140625, -45.80908203125, -43.9267578125, -42.04443359375, -40.162109375, -38.27978515625, -36.3974609375, -34.51513671875, -32.6328125, -30.75048828125, -28.8681640625, -26.98583984375, -25.103515625, -23.22119140625, -21.3388671875, -19.45654296875, -17.57421875, -15.69189453125, -13.8095703125, -11.92724609375, -10.044921875, -8.16259765625, -6.2802734375, -4.39794921875, -2.515625, -0.63330078125, 1.2490234375, 3.13134765625, 5.013671875, 6.89599609375, 8.7783203125, 10.66064453125, 12.54296875, 14.42529296875, 16.3076171875, 18.18994140625, 20.072265625, 21.95458984375, 23.8369140625, 25.71923828125, 27.6015625, 29.48388671875, 31.3662109375, 33.24853515625, 35.130859375, 37.01318359375, 38.8955078125, 40.77783203125, 42.66015625, 44.54248046875, 46.4248046875, 48.30712890625, 50.189453125, 52.07177734375, 53.9541015625, 55.83642578125, 57.71875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 12.0, 41.0, 203.0, 579.0, 122.0, 37.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-296.17376708984375, -286.0932312011719, -276.0126953125, -265.93212890625, -255.85159301757812, -245.77105712890625, -235.6905059814453, -225.60995483398438, -215.5294189453125, -205.44888305664062, -195.3683319091797, -185.28778076171875, -175.20724487304688, -165.126708984375, -155.04615783691406, -144.96560668945312, -134.88507080078125, -124.80452728271484, -114.72398376464844, -104.64344024658203, -94.56289672851562, -84.48235321044922, -74.40180969238281, -64.3212661743164, -54.24072265625, -44.160179138183594, -34.07963562011719, -23.99909210205078, -13.918548583984375, -3.8380050659179688, 6.2425384521484375, 16.323081970214844, 26.403656005859375, 36.48419952392578, 46.56474304199219, 56.645286560058594, 66.725830078125, 76.8063735961914, 86.88691711425781, 96.96746063232422, 107.04800415039062, 117.12854766845703, 127.20909118652344, 137.28964233398438, 147.37017822265625, 157.45071411132812, 167.53126525878906, 177.61181640625, 187.69235229492188, 197.77288818359375, 207.8534393310547, 217.93399047851562, 228.0145263671875, 238.09506225585938, 248.1756134033203, 258.25616455078125, 268.3367004394531, 278.417236328125, 288.497802734375, 298.5783386230469, 308.65887451171875, 318.7394104003906, 328.8199462890625, 338.9005126953125, 348.9810485839844]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 11.0, 13.0, 16.0, 12.0, 19.0, 16.0, 24.0, 23.0, 26.0, 30.0, 39.0, 38.0, 41.0, 50.0, 48.0, 44.0, 44.0, 48.0, 40.0, 35.0, 38.0, 42.0, 41.0, 34.0, 23.0, 16.0, 20.0, 18.0, 20.0, 19.0, 23.0, 8.0, 10.0, 13.0, 8.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-89.58663940429688, -86.78866577148438, -83.99069213867188, -81.19271850585938, -78.39474487304688, -75.59677124023438, -72.79879760742188, -70.00081634521484, -67.20284271240234, -64.40486907958984, -61.606895446777344, -58.808921813964844, -56.01094436645508, -53.21297073364258, -50.41499710083008, -47.61701965332031, -44.81904983520508, -42.02107620239258, -39.22310256958008, -36.42512512207031, -33.62715148925781, -30.829177856445312, -28.031204223632812, -25.23322868347168, -22.43525505065918, -19.63728141784668, -16.839305877685547, -14.041332244873047, -11.24335765838623, -8.445383071899414, -5.647409439086914, -2.8494338989257812, -0.05146026611328125, 2.746514081954956, 5.544488430023193, 8.342462539672852, 11.140437126159668, 13.938411712646484, 16.736385345458984, 19.534360885620117, 22.332334518432617, 25.130308151245117, 27.92828369140625, 30.72625732421875, 33.52423095703125, 36.32220458984375, 39.12017822265625, 41.918155670166016, 44.716129302978516, 47.514102935791016, 50.312076568603516, 53.11005401611328, 55.90802764892578, 58.70600128173828, 61.50397491455078, 64.30194854736328, 67.09992218017578, 69.89789581298828, 72.69586944580078, 75.49384307861328, 78.29181671142578, 81.08979797363281, 83.88777160644531, 86.68574523925781, 89.48371887207031]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 8.0, 13.0, 5.0, 5.0, 18.0, 5.0, 20.0, 21.0, 18.0, 27.0, 26.0, 34.0, 51.0, 63.0, 62.0, 66.0, 69.0, 75.0, 59.0, 59.0, 39.0, 28.0, 30.0, 25.0, 20.0, 22.0, 19.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.95947265625, -7.6689453125, -7.37841796875, -7.087890625, -6.79736328125, -6.5068359375, -6.21630859375, -5.92578125, -5.63525390625, -5.3447265625, -5.05419921875, -4.763671875, -4.47314453125, -4.1826171875, -3.89208984375, -3.6015625, -3.31103515625, -3.0205078125, -2.72998046875, -2.439453125, -2.14892578125, -1.8583984375, -1.56787109375, -1.27734375, -0.98681640625, -0.6962890625, -0.40576171875, -0.115234375, 0.17529296875, 0.4658203125, 0.75634765625, 1.046875, 1.33740234375, 1.6279296875, 1.91845703125, 2.208984375, 2.49951171875, 2.7900390625, 3.08056640625, 3.37109375, 3.66162109375, 3.9521484375, 4.24267578125, 4.533203125, 4.82373046875, 5.1142578125, 5.40478515625, 5.6953125, 5.98583984375, 6.2763671875, 6.56689453125, 6.857421875, 7.14794921875, 7.4384765625, 7.72900390625, 8.01953125, 8.31005859375, 8.6005859375, 8.89111328125, 9.181640625, 9.47216796875, 9.7626953125, 10.05322265625, 10.34375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 9.0, 13.0, 22.0, 30.0, 36.0, 85.0, 112.0, 156.0, 267.0, 395.0, 610.0, 876.0, 1339.0, 2044.0, 3128.0, 4862.0, 7496.0, 11716.0, 19894.0, 34611.0, 64622.0, 130183.0, 278723.0, 240410.0, 111806.0, 56263.0, 30677.0, 17713.0, 10845.0, 6669.0, 4486.0, 2906.0, 1884.0, 1254.0, 816.0, 544.0, 344.0, 235.0, 179.0, 109.0, 58.0, 40.0, 33.0, 18.0, 9.0, 8.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.17801284790039062, -0.17243194580078125, -0.16685104370117188, -0.1612701416015625, -0.15568923950195312, -0.15010833740234375, -0.14452743530273438, -0.138946533203125, -0.13336563110351562, -0.12778472900390625, -0.12220382690429688, -0.1166229248046875, -0.11104202270507812, -0.10546112060546875, -0.09988021850585938, -0.09429931640625, -0.08871841430664062, -0.08313751220703125, -0.07755661010742188, -0.0719757080078125, -0.06639480590820312, -0.06081390380859375, -0.055233001708984375, -0.049652099609375, -0.044071197509765625, -0.03849029541015625, -0.032909393310546875, -0.0273284912109375, -0.021747589111328125, -0.01616668701171875, -0.010585784912109375, -0.0050048828125, 0.000576019287109375, 0.00615692138671875, 0.011737823486328125, 0.0173187255859375, 0.022899627685546875, 0.02848052978515625, 0.034061431884765625, 0.039642333984375, 0.045223236083984375, 0.05080413818359375, 0.056385040283203125, 0.0619659423828125, 0.06754684448242188, 0.07312774658203125, 0.07870864868164062, 0.08428955078125, 0.08987045288085938, 0.09545135498046875, 0.10103225708007812, 0.1066131591796875, 0.11219406127929688, 0.11777496337890625, 0.12335586547851562, 0.128936767578125, 0.13451766967773438, 0.14009857177734375, 0.14567947387695312, 0.1512603759765625, 0.15684127807617188, 0.16242218017578125, 0.16800308227539062, 0.173583984375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 11.0, 21.0, 13.0, 19.0, 21.0, 38.0, 25.0, 32.0, 28.0, 42.0, 39.0, 35.0, 30.0, 48.0, 52.0, 1068.0, 47.0, 41.0, 38.0, 43.0, 33.0, 32.0, 36.0, 30.0, 28.0, 30.0, 22.0, 20.0, 13.0, 20.0, 11.0, 7.0, 12.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.043212890625, -3.91064453125, -3.778076171875, -3.6455078125, -3.512939453125, -3.38037109375, -3.247802734375, -3.115234375, -2.982666015625, -2.85009765625, -2.717529296875, -2.5849609375, -2.452392578125, -2.31982421875, -2.187255859375, -2.0546875, -1.922119140625, -1.78955078125, -1.656982421875, -1.5244140625, -1.391845703125, -1.25927734375, -1.126708984375, -0.994140625, -0.861572265625, -0.72900390625, -0.596435546875, -0.4638671875, -0.331298828125, -0.19873046875, -0.066162109375, 0.06640625, 0.198974609375, 0.33154296875, 0.464111328125, 0.5966796875, 0.729248046875, 0.86181640625, 0.994384765625, 1.126953125, 1.259521484375, 1.39208984375, 1.524658203125, 1.6572265625, 1.789794921875, 1.92236328125, 2.054931640625, 2.1875, 2.320068359375, 2.45263671875, 2.585205078125, 2.7177734375, 2.850341796875, 2.98291015625, 3.115478515625, 3.248046875, 3.380615234375, 3.51318359375, 3.645751953125, 3.7783203125, 3.910888671875, 4.04345703125, 4.176025390625, 4.30859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 7.0, 3.0, 9.0, 10.0, 16.0, 32.0, 42.0, 55.0, 97.0, 124.0, 172.0, 258.0, 349.0, 519.0, 743.0, 1168.0, 1601.0, 2336.0, 3505.0, 4964.0, 7378.0, 10645.0, 15421.0, 23526.0, 34072.0, 49646.0, 73216.0, 112082.0, 177446.0, 1219606.0, 117368.0, 77149.0, 51968.0, 35445.0, 24223.0, 16378.0, 11198.0, 7675.0, 5247.0, 3501.0, 2421.0, 1684.0, 1191.0, 876.0, 524.0, 400.0, 262.0, 193.0, 109.0, 88.0, 78.0, 51.0, 24.0, 9.0, 10.0, 11.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.0557861328125, -0.05398988723754883, -0.052193641662597656, -0.050397396087646484, -0.04860115051269531, -0.04680490493774414, -0.04500865936279297, -0.0432124137878418, -0.041416168212890625, -0.03961992263793945, -0.03782367706298828, -0.03602743148803711, -0.03423118591308594, -0.032434940338134766, -0.030638694763183594, -0.028842449188232422, -0.02704620361328125, -0.025249958038330078, -0.023453712463378906, -0.021657466888427734, -0.019861221313476562, -0.01806497573852539, -0.01626873016357422, -0.014472484588623047, -0.012676239013671875, -0.010879993438720703, -0.009083747863769531, -0.007287502288818359, -0.0054912567138671875, -0.0036950111389160156, -0.0018987655639648438, -0.00010251998901367188, 0.0016937255859375, 0.003489971160888672, 0.005286216735839844, 0.007082462310791016, 0.008878707885742188, 0.01067495346069336, 0.012471199035644531, 0.014267444610595703, 0.016063690185546875, 0.017859935760498047, 0.01965618133544922, 0.02145242691040039, 0.023248672485351562, 0.025044918060302734, 0.026841163635253906, 0.028637409210205078, 0.03043365478515625, 0.03222990036010742, 0.034026145935058594, 0.035822391510009766, 0.03761863708496094, 0.03941488265991211, 0.04121112823486328, 0.04300737380981445, 0.044803619384765625, 0.0465998649597168, 0.04839611053466797, 0.05019235610961914, 0.05198860168457031, 0.053784847259521484, 0.055581092834472656, 0.05737733840942383, 0.059173583984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 6.0, 5.0, 17.0, 19.0, 26.0, 25.0, 34.0, 35.0, 57.0, 57.0, 85.0, 67.0, 80.0, 72.0, 61.0, 63.0, 66.0, 59.0, 38.0, 30.0, 15.0, 15.0, 13.0, 9.0, 8.0, 6.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001628398895263672, -0.00015756674110889435, -0.0001522935926914215, -0.00014702044427394867, -0.00014174729585647583, -0.000136474147439003, -0.00013120099902153015, -0.0001259278506040573, -0.00012065470218658447, -0.00011538155376911163, -0.0001101084053516388, -0.00010483525693416595, -9.956210851669312e-05, -9.428896009922028e-05, -8.901581168174744e-05, -8.37426632642746e-05, -7.846951484680176e-05, -7.319636642932892e-05, -6.792321801185608e-05, -6.265006959438324e-05, -5.73769211769104e-05, -5.210377275943756e-05, -4.683062434196472e-05, -4.155747592449188e-05, -3.628432750701904e-05, -3.1011179089546204e-05, -2.5738030672073364e-05, -2.0464882254600525e-05, -1.5191733837127686e-05, -9.918585419654846e-06, -4.645437002182007e-06, 6.277114152908325e-07, 5.900859832763672e-06, 1.1174008250236511e-05, 1.644715666770935e-05, 2.172030508518219e-05, 2.699345350265503e-05, 3.226660192012787e-05, 3.753975033760071e-05, 4.281289875507355e-05, 4.808604717254639e-05, 5.3359195590019226e-05, 5.8632344007492065e-05, 6.39054924249649e-05, 6.917864084243774e-05, 7.445178925991058e-05, 7.972493767738342e-05, 8.499808609485626e-05, 9.02712345123291e-05, 9.554438292980194e-05, 0.00010081753134727478, 0.00010609067976474762, 0.00011136382818222046, 0.0001166369765996933, 0.00012191012501716614, 0.00012718327343463898, 0.00013245642185211182, 0.00013772957026958466, 0.0001430027186870575, 0.00014827586710453033, 0.00015354901552200317, 0.000158822163939476, 0.00016409531235694885, 0.0001693684607744217, 0.00017464160919189453]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 14.0, 12.0, 10.0, 18.0, 20.0, 22.0, 42.0, 56.0, 70.0, 80.0, 94.0, 149.0, 227.0, 283.0, 490.0, 4432.0, 1033649.0, 7239.0, 528.0, 272.0, 221.0, 157.0, 140.0, 65.0, 49.0, 53.0, 28.0, 31.0, 18.0, 16.0, 15.0, 9.0, 10.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0027408599853515625, -0.002651125192642212, -0.0025613903999328613, -0.0024716556072235107, -0.00238192081451416, -0.0022921860218048096, -0.002202451229095459, -0.0021127164363861084, -0.002022981643676758, -0.0019332468509674072, -0.0018435120582580566, -0.001753777265548706, -0.0016640424728393555, -0.0015743076801300049, -0.0014845728874206543, -0.0013948380947113037, -0.0013051033020019531, -0.0012153685092926025, -0.001125633716583252, -0.0010358989238739014, -0.0009461641311645508, -0.0008564293384552002, -0.0007666945457458496, -0.000676959753036499, -0.0005872249603271484, -0.0004974901676177979, -0.00040775537490844727, -0.0003180205821990967, -0.0002282857894897461, -0.0001385509967803955, -4.881620407104492e-05, 4.0918588638305664e-05, 0.00013065338134765625, 0.00022038817405700684, 0.0003101229667663574, 0.000399857759475708, 0.0004895925521850586, 0.0005793273448944092, 0.0006690621376037598, 0.0007587969303131104, 0.0008485317230224609, 0.0009382665157318115, 0.0010280013084411621, 0.0011177361011505127, 0.0012074708938598633, 0.0012972056865692139, 0.0013869404792785645, 0.001476675271987915, 0.0015664100646972656, 0.0016561448574066162, 0.0017458796501159668, 0.0018356144428253174, 0.001925349235534668, 0.0020150840282440186, 0.002104818820953369, 0.0021945536136627197, 0.0022842884063720703, 0.002374023199081421, 0.0024637579917907715, 0.002553492784500122, 0.0026432275772094727, 0.0027329623699188232, 0.002822697162628174, 0.0029124319553375244, 0.003002166748046875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [75.0, 925.0, 16.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.584178921300918e-05, -8.314827937283553e-06, 1.9212133338442072e-05, 4.6739092795178294e-05, 7.426605588989332e-05, 0.00010179301898460835, 0.00012931997480336577, 0.0001568469451740384, 0.00018437390099279583, 0.00021190085681155324, 0.00023942782718222588, 0.00026695476844906807, 0.00029448175337165594, 0.00032200870919041336, 0.00034953566500917077, 0.00037706264993175864, 0.0004045895766466856, 0.000432116532465443, 0.00045964348828420043, 0.0004871704732067883, 0.0005146973999217153, 0.0005422243848443031, 0.000569751369766891, 0.000597278296481818, 0.0006248052814044058, 0.0006523322663269937, 0.0006798591930419207, 0.0007073861779645085, 0.0007349131046794355, 0.0007624400896020234, 0.0007899670163169503, 0.0008174940012395382, 0.0008450209279544652, 0.000872547912877053, 0.00090007483959198, 0.0009276018245145679, 0.0009551287512294948, 0.0009826556779444218, 0.0010101826628670096, 0.0010377096477895975, 0.0010652366327121854, 0.0010927636176347733, 0.0011202906025573611, 0.0011478174710646272, 0.001175344455987215, 0.001202871440909803, 0.0012303984258323908, 0.0012579254107549787, 0.0012854522792622447, 0.0013129792641848326, 0.0013405062491074204, 0.0013680331176146865, 0.0013955601025372744, 0.0014230870874598622, 0.00145061407238245, 0.001478141057305038, 0.0015056680422276258, 0.0015331950271502137, 0.0015607220120728016, 0.0015882488805800676, 0.0016157758655026555, 0.0016433028504252434, 0.0016708298353478312, 0.0016983568202704191, 0.0017258836887776852]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 12.0, 11.0, 10.0, 11.0, 18.0, 25.0, 18.0, 35.0, 35.0, 41.0, 62.0, 44.0, 34.0, 37.0, 43.0, 53.0, 45.0, 52.0, 46.0, 48.0, 60.0, 42.0, 26.0, 47.0, 33.0, 19.0, 14.0, 13.0, 13.0, 13.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.495019912719727e-05, -9.189825505018234e-05, -8.884631097316742e-05, -8.57943668961525e-05, -8.274242281913757e-05, -7.969047874212265e-05, -7.663853466510773e-05, -7.35865905880928e-05, -7.053464651107788e-05, -6.748270243406296e-05, -6.443075835704803e-05, -6.137881428003311e-05, -5.832687020301819e-05, -5.5274926126003265e-05, -5.222298204898834e-05, -4.917103797197342e-05, -4.6119093894958496e-05, -4.306714981794357e-05, -4.001520574092865e-05, -3.696326166391373e-05, -3.3911317586898804e-05, -3.085937350988388e-05, -2.7807429432868958e-05, -2.4755485355854034e-05, -2.170354127883911e-05, -1.8651597201824188e-05, -1.5599653124809265e-05, -1.2547709047794342e-05, -9.495764970779419e-06, -6.443820893764496e-06, -3.3918768167495728e-06, -3.3993273973464966e-07, 2.7120113372802734e-06, 5.7639554142951965e-06, 8.81589949131012e-06, 1.1867843568325043e-05, 1.4919787645339966e-05, 1.797173172235489e-05, 2.1023675799369812e-05, 2.4075619876384735e-05, 2.7127563953399658e-05, 3.017950803041458e-05, 3.3231452107429504e-05, 3.628339618444443e-05, 3.933534026145935e-05, 4.2387284338474274e-05, 4.54392284154892e-05, 4.849117249250412e-05, 5.154311656951904e-05, 5.4595060646533966e-05, 5.764700472354889e-05, 6.069894880056381e-05, 6.375089287757874e-05, 6.680283695459366e-05, 6.985478103160858e-05, 7.29067251086235e-05, 7.595866918563843e-05, 7.901061326265335e-05, 8.206255733966827e-05, 8.51145014166832e-05, 8.816644549369812e-05, 9.121838957071304e-05, 9.427033364772797e-05, 9.732227772474289e-05, 0.00010037422180175781]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 8.0, 13.0, 5.0, 5.0, 18.0, 5.0, 20.0, 21.0, 18.0, 27.0, 26.0, 34.0, 51.0, 63.0, 62.0, 66.0, 69.0, 75.0, 59.0, 59.0, 39.0, 28.0, 30.0, 25.0, 20.0, 22.0, 19.0, 16.0, 11.0, 7.0, 10.0, 5.0, 4.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.95947265625, -7.6689453125, -7.37841796875, -7.087890625, -6.79736328125, -6.5068359375, -6.21630859375, -5.92578125, -5.63525390625, -5.3447265625, -5.05419921875, -4.763671875, -4.47314453125, -4.1826171875, -3.89208984375, -3.6015625, -3.31103515625, -3.0205078125, -2.72998046875, -2.439453125, -2.14892578125, -1.8583984375, -1.56787109375, -1.27734375, -0.98681640625, -0.6962890625, -0.40576171875, -0.115234375, 0.17529296875, 0.4658203125, 0.75634765625, 1.046875, 1.33740234375, 1.6279296875, 1.91845703125, 2.208984375, 2.49951171875, 2.7900390625, 3.08056640625, 3.37109375, 3.66162109375, 3.9521484375, 4.24267578125, 4.533203125, 4.82373046875, 5.1142578125, 5.40478515625, 5.6953125, 5.98583984375, 6.2763671875, 6.56689453125, 6.857421875, 7.14794921875, 7.4384765625, 7.72900390625, 8.01953125, 8.31005859375, 8.6005859375, 8.89111328125, 9.181640625, 9.47216796875, 9.7626953125, 10.05322265625, 10.34375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 6.0, 6.0, 19.0, 14.0, 27.0, 38.0, 42.0, 67.0, 85.0, 94.0, 139.0, 198.0, 270.0, 379.0, 508.0, 726.0, 1032.0, 1499.0, 2386.0, 3828.0, 7613.0, 20219.0, 111530.0, 801116.0, 64904.0, 15314.0, 6268.0, 3444.0, 2097.0, 1254.0, 973.0, 672.0, 498.0, 362.0, 242.0, 175.0, 128.0, 99.0, 87.0, 56.0, 52.0, 26.0, 29.0, 18.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.515625, -17.925537109375, -17.33544921875, -16.745361328125, -16.1552734375, -15.565185546875, -14.97509765625, -14.385009765625, -13.794921875, -13.204833984375, -12.61474609375, -12.024658203125, -11.4345703125, -10.844482421875, -10.25439453125, -9.664306640625, -9.07421875, -8.484130859375, -7.89404296875, -7.303955078125, -6.7138671875, -6.123779296875, -5.53369140625, -4.943603515625, -4.353515625, -3.763427734375, -3.17333984375, -2.583251953125, -1.9931640625, -1.403076171875, -0.81298828125, -0.222900390625, 0.3671875, 0.957275390625, 1.54736328125, 2.137451171875, 2.7275390625, 3.317626953125, 3.90771484375, 4.497802734375, 5.087890625, 5.677978515625, 6.26806640625, 6.858154296875, 7.4482421875, 8.038330078125, 8.62841796875, 9.218505859375, 9.80859375, 10.398681640625, 10.98876953125, 11.578857421875, 12.1689453125, 12.759033203125, 13.34912109375, 13.939208984375, 14.529296875, 15.119384765625, 15.70947265625, 16.299560546875, 16.8896484375, 17.479736328125, 18.06982421875, 18.659912109375, 19.25]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 7.0, 11.0, 17.0, 11.0, 11.0, 16.0, 18.0, 12.0, 20.0, 31.0, 33.0, 36.0, 32.0, 37.0, 49.0, 38.0, 56.0, 80.0, 417.0, 1563.0, 79.0, 59.0, 34.0, 37.0, 45.0, 42.0, 35.0, 39.0, 17.0, 21.0, 25.0, 24.0, 12.0, 15.0, 11.0, 15.0, 4.0, 6.0, 7.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.42431640625, -30.4736328125, -29.52294921875, -28.572265625, -27.62158203125, -26.6708984375, -25.72021484375, -24.76953125, -23.81884765625, -22.8681640625, -21.91748046875, -20.966796875, -20.01611328125, -19.0654296875, -18.11474609375, -17.1640625, -16.21337890625, -15.2626953125, -14.31201171875, -13.361328125, -12.41064453125, -11.4599609375, -10.50927734375, -9.55859375, -8.60791015625, -7.6572265625, -6.70654296875, -5.755859375, -4.80517578125, -3.8544921875, -2.90380859375, -1.953125, -1.00244140625, -0.0517578125, 0.89892578125, 1.849609375, 2.80029296875, 3.7509765625, 4.70166015625, 5.65234375, 6.60302734375, 7.5537109375, 8.50439453125, 9.455078125, 10.40576171875, 11.3564453125, 12.30712890625, 13.2578125, 14.20849609375, 15.1591796875, 16.10986328125, 17.060546875, 18.01123046875, 18.9619140625, 19.91259765625, 20.86328125, 21.81396484375, 22.7646484375, 23.71533203125, 24.666015625, 25.61669921875, 26.5673828125, 27.51806640625, 28.46875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 3.0, 10.0, 2.0, 4.0, 6.0, 9.0, 4.0, 13.0, 14.0, 19.0, 26.0, 29.0, 26.0, 35.0, 72.0, 90.0, 116.0, 206.0, 415.0, 833.0, 2446.0, 10272.0, 106567.0, 2984270.0, 31730.0, 5473.0, 1561.0, 592.0, 287.0, 168.0, 106.0, 69.0, 50.0, 41.0, 23.0, 21.0, 13.0, 22.0, 12.0, 11.0, 12.0, 10.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.15625, -49.28173828125, -47.4072265625, -45.53271484375, -43.658203125, -41.78369140625, -39.9091796875, -38.03466796875, -36.16015625, -34.28564453125, -32.4111328125, -30.53662109375, -28.662109375, -26.78759765625, -24.9130859375, -23.03857421875, -21.1640625, -19.28955078125, -17.4150390625, -15.54052734375, -13.666015625, -11.79150390625, -9.9169921875, -8.04248046875, -6.16796875, -4.29345703125, -2.4189453125, -0.54443359375, 1.330078125, 3.20458984375, 5.0791015625, 6.95361328125, 8.828125, 10.70263671875, 12.5771484375, 14.45166015625, 16.326171875, 18.20068359375, 20.0751953125, 21.94970703125, 23.82421875, 25.69873046875, 27.5732421875, 29.44775390625, 31.322265625, 33.19677734375, 35.0712890625, 36.94580078125, 38.8203125, 40.69482421875, 42.5693359375, 44.44384765625, 46.318359375, 48.19287109375, 50.0673828125, 51.94189453125, 53.81640625, 55.69091796875, 57.5654296875, 59.43994140625, 61.314453125, 63.18896484375, 65.0634765625, 66.93798828125, 68.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 961.0, 57.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.7734260559082, -24.038291931152344, 7.696842193603516, 39.43197250366211, 71.1671142578125, 102.90225219726562, 134.6373748779297, 166.3725128173828, 198.10765075683594, 229.84278869628906, 261.5779113769531, 293.31304931640625, 325.0481872558594, 356.7833251953125, 388.5184326171875, 420.25360107421875, 451.98870849609375, 483.7238464355469, 515.458984375, 547.194091796875, 578.9292602539062, 610.6643676757812, 642.3995361328125, 674.1346435546875, 705.8698120117188, 737.6049194335938, 769.340087890625, 801.0751953125, 832.8103637695312, 864.5454711914062, 896.2806396484375, 928.0157470703125, 959.7508544921875, 991.4859619140625, 1023.2211303710938, 1054.956298828125, 1086.69140625, 1118.426513671875, 1150.16162109375, 1181.896728515625, 1213.6319580078125, 1245.3670654296875, 1277.1021728515625, 1308.83740234375, 1340.572509765625, 1372.3076171875, 1404.042724609375, 1435.77783203125, 1467.512939453125, 1499.248046875, 1530.983154296875, 1562.7183837890625, 1594.4534912109375, 1626.1885986328125, 1657.9237060546875, 1689.658935546875, 1721.39404296875, 1753.129150390625, 1784.8642578125, 1816.5994873046875, 1848.3345947265625, 1880.0697021484375, 1911.8048095703125, 1943.5400390625, 1975.275146484375]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 6.0, 8.0, 11.0, 12.0, 17.0, 19.0, 16.0, 18.0, 12.0, 24.0, 25.0, 37.0, 34.0, 49.0, 33.0, 49.0, 37.0, 29.0, 36.0, 36.0, 37.0, 43.0, 49.0, 36.0, 40.0, 42.0, 38.0, 34.0, 26.0, 19.0, 17.0, 19.0, 11.0, 14.0, 7.0, 13.0, 8.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.44548034667969, -90.22933959960938, -87.01319885253906, -83.79705810546875, -80.5809097290039, -77.3647689819336, -74.14862823486328, -70.93248748779297, -67.71634674072266, -64.50020599365234, -61.284061431884766, -58.06792068481445, -54.85177993774414, -51.63563537597656, -48.41949462890625, -45.20335388183594, -41.98720932006836, -38.77106857299805, -35.55492401123047, -32.338783264160156, -29.122642517089844, -25.9064998626709, -22.690357208251953, -19.47421646118164, -16.258073806762695, -13.041932106018066, -9.825790405273438, -6.609647750854492, -3.3935060501098633, -0.17736434936523438, 3.038778305053711, 6.254919052124023, 9.471061706542969, 12.687203407287598, 15.903345108032227, 19.119487762451172, 22.335628509521484, 25.55177116394043, 28.767913818359375, 31.984054565429688, 35.2001953125, 38.41633605957031, 41.63248062133789, 44.8486213684082, 48.064762115478516, 51.280906677246094, 54.497047424316406, 57.71318817138672, 60.9293327331543, 64.14547729492188, 67.36161804199219, 70.5777587890625, 73.79389953613281, 77.01004028320312, 80.22618103027344, 83.44232177734375, 86.6584701538086, 89.8746109008789, 93.09075164794922, 96.30690002441406, 99.52304077148438, 102.73918151855469, 105.955322265625, 109.17146301269531, 112.38760375976562]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 6.0, 10.0, 9.0, 11.0, 6.0, 9.0, 11.0, 12.0, 16.0, 13.0, 18.0, 30.0, 30.0, 31.0, 42.0, 51.0, 71.0, 44.0, 82.0, 66.0, 66.0, 55.0, 54.0, 33.0, 29.0, 26.0, 26.0, 19.0, 21.0, 20.0, 8.0, 12.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.403076171875, -8.11083984375, -7.818603515625, -7.5263671875, -7.234130859375, -6.94189453125, -6.649658203125, -6.357421875, -6.065185546875, -5.77294921875, -5.480712890625, -5.1884765625, -4.896240234375, -4.60400390625, -4.311767578125, -4.01953125, -3.727294921875, -3.43505859375, -3.142822265625, -2.8505859375, -2.558349609375, -2.26611328125, -1.973876953125, -1.681640625, -1.389404296875, -1.09716796875, -0.804931640625, -0.5126953125, -0.220458984375, 0.07177734375, 0.364013671875, 0.65625, 0.948486328125, 1.24072265625, 1.532958984375, 1.8251953125, 2.117431640625, 2.40966796875, 2.701904296875, 2.994140625, 3.286376953125, 3.57861328125, 3.870849609375, 4.1630859375, 4.455322265625, 4.74755859375, 5.039794921875, 5.33203125, 5.624267578125, 5.91650390625, 6.208740234375, 6.5009765625, 6.793212890625, 7.08544921875, 7.377685546875, 7.669921875, 7.962158203125, 8.25439453125, 8.546630859375, 8.8388671875, 9.131103515625, 9.42333984375, 9.715576171875, 10.0078125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 11.0, 7.0, 13.0, 14.0, 18.0, 27.0, 36.0, 45.0, 60.0, 73.0, 94.0, 154.0, 229.0, 364.0, 573.0, 992.0, 1903.0, 3919.0, 9249.0, 35531.0, 3168565.0, 935198.0, 22642.0, 7290.0, 3291.0, 1595.0, 851.0, 510.0, 314.0, 218.0, 130.0, 92.0, 67.0, 42.0, 35.0, 27.0, 24.0, 19.0, 16.0, 14.0, 11.0, 0.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.9375, -42.5146484375, -41.091796875, -39.6689453125, -38.24609375, -36.8232421875, -35.400390625, -33.9775390625, -32.5546875, -31.1318359375, -29.708984375, -28.2861328125, -26.86328125, -25.4404296875, -24.017578125, -22.5947265625, -21.171875, -19.7490234375, -18.326171875, -16.9033203125, -15.48046875, -14.0576171875, -12.634765625, -11.2119140625, -9.7890625, -8.3662109375, -6.943359375, -5.5205078125, -4.09765625, -2.6748046875, -1.251953125, 0.1708984375, 1.59375, 3.0166015625, 4.439453125, 5.8623046875, 7.28515625, 8.7080078125, 10.130859375, 11.5537109375, 12.9765625, 14.3994140625, 15.822265625, 17.2451171875, 18.66796875, 20.0908203125, 21.513671875, 22.9365234375, 24.359375, 25.7822265625, 27.205078125, 28.6279296875, 30.05078125, 31.4736328125, 32.896484375, 34.3193359375, 35.7421875, 37.1650390625, 38.587890625, 40.0107421875, 41.43359375, 42.8564453125, 44.279296875, 45.7021484375, 47.125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 6.0, 12.0, 9.0, 12.0, 21.0, 21.0, 15.0, 37.0, 38.0, 78.0, 130.0, 284.0, 641.0, 1100.0, 812.0, 375.0, 151.0, 96.0, 39.0, 38.0, 19.0, 22.0, 19.0, 21.0, 15.0, 15.0, 4.0, 10.0, 1.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.438720703125, -23.48681640625, -22.534912109375, -21.5830078125, -20.631103515625, -19.67919921875, -18.727294921875, -17.775390625, -16.823486328125, -15.87158203125, -14.919677734375, -13.9677734375, -13.015869140625, -12.06396484375, -11.112060546875, -10.16015625, -9.208251953125, -8.25634765625, -7.304443359375, -6.3525390625, -5.400634765625, -4.44873046875, -3.496826171875, -2.544921875, -1.593017578125, -0.64111328125, 0.310791015625, 1.2626953125, 2.214599609375, 3.16650390625, 4.118408203125, 5.0703125, 6.022216796875, 6.97412109375, 7.926025390625, 8.8779296875, 9.829833984375, 10.78173828125, 11.733642578125, 12.685546875, 13.637451171875, 14.58935546875, 15.541259765625, 16.4931640625, 17.445068359375, 18.39697265625, 19.348876953125, 20.30078125, 21.252685546875, 22.20458984375, 23.156494140625, 24.1083984375, 25.060302734375, 26.01220703125, 26.964111328125, 27.916015625, 28.867919921875, 29.81982421875, 30.771728515625, 31.7236328125, 32.675537109375, 33.62744140625, 34.579345703125, 35.53125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 15.0, 17.0, 28.0, 25.0, 63.0, 86.0, 125.0, 218.0, 438.0, 837.0, 1869.0, 4775.0, 14118.0, 52428.0, 1022673.0, 2992603.0, 75702.0, 17965.0, 5885.0, 2293.0, 985.0, 436.0, 263.0, 138.0, 101.0, 66.0, 31.0, 23.0, 17.0, 16.0, 5.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.40625, -40.841796875, -39.27734375, -37.712890625, -36.1484375, -34.583984375, -33.01953125, -31.455078125, -29.890625, -28.326171875, -26.76171875, -25.197265625, -23.6328125, -22.068359375, -20.50390625, -18.939453125, -17.375, -15.810546875, -14.24609375, -12.681640625, -11.1171875, -9.552734375, -7.98828125, -6.423828125, -4.859375, -3.294921875, -1.73046875, -0.166015625, 1.3984375, 2.962890625, 4.52734375, 6.091796875, 7.65625, 9.220703125, 10.78515625, 12.349609375, 13.9140625, 15.478515625, 17.04296875, 18.607421875, 20.171875, 21.736328125, 23.30078125, 24.865234375, 26.4296875, 27.994140625, 29.55859375, 31.123046875, 32.6875, 34.251953125, 35.81640625, 37.380859375, 38.9453125, 40.509765625, 42.07421875, 43.638671875, 45.203125, 46.767578125, 48.33203125, 49.896484375, 51.4609375, 53.025390625, 54.58984375, 56.154296875, 57.71875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 9.0, 16.0, 39.0, 99.0, 177.0, 309.0, 223.0, 68.0, 36.0, 16.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.44499206542969, -43.59242248535156, -37.73985290527344, -31.887279510498047, -26.034709930419922, -20.182140350341797, -14.329566955566406, -8.476997375488281, -2.6244277954101562, 3.228142738342285, 9.080713272094727, 14.933284759521484, 20.78585433959961, 26.638423919677734, 32.490997314453125, 38.34356689453125, 44.196136474609375, 50.0487060546875, 55.901275634765625, 61.753849029541016, 67.60641479492188, 73.458984375, 79.31156158447266, 85.16413116455078, 91.0167007446289, 96.86927032470703, 102.72183990478516, 108.57441711425781, 114.42698669433594, 120.27955627441406, 126.13212585449219, 131.9846954345703, 137.83724975585938, 143.6898193359375, 149.54238891601562, 155.39495849609375, 161.24752807617188, 167.10009765625, 172.95266723632812, 178.80523681640625, 184.65780639648438, 190.5103759765625, 196.36294555664062, 202.21551513671875, 208.06808471679688, 213.920654296875, 219.77322387695312, 225.62579345703125, 231.47837829589844, 237.33094787597656, 243.1835174560547, 249.0360870361328, 254.88865661621094, 260.7412414550781, 266.59381103515625, 272.4463806152344, 278.2989501953125, 284.1515197753906, 290.00408935546875, 295.8566589355469, 301.709228515625, 307.5617980957031, 313.41436767578125, 319.2669372558594, 325.1195068359375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 10.0, 6.0, 13.0, 14.0, 12.0, 14.0, 25.0, 20.0, 23.0, 21.0, 28.0, 28.0, 30.0, 32.0, 24.0, 30.0, 35.0, 37.0, 43.0, 38.0, 41.0, 39.0, 41.0, 41.0, 42.0, 41.0, 27.0, 37.0, 22.0, 27.0, 21.0, 27.0, 16.0, 17.0, 9.0, 11.0, 8.0, 5.0, 6.0, 7.0, 1.0, 8.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-79.05381774902344, -76.65140533447266, -74.24899291992188, -71.84658813476562, -69.44417572021484, -67.04176330566406, -64.63935089111328, -62.2369384765625, -59.834529876708984, -57.4321174621582, -55.02970886230469, -52.627296447753906, -50.224884033203125, -47.82247543334961, -45.42006301879883, -43.01765441894531, -40.61524200439453, -38.21282958984375, -35.810420989990234, -33.40800857543945, -31.005598068237305, -28.603187561035156, -26.200775146484375, -23.798364639282227, -21.395954132080078, -18.99354362487793, -16.59113311767578, -14.188720703125, -11.786310195922852, -9.383899688720703, -6.981488227844238, -4.579076766967773, -2.176666259765625, 0.22574472427368164, 2.6281557083129883, 5.030566692352295, 7.432977676391602, 9.83538818359375, 12.237799644470215, 14.64021110534668, 17.042621612548828, 19.445032119750977, 21.847442626953125, 24.249855041503906, 26.652265548706055, 29.054676055908203, 31.457088470458984, 33.8594970703125, 36.26190948486328, 38.66432189941406, 41.06673049926758, 43.46914291381836, 45.871551513671875, 48.273963928222656, 50.67637634277344, 53.07878875732422, 55.481197357177734, 57.883609771728516, 60.28601837158203, 62.68843078613281, 65.0908432006836, 67.49325561523438, 69.89566040039062, 72.2980728149414, 74.70048522949219]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 7.0, 15.0, 8.0, 10.0, 14.0, 17.0, 16.0, 24.0, 37.0, 29.0, 35.0, 38.0, 62.0, 50.0, 70.0, 66.0, 68.0, 62.0, 55.0, 40.0, 35.0, 26.0, 20.0, 23.0, 28.0, 20.0, 17.0, 14.0, 13.0, 5.0, 8.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3724365234375, -8.088623046875, -7.8048095703125, -7.52099609375, -7.2371826171875, -6.953369140625, -6.6695556640625, -6.3857421875, -6.1019287109375, -5.818115234375, -5.5343017578125, -5.25048828125, -4.9666748046875, -4.682861328125, -4.3990478515625, -4.115234375, -3.8314208984375, -3.547607421875, -3.2637939453125, -2.97998046875, -2.6961669921875, -2.412353515625, -2.1285400390625, -1.8447265625, -1.5609130859375, -1.277099609375, -0.9932861328125, -0.70947265625, -0.4256591796875, -0.141845703125, 0.1419677734375, 0.42578125, 0.7095947265625, 0.993408203125, 1.2772216796875, 1.56103515625, 1.8448486328125, 2.128662109375, 2.4124755859375, 2.6962890625, 2.9801025390625, 3.263916015625, 3.5477294921875, 3.83154296875, 4.1153564453125, 4.399169921875, 4.6829833984375, 4.966796875, 5.2506103515625, 5.534423828125, 5.8182373046875, 6.10205078125, 6.3858642578125, 6.669677734375, 6.9534912109375, 7.2373046875, 7.5211181640625, 7.804931640625, 8.0887451171875, 8.37255859375, 8.6563720703125, 8.940185546875, 9.2239990234375, 9.5078125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 16.0, 21.0, 29.0, 42.0, 58.0, 92.0, 140.0, 198.0, 291.0, 383.0, 602.0, 903.0, 1415.0, 2069.0, 3244.0, 5069.0, 7863.0, 12682.0, 20447.0, 33906.0, 58124.0, 105139.0, 200613.0, 265556.0, 140401.0, 76671.0, 43141.0, 25716.0, 15952.0, 9848.0, 6182.0, 4023.0, 2674.0, 1643.0, 1087.0, 731.0, 520.0, 318.0, 222.0, 157.0, 115.0, 79.0, 51.0, 30.0, 30.0, 20.0, 8.0, 5.0, 8.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1685791015625, -0.16334915161132812, -0.15811920166015625, -0.15288925170898438, -0.1476593017578125, -0.14242935180664062, -0.13719940185546875, -0.13196945190429688, -0.126739501953125, -0.12150955200195312, -0.11627960205078125, -0.11104965209960938, -0.1058197021484375, -0.10058975219726562, -0.09535980224609375, -0.09012985229492188, -0.08489990234375, -0.07966995239257812, -0.07444000244140625, -0.06921005249023438, -0.0639801025390625, -0.058750152587890625, -0.05352020263671875, -0.048290252685546875, -0.043060302734375, -0.037830352783203125, -0.03260040283203125, -0.027370452880859375, -0.0221405029296875, -0.016910552978515625, -0.01168060302734375, -0.006450653076171875, -0.001220703125, 0.004009246826171875, 0.00923919677734375, 0.014469146728515625, 0.0196990966796875, 0.024929046630859375, 0.03015899658203125, 0.035388946533203125, 0.040618896484375, 0.045848846435546875, 0.05107879638671875, 0.056308746337890625, 0.0615386962890625, 0.06676864624023438, 0.07199859619140625, 0.07722854614257812, 0.08245849609375, 0.08768844604492188, 0.09291839599609375, 0.09814834594726562, 0.1033782958984375, 0.10860824584960938, 0.11383819580078125, 0.11906814575195312, 0.124298095703125, 0.12952804565429688, 0.13475799560546875, 0.13998794555664062, 0.1452178955078125, 0.15044784545898438, 0.15567779541015625, 0.16090774536132812, 0.1661376953125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 6.0, 7.0, 6.0, 9.0, 11.0, 19.0, 19.0, 22.0, 18.0, 27.0, 32.0, 27.0, 42.0, 32.0, 32.0, 48.0, 47.0, 41.0, 1066.0, 52.0, 50.0, 41.0, 48.0, 34.0, 41.0, 33.0, 25.0, 28.0, 29.0, 22.0, 14.0, 14.0, 9.0, 12.0, 8.0, 12.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.50140380859375, -4.3660888671875, -4.23077392578125, -4.095458984375, -3.96014404296875, -3.8248291015625, -3.68951416015625, -3.55419921875, -3.41888427734375, -3.2835693359375, -3.14825439453125, -3.012939453125, -2.87762451171875, -2.7423095703125, -2.60699462890625, -2.4716796875, -2.33636474609375, -2.2010498046875, -2.06573486328125, -1.930419921875, -1.79510498046875, -1.6597900390625, -1.52447509765625, -1.38916015625, -1.25384521484375, -1.1185302734375, -0.98321533203125, -0.847900390625, -0.71258544921875, -0.5772705078125, -0.44195556640625, -0.306640625, -0.17132568359375, -0.0360107421875, 0.09930419921875, 0.234619140625, 0.36993408203125, 0.5052490234375, 0.64056396484375, 0.77587890625, 0.91119384765625, 1.0465087890625, 1.18182373046875, 1.317138671875, 1.45245361328125, 1.5877685546875, 1.72308349609375, 1.8583984375, 1.99371337890625, 2.1290283203125, 2.26434326171875, 2.399658203125, 2.53497314453125, 2.6702880859375, 2.80560302734375, 2.94091796875, 3.07623291015625, 3.2115478515625, 3.34686279296875, 3.482177734375, 3.61749267578125, 3.7528076171875, 3.88812255859375, 4.0234375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 9.0, 12.0, 19.0, 30.0, 31.0, 67.0, 93.0, 134.0, 203.0, 246.0, 413.0, 540.0, 826.0, 1162.0, 1765.0, 2486.0, 3837.0, 5561.0, 8392.0, 12643.0, 18930.0, 28477.0, 43976.0, 66942.0, 106046.0, 169602.0, 1250352.0, 132505.0, 83545.0, 53693.0, 35029.0, 23111.0, 15461.0, 10020.0, 6748.0, 4483.0, 3084.0, 2017.0, 1439.0, 972.0, 729.0, 440.0, 329.0, 207.0, 162.0, 119.0, 81.0, 59.0, 44.0, 26.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0650634765625, -0.06304550170898438, -0.06102752685546875, -0.059009552001953125, -0.0569915771484375, -0.054973602294921875, -0.05295562744140625, -0.050937652587890625, -0.048919677734375, -0.046901702880859375, -0.04488372802734375, -0.042865753173828125, -0.0408477783203125, -0.038829803466796875, -0.03681182861328125, -0.034793853759765625, -0.03277587890625, -0.030757904052734375, -0.02873992919921875, -0.026721954345703125, -0.0247039794921875, -0.022686004638671875, -0.02066802978515625, -0.018650054931640625, -0.016632080078125, -0.014614105224609375, -0.01259613037109375, -0.010578155517578125, -0.0085601806640625, -0.006542205810546875, -0.00452423095703125, -0.002506256103515625, -0.00048828125, 0.001529693603515625, 0.00354766845703125, 0.005565643310546875, 0.0075836181640625, 0.009601593017578125, 0.01161956787109375, 0.013637542724609375, 0.015655517578125, 0.017673492431640625, 0.01969146728515625, 0.021709442138671875, 0.0237274169921875, 0.025745391845703125, 0.02776336669921875, 0.029781341552734375, 0.03179931640625, 0.033817291259765625, 0.03583526611328125, 0.037853240966796875, 0.0398712158203125, 0.041889190673828125, 0.04390716552734375, 0.045925140380859375, 0.047943115234375, 0.049961090087890625, 0.05197906494140625, 0.053997039794921875, 0.0560150146484375, 0.058032989501953125, 0.06005096435546875, 0.062068939208984375, 0.0640869140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 4.0, 7.0, 7.0, 6.0, 12.0, 21.0, 18.0, 20.0, 26.0, 31.0, 38.0, 45.0, 62.0, 70.0, 74.0, 67.0, 77.0, 61.0, 60.0, 40.0, 50.0, 37.0, 30.0, 16.0, 25.0, 19.0, 17.0, 14.0, 5.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00015294551849365234, -0.00014812685549259186, -0.00014330819249153137, -0.00013848952949047089, -0.0001336708664894104, -0.00012885220348834991, -0.00012403354048728943, -0.00011921487748622894, -0.00011439621448516846, -0.00010957755148410797, -0.00010475888848304749, -9.9940225481987e-05, -9.512156248092651e-05, -9.030289947986603e-05, -8.548423647880554e-05, -8.066557347774506e-05, -7.584691047668457e-05, -7.102824747562408e-05, -6.62095844745636e-05, -6.139092147350311e-05, -5.657225847244263e-05, -5.175359547138214e-05, -4.6934932470321655e-05, -4.211626946926117e-05, -3.7297606468200684e-05, -3.24789434671402e-05, -2.7660280466079712e-05, -2.2841617465019226e-05, -1.802295446395874e-05, -1.3204291462898254e-05, -8.385628461837769e-06, -3.5669654607772827e-06, 1.2516975402832031e-06, 6.070360541343689e-06, 1.0889023542404175e-05, 1.570768654346466e-05, 2.0526349544525146e-05, 2.5345012545585632e-05, 3.0163675546646118e-05, 3.4982338547706604e-05, 3.980100154876709e-05, 4.4619664549827576e-05, 4.943832755088806e-05, 5.425699055194855e-05, 5.907565355300903e-05, 6.389431655406952e-05, 6.871297955513e-05, 7.353164255619049e-05, 7.835030555725098e-05, 8.316896855831146e-05, 8.798763155937195e-05, 9.280629456043243e-05, 9.762495756149292e-05, 0.0001024436205625534, 0.00010726228356361389, 0.00011208094656467438, 0.00011689960956573486, 0.00012171827256679535, 0.00012653693556785583, 0.00013135559856891632, 0.0001361742615699768, 0.0001409929245710373, 0.00014581158757209778, 0.00015063025057315826, 0.00015544891357421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 11.0, 7.0, 13.0, 19.0, 15.0, 26.0, 16.0, 33.0, 36.0, 61.0, 78.0, 90.0, 87.0, 134.0, 173.0, 224.0, 349.0, 1076.0, 35244.0, 999309.0, 9600.0, 678.0, 299.0, 199.0, 152.0, 135.0, 100.0, 72.0, 69.0, 58.0, 45.0, 22.0, 22.0, 19.0, 18.0, 20.0, 10.0, 7.0, 3.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-0.00244903564453125, -0.0023733675479888916, -0.002297699451446533, -0.002222031354904175, -0.0021463632583618164, -0.002070695161819458, -0.0019950270652770996, -0.0019193589687347412, -0.0018436908721923828, -0.0017680227756500244, -0.001692354679107666, -0.0016166865825653076, -0.0015410184860229492, -0.0014653503894805908, -0.0013896822929382324, -0.001314014196395874, -0.0012383460998535156, -0.0011626780033111572, -0.0010870099067687988, -0.0010113418102264404, -0.000935673713684082, -0.0008600056171417236, -0.0007843375205993652, -0.0007086694240570068, -0.0006330013275146484, -0.00055733323097229, -0.00048166513442993164, -0.00040599703788757324, -0.00033032894134521484, -0.00025466084480285645, -0.00017899274826049805, -0.00010332465171813965, -2.765655517578125e-05, 4.801154136657715e-05, 0.00012367963790893555, 0.00019934773445129395, 0.00027501583099365234, 0.00035068392753601074, 0.00042635202407836914, 0.0005020201206207275, 0.0005776882171630859, 0.0006533563137054443, 0.0007290244102478027, 0.0008046925067901611, 0.0008803606033325195, 0.0009560286998748779, 0.0010316967964172363, 0.0011073648929595947, 0.0011830329895019531, 0.0012587010860443115, 0.00133436918258667, 0.0014100372791290283, 0.0014857053756713867, 0.0015613734722137451, 0.0016370415687561035, 0.001712709665298462, 0.0017883777618408203, 0.0018640458583831787, 0.0019397139549255371, 0.0020153820514678955, 0.002091050148010254, 0.0021667182445526123, 0.0022423863410949707, 0.002318054437637329, 0.0023937225341796875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 21.0, 82.0, 391.0, 362.0, 85.0, 37.0, 12.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.0005354912136681378, -0.0005259194294922054, -0.0005163475871086121, -0.0005067758029326797, -0.0004972039605490863, -0.00048763214726932347, -0.0004780603339895606, -0.00046848852070979774, -0.0004589167074300349, -0.000449344894150272, -0.00043977308087050915, -0.0004302012675907463, -0.0004206294543109834, -0.00041105764103122056, -0.0004014858277514577, -0.0003919140144716948, -0.00038234220119193196, -0.0003727703879121691, -0.00036319857463240623, -0.00035362676135264337, -0.0003440549480728805, -0.00033448313479311764, -0.0003249113215133548, -0.0003153395082335919, -0.0003057677240576595, -0.00029619591077789664, -0.0002866240974981338, -0.0002770522842183709, -0.00026748047093860805, -0.0002579086576588452, -0.0002483368443790823, -0.00023876503109931946, -0.00022919323237147182, -0.00021962141909170896, -0.0002100496058119461, -0.00020047779253218323, -0.00019090597925242037, -0.0001813341659726575, -0.00017176236724480987, -0.000162190553965047, -0.00015261874068528414, -0.00014304692740552127, -0.0001334751141257584, -0.00012390330084599555, -0.00011433148756623268, -0.00010475967428646982, -9.518786828266457e-05, -8.56160550029017e-05, -7.604423444718122e-05, -6.647242116741836e-05, -5.6900607887655497e-05, -4.732879824587144e-05, -3.7756984966108575e-05, -2.818517168634571e-05, -1.8613362044561654e-05, -9.04154876479879e-06, 5.302645149640739e-07, 1.0102076885232236e-05, 1.96738892555004e-05, 2.924570071627386e-05, 3.881751399603672e-05, 4.838932727579959e-05, 5.7961136917583644e-05, 6.753295019734651e-05, 7.710476347710937e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 8.0, 10.0, 10.0, 9.0, 10.0, 15.0, 23.0, 27.0, 28.0, 28.0, 27.0, 29.0, 36.0, 51.0, 48.0, 29.0, 51.0, 43.0, 48.0, 43.0, 39.0, 41.0, 41.0, 28.0, 34.0, 32.0, 22.0, 35.0, 31.0, 24.0, 10.0, 14.0, 11.0, 8.0, 13.0, 11.0, 4.0, 6.0, 6.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.738040924072266e-05, -8.438806980848312e-05, -8.139573037624359e-05, -7.840339094400406e-05, -7.541105151176453e-05, -7.2418712079525e-05, -6.942637264728546e-05, -6.643403321504593e-05, -6.34416937828064e-05, -6.0449354350566864e-05, -5.745701491832733e-05, -5.44646754860878e-05, -5.1472336053848267e-05, -4.8479996621608734e-05, -4.54876571893692e-05, -4.249531775712967e-05, -3.950297832489014e-05, -3.6510638892650604e-05, -3.351829946041107e-05, -3.052596002817154e-05, -2.7533620595932007e-05, -2.4541281163692474e-05, -2.1548941731452942e-05, -1.855660229921341e-05, -1.5564262866973877e-05, -1.2571923434734344e-05, -9.579584002494812e-06, -6.5872445702552795e-06, -3.594905138015747e-06, -6.025657057762146e-07, 2.389773726463318e-06, 5.38211315870285e-06, 8.374452590942383e-06, 1.1366792023181915e-05, 1.4359131455421448e-05, 1.735147088766098e-05, 2.0343810319900513e-05, 2.3336149752140045e-05, 2.6328489184379578e-05, 2.932082861661911e-05, 3.231316804885864e-05, 3.5305507481098175e-05, 3.829784691333771e-05, 4.129018634557724e-05, 4.428252577781677e-05, 4.7274865210056305e-05, 5.026720464229584e-05, 5.325954407453537e-05, 5.62518835067749e-05, 5.9244222939014435e-05, 6.223656237125397e-05, 6.52289018034935e-05, 6.822124123573303e-05, 7.121358066797256e-05, 7.42059201002121e-05, 7.719825953245163e-05, 8.019059896469116e-05, 8.31829383969307e-05, 8.617527782917023e-05, 8.916761726140976e-05, 9.215995669364929e-05, 9.515229612588882e-05, 9.814463555812836e-05, 0.00010113697499036789, 0.00010412931442260742]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 7.0, 15.0, 8.0, 10.0, 14.0, 17.0, 16.0, 24.0, 37.0, 29.0, 35.0, 38.0, 62.0, 50.0, 70.0, 66.0, 68.0, 62.0, 55.0, 40.0, 35.0, 26.0, 20.0, 23.0, 28.0, 20.0, 17.0, 14.0, 13.0, 5.0, 8.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3724365234375, -8.088623046875, -7.8048095703125, -7.52099609375, -7.2371826171875, -6.953369140625, -6.6695556640625, -6.3857421875, -6.1019287109375, -5.818115234375, -5.5343017578125, -5.25048828125, -4.9666748046875, -4.682861328125, -4.3990478515625, -4.115234375, -3.8314208984375, -3.547607421875, -3.2637939453125, -2.97998046875, -2.6961669921875, -2.412353515625, -2.1285400390625, -1.8447265625, -1.5609130859375, -1.277099609375, -0.9932861328125, -0.70947265625, -0.4256591796875, -0.141845703125, 0.1419677734375, 0.42578125, 0.7095947265625, 0.993408203125, 1.2772216796875, 1.56103515625, 1.8448486328125, 2.128662109375, 2.4124755859375, 2.6962890625, 2.9801025390625, 3.263916015625, 3.5477294921875, 3.83154296875, 4.1153564453125, 4.399169921875, 4.6829833984375, 4.966796875, 5.2506103515625, 5.534423828125, 5.8182373046875, 6.10205078125, 6.3858642578125, 6.669677734375, 6.9534912109375, 7.2373046875, 7.5211181640625, 7.804931640625, 8.0887451171875, 8.37255859375, 8.6563720703125, 8.940185546875, 9.2239990234375, 9.5078125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 7.0, 3.0, 6.0, 9.0, 10.0, 21.0, 26.0, 39.0, 47.0, 93.0, 111.0, 172.0, 251.0, 364.0, 525.0, 771.0, 1273.0, 2559.0, 7108.0, 52627.0, 909271.0, 59406.0, 7361.0, 2642.0, 1369.0, 805.0, 507.0, 371.0, 247.0, 172.0, 117.0, 88.0, 47.0, 50.0, 17.0, 16.0, 14.0, 11.0, 5.0, 2.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.453125, -19.782958984375, -19.11279296875, -18.442626953125, -17.7724609375, -17.102294921875, -16.43212890625, -15.761962890625, -15.091796875, -14.421630859375, -13.75146484375, -13.081298828125, -12.4111328125, -11.740966796875, -11.07080078125, -10.400634765625, -9.73046875, -9.060302734375, -8.39013671875, -7.719970703125, -7.0498046875, -6.379638671875, -5.70947265625, -5.039306640625, -4.369140625, -3.698974609375, -3.02880859375, -2.358642578125, -1.6884765625, -1.018310546875, -0.34814453125, 0.322021484375, 0.9921875, 1.662353515625, 2.33251953125, 3.002685546875, 3.6728515625, 4.343017578125, 5.01318359375, 5.683349609375, 6.353515625, 7.023681640625, 7.69384765625, 8.364013671875, 9.0341796875, 9.704345703125, 10.37451171875, 11.044677734375, 11.71484375, 12.385009765625, 13.05517578125, 13.725341796875, 14.3955078125, 15.065673828125, 15.73583984375, 16.406005859375, 17.076171875, 17.746337890625, 18.41650390625, 19.086669921875, 19.7568359375, 20.427001953125, 21.09716796875, 21.767333984375, 22.4375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 9.0, 11.0, 15.0, 14.0, 18.0, 33.0, 27.0, 29.0, 31.0, 40.0, 35.0, 34.0, 45.0, 60.0, 106.0, 1716.0, 268.0, 85.0, 54.0, 44.0, 54.0, 35.0, 42.0, 28.0, 28.0, 30.0, 20.0, 15.0, 14.0, 15.0, 20.0, 12.0, 9.0, 4.0, 7.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.640625, -29.706298828125, -28.77197265625, -27.837646484375, -26.9033203125, -25.968994140625, -25.03466796875, -24.100341796875, -23.166015625, -22.231689453125, -21.29736328125, -20.363037109375, -19.4287109375, -18.494384765625, -17.56005859375, -16.625732421875, -15.69140625, -14.757080078125, -13.82275390625, -12.888427734375, -11.9541015625, -11.019775390625, -10.08544921875, -9.151123046875, -8.216796875, -7.282470703125, -6.34814453125, -5.413818359375, -4.4794921875, -3.545166015625, -2.61083984375, -1.676513671875, -0.7421875, 0.192138671875, 1.12646484375, 2.060791015625, 2.9951171875, 3.929443359375, 4.86376953125, 5.798095703125, 6.732421875, 7.666748046875, 8.60107421875, 9.535400390625, 10.4697265625, 11.404052734375, 12.33837890625, 13.272705078125, 14.20703125, 15.141357421875, 16.07568359375, 17.010009765625, 17.9443359375, 18.878662109375, 19.81298828125, 20.747314453125, 21.681640625, 22.615966796875, 23.55029296875, 24.484619140625, 25.4189453125, 26.353271484375, 27.28759765625, 28.221923828125, 29.15625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 7.0, 17.0, 11.0, 18.0, 20.0, 21.0, 29.0, 27.0, 51.0, 71.0, 117.0, 219.0, 434.0, 974.0, 2438.0, 10508.0, 2923485.0, 198011.0, 5825.0, 1736.0, 754.0, 343.0, 178.0, 102.0, 67.0, 51.0, 49.0, 24.0, 23.0, 16.0, 15.0, 11.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.5625, -46.02001953125, -44.4775390625, -42.93505859375, -41.392578125, -39.85009765625, -38.3076171875, -36.76513671875, -35.22265625, -33.68017578125, -32.1376953125, -30.59521484375, -29.052734375, -27.51025390625, -25.9677734375, -24.42529296875, -22.8828125, -21.34033203125, -19.7978515625, -18.25537109375, -16.712890625, -15.17041015625, -13.6279296875, -12.08544921875, -10.54296875, -9.00048828125, -7.4580078125, -5.91552734375, -4.373046875, -2.83056640625, -1.2880859375, 0.25439453125, 1.796875, 3.33935546875, 4.8818359375, 6.42431640625, 7.966796875, 9.50927734375, 11.0517578125, 12.59423828125, 14.13671875, 15.67919921875, 17.2216796875, 18.76416015625, 20.306640625, 21.84912109375, 23.3916015625, 24.93408203125, 26.4765625, 28.01904296875, 29.5615234375, 31.10400390625, 32.646484375, 34.18896484375, 35.7314453125, 37.27392578125, 38.81640625, 40.35888671875, 41.9013671875, 43.44384765625, 44.986328125, 46.52880859375, 48.0712890625, 49.61376953125, 51.15625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 54.0, 385.0, 496.0, 61.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.58192443847656, -109.81767272949219, -104.05342864990234, -98.28917694091797, -92.52493286132812, -86.76068115234375, -80.99642944335938, -75.23218536376953, -69.46794128417969, -63.70369338989258, -57.93944549560547, -52.175193786621094, -46.41094970703125, -40.646697998046875, -34.882450103759766, -29.118202209472656, -23.35395050048828, -17.589702606201172, -11.825453758239746, -6.06120491027832, -0.29695701599121094, 5.467290878295898, 11.23154067993164, 16.99578857421875, 22.76003646850586, 28.52428436279297, 34.28853225708008, 40.05278015136719, 45.81703186035156, 51.581275939941406, 57.34552764892578, 63.10977554321289, 68.8740234375, 74.63827514648438, 80.40251922607422, 86.1667709350586, 91.93101501464844, 97.69526672363281, 103.45951843261719, 109.22376251220703, 114.98800659179688, 120.75225830078125, 126.5165023803711, 132.28074645996094, 138.0449981689453, 143.8092498779297, 149.57350158691406, 155.33773803710938, 161.10198974609375, 166.86624145507812, 172.6304931640625, 178.3947296142578, 184.1589813232422, 189.92323303222656, 195.68748474121094, 201.45172119140625, 207.2159881591797, 212.98023986816406, 218.74449157714844, 224.50872802734375, 230.27297973632812, 236.0372314453125, 241.80148315429688, 247.56573486328125, 253.32997131347656]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 7.0, 12.0, 13.0, 18.0, 26.0, 24.0, 21.0, 21.0, 22.0, 33.0, 31.0, 40.0, 42.0, 39.0, 34.0, 42.0, 52.0, 55.0, 36.0, 46.0, 33.0, 43.0, 33.0, 38.0, 35.0, 31.0, 28.0, 23.0, 25.0, 16.0, 6.0, 18.0, 8.0, 5.0, 9.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-103.51428985595703, -100.1222915649414, -96.73029327392578, -93.33828735351562, -89.9462890625, -86.55429077148438, -83.16229248046875, -79.77029418945312, -76.3782958984375, -72.98629760742188, -69.59429931640625, -66.20230102539062, -62.81029510498047, -59.418296813964844, -56.02629852294922, -52.634300231933594, -49.24229431152344, -45.85029602050781, -42.45829391479492, -39.0662956237793, -35.674293518066406, -32.28229522705078, -28.890296936035156, -25.4982967376709, -22.10629653930664, -18.714296340942383, -15.322297096252441, -11.9302978515625, -8.538297653198242, -5.146297454833984, -1.7542991638183594, 1.6377010345458984, 5.029701232910156, 8.421701431274414, 11.813700675964355, 15.205699920654297, 18.597700119018555, 21.989700317382812, 25.381698608398438, 28.773698806762695, 32.16569900512695, 35.55769729614258, 38.94969940185547, 42.341697692871094, 45.73369598388672, 49.12569808959961, 52.517696380615234, 55.909698486328125, 59.30169677734375, 62.693695068359375, 66.085693359375, 69.47769165039062, 72.86969757080078, 76.2616958618164, 79.65369415283203, 83.04569244384766, 86.43769836425781, 89.82969665527344, 93.22169494628906, 96.61369323730469, 100.00569915771484, 103.39769744873047, 106.7896957397461, 110.18169403076172, 113.57369232177734]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 4.0, 4.0, 7.0, 13.0, 8.0, 10.0, 14.0, 10.0, 17.0, 24.0, 22.0, 22.0, 41.0, 37.0, 46.0, 57.0, 54.0, 63.0, 71.0, 58.0, 64.0, 57.0, 42.0, 31.0, 32.0, 21.0, 29.0, 22.0, 17.0, 20.0, 11.0, 13.0, 9.0, 6.0, 4.0, 5.0, 7.0, 8.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.62890625, -8.3359375, -8.04296875, -7.75, -7.45703125, -7.1640625, -6.87109375, -6.578125, -6.28515625, -5.9921875, -5.69921875, -5.40625, -5.11328125, -4.8203125, -4.52734375, -4.234375, -3.94140625, -3.6484375, -3.35546875, -3.0625, -2.76953125, -2.4765625, -2.18359375, -1.890625, -1.59765625, -1.3046875, -1.01171875, -0.71875, -0.42578125, -0.1328125, 0.16015625, 0.453125, 0.74609375, 1.0390625, 1.33203125, 1.625, 1.91796875, 2.2109375, 2.50390625, 2.796875, 3.08984375, 3.3828125, 3.67578125, 3.96875, 4.26171875, 4.5546875, 4.84765625, 5.140625, 5.43359375, 5.7265625, 6.01953125, 6.3125, 6.60546875, 6.8984375, 7.19140625, 7.484375, 7.77734375, 8.0703125, 8.36328125, 8.65625, 8.94921875, 9.2421875, 9.53515625, 9.828125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 12.0, 6.0, 11.0, 22.0, 38.0, 41.0, 51.0, 74.0, 99.0, 162.0, 273.0, 332.0, 539.0, 841.0, 1310.0, 2376.0, 4371.0, 8819.0, 27489.0, 698260.0, 3317458.0, 104353.0, 13454.0, 5952.0, 3182.0, 1726.0, 1023.0, 659.0, 439.0, 286.0, 172.0, 140.0, 89.0, 59.0, 39.0, 29.0, 25.0, 16.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -30.201416015625, -29.16845703125, -28.135498046875, -27.1025390625, -26.069580078125, -25.03662109375, -24.003662109375, -22.970703125, -21.937744140625, -20.90478515625, -19.871826171875, -18.8388671875, -17.805908203125, -16.77294921875, -15.739990234375, -14.70703125, -13.674072265625, -12.64111328125, -11.608154296875, -10.5751953125, -9.542236328125, -8.50927734375, -7.476318359375, -6.443359375, -5.410400390625, -4.37744140625, -3.344482421875, -2.3115234375, -1.278564453125, -0.24560546875, 0.787353515625, 1.8203125, 2.853271484375, 3.88623046875, 4.919189453125, 5.9521484375, 6.985107421875, 8.01806640625, 9.051025390625, 10.083984375, 11.116943359375, 12.14990234375, 13.182861328125, 14.2158203125, 15.248779296875, 16.28173828125, 17.314697265625, 18.34765625, 19.380615234375, 20.41357421875, 21.446533203125, 22.4794921875, 23.512451171875, 24.54541015625, 25.578369140625, 26.611328125, 27.644287109375, 28.67724609375, 29.710205078125, 30.7431640625, 31.776123046875, 32.80908203125, 33.842041015625, 34.875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 11.0, 11.0, 21.0, 25.0, 42.0, 79.0, 156.0, 480.0, 1417.0, 1166.0, 349.0, 107.0, 55.0, 43.0, 29.0, 19.0, 15.0, 16.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.0625, -33.654296875, -32.24609375, -30.837890625, -29.4296875, -28.021484375, -26.61328125, -25.205078125, -23.796875, -22.388671875, -20.98046875, -19.572265625, -18.1640625, -16.755859375, -15.34765625, -13.939453125, -12.53125, -11.123046875, -9.71484375, -8.306640625, -6.8984375, -5.490234375, -4.08203125, -2.673828125, -1.265625, 0.142578125, 1.55078125, 2.958984375, 4.3671875, 5.775390625, 7.18359375, 8.591796875, 10.0, 11.408203125, 12.81640625, 14.224609375, 15.6328125, 17.041015625, 18.44921875, 19.857421875, 21.265625, 22.673828125, 24.08203125, 25.490234375, 26.8984375, 28.306640625, 29.71484375, 31.123046875, 32.53125, 33.939453125, 35.34765625, 36.755859375, 38.1640625, 39.572265625, 40.98046875, 42.388671875, 43.796875, 45.205078125, 46.61328125, 48.021484375, 49.4296875, 50.837890625, 52.24609375, 53.654296875, 55.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 15.0, 15.0, 33.0, 61.0, 90.0, 160.0, 396.0, 1100.0, 4279.0, 29231.0, 3601926.0, 536361.0, 16346.0, 2785.0, 837.0, 300.0, 136.0, 94.0, 48.0, 18.0, 17.0, 4.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.3125, -102.4560546875, -99.599609375, -96.7431640625, -93.88671875, -91.0302734375, -88.173828125, -85.3173828125, -82.4609375, -79.6044921875, -76.748046875, -73.8916015625, -71.03515625, -68.1787109375, -65.322265625, -62.4658203125, -59.609375, -56.7529296875, -53.896484375, -51.0400390625, -48.18359375, -45.3271484375, -42.470703125, -39.6142578125, -36.7578125, -33.9013671875, -31.044921875, -28.1884765625, -25.33203125, -22.4755859375, -19.619140625, -16.7626953125, -13.90625, -11.0498046875, -8.193359375, -5.3369140625, -2.48046875, 0.3759765625, 3.232421875, 6.0888671875, 8.9453125, 11.8017578125, 14.658203125, 17.5146484375, 20.37109375, 23.2275390625, 26.083984375, 28.9404296875, 31.796875, 34.6533203125, 37.509765625, 40.3662109375, 43.22265625, 46.0791015625, 48.935546875, 51.7919921875, 54.6484375, 57.5048828125, 60.361328125, 63.2177734375, 66.07421875, 68.9306640625, 71.787109375, 74.6435546875, 77.5]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 67.0, 384.0, 447.0, 76.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.3537902832031, -335.4908447265625, -322.6278991699219, -309.76495361328125, -296.9020080566406, -284.0390625, -271.1761474609375, -258.31317138671875, -245.4502410888672, -232.58729553222656, -219.72434997558594, -206.86141967773438, -193.99847412109375, -181.13552856445312, -168.2725830078125, -155.40963745117188, -142.54669189453125, -129.68374633789062, -116.82080078125, -103.9578628540039, -91.09491729736328, -78.23197174072266, -65.36903381347656, -52.50608825683594, -39.64314270019531, -26.78019905090332, -13.917255401611328, -1.0543136596679688, 11.808631896972656, 24.67157745361328, 37.534515380859375, 50.3974609375, 63.260406494140625, 76.12335205078125, 88.98629760742188, 101.84923553466797, 114.7121810913086, 127.57512664794922, 140.4380645751953, 153.30101013183594, 166.16395568847656, 179.0269012451172, 191.8898468017578, 204.75277709960938, 217.61572265625, 230.47866821289062, 243.34161376953125, 256.2045593261719, 269.0675048828125, 281.9304504394531, 294.79339599609375, 307.6563415527344, 320.519287109375, 333.3822326660156, 346.24517822265625, 359.10809326171875, 371.9710693359375, 384.8340148925781, 397.69696044921875, 410.5599060058594, 423.4228515625, 436.2857971191406, 449.14874267578125, 462.01165771484375, 474.8746032714844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 10.0, 8.0, 7.0, 15.0, 11.0, 7.0, 18.0, 18.0, 14.0, 21.0, 30.0, 34.0, 24.0, 38.0, 40.0, 33.0, 21.0, 29.0, 41.0, 39.0, 35.0, 38.0, 44.0, 37.0, 37.0, 41.0, 29.0, 32.0, 27.0, 27.0, 35.0, 18.0, 20.0, 21.0, 14.0, 14.0, 14.0, 13.0, 10.0, 6.0, 9.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-78.59513092041016, -76.32500457763672, -74.05488586425781, -71.78475952148438, -69.51463317871094, -67.2445068359375, -64.9743881225586, -62.704261779785156, -60.434139251708984, -58.16401672363281, -55.893890380859375, -53.6237678527832, -51.35364532470703, -49.083518981933594, -46.81339645385742, -44.54327392578125, -42.27314758300781, -40.00302505493164, -37.7328987121582, -35.46277618408203, -33.192649841308594, -30.922527313232422, -28.65240478515625, -26.382280349731445, -24.11215591430664, -21.842031478881836, -19.57190704345703, -17.30178451538086, -15.031660079956055, -12.76153564453125, -10.491412162780762, -8.221288681030273, -5.9511566162109375, -3.681032657623291, -1.4109086990356445, 0.859215259552002, 3.1293392181396484, 5.399463653564453, 7.669587135314941, 9.93971061706543, 12.209835052490234, 14.479959487915039, 16.750083923339844, 19.020206451416016, 21.29033088684082, 23.560455322265625, 25.830577850341797, 28.1007022857666, 30.370826721191406, 32.64094924926758, 34.911075592041016, 37.18119812011719, 39.451324462890625, 41.7214469909668, 43.99156951904297, 46.261695861816406, 48.53181838989258, 50.80194091796875, 53.07206726074219, 55.34218978881836, 57.61231231689453, 59.88243865966797, 62.15256118774414, 64.42268371582031, 66.69281005859375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 11.0, 6.0, 14.0, 14.0, 12.0, 16.0, 26.0, 34.0, 21.0, 30.0, 45.0, 49.0, 44.0, 65.0, 53.0, 69.0, 48.0, 54.0, 55.0, 35.0, 41.0, 33.0, 39.0, 25.0, 18.0, 15.0, 18.0, 18.0, 9.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.8060302734375, -8.526123046875, -8.2462158203125, -7.96630859375, -7.6864013671875, -7.406494140625, -7.1265869140625, -6.8466796875, -6.5667724609375, -6.286865234375, -6.0069580078125, -5.72705078125, -5.4471435546875, -5.167236328125, -4.8873291015625, -4.607421875, -4.3275146484375, -4.047607421875, -3.7677001953125, -3.48779296875, -3.2078857421875, -2.927978515625, -2.6480712890625, -2.3681640625, -2.0882568359375, -1.808349609375, -1.5284423828125, -1.24853515625, -0.9686279296875, -0.688720703125, -0.4088134765625, -0.12890625, 0.1510009765625, 0.430908203125, 0.7108154296875, 0.99072265625, 1.2706298828125, 1.550537109375, 1.8304443359375, 2.1103515625, 2.3902587890625, 2.670166015625, 2.9500732421875, 3.22998046875, 3.5098876953125, 3.789794921875, 4.0697021484375, 4.349609375, 4.6295166015625, 4.909423828125, 5.1893310546875, 5.46923828125, 5.7491455078125, 6.029052734375, 6.3089599609375, 6.5888671875, 6.8687744140625, 7.148681640625, 7.4285888671875, 7.70849609375, 7.9884033203125, 8.268310546875, 8.5482177734375, 8.828125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 23.0, 21.0, 42.0, 57.0, 54.0, 99.0, 119.0, 215.0, 306.0, 377.0, 536.0, 776.0, 1119.0, 1593.0, 2320.0, 3214.0, 4743.0, 7189.0, 10487.0, 16367.0, 25248.0, 40103.0, 64931.0, 107957.0, 178207.0, 218938.0, 138440.0, 83256.0, 50114.0, 31307.0, 19854.0, 13069.0, 8577.0, 5915.0, 3894.0, 2781.0, 1831.0, 1316.0, 948.0, 660.0, 451.0, 321.0, 230.0, 134.0, 113.0, 91.0, 71.0, 37.0, 29.0, 23.0, 17.0, 7.0, 8.0, 6.0, 3.0, 1.0, 2.0], "bins": [-0.147705078125, -0.14312362670898438, -0.13854217529296875, -0.13396072387695312, -0.1293792724609375, -0.12479782104492188, -0.12021636962890625, -0.11563491821289062, -0.111053466796875, -0.10647201538085938, -0.10189056396484375, -0.09730911254882812, -0.0927276611328125, -0.08814620971679688, -0.08356475830078125, -0.07898330688476562, -0.07440185546875, -0.06982040405273438, -0.06523895263671875, -0.060657501220703125, -0.0560760498046875, -0.051494598388671875, -0.04691314697265625, -0.042331695556640625, -0.037750244140625, -0.033168792724609375, -0.02858734130859375, -0.024005889892578125, -0.0194244384765625, -0.014842987060546875, -0.01026153564453125, -0.005680084228515625, -0.0010986328125, 0.003482818603515625, 0.00806427001953125, 0.012645721435546875, 0.0172271728515625, 0.021808624267578125, 0.02639007568359375, 0.030971527099609375, 0.035552978515625, 0.040134429931640625, 0.04471588134765625, 0.049297332763671875, 0.0538787841796875, 0.058460235595703125, 0.06304168701171875, 0.06762313842773438, 0.07220458984375, 0.07678604125976562, 0.08136749267578125, 0.08594894409179688, 0.0905303955078125, 0.09511184692382812, 0.09969329833984375, 0.10427474975585938, 0.108856201171875, 0.11343765258789062, 0.11801910400390625, 0.12260055541992188, 0.1271820068359375, 0.13176345825195312, 0.13634490966796875, 0.14092636108398438, 0.1455078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 6.0, 3.0, 8.0, 6.0, 13.0, 12.0, 12.0, 13.0, 17.0, 18.0, 22.0, 19.0, 22.0, 22.0, 33.0, 34.0, 40.0, 33.0, 40.0, 55.0, 43.0, 1060.0, 39.0, 32.0, 49.0, 35.0, 39.0, 34.0, 32.0, 31.0, 25.0, 18.0, 29.0, 15.0, 13.0, 17.0, 16.0, 11.0, 8.0, 12.0, 6.0, 6.0, 7.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.1640625, -4.03155517578125, -3.8990478515625, -3.76654052734375, -3.634033203125, -3.50152587890625, -3.3690185546875, -3.23651123046875, -3.10400390625, -2.97149658203125, -2.8389892578125, -2.70648193359375, -2.573974609375, -2.44146728515625, -2.3089599609375, -2.17645263671875, -2.0439453125, -1.91143798828125, -1.7789306640625, -1.64642333984375, -1.513916015625, -1.38140869140625, -1.2489013671875, -1.11639404296875, -0.98388671875, -0.85137939453125, -0.7188720703125, -0.58636474609375, -0.453857421875, -0.32135009765625, -0.1888427734375, -0.05633544921875, 0.076171875, 0.20867919921875, 0.3411865234375, 0.47369384765625, 0.606201171875, 0.73870849609375, 0.8712158203125, 1.00372314453125, 1.13623046875, 1.26873779296875, 1.4012451171875, 1.53375244140625, 1.666259765625, 1.79876708984375, 1.9312744140625, 2.06378173828125, 2.1962890625, 2.32879638671875, 2.4613037109375, 2.59381103515625, 2.726318359375, 2.85882568359375, 2.9913330078125, 3.12384033203125, 3.25634765625, 3.38885498046875, 3.5213623046875, 3.65386962890625, 3.786376953125, 3.91888427734375, 4.0513916015625, 4.18389892578125, 4.31640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 6.0, 20.0, 18.0, 28.0, 35.0, 75.0, 111.0, 142.0, 192.0, 304.0, 374.0, 552.0, 822.0, 1129.0, 1591.0, 2174.0, 3037.0, 4247.0, 5870.0, 8328.0, 11657.0, 16433.0, 22950.0, 32903.0, 46501.0, 67251.0, 98673.0, 143971.0, 1216559.0, 126525.0, 86144.0, 58743.0, 40545.0, 28828.0, 20181.0, 14312.0, 10166.0, 7416.0, 5186.0, 3760.0, 2686.0, 1893.0, 1375.0, 994.0, 678.0, 503.0, 376.0, 269.0, 170.0, 143.0, 96.0, 73.0, 42.0, 31.0, 16.0, 8.0, 13.0, 8.0, 3.0, 5.0], "bins": [-0.0596923828125, -0.0578455924987793, -0.055998802185058594, -0.05415201187133789, -0.05230522155761719, -0.050458431243896484, -0.04861164093017578, -0.04676485061645508, -0.044918060302734375, -0.04307126998901367, -0.04122447967529297, -0.039377689361572266, -0.03753089904785156, -0.03568410873413086, -0.033837318420410156, -0.03199052810668945, -0.03014373779296875, -0.028296947479248047, -0.026450157165527344, -0.02460336685180664, -0.022756576538085938, -0.020909786224365234, -0.01906299591064453, -0.017216205596923828, -0.015369415283203125, -0.013522624969482422, -0.011675834655761719, -0.009829044342041016, -0.007982254028320312, -0.006135463714599609, -0.004288673400878906, -0.002441883087158203, -0.0005950927734375, 0.0012516975402832031, 0.0030984878540039062, 0.004945278167724609, 0.0067920684814453125, 0.008638858795166016, 0.010485649108886719, 0.012332439422607422, 0.014179229736328125, 0.016026020050048828, 0.01787281036376953, 0.019719600677490234, 0.021566390991210938, 0.02341318130493164, 0.025259971618652344, 0.027106761932373047, 0.02895355224609375, 0.030800342559814453, 0.032647132873535156, 0.03449392318725586, 0.03634071350097656, 0.038187503814697266, 0.04003429412841797, 0.04188108444213867, 0.043727874755859375, 0.04557466506958008, 0.04742145538330078, 0.049268245697021484, 0.05111503601074219, 0.05296182632446289, 0.054808616638183594, 0.0566554069519043, 0.058502197265625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 6.0, 17.0, 28.0, 19.0, 28.0, 36.0, 53.0, 43.0, 69.0, 72.0, 76.0, 70.0, 77.0, 80.0, 51.0, 64.0, 52.0, 32.0, 28.0, 29.0, 14.0, 10.0, 14.0, 6.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027441978454589844, -0.00026644766330718994, -0.00025847554206848145, -0.00025050342082977295, -0.00024253129959106445, -0.00023455917835235596, -0.00022658705711364746, -0.00021861493587493896, -0.00021064281463623047, -0.00020267069339752197, -0.00019469857215881348, -0.00018672645092010498, -0.00017875432968139648, -0.000170782208442688, -0.0001628100872039795, -0.000154837965965271, -0.0001468658447265625, -0.000138893723487854, -0.0001309216022491455, -0.000122949481010437, -0.00011497735977172852, -0.00010700523853302002, -9.903311729431152e-05, -9.106099605560303e-05, -8.308887481689453e-05, -7.511675357818604e-05, -6.714463233947754e-05, -5.917251110076904e-05, -5.120038986206055e-05, -4.322826862335205e-05, -3.5256147384643555e-05, -2.728402614593506e-05, -1.9311904907226562e-05, -1.1339783668518066e-05, -3.3676624298095703e-06, 4.604458808898926e-06, 1.2576580047607422e-05, 2.0548701286315918e-05, 2.8520822525024414e-05, 3.649294376373291e-05, 4.4465065002441406e-05, 5.24371862411499e-05, 6.04093074798584e-05, 6.83814287185669e-05, 7.635354995727539e-05, 8.432567119598389e-05, 9.229779243469238e-05, 0.00010026991367340088, 0.00010824203491210938, 0.00011621415615081787, 0.00012418627738952637, 0.00013215839862823486, 0.00014013051986694336, 0.00014810264110565186, 0.00015607476234436035, 0.00016404688358306885, 0.00017201900482177734, 0.00017999112606048584, 0.00018796324729919434, 0.00019593536853790283, 0.00020390748977661133, 0.00021187961101531982, 0.00021985173225402832, 0.00022782385349273682, 0.0002357959747314453]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 4.0, 12.0, 19.0, 24.0, 33.0, 58.0, 70.0, 107.0, 131.0, 186.0, 252.0, 302.0, 746.0, 13932.0, 1024165.0, 6674.0, 629.0, 304.0, 258.0, 159.0, 126.0, 104.0, 69.0, 51.0, 41.0, 26.0, 17.0, 10.0, 11.0, 11.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003814697265625, -0.0036893486976623535, -0.003564000129699707, -0.0034386515617370605, -0.003313302993774414, -0.0031879544258117676, -0.003062605857849121, -0.0029372572898864746, -0.002811908721923828, -0.0026865601539611816, -0.002561211585998535, -0.0024358630180358887, -0.002310514450073242, -0.0021851658821105957, -0.0020598173141479492, -0.0019344687461853027, -0.0018091201782226562, -0.0016837716102600098, -0.0015584230422973633, -0.0014330744743347168, -0.0013077259063720703, -0.0011823773384094238, -0.0010570287704467773, -0.0009316802024841309, -0.0008063316345214844, -0.0006809830665588379, -0.0005556344985961914, -0.0004302859306335449, -0.00030493736267089844, -0.00017958879470825195, -5.424022674560547e-05, 7.110834121704102e-05, 0.0001964569091796875, 0.000321805477142334, 0.00044715404510498047, 0.000572502613067627, 0.0006978511810302734, 0.0008231997489929199, 0.0009485483169555664, 0.0010738968849182129, 0.0011992454528808594, 0.0013245940208435059, 0.0014499425888061523, 0.0015752911567687988, 0.0017006397247314453, 0.0018259882926940918, 0.0019513368606567383, 0.0020766854286193848, 0.0022020339965820312, 0.0023273825645446777, 0.0024527311325073242, 0.0025780797004699707, 0.002703428268432617, 0.0028287768363952637, 0.00295412540435791, 0.0030794739723205566, 0.003204822540283203, 0.0033301711082458496, 0.003455519676208496, 0.0035808682441711426, 0.003706216812133789, 0.0038315653800964355, 0.003956913948059082, 0.0040822625160217285, 0.004207611083984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 19.0, 592.0, 376.0, 27.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009625245584174991, -0.0009280359954573214, -0.0008935473742894828, -0.0008590588113293052, -0.0008245701901614666, -0.0007900816272012889, -0.0007555930642411113, -0.0007211044430732727, -0.000686615880113095, -0.0006521273171529174, -0.0006176386959850788, -0.0005831501330249012, -0.0005486615700647235, -0.0005141729488968849, -0.00047968438593670726, -0.00044519579387269914, -0.000410707201808691, -0.0003762186097446829, -0.0003417300176806748, -0.00030724145472049713, -0.000272752862656489, -0.0002382642705924809, -0.000203775693080388, -0.00016928711556829512, -0.000134798523504287, -0.0001003099387162365, -6.5821353928186e-05, -3.13327691401355e-05, 3.1558156479150057e-06, 3.764440771192312e-05, 7.213298522401601e-05, 0.0001066215627361089, 0.0001411100383847952, 0.0001755986304488033, 0.0002100872079608962, 0.0002445757854729891, 0.0002790643775369972, 0.0003135529696010053, 0.000348041532561183, 0.0003825301246251911, 0.0004170187166891992, 0.0004515073087532073, 0.00048599590081721544, 0.0005204844637773931, 0.0005549730267375708, 0.0005894616479054093, 0.000623950210865587, 0.0006584387738257647, 0.0006929273949936032, 0.0007274159579537809, 0.0007619045791216195, 0.0007963931420817971, 0.0008308817632496357, 0.0008653703262098134, 0.000899858889169991, 0.0009343475103378296, 0.0009688360732980072, 0.001003324636258185, 0.0010378132574260235, 0.001072301878593862, 0.0011067903833463788, 0.0011412790045142174, 0.001175767625682056, 0.0012102561304345727, 0.0012447447516024113]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 2.0, 12.0, 11.0, 15.0, 15.0, 18.0, 19.0, 25.0, 25.0, 25.0, 25.0, 29.0, 27.0, 49.0, 38.0, 32.0, 29.0, 32.0, 49.0, 33.0, 44.0, 29.0, 36.0, 32.0, 36.0, 25.0, 36.0, 30.0, 31.0, 20.0, 25.0, 21.0, 17.0, 21.0, 10.0, 14.0, 7.0, 5.0, 6.0, 6.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0001232624053955078, -0.00011950545012950897, -0.00011574849486351013, -0.00011199153959751129, -0.00010823458433151245, -0.00010447762906551361, -0.00010072067379951477, -9.696371853351593e-05, -9.320676326751709e-05, -8.944980800151825e-05, -8.569285273551941e-05, -8.193589746952057e-05, -7.817894220352173e-05, -7.442198693752289e-05, -7.066503167152405e-05, -6.690807640552521e-05, -6.315112113952637e-05, -5.939416587352753e-05, -5.5637210607528687e-05, -5.1880255341529846e-05, -4.8123300075531006e-05, -4.4366344809532166e-05, -4.0609389543533325e-05, -3.6852434277534485e-05, -3.3095479011535645e-05, -2.9338523745536804e-05, -2.5581568479537964e-05, -2.1824613213539124e-05, -1.8067657947540283e-05, -1.4310702681541443e-05, -1.0553747415542603e-05, -6.796792149543762e-06, -3.039836883544922e-06, 7.171183824539185e-07, 4.474073648452759e-06, 8.231028914451599e-06, 1.198798418045044e-05, 1.574493944644928e-05, 1.950189471244812e-05, 2.325884997844696e-05, 2.70158052444458e-05, 3.077276051044464e-05, 3.452971577644348e-05, 3.828667104244232e-05, 4.204362630844116e-05, 4.580058157444e-05, 4.955753684043884e-05, 5.331449210643768e-05, 5.7071447372436523e-05, 6.0828402638435364e-05, 6.45853579044342e-05, 6.834231317043304e-05, 7.209926843643188e-05, 7.585622370243073e-05, 7.961317896842957e-05, 8.33701342344284e-05, 8.712708950042725e-05, 9.088404476642609e-05, 9.464100003242493e-05, 9.839795529842377e-05, 0.00010215491056442261, 0.00010591186583042145, 0.00010966882109642029, 0.00011342577636241913, 0.00011718273162841797]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 11.0, 6.0, 14.0, 14.0, 12.0, 16.0, 26.0, 34.0, 21.0, 30.0, 45.0, 49.0, 44.0, 65.0, 53.0, 69.0, 48.0, 54.0, 55.0, 35.0, 41.0, 33.0, 39.0, 25.0, 18.0, 15.0, 18.0, 18.0, 9.0, 14.0, 10.0, 8.0, 4.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.8060302734375, -8.526123046875, -8.2462158203125, -7.96630859375, -7.6864013671875, -7.406494140625, -7.1265869140625, -6.8466796875, -6.5667724609375, -6.286865234375, -6.0069580078125, -5.72705078125, -5.4471435546875, -5.167236328125, -4.8873291015625, -4.607421875, -4.3275146484375, -4.047607421875, -3.7677001953125, -3.48779296875, -3.2078857421875, -2.927978515625, -2.6480712890625, -2.3681640625, -2.0882568359375, -1.808349609375, -1.5284423828125, -1.24853515625, -0.9686279296875, -0.688720703125, -0.4088134765625, -0.12890625, 0.1510009765625, 0.430908203125, 0.7108154296875, 0.99072265625, 1.2706298828125, 1.550537109375, 1.8304443359375, 2.1103515625, 2.3902587890625, 2.670166015625, 2.9500732421875, 3.22998046875, 3.5098876953125, 3.789794921875, 4.0697021484375, 4.349609375, 4.6295166015625, 4.909423828125, 5.1893310546875, 5.46923828125, 5.7491455078125, 6.029052734375, 6.3089599609375, 6.5888671875, 6.8687744140625, 7.148681640625, 7.4285888671875, 7.70849609375, 7.9884033203125, 8.268310546875, 8.5482177734375, 8.828125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 10.0, 18.0, 20.0, 25.0, 26.0, 45.0, 52.0, 88.0, 93.0, 125.0, 162.0, 255.0, 360.0, 546.0, 820.0, 1244.0, 2252.0, 4049.0, 7867.0, 20317.0, 133324.0, 795785.0, 52976.0, 13671.0, 6022.0, 3120.0, 1843.0, 1136.0, 685.0, 457.0, 285.0, 215.0, 150.0, 125.0, 89.0, 75.0, 53.0, 43.0, 25.0, 21.0, 14.0, 13.0, 16.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.0625, -14.6103515625, -14.158203125, -13.7060546875, -13.25390625, -12.8017578125, -12.349609375, -11.8974609375, -11.4453125, -10.9931640625, -10.541015625, -10.0888671875, -9.63671875, -9.1845703125, -8.732421875, -8.2802734375, -7.828125, -7.3759765625, -6.923828125, -6.4716796875, -6.01953125, -5.5673828125, -5.115234375, -4.6630859375, -4.2109375, -3.7587890625, -3.306640625, -2.8544921875, -2.40234375, -1.9501953125, -1.498046875, -1.0458984375, -0.59375, -0.1416015625, 0.310546875, 0.7626953125, 1.21484375, 1.6669921875, 2.119140625, 2.5712890625, 3.0234375, 3.4755859375, 3.927734375, 4.3798828125, 4.83203125, 5.2841796875, 5.736328125, 6.1884765625, 6.640625, 7.0927734375, 7.544921875, 7.9970703125, 8.44921875, 8.9013671875, 9.353515625, 9.8056640625, 10.2578125, 10.7099609375, 11.162109375, 11.6142578125, 12.06640625, 12.5185546875, 12.970703125, 13.4228515625, 13.875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 5.0, 5.0, 5.0, 8.0, 10.0, 18.0, 17.0, 19.0, 25.0, 20.0, 26.0, 44.0, 41.0, 44.0, 49.0, 56.0, 57.0, 109.0, 1715.0, 260.0, 87.0, 60.0, 43.0, 49.0, 40.0, 31.0, 24.0, 32.0, 28.0, 24.0, 17.0, 12.0, 14.0, 4.0, 8.0, 9.0, 6.0, 4.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-33.1875, -32.234375, -31.28125, -30.328125, -29.375, -28.421875, -27.46875, -26.515625, -25.5625, -24.609375, -23.65625, -22.703125, -21.75, -20.796875, -19.84375, -18.890625, -17.9375, -16.984375, -16.03125, -15.078125, -14.125, -13.171875, -12.21875, -11.265625, -10.3125, -9.359375, -8.40625, -7.453125, -6.5, -5.546875, -4.59375, -3.640625, -2.6875, -1.734375, -0.78125, 0.171875, 1.125, 2.078125, 3.03125, 3.984375, 4.9375, 5.890625, 6.84375, 7.796875, 8.75, 9.703125, 10.65625, 11.609375, 12.5625, 13.515625, 14.46875, 15.421875, 16.375, 17.328125, 18.28125, 19.234375, 20.1875, 21.140625, 22.09375, 23.046875, 24.0, 24.953125, 25.90625, 26.859375, 27.8125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 5.0, 9.0, 7.0, 4.0, 13.0, 15.0, 21.0, 27.0, 37.0, 47.0, 65.0, 80.0, 126.0, 286.0, 601.0, 1521.0, 6901.0, 88240.0, 3002830.0, 38095.0, 4433.0, 1152.0, 473.0, 257.0, 134.0, 82.0, 52.0, 41.0, 31.0, 24.0, 23.0, 13.0, 14.0, 12.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-40.78125, -39.39306640625, -38.0048828125, -36.61669921875, -35.228515625, -33.84033203125, -32.4521484375, -31.06396484375, -29.67578125, -28.28759765625, -26.8994140625, -25.51123046875, -24.123046875, -22.73486328125, -21.3466796875, -19.95849609375, -18.5703125, -17.18212890625, -15.7939453125, -14.40576171875, -13.017578125, -11.62939453125, -10.2412109375, -8.85302734375, -7.46484375, -6.07666015625, -4.6884765625, -3.30029296875, -1.912109375, -0.52392578125, 0.8642578125, 2.25244140625, 3.640625, 5.02880859375, 6.4169921875, 7.80517578125, 9.193359375, 10.58154296875, 11.9697265625, 13.35791015625, 14.74609375, 16.13427734375, 17.5224609375, 18.91064453125, 20.298828125, 21.68701171875, 23.0751953125, 24.46337890625, 25.8515625, 27.23974609375, 28.6279296875, 30.01611328125, 31.404296875, 32.79248046875, 34.1806640625, 35.56884765625, 36.95703125, 38.34521484375, 39.7333984375, 41.12158203125, 42.509765625, 43.89794921875, 45.2861328125, 46.67431640625, 48.0625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [8.0, 784.0, 221.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.034774780273438, -11.262662887573242, 2.509449005126953, 16.28156280517578, 30.053672790527344, 43.825782775878906, 57.597900390625, 71.37001037597656, 85.14212036132812, 98.91423034667969, 112.68634033203125, 126.45845794677734, 140.23056030273438, 154.002685546875, 167.77479553222656, 181.54690551757812, 195.3190155029297, 209.09112548828125, 222.8632354736328, 236.63534545898438, 250.407470703125, 264.1795654296875, 277.9516906738281, 291.72381591796875, 305.49591064453125, 319.2680358886719, 333.0401306152344, 346.812255859375, 360.5843505859375, 374.3564758300781, 388.12860107421875, 401.90069580078125, 415.67279052734375, 429.4449157714844, 443.2170104980469, 456.9891357421875, 470.76123046875, 484.5333557128906, 498.30548095703125, 512.0775756835938, 525.8496704101562, 539.6217651367188, 553.3939208984375, 567.166015625, 580.9381103515625, 594.710205078125, 608.4823608398438, 622.2544555664062, 636.026611328125, 649.7987060546875, 663.5708618164062, 677.3429565429688, 691.1150512695312, 704.8871459960938, 718.6593017578125, 732.431396484375, 746.2034912109375, 759.9755859375, 773.7477416992188, 787.5198364257812, 801.2919311523438, 815.0640258789062, 828.836181640625, 842.6082763671875, 856.38037109375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 15.0, 12.0, 12.0, 24.0, 22.0, 30.0, 33.0, 32.0, 26.0, 34.0, 32.0, 40.0, 35.0, 44.0, 59.0, 43.0, 38.0, 39.0, 48.0, 44.0, 36.0, 35.0, 28.0, 34.0, 27.0, 20.0, 24.0, 15.0, 11.0, 12.0, 18.0, 8.0, 7.0, 3.0, 5.0, 7.0, 0.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-100.16007232666016, -97.13978576660156, -94.11949920654297, -91.0992202758789, -88.07893371582031, -85.05864715576172, -82.03836059570312, -79.01808166503906, -75.99779510498047, -72.97750854492188, -69.95722198486328, -66.93694305419922, -63.916656494140625, -60.89636993408203, -57.87608337402344, -54.85580062866211, -51.835514068603516, -48.81522750854492, -45.794944763183594, -42.774658203125, -39.75437545776367, -36.73408889770508, -33.71380615234375, -30.693519592285156, -27.673234939575195, -24.652950286865234, -21.632665634155273, -18.612380981445312, -15.592095375061035, -12.571810722351074, -9.551525115966797, -6.531240463256836, -3.510955810546875, -0.49067091941833496, 2.529613971710205, 5.549899101257324, 8.570183753967285, 11.590468406677246, 14.610754013061523, 17.631038665771484, 20.651323318481445, 23.671607971191406, 26.691892623901367, 29.712177276611328, 32.73246383666992, 35.75274658203125, 38.773033142089844, 41.79331970214844, 44.813602447509766, 47.83388900756836, 50.85417175292969, 53.87445831298828, 56.89474105834961, 59.9150276184082, 62.93531036376953, 65.95559692382812, 68.97588348388672, 71.99617004394531, 75.0164566040039, 78.03673553466797, 81.05702209472656, 84.07730865478516, 87.09759521484375, 90.11787414550781, 93.1381607055664]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 10.0, 9.0, 12.0, 13.0, 7.0, 15.0, 17.0, 27.0, 24.0, 31.0, 33.0, 44.0, 39.0, 53.0, 52.0, 51.0, 69.0, 60.0, 53.0, 50.0, 46.0, 39.0, 36.0, 28.0, 31.0, 17.0, 21.0, 14.0, 15.0, 14.0, 18.0, 10.0, 9.0, 1.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -8.989501953125, -8.70556640625, -8.421630859375, -8.1376953125, -7.853759765625, -7.56982421875, -7.285888671875, -7.001953125, -6.718017578125, -6.43408203125, -6.150146484375, -5.8662109375, -5.582275390625, -5.29833984375, -5.014404296875, -4.73046875, -4.446533203125, -4.16259765625, -3.878662109375, -3.5947265625, -3.310791015625, -3.02685546875, -2.742919921875, -2.458984375, -2.175048828125, -1.89111328125, -1.607177734375, -1.3232421875, -1.039306640625, -0.75537109375, -0.471435546875, -0.1875, 0.096435546875, 0.38037109375, 0.664306640625, 0.9482421875, 1.232177734375, 1.51611328125, 1.800048828125, 2.083984375, 2.367919921875, 2.65185546875, 2.935791015625, 3.2197265625, 3.503662109375, 3.78759765625, 4.071533203125, 4.35546875, 4.639404296875, 4.92333984375, 5.207275390625, 5.4912109375, 5.775146484375, 6.05908203125, 6.343017578125, 6.626953125, 6.910888671875, 7.19482421875, 7.478759765625, 7.7626953125, 8.046630859375, 8.33056640625, 8.614501953125, 8.8984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 8.0, 14.0, 19.0, 21.0, 36.0, 49.0, 52.0, 123.0, 181.0, 282.0, 443.0, 717.0, 1189.0, 2148.0, 3988.0, 8250.0, 21876.0, 359691.0, 3592159.0, 170352.0, 17483.0, 7069.0, 3536.0, 1893.0, 1037.0, 646.0, 406.0, 192.0, 139.0, 80.0, 72.0, 30.0, 32.0, 21.0, 12.0, 5.0, 5.0, 2.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.71875, -33.67919921875, -32.6396484375, -31.60009765625, -30.560546875, -29.52099609375, -28.4814453125, -27.44189453125, -26.40234375, -25.36279296875, -24.3232421875, -23.28369140625, -22.244140625, -21.20458984375, -20.1650390625, -19.12548828125, -18.0859375, -17.04638671875, -16.0068359375, -14.96728515625, -13.927734375, -12.88818359375, -11.8486328125, -10.80908203125, -9.76953125, -8.72998046875, -7.6904296875, -6.65087890625, -5.611328125, -4.57177734375, -3.5322265625, -2.49267578125, -1.453125, -0.41357421875, 0.6259765625, 1.66552734375, 2.705078125, 3.74462890625, 4.7841796875, 5.82373046875, 6.86328125, 7.90283203125, 8.9423828125, 9.98193359375, 11.021484375, 12.06103515625, 13.1005859375, 14.14013671875, 15.1796875, 16.21923828125, 17.2587890625, 18.29833984375, 19.337890625, 20.37744140625, 21.4169921875, 22.45654296875, 23.49609375, 24.53564453125, 25.5751953125, 26.61474609375, 27.654296875, 28.69384765625, 29.7333984375, 30.77294921875, 31.8125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 8.0, 8.0, 5.0, 4.0, 10.0, 18.0, 13.0, 20.0, 25.0, 41.0, 39.0, 50.0, 99.0, 193.0, 373.0, 714.0, 961.0, 674.0, 317.0, 164.0, 71.0, 58.0, 27.0, 40.0, 24.0, 15.0, 26.0, 7.0, 11.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.296875, -24.516357421875, -23.73583984375, -22.955322265625, -22.1748046875, -21.394287109375, -20.61376953125, -19.833251953125, -19.052734375, -18.272216796875, -17.49169921875, -16.711181640625, -15.9306640625, -15.150146484375, -14.36962890625, -13.589111328125, -12.80859375, -12.028076171875, -11.24755859375, -10.467041015625, -9.6865234375, -8.906005859375, -8.12548828125, -7.344970703125, -6.564453125, -5.783935546875, -5.00341796875, -4.222900390625, -3.4423828125, -2.661865234375, -1.88134765625, -1.100830078125, -0.3203125, 0.460205078125, 1.24072265625, 2.021240234375, 2.8017578125, 3.582275390625, 4.36279296875, 5.143310546875, 5.923828125, 6.704345703125, 7.48486328125, 8.265380859375, 9.0458984375, 9.826416015625, 10.60693359375, 11.387451171875, 12.16796875, 12.948486328125, 13.72900390625, 14.509521484375, 15.2900390625, 16.070556640625, 16.85107421875, 17.631591796875, 18.412109375, 19.192626953125, 19.97314453125, 20.753662109375, 21.5341796875, 22.314697265625, 23.09521484375, 23.875732421875, 24.65625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 6.0, 12.0, 15.0, 21.0, 24.0, 37.0, 55.0, 80.0, 112.0, 170.0, 239.0, 394.0, 579.0, 991.0, 1620.0, 2848.0, 5362.0, 10841.0, 24947.0, 76530.0, 751621.0, 3064432.0, 179383.0, 40918.0, 16001.0, 7619.0, 3890.0, 2113.0, 1257.0, 781.0, 501.0, 303.0, 168.0, 99.0, 63.0, 62.0, 46.0, 36.0, 27.0, 21.0, 12.0, 9.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-30.6875, -29.73583984375, -28.7841796875, -27.83251953125, -26.880859375, -25.92919921875, -24.9775390625, -24.02587890625, -23.07421875, -22.12255859375, -21.1708984375, -20.21923828125, -19.267578125, -18.31591796875, -17.3642578125, -16.41259765625, -15.4609375, -14.50927734375, -13.5576171875, -12.60595703125, -11.654296875, -10.70263671875, -9.7509765625, -8.79931640625, -7.84765625, -6.89599609375, -5.9443359375, -4.99267578125, -4.041015625, -3.08935546875, -2.1376953125, -1.18603515625, -0.234375, 0.71728515625, 1.6689453125, 2.62060546875, 3.572265625, 4.52392578125, 5.4755859375, 6.42724609375, 7.37890625, 8.33056640625, 9.2822265625, 10.23388671875, 11.185546875, 12.13720703125, 13.0888671875, 14.04052734375, 14.9921875, 15.94384765625, 16.8955078125, 17.84716796875, 18.798828125, 19.75048828125, 20.7021484375, 21.65380859375, 22.60546875, 23.55712890625, 24.5087890625, 25.46044921875, 26.412109375, 27.36376953125, 28.3154296875, 29.26708984375, 30.21875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 26.0, 34.0, 68.0, 128.0, 190.0, 204.0, 133.0, 68.0, 56.0, 25.0, 17.0, 15.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.36418151855469, -74.26775360107422, -70.17131805419922, -66.07489013671875, -61.978458404541016, -57.88202667236328, -53.78559875488281, -49.68916702270508, -45.592735290527344, -41.49630355834961, -37.399871826171875, -33.303443908691406, -29.207012176513672, -25.110580444335938, -21.014150619506836, -16.917720794677734, -12.8212890625, -8.724858283996582, -4.628427505493164, -0.5319967269897461, 3.564434051513672, 7.660865783691406, 11.757295608520508, 15.85372543334961, 19.950157165527344, 24.046588897705078, 28.14301872253418, 32.23944854736328, 36.335880279541016, 40.43231201171875, 44.52873992919922, 48.62517166137695, 52.72160339355469, 56.81803512573242, 60.914466857910156, 65.01089477539062, 69.10733032226562, 73.2037582397461, 77.30018615722656, 81.39662170410156, 85.49304962158203, 89.5894775390625, 93.6859130859375, 97.78234100341797, 101.87876892089844, 105.97520446777344, 110.0716323852539, 114.16806030273438, 118.26449584960938, 122.36092376708984, 126.45735931396484, 130.5537872314453, 134.6502227783203, 138.74664306640625, 142.84307861328125, 146.93951416015625, 151.03594970703125, 155.13238525390625, 159.2288055419922, 163.3252410888672, 167.4216766357422, 171.51809692382812, 175.61453247070312, 179.71096801757812, 183.80738830566406]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 9.0, 5.0, 8.0, 13.0, 10.0, 15.0, 13.0, 19.0, 22.0, 21.0, 24.0, 28.0, 51.0, 38.0, 32.0, 39.0, 43.0, 54.0, 48.0, 43.0, 44.0, 51.0, 49.0, 33.0, 28.0, 35.0, 32.0, 24.0, 23.0, 20.0, 17.0, 25.0, 20.0, 17.0, 9.0, 8.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.7494125366211, -75.25308990478516, -72.75676727294922, -70.26044464111328, -67.76412200927734, -65.2677993774414, -62.771480560302734, -60.2751579284668, -57.77883529663086, -55.28251266479492, -52.786190032958984, -50.28986740112305, -47.793548583984375, -45.29722595214844, -42.8009033203125, -40.30458068847656, -37.808258056640625, -35.31193542480469, -32.81561279296875, -30.319292068481445, -27.822969436645508, -25.32664680480957, -22.830326080322266, -20.334003448486328, -17.83768081665039, -15.341358184814453, -12.845036506652832, -10.348714828491211, -7.852392196655273, -5.356069564819336, -2.859747886657715, -0.36342620849609375, 2.132904052734375, 4.629226207733154, 7.125548362731934, 9.621870040893555, 12.118192672729492, 14.61451530456543, 17.110836029052734, 19.607158660888672, 22.10348129272461, 24.599803924560547, 27.096126556396484, 29.59244728088379, 32.088768005371094, 34.58509063720703, 37.08141326904297, 39.577735900878906, 42.074058532714844, 44.57038116455078, 47.06670379638672, 49.563026428222656, 52.059349060058594, 54.55567169189453, 57.0519905090332, 59.54831314086914, 62.04463577270508, 64.54095458984375, 67.03727722167969, 69.53359985351562, 72.02992248535156, 74.5262451171875, 77.02256774902344, 79.51889038085938, 82.01521301269531]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 3.0, 9.0, 15.0, 6.0, 14.0, 16.0, 18.0, 25.0, 24.0, 33.0, 39.0, 29.0, 44.0, 60.0, 36.0, 54.0, 54.0, 59.0, 49.0, 46.0, 44.0, 56.0, 33.0, 32.0, 29.0, 24.0, 29.0, 12.0, 19.0, 11.0, 15.0, 9.0, 13.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.8184814453125, -8.543212890625, -8.2679443359375, -7.99267578125, -7.7174072265625, -7.442138671875, -7.1668701171875, -6.8916015625, -6.6163330078125, -6.341064453125, -6.0657958984375, -5.79052734375, -5.5152587890625, -5.239990234375, -4.9647216796875, -4.689453125, -4.4141845703125, -4.138916015625, -3.8636474609375, -3.58837890625, -3.3131103515625, -3.037841796875, -2.7625732421875, -2.4873046875, -2.2120361328125, -1.936767578125, -1.6614990234375, -1.38623046875, -1.1109619140625, -0.835693359375, -0.5604248046875, -0.28515625, -0.0098876953125, 0.265380859375, 0.5406494140625, 0.81591796875, 1.0911865234375, 1.366455078125, 1.6417236328125, 1.9169921875, 2.1922607421875, 2.467529296875, 2.7427978515625, 3.01806640625, 3.2933349609375, 3.568603515625, 3.8438720703125, 4.119140625, 4.3944091796875, 4.669677734375, 4.9449462890625, 5.22021484375, 5.4954833984375, 5.770751953125, 6.0460205078125, 6.3212890625, 6.5965576171875, 6.871826171875, 7.1470947265625, 7.42236328125, 7.6976318359375, 7.972900390625, 8.2481689453125, 8.5234375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 8.0, 6.0, 12.0, 22.0, 20.0, 42.0, 56.0, 89.0, 119.0, 148.0, 227.0, 332.0, 483.0, 707.0, 1091.0, 1575.0, 2533.0, 3892.0, 6016.0, 9637.0, 15729.0, 25848.0, 43997.0, 76285.0, 139091.0, 253598.0, 204781.0, 108949.0, 60888.0, 35645.0, 21217.0, 12990.0, 7984.0, 4994.0, 3230.0, 2090.0, 1364.0, 880.0, 654.0, 417.0, 278.0, 171.0, 150.0, 94.0, 78.0, 54.0, 25.0, 16.0, 15.0, 9.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.1756591796875, -0.170135498046875, -0.16461181640625, -0.159088134765625, -0.153564453125, -0.148040771484375, -0.14251708984375, -0.136993408203125, -0.1314697265625, -0.125946044921875, -0.12042236328125, -0.114898681640625, -0.109375, -0.103851318359375, -0.09832763671875, -0.092803955078125, -0.0872802734375, -0.081756591796875, -0.07623291015625, -0.070709228515625, -0.065185546875, -0.059661865234375, -0.05413818359375, -0.048614501953125, -0.0430908203125, -0.037567138671875, -0.03204345703125, -0.026519775390625, -0.02099609375, -0.015472412109375, -0.00994873046875, -0.004425048828125, 0.0010986328125, 0.006622314453125, 0.01214599609375, 0.017669677734375, 0.023193359375, 0.028717041015625, 0.03424072265625, 0.039764404296875, 0.0452880859375, 0.050811767578125, 0.05633544921875, 0.061859130859375, 0.0673828125, 0.072906494140625, 0.07843017578125, 0.083953857421875, 0.0894775390625, 0.095001220703125, 0.10052490234375, 0.106048583984375, 0.111572265625, 0.117095947265625, 0.12261962890625, 0.128143310546875, 0.1336669921875, 0.139190673828125, 0.14471435546875, 0.150238037109375, 0.15576171875, 0.161285400390625, 0.16680908203125, 0.172332763671875, 0.1778564453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 7.0, 9.0, 12.0, 8.0, 9.0, 10.0, 20.0, 25.0, 23.0, 17.0, 20.0, 21.0, 42.0, 33.0, 36.0, 28.0, 23.0, 36.0, 44.0, 45.0, 1068.0, 40.0, 38.0, 45.0, 36.0, 34.0, 37.0, 30.0, 26.0, 25.0, 22.0, 20.0, 15.0, 17.0, 14.0, 15.0, 9.0, 10.0, 10.0, 12.0, 7.0, 3.0, 5.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.966796875, -3.832489013671875, -3.69818115234375, -3.563873291015625, -3.4295654296875, -3.295257568359375, -3.16094970703125, -3.026641845703125, -2.892333984375, -2.758026123046875, -2.62371826171875, -2.489410400390625, -2.3551025390625, -2.220794677734375, -2.08648681640625, -1.952178955078125, -1.81787109375, -1.683563232421875, -1.54925537109375, -1.414947509765625, -1.2806396484375, -1.146331787109375, -1.01202392578125, -0.877716064453125, -0.743408203125, -0.609100341796875, -0.47479248046875, -0.340484619140625, -0.2061767578125, -0.071868896484375, 0.06243896484375, 0.196746826171875, 0.3310546875, 0.465362548828125, 0.59967041015625, 0.733978271484375, 0.8682861328125, 1.002593994140625, 1.13690185546875, 1.271209716796875, 1.405517578125, 1.539825439453125, 1.67413330078125, 1.808441162109375, 1.9427490234375, 2.077056884765625, 2.21136474609375, 2.345672607421875, 2.47998046875, 2.614288330078125, 2.74859619140625, 2.882904052734375, 3.0172119140625, 3.151519775390625, 3.28582763671875, 3.420135498046875, 3.554443359375, 3.688751220703125, 3.82305908203125, 3.957366943359375, 4.0916748046875, 4.225982666015625, 4.36029052734375, 4.494598388671875, 4.62890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 11.0, 21.0, 23.0, 41.0, 50.0, 96.0, 111.0, 176.0, 277.0, 358.0, 588.0, 831.0, 1226.0, 1828.0, 2790.0, 4219.0, 6322.0, 9228.0, 14474.0, 21146.0, 32230.0, 48487.0, 74877.0, 118717.0, 812722.0, 608040.0, 118561.0, 75053.0, 49034.0, 31870.0, 21376.0, 14130.0, 9433.0, 6196.0, 4052.0, 2791.0, 1875.0, 1230.0, 857.0, 595.0, 389.0, 265.0, 173.0, 117.0, 85.0, 53.0, 37.0, 27.0, 14.0, 12.0, 3.0, 7.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06763076782226562, -0.06537628173828125, -0.06312179565429688, -0.0608673095703125, -0.058612823486328125, -0.05635833740234375, -0.054103851318359375, -0.051849365234375, -0.049594879150390625, -0.04734039306640625, -0.045085906982421875, -0.0428314208984375, -0.040576934814453125, -0.03832244873046875, -0.036067962646484375, -0.0338134765625, -0.031558990478515625, -0.02930450439453125, -0.027050018310546875, -0.0247955322265625, -0.022541046142578125, -0.02028656005859375, -0.018032073974609375, -0.015777587890625, -0.013523101806640625, -0.01126861572265625, -0.009014129638671875, -0.0067596435546875, -0.004505157470703125, -0.00225067138671875, 3.814697265625e-06, 0.00225830078125, 0.004512786865234375, 0.00676727294921875, 0.009021759033203125, 0.0112762451171875, 0.013530731201171875, 0.01578521728515625, 0.018039703369140625, 0.020294189453125, 0.022548675537109375, 0.02480316162109375, 0.027057647705078125, 0.0293121337890625, 0.031566619873046875, 0.03382110595703125, 0.036075592041015625, 0.038330078125, 0.040584564208984375, 0.04283905029296875, 0.045093536376953125, 0.0473480224609375, 0.049602508544921875, 0.05185699462890625, 0.054111480712890625, 0.056365966796875, 0.058620452880859375, 0.06087493896484375, 0.06312942504882812, 0.0653839111328125, 0.06763839721679688, 0.06989288330078125, 0.07214736938476562, 0.07440185546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 19.0, 17.0, 26.0, 30.0, 39.0, 52.0, 54.0, 88.0, 81.0, 71.0, 65.0, 76.0, 77.0, 77.0, 60.0, 43.0, 26.0, 25.0, 17.0, 17.0, 11.0, 10.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003476142883300781, -0.0003368891775608063, -0.0003261640667915344, -0.0003154389560222626, -0.0003047138452529907, -0.00029398873448371887, -0.000283263623714447, -0.00027253851294517517, -0.0002618134021759033, -0.00025108829140663147, -0.00024036318063735962, -0.00022963806986808777, -0.00021891295909881592, -0.00020818784832954407, -0.00019746273756027222, -0.00018673762679100037, -0.00017601251602172852, -0.00016528740525245667, -0.00015456229448318481, -0.00014383718371391296, -0.0001331120729446411, -0.00012238696217536926, -0.00011166185140609741, -0.00010093674063682556, -9.021162986755371e-05, -7.948651909828186e-05, -6.876140832901001e-05, -5.803629755973816e-05, -4.731118679046631e-05, -3.658607602119446e-05, -2.5860965251922607e-05, -1.5135854482650757e-05, -4.410743713378906e-06, 6.314367055892944e-06, 1.7039477825164795e-05, 2.7764588594436646e-05, 3.8489699363708496e-05, 4.921481013298035e-05, 5.99399209022522e-05, 7.066503167152405e-05, 8.13901424407959e-05, 9.211525321006775e-05, 0.0001028403639793396, 0.00011356547474861145, 0.0001242905855178833, 0.00013501569628715515, 0.000145740807056427, 0.00015646591782569885, 0.0001671910285949707, 0.00017791613936424255, 0.0001886412501335144, 0.00019936636090278625, 0.0002100914716720581, 0.00022081658244132996, 0.0002315416932106018, 0.00024226680397987366, 0.0002529919147491455, 0.00026371702551841736, 0.0002744421362876892, 0.00028516724705696106, 0.0002958923578262329, 0.00030661746859550476, 0.0003173425793647766, 0.00032806769013404846, 0.0003387928009033203]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 16.0, 19.0, 39.0, 70.0, 80.0, 125.0, 167.0, 250.0, 350.0, 727.0, 9486.0, 1025911.0, 9432.0, 773.0, 338.0, 215.0, 144.0, 126.0, 76.0, 61.0, 39.0, 35.0, 19.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052642822265625, -0.005097150802612305, -0.004930019378662109, -0.004762887954711914, -0.004595756530761719, -0.0044286251068115234, -0.004261493682861328, -0.004094362258911133, -0.0039272308349609375, -0.003760099411010742, -0.003592967987060547, -0.0034258365631103516, -0.0032587051391601562, -0.003091573715209961, -0.0029244422912597656, -0.0027573108673095703, -0.002590179443359375, -0.0024230480194091797, -0.0022559165954589844, -0.002088785171508789, -0.0019216537475585938, -0.0017545223236083984, -0.0015873908996582031, -0.0014202594757080078, -0.0012531280517578125, -0.0010859966278076172, -0.0009188652038574219, -0.0007517337799072266, -0.0005846023559570312, -0.00041747093200683594, -0.0002503395080566406, -8.320808410644531e-05, 8.392333984375e-05, 0.0002510547637939453, 0.0004181861877441406, 0.0005853176116943359, 0.0007524490356445312, 0.0009195804595947266, 0.0010867118835449219, 0.0012538433074951172, 0.0014209747314453125, 0.0015881061553955078, 0.0017552375793457031, 0.0019223690032958984, 0.0020895004272460938, 0.002256631851196289, 0.0024237632751464844, 0.0025908946990966797, 0.002758026123046875, 0.0029251575469970703, 0.0030922889709472656, 0.003259420394897461, 0.0034265518188476562, 0.0035936832427978516, 0.003760814666748047, 0.003927946090698242, 0.0040950775146484375, 0.004262208938598633, 0.004429340362548828, 0.0045964717864990234, 0.004763603210449219, 0.004930734634399414, 0.005097866058349609, 0.005264997482299805, 0.00543212890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 60.0, 900.0, 51.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.003988742362707853, -0.003920490853488445, -0.0038522391114383936, -0.003783987369388342, -0.003715735860168934, -0.003647484118118882, -0.003579232608899474, -0.0035109808668494225, -0.0034427293576300144, -0.0033744776155799627, -0.0033062261063605547, -0.003237974364310503, -0.003169722855091095, -0.0031014711130410433, -0.0030332196038216352, -0.0029649678617715836, -0.0028967163525521755, -0.002828464610502124, -0.002760213101282716, -0.002691961359232664, -0.002623709850013256, -0.0025554581079632044, -0.0024872065987437963, -0.0024189548566937447, -0.002350703114643693, -0.0022824513725936413, -0.0022141998633742332, -0.0021459481213241816, -0.0020776966121047735, -0.002009444870054722, -0.0019411933608353138, -0.001872941618785262, -0.0018046898767352104, -0.0017364382511004806, -0.0016681866254657507, -0.0015999349998310208, -0.001531683374196291, -0.001463431748561561, -0.0013951801229268312, -0.0013269283808767796, -0.0012586768716573715, -0.0011904252460226417, -0.0011221736203879118, -0.001053921994753182, -0.000985670369118452, -0.0009174187434837222, -0.0008491670596413314, -0.0007809154340066016, -0.0007126637501642108, -0.0006444121245294809, -0.0005761604988947511, -0.0005079088732600212, -0.0004396572185214609, -0.00037140559288673103, -0.0003031539381481707, -0.00023490231251344085, -0.00016665071598254144, -9.839908307185397e-05, -3.014745016116649e-05, 3.81041900254786e-05, 0.00010635581566020846, 0.00017460744129493833, 0.00024285909603349864, 0.0003111107216682285, 0.00037936234730295837]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 5.0, 14.0, 12.0, 18.0, 27.0, 23.0, 20.0, 23.0, 33.0, 45.0, 41.0, 47.0, 43.0, 47.0, 44.0, 50.0, 45.0, 58.0, 44.0, 43.0, 42.0, 38.0, 32.0, 32.0, 25.0, 18.0, 22.0, 21.0, 18.0, 12.0, 10.0, 14.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001506805419921875, -0.0001443866640329361, -0.0001380927860736847, -0.0001317989081144333, -0.00012550503015518188, -0.00011921115219593048, -0.00011291727423667908, -0.00010662339627742767, -0.00010032951831817627, -9.403564035892487e-05, -8.774176239967346e-05, -8.144788444042206e-05, -7.515400648117065e-05, -6.886012852191925e-05, -6.256625056266785e-05, -5.627237260341644e-05, -4.997849464416504e-05, -4.3684616684913635e-05, -3.739073872566223e-05, -3.109686076641083e-05, -2.4802982807159424e-05, -1.850910484790802e-05, -1.2215226888656616e-05, -5.921348929405212e-06, 3.725290298461914e-07, 6.666406989097595e-06, 1.2960284948348999e-05, 1.9254162907600403e-05, 2.5548040866851807e-05, 3.184191882610321e-05, 3.8135796785354614e-05, 4.442967474460602e-05, 5.072355270385742e-05, 5.7017430663108826e-05, 6.331130862236023e-05, 6.960518658161163e-05, 7.589906454086304e-05, 8.219294250011444e-05, 8.848682045936584e-05, 9.478069841861725e-05, 0.00010107457637786865, 0.00010736845433712006, 0.00011366233229637146, 0.00011995621025562286, 0.00012625008821487427, 0.00013254396617412567, 0.00013883784413337708, 0.00014513172209262848, 0.00015142560005187988, 0.0001577194780111313, 0.0001640133559703827, 0.0001703072339296341, 0.0001766011118888855, 0.0001828949898481369, 0.0001891888678073883, 0.0001954827457666397, 0.0002017766237258911, 0.00020807050168514252, 0.00021436437964439392, 0.00022065825760364532, 0.00022695213556289673, 0.00023324601352214813, 0.00023953989148139954, 0.00024583376944065094, 0.00025212764739990234]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 3.0, 9.0, 15.0, 6.0, 14.0, 16.0, 18.0, 25.0, 24.0, 33.0, 39.0, 29.0, 44.0, 60.0, 36.0, 54.0, 54.0, 59.0, 49.0, 46.0, 44.0, 56.0, 33.0, 32.0, 29.0, 24.0, 29.0, 12.0, 19.0, 11.0, 15.0, 9.0, 13.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.8184814453125, -8.543212890625, -8.2679443359375, -7.99267578125, -7.7174072265625, -7.442138671875, -7.1668701171875, -6.8916015625, -6.6163330078125, -6.341064453125, -6.0657958984375, -5.79052734375, -5.5152587890625, -5.239990234375, -4.9647216796875, -4.689453125, -4.4141845703125, -4.138916015625, -3.8636474609375, -3.58837890625, -3.3131103515625, -3.037841796875, -2.7625732421875, -2.4873046875, -2.2120361328125, -1.936767578125, -1.6614990234375, -1.38623046875, -1.1109619140625, -0.835693359375, -0.5604248046875, -0.28515625, -0.0098876953125, 0.265380859375, 0.5406494140625, 0.81591796875, 1.0911865234375, 1.366455078125, 1.6417236328125, 1.9169921875, 2.1922607421875, 2.467529296875, 2.7427978515625, 3.01806640625, 3.2933349609375, 3.568603515625, 3.8438720703125, 4.119140625, 4.3944091796875, 4.669677734375, 4.9449462890625, 5.22021484375, 5.4954833984375, 5.770751953125, 6.0460205078125, 6.3212890625, 6.5965576171875, 6.871826171875, 7.1470947265625, 7.42236328125, 7.6976318359375, 7.972900390625, 8.2481689453125, 8.5234375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 15.0, 11.0, 22.0, 29.0, 37.0, 62.0, 86.0, 113.0, 164.0, 235.0, 353.0, 473.0, 737.0, 1001.0, 1566.0, 2422.0, 3934.0, 6848.0, 14223.0, 38858.0, 296877.0, 592431.0, 51325.0, 16629.0, 7850.0, 4350.0, 2586.0, 1661.0, 1118.0, 775.0, 544.0, 379.0, 221.0, 199.0, 130.0, 95.0, 50.0, 40.0, 22.0, 21.0, 17.0, 18.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.765625, -17.1943359375, -16.623046875, -16.0517578125, -15.48046875, -14.9091796875, -14.337890625, -13.7666015625, -13.1953125, -12.6240234375, -12.052734375, -11.4814453125, -10.91015625, -10.3388671875, -9.767578125, -9.1962890625, -8.625, -8.0537109375, -7.482421875, -6.9111328125, -6.33984375, -5.7685546875, -5.197265625, -4.6259765625, -4.0546875, -3.4833984375, -2.912109375, -2.3408203125, -1.76953125, -1.1982421875, -0.626953125, -0.0556640625, 0.515625, 1.0869140625, 1.658203125, 2.2294921875, 2.80078125, 3.3720703125, 3.943359375, 4.5146484375, 5.0859375, 5.6572265625, 6.228515625, 6.7998046875, 7.37109375, 7.9423828125, 8.513671875, 9.0849609375, 9.65625, 10.2275390625, 10.798828125, 11.3701171875, 11.94140625, 12.5126953125, 13.083984375, 13.6552734375, 14.2265625, 14.7978515625, 15.369140625, 15.9404296875, 16.51171875, 17.0830078125, 17.654296875, 18.2255859375, 18.796875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 7.0, 13.0, 17.0, 17.0, 25.0, 12.0, 19.0, 23.0, 26.0, 34.0, 51.0, 56.0, 60.0, 79.0, 154.0, 1537.0, 315.0, 132.0, 67.0, 57.0, 48.0, 30.0, 21.0, 35.0, 38.0, 16.0, 19.0, 12.0, 19.0, 23.0, 14.0, 16.0, 13.0, 6.0, 13.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-31.8125, -30.873046875, -29.93359375, -28.994140625, -28.0546875, -27.115234375, -26.17578125, -25.236328125, -24.296875, -23.357421875, -22.41796875, -21.478515625, -20.5390625, -19.599609375, -18.66015625, -17.720703125, -16.78125, -15.841796875, -14.90234375, -13.962890625, -13.0234375, -12.083984375, -11.14453125, -10.205078125, -9.265625, -8.326171875, -7.38671875, -6.447265625, -5.5078125, -4.568359375, -3.62890625, -2.689453125, -1.75, -0.810546875, 0.12890625, 1.068359375, 2.0078125, 2.947265625, 3.88671875, 4.826171875, 5.765625, 6.705078125, 7.64453125, 8.583984375, 9.5234375, 10.462890625, 11.40234375, 12.341796875, 13.28125, 14.220703125, 15.16015625, 16.099609375, 17.0390625, 17.978515625, 18.91796875, 19.857421875, 20.796875, 21.736328125, 22.67578125, 23.615234375, 24.5546875, 25.494140625, 26.43359375, 27.373046875, 28.3125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 6.0, 8.0, 13.0, 10.0, 20.0, 9.0, 26.0, 12.0, 22.0, 39.0, 61.0, 77.0, 106.0, 234.0, 533.0, 1433.0, 5015.0, 25698.0, 2263933.0, 821314.0, 20573.0, 4247.0, 1296.0, 489.0, 201.0, 110.0, 57.0, 32.0, 23.0, 17.0, 20.0, 19.0, 15.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84375, -40.4462890625, -39.048828125, -37.6513671875, -36.25390625, -34.8564453125, -33.458984375, -32.0615234375, -30.6640625, -29.2666015625, -27.869140625, -26.4716796875, -25.07421875, -23.6767578125, -22.279296875, -20.8818359375, -19.484375, -18.0869140625, -16.689453125, -15.2919921875, -13.89453125, -12.4970703125, -11.099609375, -9.7021484375, -8.3046875, -6.9072265625, -5.509765625, -4.1123046875, -2.71484375, -1.3173828125, 0.080078125, 1.4775390625, 2.875, 4.2724609375, 5.669921875, 7.0673828125, 8.46484375, 9.8623046875, 11.259765625, 12.6572265625, 14.0546875, 15.4521484375, 16.849609375, 18.2470703125, 19.64453125, 21.0419921875, 22.439453125, 23.8369140625, 25.234375, 26.6318359375, 28.029296875, 29.4267578125, 30.82421875, 32.2216796875, 33.619140625, 35.0166015625, 36.4140625, 37.8115234375, 39.208984375, 40.6064453125, 42.00390625, 43.4013671875, 44.798828125, 46.1962890625, 47.59375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 15.0, 36.0, 52.0, 68.0, 150.0, 181.0, 196.0, 139.0, 68.0, 40.0, 25.0, 10.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.12922668457031, -69.99588012695312, -67.86253356933594, -65.72918701171875, -63.59584426879883, -61.46249771118164, -59.32915115356445, -57.195804595947266, -55.062461853027344, -52.929115295410156, -50.79576873779297, -48.66242218017578, -46.52907943725586, -44.39573287963867, -42.262386322021484, -40.1290397644043, -37.99569320678711, -35.86234664916992, -33.729000091552734, -31.59565544128418, -29.462310791015625, -27.328964233398438, -25.19561767578125, -23.062271118164062, -20.928926467895508, -18.79557991027832, -16.662235260009766, -14.528888702392578, -12.395543098449707, -10.262197494506836, -8.128850936889648, -5.995505332946777, -3.8621597290039062, -1.728813886642456, 0.40453195571899414, 2.5378780364990234, 4.6712236404418945, 6.804569244384766, 8.937915802001953, 11.071261405944824, 13.204607009887695, 15.337952613830566, 17.471298217773438, 19.604644775390625, 21.737991333007812, 23.871335983276367, 26.004682540893555, 28.13802719116211, 30.271373748779297, 32.404720306396484, 34.53806686401367, 36.671409606933594, 38.80475616455078, 40.93810272216797, 43.071449279785156, 45.204795837402344, 47.33814239501953, 49.47148895263672, 51.604835510253906, 53.738182067871094, 55.871524810791016, 58.0048713684082, 60.13821792602539, 62.27156448364258, 64.4049072265625]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 12.0, 13.0, 19.0, 17.0, 18.0, 18.0, 21.0, 30.0, 29.0, 28.0, 39.0, 29.0, 51.0, 33.0, 37.0, 29.0, 30.0, 46.0, 42.0, 40.0, 36.0, 28.0, 34.0, 27.0, 45.0, 19.0, 29.0, 24.0, 21.0, 23.0, 17.0, 15.0, 10.0, 9.0, 16.0, 8.0, 5.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.57829284667969, -83.71070861816406, -80.84313201904297, -77.97555541992188, -75.10797119140625, -72.24038696289062, -69.37281036376953, -66.50523376464844, -63.63764953613281, -60.77006912231445, -57.902488708496094, -55.034908294677734, -52.167327880859375, -49.299747467041016, -46.432167053222656, -43.5645866394043, -40.69700622558594, -37.82942581176758, -34.96184539794922, -32.09426498413086, -29.2266845703125, -26.35910415649414, -23.49152374267578, -20.623943328857422, -17.756362915039062, -14.888782501220703, -12.021202087402344, -9.153621673583984, -6.286041259765625, -3.4184608459472656, -0.5508804321289062, 2.316699981689453, 5.184288024902344, 8.051868438720703, 10.919448852539062, 13.787029266357422, 16.65460968017578, 19.52219009399414, 22.3897705078125, 25.25735092163086, 28.12493133544922, 30.992511749267578, 33.86009216308594, 36.7276725769043, 39.595252990722656, 42.462833404541016, 45.330413818359375, 48.197994232177734, 51.065574645996094, 53.93315505981445, 56.80073547363281, 59.66831588745117, 62.53589630126953, 65.40347290039062, 68.27105712890625, 71.13864135742188, 74.00621795654297, 76.87379455566406, 79.74137878417969, 82.60896301269531, 85.4765396118164, 88.3441162109375, 91.21170043945312, 94.07928466796875, 96.94686126708984]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 7.0, 2.0, 4.0, 8.0, 15.0, 9.0, 16.0, 22.0, 11.0, 16.0, 34.0, 28.0, 29.0, 39.0, 33.0, 34.0, 40.0, 47.0, 56.0, 47.0, 54.0, 53.0, 41.0, 48.0, 41.0, 39.0, 39.0, 31.0, 21.0, 22.0, 15.0, 15.0, 13.0, 20.0, 9.0, 8.0, 6.0, 6.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.21875, -8.94580078125, -8.6728515625, -8.39990234375, -8.126953125, -7.85400390625, -7.5810546875, -7.30810546875, -7.03515625, -6.76220703125, -6.4892578125, -6.21630859375, -5.943359375, -5.67041015625, -5.3974609375, -5.12451171875, -4.8515625, -4.57861328125, -4.3056640625, -4.03271484375, -3.759765625, -3.48681640625, -3.2138671875, -2.94091796875, -2.66796875, -2.39501953125, -2.1220703125, -1.84912109375, -1.576171875, -1.30322265625, -1.0302734375, -0.75732421875, -0.484375, -0.21142578125, 0.0615234375, 0.33447265625, 0.607421875, 0.88037109375, 1.1533203125, 1.42626953125, 1.69921875, 1.97216796875, 2.2451171875, 2.51806640625, 2.791015625, 3.06396484375, 3.3369140625, 3.60986328125, 3.8828125, 4.15576171875, 4.4287109375, 4.70166015625, 4.974609375, 5.24755859375, 5.5205078125, 5.79345703125, 6.06640625, 6.33935546875, 6.6123046875, 6.88525390625, 7.158203125, 7.43115234375, 7.7041015625, 7.97705078125, 8.25]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 12.0, 14.0, 13.0, 11.0, 19.0, 33.0, 47.0, 62.0, 95.0, 136.0, 200.0, 272.0, 396.0, 711.0, 1036.0, 1809.0, 3270.0, 6465.0, 15968.0, 155846.0, 2938556.0, 996271.0, 51313.0, 10378.0, 4830.0, 2582.0, 1520.0, 880.0, 536.0, 319.0, 218.0, 129.0, 95.0, 76.0, 40.0, 32.0, 30.0, 10.0, 8.0, 11.0, 10.0, 6.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.140625, -26.33740234375, -25.5341796875, -24.73095703125, -23.927734375, -23.12451171875, -22.3212890625, -21.51806640625, -20.71484375, -19.91162109375, -19.1083984375, -18.30517578125, -17.501953125, -16.69873046875, -15.8955078125, -15.09228515625, -14.2890625, -13.48583984375, -12.6826171875, -11.87939453125, -11.076171875, -10.27294921875, -9.4697265625, -8.66650390625, -7.86328125, -7.06005859375, -6.2568359375, -5.45361328125, -4.650390625, -3.84716796875, -3.0439453125, -2.24072265625, -1.4375, -0.63427734375, 0.1689453125, 0.97216796875, 1.775390625, 2.57861328125, 3.3818359375, 4.18505859375, 4.98828125, 5.79150390625, 6.5947265625, 7.39794921875, 8.201171875, 9.00439453125, 9.8076171875, 10.61083984375, 11.4140625, 12.21728515625, 13.0205078125, 13.82373046875, 14.626953125, 15.43017578125, 16.2333984375, 17.03662109375, 17.83984375, 18.64306640625, 19.4462890625, 20.24951171875, 21.052734375, 21.85595703125, 22.6591796875, 23.46240234375, 24.265625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 14.0, 7.0, 18.0, 31.0, 33.0, 43.0, 71.0, 109.0, 229.0, 532.0, 972.0, 972.0, 484.0, 200.0, 110.0, 71.0, 42.0, 26.0, 19.0, 18.0, 18.0, 9.0, 7.0, 7.0, 8.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.21875, -27.27685546875, -26.3349609375, -25.39306640625, -24.451171875, -23.50927734375, -22.5673828125, -21.62548828125, -20.68359375, -19.74169921875, -18.7998046875, -17.85791015625, -16.916015625, -15.97412109375, -15.0322265625, -14.09033203125, -13.1484375, -12.20654296875, -11.2646484375, -10.32275390625, -9.380859375, -8.43896484375, -7.4970703125, -6.55517578125, -5.61328125, -4.67138671875, -3.7294921875, -2.78759765625, -1.845703125, -0.90380859375, 0.0380859375, 0.97998046875, 1.921875, 2.86376953125, 3.8056640625, 4.74755859375, 5.689453125, 6.63134765625, 7.5732421875, 8.51513671875, 9.45703125, 10.39892578125, 11.3408203125, 12.28271484375, 13.224609375, 14.16650390625, 15.1083984375, 16.05029296875, 16.9921875, 17.93408203125, 18.8759765625, 19.81787109375, 20.759765625, 21.70166015625, 22.6435546875, 23.58544921875, 24.52734375, 25.46923828125, 26.4111328125, 27.35302734375, 28.294921875, 29.23681640625, 30.1787109375, 31.12060546875, 32.0625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 12.0, 13.0, 18.0, 31.0, 38.0, 56.0, 89.0, 158.0, 240.0, 439.0, 845.0, 1727.0, 4080.0, 10167.0, 34134.0, 247548.0, 3588725.0, 253167.0, 34632.0, 10528.0, 3981.0, 1755.0, 772.0, 449.0, 293.0, 137.0, 102.0, 49.0, 32.0, 13.0, 14.0, 7.0, 5.0, 5.0, 4.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.78125, -40.5341796875, -39.287109375, -38.0400390625, -36.79296875, -35.5458984375, -34.298828125, -33.0517578125, -31.8046875, -30.5576171875, -29.310546875, -28.0634765625, -26.81640625, -25.5693359375, -24.322265625, -23.0751953125, -21.828125, -20.5810546875, -19.333984375, -18.0869140625, -16.83984375, -15.5927734375, -14.345703125, -13.0986328125, -11.8515625, -10.6044921875, -9.357421875, -8.1103515625, -6.86328125, -5.6162109375, -4.369140625, -3.1220703125, -1.875, -0.6279296875, 0.619140625, 1.8662109375, 3.11328125, 4.3603515625, 5.607421875, 6.8544921875, 8.1015625, 9.3486328125, 10.595703125, 11.8427734375, 13.08984375, 14.3369140625, 15.583984375, 16.8310546875, 18.078125, 19.3251953125, 20.572265625, 21.8193359375, 23.06640625, 24.3134765625, 25.560546875, 26.8076171875, 28.0546875, 29.3017578125, 30.548828125, 31.7958984375, 33.04296875, 34.2900390625, 35.537109375, 36.7841796875, 38.03125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 9.0, 12.0, 9.0, 22.0, 41.0, 58.0, 88.0, 121.0, 166.0, 130.0, 108.0, 70.0, 56.0, 34.0, 19.0, 18.0, 11.0, 8.0, 3.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-98.1707992553711, -95.26211547851562, -92.35343170166016, -89.44474792480469, -86.53606414794922, -83.62738037109375, -80.71870422363281, -77.81002044677734, -74.90133666992188, -71.9926528930664, -69.08396911621094, -66.17528533935547, -63.266605377197266, -60.3579216003418, -57.44923782348633, -54.540557861328125, -51.63187026977539, -48.72318649291992, -45.81450271606445, -42.90582275390625, -39.99713897705078, -37.08845520019531, -34.179771423339844, -31.271089553833008, -28.36240577697754, -25.45372200012207, -22.545040130615234, -19.636356353759766, -16.727672576904297, -13.818990707397461, -10.910306930541992, -8.001625061035156, -5.0929412841796875, -2.184258222579956, 0.7244248390197754, 3.633108139038086, 6.541790962219238, 9.45047378540039, 12.35915756225586, 15.267839431762695, 18.176523208618164, 21.085206985473633, 23.99388885498047, 26.902572631835938, 29.811256408691406, 32.719940185546875, 35.628623962402344, 38.53730392456055, 41.445987701416016, 44.354671478271484, 47.26335525512695, 50.172035217285156, 53.080718994140625, 55.989402770996094, 58.89808654785156, 61.80677032470703, 64.7154541015625, 67.62413787841797, 70.53282165527344, 73.4415054321289, 76.35018920898438, 79.25886535644531, 82.16755676269531, 85.07623291015625, 87.98491668701172]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 5.0, 12.0, 7.0, 15.0, 14.0, 15.0, 21.0, 19.0, 30.0, 23.0, 18.0, 33.0, 31.0, 23.0, 27.0, 34.0, 42.0, 41.0, 59.0, 40.0, 34.0, 35.0, 42.0, 40.0, 34.0, 27.0, 32.0, 27.0, 28.0, 30.0, 26.0, 13.0, 15.0, 10.0, 11.0, 13.0, 7.0, 10.0, 9.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-57.083038330078125, -55.23347091674805, -53.38390350341797, -51.53433609008789, -49.68476867675781, -47.835201263427734, -45.985633850097656, -44.13606643676758, -42.2864990234375, -40.43693161010742, -38.587364196777344, -36.737796783447266, -34.88822937011719, -33.03866195678711, -31.18909454345703, -29.339527130126953, -27.489959716796875, -25.640392303466797, -23.79082489013672, -21.94125747680664, -20.091690063476562, -18.242122650146484, -16.392555236816406, -14.542987823486328, -12.69342041015625, -10.843852996826172, -8.994285583496094, -7.144718170166016, -5.2951507568359375, -3.4455833435058594, -1.5960159301757812, 0.2535514831542969, 2.103118896484375, 3.952686309814453, 5.802253723144531, 7.651821136474609, 9.501388549804688, 11.350955963134766, 13.200523376464844, 15.050090789794922, 16.899658203125, 18.749225616455078, 20.598793029785156, 22.448360443115234, 24.297927856445312, 26.14749526977539, 27.99706268310547, 29.846630096435547, 31.696197509765625, 33.5457649230957, 35.39533233642578, 37.24489974975586, 39.09446716308594, 40.944034576416016, 42.793601989746094, 44.64316940307617, 46.49273681640625, 48.34230422973633, 50.191871643066406, 52.041439056396484, 53.89100646972656, 55.74057388305664, 57.59014129638672, 59.4397087097168, 61.289276123046875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 2.0, 10.0, 11.0, 19.0, 10.0, 20.0, 19.0, 25.0, 24.0, 34.0, 41.0, 26.0, 41.0, 38.0, 45.0, 47.0, 51.0, 54.0, 61.0, 46.0, 35.0, 42.0, 35.0, 35.0, 44.0, 20.0, 24.0, 19.0, 20.0, 14.0, 12.0, 14.0, 6.0, 9.0, 4.0, 6.0, 10.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.515625, -9.24456787109375, -8.9735107421875, -8.70245361328125, -8.431396484375, -8.16033935546875, -7.8892822265625, -7.61822509765625, -7.34716796875, -7.07611083984375, -6.8050537109375, -6.53399658203125, -6.262939453125, -5.99188232421875, -5.7208251953125, -5.44976806640625, -5.1787109375, -4.90765380859375, -4.6365966796875, -4.36553955078125, -4.094482421875, -3.82342529296875, -3.5523681640625, -3.28131103515625, -3.01025390625, -2.73919677734375, -2.4681396484375, -2.19708251953125, -1.926025390625, -1.65496826171875, -1.3839111328125, -1.11285400390625, -0.841796875, -0.57073974609375, -0.2996826171875, -0.02862548828125, 0.242431640625, 0.51348876953125, 0.7845458984375, 1.05560302734375, 1.32666015625, 1.59771728515625, 1.8687744140625, 2.13983154296875, 2.410888671875, 2.68194580078125, 2.9530029296875, 3.22406005859375, 3.4951171875, 3.76617431640625, 4.0372314453125, 4.30828857421875, 4.579345703125, 4.85040283203125, 5.1214599609375, 5.39251708984375, 5.66357421875, 5.93463134765625, 6.2056884765625, 6.47674560546875, 6.747802734375, 7.01885986328125, 7.2899169921875, 7.56097412109375, 7.83203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 9.0, 5.0, 6.0, 14.0, 23.0, 37.0, 53.0, 62.0, 98.0, 184.0, 288.0, 404.0, 588.0, 923.0, 1443.0, 2385.0, 3636.0, 5755.0, 9205.0, 14914.0, 24916.0, 42030.0, 72262.0, 126349.0, 231862.0, 219852.0, 119918.0, 69119.0, 39985.0, 24009.0, 14231.0, 8772.0, 5536.0, 3443.0, 2188.0, 1465.0, 862.0, 606.0, 399.0, 257.0, 146.0, 109.0, 75.0, 50.0, 24.0, 20.0, 13.0, 15.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.2003173828125, -0.19441795349121094, -0.18851852416992188, -0.1826190948486328, -0.17671966552734375, -0.1708202362060547, -0.16492080688476562, -0.15902137756347656, -0.1531219482421875, -0.14722251892089844, -0.14132308959960938, -0.1354236602783203, -0.12952423095703125, -0.12362480163574219, -0.11772537231445312, -0.11182594299316406, -0.105926513671875, -0.10002708435058594, -0.09412765502929688, -0.08822822570800781, -0.08232879638671875, -0.07642936706542969, -0.07052993774414062, -0.06463050842285156, -0.0587310791015625, -0.05283164978027344, -0.046932220458984375, -0.04103279113769531, -0.03513336181640625, -0.029233932495117188, -0.023334503173828125, -0.017435073852539062, -0.01153564453125, -0.0056362152099609375, 0.000263214111328125, 0.0061626434326171875, 0.01206207275390625, 0.017961502075195312, 0.023860931396484375, 0.029760360717773438, 0.0356597900390625, 0.04155921936035156, 0.047458648681640625, 0.05335807800292969, 0.05925750732421875, 0.06515693664550781, 0.07105636596679688, 0.07695579528808594, 0.082855224609375, 0.08875465393066406, 0.09465408325195312, 0.10055351257324219, 0.10645294189453125, 0.11235237121582031, 0.11825180053710938, 0.12415122985839844, 0.1300506591796875, 0.13595008850097656, 0.14184951782226562, 0.1477489471435547, 0.15364837646484375, 0.1595478057861328, 0.16544723510742188, 0.17134666442871094, 0.17724609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 10.0, 10.0, 10.0, 12.0, 11.0, 15.0, 23.0, 22.0, 20.0, 22.0, 32.0, 33.0, 35.0, 36.0, 33.0, 30.0, 45.0, 35.0, 33.0, 1061.0, 36.0, 48.0, 35.0, 38.0, 35.0, 35.0, 27.0, 31.0, 23.0, 25.0, 19.0, 26.0, 20.0, 20.0, 9.0, 5.0, 9.0, 9.0, 6.0, 4.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.13043212890625, -3.9835205078125, -3.83660888671875, -3.689697265625, -3.54278564453125, -3.3958740234375, -3.24896240234375, -3.10205078125, -2.95513916015625, -2.8082275390625, -2.66131591796875, -2.514404296875, -2.36749267578125, -2.2205810546875, -2.07366943359375, -1.9267578125, -1.77984619140625, -1.6329345703125, -1.48602294921875, -1.339111328125, -1.19219970703125, -1.0452880859375, -0.89837646484375, -0.75146484375, -0.60455322265625, -0.4576416015625, -0.31072998046875, -0.163818359375, -0.01690673828125, 0.1300048828125, 0.27691650390625, 0.423828125, 0.57073974609375, 0.7176513671875, 0.86456298828125, 1.011474609375, 1.15838623046875, 1.3052978515625, 1.45220947265625, 1.59912109375, 1.74603271484375, 1.8929443359375, 2.03985595703125, 2.186767578125, 2.33367919921875, 2.4805908203125, 2.62750244140625, 2.7744140625, 2.92132568359375, 3.0682373046875, 3.21514892578125, 3.362060546875, 3.50897216796875, 3.6558837890625, 3.80279541015625, 3.94970703125, 4.09661865234375, 4.2435302734375, 4.39044189453125, 4.537353515625, 4.68426513671875, 4.8311767578125, 4.97808837890625, 5.125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 13.0, 18.0, 26.0, 25.0, 60.0, 78.0, 111.0, 164.0, 264.0, 365.0, 504.0, 735.0, 1056.0, 1402.0, 2032.0, 3114.0, 4511.0, 6592.0, 9780.0, 14151.0, 20706.0, 30248.0, 45080.0, 67141.0, 100897.0, 152353.0, 1234573.0, 132065.0, 87679.0, 58175.0, 38976.0, 26663.0, 18272.0, 12224.0, 8459.0, 5728.0, 4027.0, 2795.0, 1886.0, 1312.0, 866.0, 627.0, 429.0, 303.0, 210.0, 138.0, 104.0, 60.0, 50.0, 40.0, 17.0, 12.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.06927490234375, -0.0670633316040039, -0.06485176086425781, -0.06264019012451172, -0.060428619384765625, -0.05821704864501953, -0.05600547790527344, -0.053793907165527344, -0.05158233642578125, -0.049370765686035156, -0.04715919494628906, -0.04494762420654297, -0.042736053466796875, -0.04052448272705078, -0.03831291198730469, -0.036101341247558594, -0.0338897705078125, -0.031678199768066406, -0.029466629028320312, -0.02725505828857422, -0.025043487548828125, -0.02283191680908203, -0.020620346069335938, -0.018408775329589844, -0.01619720458984375, -0.013985633850097656, -0.011774063110351562, -0.009562492370605469, -0.007350921630859375, -0.005139350891113281, -0.0029277801513671875, -0.0007162094116210938, 0.001495361328125, 0.0037069320678710938, 0.0059185028076171875, 0.008130073547363281, 0.010341644287109375, 0.012553215026855469, 0.014764785766601562, 0.016976356506347656, 0.01918792724609375, 0.021399497985839844, 0.023611068725585938, 0.02582263946533203, 0.028034210205078125, 0.03024578094482422, 0.03245735168457031, 0.034668922424316406, 0.0368804931640625, 0.039092063903808594, 0.04130363464355469, 0.04351520538330078, 0.045726776123046875, 0.04793834686279297, 0.05014991760253906, 0.052361488342285156, 0.05457305908203125, 0.056784629821777344, 0.05899620056152344, 0.06120777130126953, 0.06341934204101562, 0.06563091278076172, 0.06784248352050781, 0.0700540542602539, 0.072265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 9.0, 10.0, 9.0, 14.0, 24.0, 33.0, 35.0, 44.0, 40.0, 46.0, 63.0, 65.0, 56.0, 62.0, 55.0, 50.0, 51.0, 58.0, 54.0, 35.0, 31.0, 29.0, 23.0, 20.0, 17.0, 16.0, 7.0, 5.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030612945556640625, -0.00029597803950309753, -0.0002858266234397888, -0.0002756752073764801, -0.0002655237913131714, -0.00025537237524986267, -0.00024522095918655396, -0.00023506954312324524, -0.00022491812705993652, -0.0002147667109966278, -0.0002046152949333191, -0.00019446387887001038, -0.00018431246280670166, -0.00017416104674339294, -0.00016400963068008423, -0.0001538582146167755, -0.0001437067985534668, -0.00013355538249015808, -0.00012340396642684937, -0.00011325255036354065, -0.00010310113430023193, -9.294971823692322e-05, -8.27983021736145e-05, -7.264688611030579e-05, -6.249547004699707e-05, -5.2344053983688354e-05, -4.219263792037964e-05, -3.204122185707092e-05, -2.1889805793762207e-05, -1.1738389730453491e-05, -1.5869736671447754e-06, 8.56444239616394e-06, 1.8715858459472656e-05, 2.8867274522781372e-05, 3.901869058609009e-05, 4.9170106649398804e-05, 5.932152271270752e-05, 6.947293877601624e-05, 7.962435483932495e-05, 8.977577090263367e-05, 9.992718696594238e-05, 0.0001100786030292511, 0.00012023001909255981, 0.00013038143515586853, 0.00014053285121917725, 0.00015068426728248596, 0.00016083568334579468, 0.0001709870994091034, 0.0001811385154724121, 0.00019128993153572083, 0.00020144134759902954, 0.00021159276366233826, 0.00022174417972564697, 0.0002318955957889557, 0.0002420470118522644, 0.0002521984279155731, 0.00026234984397888184, 0.00027250126004219055, 0.00028265267610549927, 0.000292804092168808, 0.0003029555082321167, 0.0003131069242954254, 0.00032325834035873413, 0.00033340975642204285, 0.00034356117248535156]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 8.0, 13.0, 15.0, 30.0, 41.0, 53.0, 66.0, 80.0, 137.0, 179.0, 239.0, 325.0, 660.0, 6876.0, 1008033.0, 29512.0, 853.0, 404.0, 260.0, 190.0, 162.0, 105.0, 90.0, 64.0, 33.0, 32.0, 22.0, 19.0, 11.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00583648681640625, -0.005662977695465088, -0.005489468574523926, -0.005315959453582764, -0.0051424503326416016, -0.0049689412117004395, -0.004795432090759277, -0.004621922969818115, -0.004448413848876953, -0.004274904727935791, -0.004101395606994629, -0.003927886486053467, -0.0037543773651123047, -0.0035808682441711426, -0.0034073591232299805, -0.0032338500022888184, -0.0030603408813476562, -0.002886831760406494, -0.002713322639465332, -0.00253981351852417, -0.002366304397583008, -0.0021927952766418457, -0.0020192861557006836, -0.0018457770347595215, -0.0016722679138183594, -0.0014987587928771973, -0.0013252496719360352, -0.001151740550994873, -0.000978231430053711, -0.0008047223091125488, -0.0006312131881713867, -0.0004577040672302246, -0.0002841949462890625, -0.00011068582534790039, 6.282329559326172e-05, 0.00023633241653442383, 0.00040984153747558594, 0.000583350658416748, 0.0007568597793579102, 0.0009303689002990723, 0.0011038780212402344, 0.0012773871421813965, 0.0014508962631225586, 0.0016244053840637207, 0.0017979145050048828, 0.001971423625946045, 0.002144932746887207, 0.002318441867828369, 0.0024919509887695312, 0.0026654601097106934, 0.0028389692306518555, 0.0030124783515930176, 0.0031859874725341797, 0.003359496593475342, 0.003533005714416504, 0.003706514835357666, 0.003880023956298828, 0.00405353307723999, 0.004227042198181152, 0.0044005513191223145, 0.0045740604400634766, 0.004747569561004639, 0.004921078681945801, 0.005094587802886963, 0.005268096923828125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 24.0, 515.0, 450.0, 22.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0032828235998749733, -0.0032251852098852396, -0.003167546819895506, -0.0031099081970751286, -0.003052269807085395, -0.002994631417095661, -0.0029369930271059275, -0.0028793546371161938, -0.00282171624712646, -0.0027640778571367264, -0.0027064394671469927, -0.002648801077157259, -0.0025911624543368816, -0.002533524064347148, -0.0024758856743574142, -0.0024182472843676805, -0.002360608661547303, -0.0023029702715575695, -0.002245331881567836, -0.002187693491578102, -0.0021300548687577248, -0.002072416478767991, -0.0020147780887782574, -0.0019571396987885237, -0.00189950130879879, -0.0018418629188090563, -0.0017842244124040008, -0.001726586022414267, -0.0016689476324245334, -0.0016113091260194778, -0.0015536707360297441, -0.0014960323460400105, -0.0014383939560502768, -0.001380755566060543, -0.0013231170596554875, -0.0012654786696657538, -0.0012078402796760201, -0.0011502017732709646, -0.001092563383281231, -0.0010349249932914972, -0.0009772864868864417, -0.0009196480386890471, -0.0008620096486993134, -0.0008043712005019188, -0.0007467327523045242, -0.0006890943041071296, -0.0006314559141173959, -0.0005738174659200013, -0.0005161790177226067, -0.0004585405986290425, -0.0004009021504316479, -0.00034326373133808374, -0.00028562528314068913, -0.00022798686404712498, -0.00017034844495356083, -0.00011270999675616622, -5.507157766260207e-05, 2.566852344898507e-06, 6.020528235239908e-05, 0.00011784370872192085, 0.00017548214236740023, 0.0002331205760128796, 0.00029075899510644376, 0.00034839744330383837, 0.0004060358623974025]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 10.0, 24.0, 20.0, 20.0, 23.0, 30.0, 31.0, 33.0, 27.0, 49.0, 46.0, 41.0, 59.0, 48.0, 40.0, 48.0, 42.0, 41.0, 44.0, 32.0, 38.0, 27.0, 32.0, 26.0, 31.0, 21.0, 16.0, 14.0, 12.0, 15.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0002675056457519531, -0.0002597291022539139, -0.00025195255875587463, -0.0002441760152578354, -0.00023639947175979614, -0.0002286229282617569, -0.00022084638476371765, -0.0002130698412656784, -0.00020529329776763916, -0.00019751675426959991, -0.00018974021077156067, -0.00018196366727352142, -0.00017418712377548218, -0.00016641058027744293, -0.0001586340367794037, -0.00015085749328136444, -0.0001430809497833252, -0.00013530440628528595, -0.0001275278627872467, -0.00011975131928920746, -0.00011197477579116821, -0.00010419823229312897, -9.642168879508972e-05, -8.864514529705048e-05, -8.086860179901123e-05, -7.309205830097198e-05, -6.531551480293274e-05, -5.7538971304893494e-05, -4.976242780685425e-05, -4.1985884308815e-05, -3.420934081077576e-05, -2.643279731273651e-05, -1.8656253814697266e-05, -1.087971031665802e-05, -3.1031668186187744e-06, 4.673376679420471e-06, 1.2449920177459717e-05, 2.0226463675498962e-05, 2.8003007173538208e-05, 3.5779550671577454e-05, 4.35560941696167e-05, 5.1332637667655945e-05, 5.910918116569519e-05, 6.688572466373444e-05, 7.466226816177368e-05, 8.243881165981293e-05, 9.021535515785217e-05, 9.799189865589142e-05, 0.00010576844215393066, 0.00011354498565196991, 0.00012132152915000916, 0.0001290980726480484, 0.00013687461614608765, 0.0001446511596441269, 0.00015242770314216614, 0.00016020424664020538, 0.00016798079013824463, 0.00017575733363628387, 0.00018353387713432312, 0.00019131042063236237, 0.0001990869641304016, 0.00020686350762844086, 0.0002146400511264801, 0.00022241659462451935, 0.0002301931381225586]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 2.0, 10.0, 11.0, 19.0, 10.0, 20.0, 19.0, 25.0, 24.0, 34.0, 41.0, 26.0, 41.0, 38.0, 45.0, 47.0, 51.0, 54.0, 61.0, 46.0, 35.0, 42.0, 35.0, 35.0, 44.0, 20.0, 24.0, 19.0, 20.0, 14.0, 12.0, 14.0, 6.0, 9.0, 4.0, 6.0, 10.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.515625, -9.24456787109375, -8.9735107421875, -8.70245361328125, -8.431396484375, -8.16033935546875, -7.8892822265625, -7.61822509765625, -7.34716796875, -7.07611083984375, -6.8050537109375, -6.53399658203125, -6.262939453125, -5.99188232421875, -5.7208251953125, -5.44976806640625, -5.1787109375, -4.90765380859375, -4.6365966796875, -4.36553955078125, -4.094482421875, -3.82342529296875, -3.5523681640625, -3.28131103515625, -3.01025390625, -2.73919677734375, -2.4681396484375, -2.19708251953125, -1.926025390625, -1.65496826171875, -1.3839111328125, -1.11285400390625, -0.841796875, -0.57073974609375, -0.2996826171875, -0.02862548828125, 0.242431640625, 0.51348876953125, 0.7845458984375, 1.05560302734375, 1.32666015625, 1.59771728515625, 1.8687744140625, 2.13983154296875, 2.410888671875, 2.68194580078125, 2.9530029296875, 3.22406005859375, 3.4951171875, 3.76617431640625, 4.0372314453125, 4.30828857421875, 4.579345703125, 4.85040283203125, 5.1214599609375, 5.39251708984375, 5.66357421875, 5.93463134765625, 6.2056884765625, 6.47674560546875, 6.747802734375, 7.01885986328125, 7.2899169921875, 7.56097412109375, 7.83203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 11.0, 12.0, 6.0, 23.0, 18.0, 25.0, 27.0, 39.0, 51.0, 67.0, 114.0, 170.0, 277.0, 453.0, 729.0, 1187.0, 2020.0, 3901.0, 8089.0, 22896.0, 163588.0, 771201.0, 48504.0, 12944.0, 5415.0, 2725.0, 1526.0, 908.0, 564.0, 344.0, 219.0, 153.0, 101.0, 71.0, 45.0, 38.0, 23.0, 10.0, 12.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.96875, -25.080810546875, -24.19287109375, -23.304931640625, -22.4169921875, -21.529052734375, -20.64111328125, -19.753173828125, -18.865234375, -17.977294921875, -17.08935546875, -16.201416015625, -15.3134765625, -14.425537109375, -13.53759765625, -12.649658203125, -11.76171875, -10.873779296875, -9.98583984375, -9.097900390625, -8.2099609375, -7.322021484375, -6.43408203125, -5.546142578125, -4.658203125, -3.770263671875, -2.88232421875, -1.994384765625, -1.1064453125, -0.218505859375, 0.66943359375, 1.557373046875, 2.4453125, 3.333251953125, 4.22119140625, 5.109130859375, 5.9970703125, 6.885009765625, 7.77294921875, 8.660888671875, 9.548828125, 10.436767578125, 11.32470703125, 12.212646484375, 13.1005859375, 13.988525390625, 14.87646484375, 15.764404296875, 16.65234375, 17.540283203125, 18.42822265625, 19.316162109375, 20.2041015625, 21.092041015625, 21.97998046875, 22.867919921875, 23.755859375, 24.643798828125, 25.53173828125, 26.419677734375, 27.3076171875, 28.195556640625, 29.08349609375, 29.971435546875, 30.859375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 11.0, 13.0, 15.0, 19.0, 21.0, 28.0, 33.0, 38.0, 44.0, 38.0, 34.0, 54.0, 86.0, 147.0, 1565.0, 315.0, 114.0, 68.0, 53.0, 32.0, 45.0, 28.0, 35.0, 36.0, 27.0, 18.0, 23.0, 22.0, 12.0, 6.0, 16.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-28.5625, -27.63525390625, -26.7080078125, -25.78076171875, -24.853515625, -23.92626953125, -22.9990234375, -22.07177734375, -21.14453125, -20.21728515625, -19.2900390625, -18.36279296875, -17.435546875, -16.50830078125, -15.5810546875, -14.65380859375, -13.7265625, -12.79931640625, -11.8720703125, -10.94482421875, -10.017578125, -9.09033203125, -8.1630859375, -7.23583984375, -6.30859375, -5.38134765625, -4.4541015625, -3.52685546875, -2.599609375, -1.67236328125, -0.7451171875, 0.18212890625, 1.109375, 2.03662109375, 2.9638671875, 3.89111328125, 4.818359375, 5.74560546875, 6.6728515625, 7.60009765625, 8.52734375, 9.45458984375, 10.3818359375, 11.30908203125, 12.236328125, 13.16357421875, 14.0908203125, 15.01806640625, 15.9453125, 16.87255859375, 17.7998046875, 18.72705078125, 19.654296875, 20.58154296875, 21.5087890625, 22.43603515625, 23.36328125, 24.29052734375, 25.2177734375, 26.14501953125, 27.072265625, 27.99951171875, 28.9267578125, 29.85400390625, 30.78125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 4.0, 11.0, 5.0, 11.0, 18.0, 30.0, 32.0, 38.0, 58.0, 85.0, 129.0, 235.0, 521.0, 1173.0, 3109.0, 10721.0, 75919.0, 2939636.0, 96013.0, 12091.0, 3410.0, 1270.0, 506.0, 249.0, 133.0, 77.0, 61.0, 45.0, 27.0, 19.0, 13.0, 17.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.53125, -48.09716796875, -46.6630859375, -45.22900390625, -43.794921875, -42.36083984375, -40.9267578125, -39.49267578125, -38.05859375, -36.62451171875, -35.1904296875, -33.75634765625, -32.322265625, -30.88818359375, -29.4541015625, -28.02001953125, -26.5859375, -25.15185546875, -23.7177734375, -22.28369140625, -20.849609375, -19.41552734375, -17.9814453125, -16.54736328125, -15.11328125, -13.67919921875, -12.2451171875, -10.81103515625, -9.376953125, -7.94287109375, -6.5087890625, -5.07470703125, -3.640625, -2.20654296875, -0.7724609375, 0.66162109375, 2.095703125, 3.52978515625, 4.9638671875, 6.39794921875, 7.83203125, 9.26611328125, 10.7001953125, 12.13427734375, 13.568359375, 15.00244140625, 16.4365234375, 17.87060546875, 19.3046875, 20.73876953125, 22.1728515625, 23.60693359375, 25.041015625, 26.47509765625, 27.9091796875, 29.34326171875, 30.77734375, 32.21142578125, 33.6455078125, 35.07958984375, 36.513671875, 37.94775390625, 39.3818359375, 40.81591796875, 42.25]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [3.0, 25.0, 153.0, 563.0, 222.0, 39.0, 10.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.226104736328125, -21.176929473876953, -13.127754211425781, -5.078578948974609, 2.9705963134765625, 11.019771575927734, 19.068946838378906, 27.118122100830078, 35.16729736328125, 43.21647262573242, 51.265647888183594, 59.314823150634766, 67.36399841308594, 75.41317749023438, 83.46234893798828, 91.51152038574219, 99.56069946289062, 107.60987854003906, 115.65904998779297, 123.70822143554688, 131.7574005126953, 139.80657958984375, 147.85574340820312, 155.90492248535156, 163.9541015625, 172.00328063964844, 180.05245971679688, 188.10162353515625, 196.1508026123047, 204.19998168945312, 212.2491455078125, 220.29832458496094, 228.3475341796875, 236.39671325683594, 244.44589233398438, 252.49505615234375, 260.54425048828125, 268.5934143066406, 276.642578125, 284.6917724609375, 292.7409362792969, 300.79010009765625, 308.83929443359375, 316.8884582519531, 324.9376220703125, 332.98681640625, 341.0359802246094, 349.0851745605469, 357.13433837890625, 365.1835021972656, 373.2326965332031, 381.2818603515625, 389.3310546875, 397.3802185058594, 405.42938232421875, 413.47857666015625, 421.5277404785156, 429.576904296875, 437.6260986328125, 445.6752624511719, 453.72442626953125, 461.77362060546875, 469.8227844238281, 477.8719787597656, 485.921142578125]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 9.0, 16.0, 7.0, 17.0, 14.0, 20.0, 29.0, 26.0, 28.0, 27.0, 22.0, 40.0, 33.0, 33.0, 43.0, 35.0, 41.0, 43.0, 44.0, 50.0, 40.0, 40.0, 37.0, 36.0, 37.0, 34.0, 36.0, 33.0, 12.0, 17.0, 13.0, 14.0, 11.0, 16.0, 4.0, 11.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.70098876953125, -87.95838928222656, -85.21578979492188, -82.47319030761719, -79.7305908203125, -76.98799133300781, -74.24539184570312, -71.5027847290039, -68.76018524169922, -66.01758575439453, -63.274986267089844, -60.532386779785156, -57.7897834777832, -55.047183990478516, -52.30458450317383, -49.561981201171875, -46.81938552856445, -44.076786041259766, -41.33418655395508, -38.591583251953125, -35.84898376464844, -33.10638427734375, -30.363784790039062, -27.621183395385742, -24.878583908081055, -22.135984420776367, -19.393383026123047, -16.65078353881836, -13.908183097839355, -11.165582656860352, -8.422983169555664, -5.680381774902344, -2.9377822875976562, -0.19518208503723145, 2.5474181175231934, 5.290018081665039, 8.032618522644043, 10.775218963623047, 13.517818450927734, 16.260419845581055, 19.003019332885742, 21.74561882019043, 24.48822021484375, 27.230819702148438, 29.973419189453125, 32.71601867675781, 35.4586181640625, 38.20122146606445, 40.94382095336914, 43.68642044067383, 46.429019927978516, 49.17162322998047, 51.914222717285156, 54.656822204589844, 57.39942169189453, 60.14202117919922, 62.884620666503906, 65.6272201538086, 68.36981964111328, 71.11241912841797, 73.85501861572266, 76.59762573242188, 79.34022521972656, 82.08282470703125, 84.82542419433594]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 11.0, 13.0, 14.0, 33.0, 19.0, 19.0, 30.0, 31.0, 36.0, 46.0, 32.0, 47.0, 39.0, 43.0, 56.0, 55.0, 42.0, 48.0, 45.0, 36.0, 39.0, 35.0, 29.0, 29.0, 23.0, 18.0, 15.0, 20.0, 8.0, 12.0, 8.0, 6.0, 3.0, 12.0, 4.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-9.9921875, -9.7122802734375, -9.432373046875, -9.1524658203125, -8.87255859375, -8.5926513671875, -8.312744140625, -8.0328369140625, -7.7529296875, -7.4730224609375, -7.193115234375, -6.9132080078125, -6.63330078125, -6.3533935546875, -6.073486328125, -5.7935791015625, -5.513671875, -5.2337646484375, -4.953857421875, -4.6739501953125, -4.39404296875, -4.1141357421875, -3.834228515625, -3.5543212890625, -3.2744140625, -2.9945068359375, -2.714599609375, -2.4346923828125, -2.15478515625, -1.8748779296875, -1.594970703125, -1.3150634765625, -1.03515625, -0.7552490234375, -0.475341796875, -0.1954345703125, 0.08447265625, 0.3643798828125, 0.644287109375, 0.9241943359375, 1.2041015625, 1.4840087890625, 1.763916015625, 2.0438232421875, 2.32373046875, 2.6036376953125, 2.883544921875, 3.1634521484375, 3.443359375, 3.7232666015625, 4.003173828125, 4.2830810546875, 4.56298828125, 4.8428955078125, 5.122802734375, 5.4027099609375, 5.6826171875, 5.9625244140625, 6.242431640625, 6.5223388671875, 6.80224609375, 7.0821533203125, 7.362060546875, 7.6419677734375, 7.921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 6.0, 8.0, 15.0, 17.0, 27.0, 30.0, 62.0, 69.0, 80.0, 126.0, 168.0, 243.0, 354.0, 519.0, 825.0, 1268.0, 2129.0, 3388.0, 6329.0, 13207.0, 46986.0, 471690.0, 2929203.0, 622923.0, 62956.0, 14921.0, 7000.0, 3668.0, 2220.0, 1325.0, 771.0, 582.0, 384.0, 243.0, 172.0, 108.0, 75.0, 65.0, 32.0, 25.0, 15.0, 15.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-23.328125, -22.68994140625, -22.0517578125, -21.41357421875, -20.775390625, -20.13720703125, -19.4990234375, -18.86083984375, -18.22265625, -17.58447265625, -16.9462890625, -16.30810546875, -15.669921875, -15.03173828125, -14.3935546875, -13.75537109375, -13.1171875, -12.47900390625, -11.8408203125, -11.20263671875, -10.564453125, -9.92626953125, -9.2880859375, -8.64990234375, -8.01171875, -7.37353515625, -6.7353515625, -6.09716796875, -5.458984375, -4.82080078125, -4.1826171875, -3.54443359375, -2.90625, -2.26806640625, -1.6298828125, -0.99169921875, -0.353515625, 0.28466796875, 0.9228515625, 1.56103515625, 2.19921875, 2.83740234375, 3.4755859375, 4.11376953125, 4.751953125, 5.39013671875, 6.0283203125, 6.66650390625, 7.3046875, 7.94287109375, 8.5810546875, 9.21923828125, 9.857421875, 10.49560546875, 11.1337890625, 11.77197265625, 12.41015625, 13.04833984375, 13.6865234375, 14.32470703125, 14.962890625, 15.60107421875, 16.2392578125, 16.87744140625, 17.515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 4.0, 5.0, 4.0, 8.0, 6.0, 12.0, 21.0, 19.0, 26.0, 38.0, 44.0, 61.0, 97.0, 172.0, 361.0, 688.0, 888.0, 653.0, 394.0, 191.0, 113.0, 57.0, 39.0, 39.0, 21.0, 28.0, 13.0, 11.0, 12.0, 8.0, 10.0, 5.0, 2.0, 8.0, 2.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.270263671875, -24.49365234375, -23.717041015625, -22.9404296875, -22.163818359375, -21.38720703125, -20.610595703125, -19.833984375, -19.057373046875, -18.28076171875, -17.504150390625, -16.7275390625, -15.950927734375, -15.17431640625, -14.397705078125, -13.62109375, -12.844482421875, -12.06787109375, -11.291259765625, -10.5146484375, -9.738037109375, -8.96142578125, -8.184814453125, -7.408203125, -6.631591796875, -5.85498046875, -5.078369140625, -4.3017578125, -3.525146484375, -2.74853515625, -1.971923828125, -1.1953125, -0.418701171875, 0.35791015625, 1.134521484375, 1.9111328125, 2.687744140625, 3.46435546875, 4.240966796875, 5.017578125, 5.794189453125, 6.57080078125, 7.347412109375, 8.1240234375, 8.900634765625, 9.67724609375, 10.453857421875, 11.23046875, 12.007080078125, 12.78369140625, 13.560302734375, 14.3369140625, 15.113525390625, 15.89013671875, 16.666748046875, 17.443359375, 18.219970703125, 18.99658203125, 19.773193359375, 20.5498046875, 21.326416015625, 22.10302734375, 22.879638671875, 23.65625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 8.0, 27.0, 23.0, 35.0, 56.0, 67.0, 121.0, 164.0, 235.0, 450.0, 669.0, 1146.0, 1891.0, 3316.0, 6232.0, 12220.0, 27491.0, 79096.0, 563008.0, 3055936.0, 333827.0, 61755.0, 23047.0, 10693.0, 5328.0, 2979.0, 1704.0, 968.0, 596.0, 421.0, 259.0, 182.0, 96.0, 68.0, 48.0, 26.0, 22.0, 18.0, 13.0, 13.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.484375, -23.678955078125, -22.87353515625, -22.068115234375, -21.2626953125, -20.457275390625, -19.65185546875, -18.846435546875, -18.041015625, -17.235595703125, -16.43017578125, -15.624755859375, -14.8193359375, -14.013916015625, -13.20849609375, -12.403076171875, -11.59765625, -10.792236328125, -9.98681640625, -9.181396484375, -8.3759765625, -7.570556640625, -6.76513671875, -5.959716796875, -5.154296875, -4.348876953125, -3.54345703125, -2.738037109375, -1.9326171875, -1.127197265625, -0.32177734375, 0.483642578125, 1.2890625, 2.094482421875, 2.89990234375, 3.705322265625, 4.5107421875, 5.316162109375, 6.12158203125, 6.927001953125, 7.732421875, 8.537841796875, 9.34326171875, 10.148681640625, 10.9541015625, 11.759521484375, 12.56494140625, 13.370361328125, 14.17578125, 14.981201171875, 15.78662109375, 16.592041015625, 17.3974609375, 18.202880859375, 19.00830078125, 19.813720703125, 20.619140625, 21.424560546875, 22.22998046875, 23.035400390625, 23.8408203125, 24.646240234375, 25.45166015625, 26.257080078125, 27.0625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 35.0, 91.0, 262.0, 384.0, 162.0, 47.0, 16.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.69752502441406, -81.86127471923828, -73.02503204345703, -64.18878173828125, -55.352535247802734, -46.51628875732422, -37.68003845214844, -28.843791961669922, -20.007545471191406, -11.171298027038574, -2.335050582885742, 6.501197814941406, 15.337444305419922, 24.173690795898438, 33.00994110107422, 41.846187591552734, 50.68243408203125, 59.518680572509766, 68.35492706298828, 77.19117736816406, 86.02742004394531, 94.8636703491211, 103.69992065429688, 112.53616333007812, 121.3724136352539, 130.2086639404297, 139.04490661621094, 147.88116455078125, 156.7174072265625, 165.55364990234375, 174.389892578125, 183.2261505126953, 192.06240844726562, 200.89865112304688, 209.7349090576172, 218.57115173339844, 227.4073944091797, 236.24365234375, 245.07989501953125, 253.9161376953125, 262.75238037109375, 271.588623046875, 280.42486572265625, 289.2611083984375, 298.0973815917969, 306.9336242675781, 315.7698669433594, 324.6061096191406, 333.4423828125, 342.27862548828125, 351.1148681640625, 359.95111083984375, 368.7873840332031, 377.6236267089844, 386.4598693847656, 395.2961120605469, 404.1323547363281, 412.9685974121094, 421.8048400878906, 430.64111328125, 439.47735595703125, 448.3135986328125, 457.14984130859375, 465.986083984375, 474.82232666015625]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 5.0, 7.0, 8.0, 14.0, 11.0, 21.0, 20.0, 16.0, 22.0, 28.0, 28.0, 30.0, 33.0, 44.0, 39.0, 36.0, 40.0, 44.0, 35.0, 41.0, 33.0, 46.0, 37.0, 33.0, 41.0, 28.0, 34.0, 25.0, 34.0, 23.0, 23.0, 25.0, 18.0, 7.0, 11.0, 5.0, 13.0, 7.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-68.72080993652344, -66.65535736083984, -64.58990478515625, -62.52445983886719, -60.459007263183594, -58.3935546875, -56.32810592651367, -54.262657165527344, -52.19720458984375, -50.131752014160156, -48.06630325317383, -46.0008544921875, -43.935401916503906, -41.86994934082031, -39.804500579833984, -37.739051818847656, -35.67359924316406, -33.60814666748047, -31.54269790649414, -29.47724723815918, -27.41179656982422, -25.346345901489258, -23.280895233154297, -21.215444564819336, -19.149993896484375, -17.084543228149414, -15.019092559814453, -12.953641891479492, -10.888191223144531, -8.82274055480957, -6.757289886474609, -4.691839218139648, -2.6263885498046875, -0.5609378814697266, 1.5045127868652344, 3.5699634552001953, 5.635414123535156, 7.700864791870117, 9.766315460205078, 11.831766128540039, 13.897216796875, 15.962667465209961, 18.028118133544922, 20.093568801879883, 22.159019470214844, 24.224470138549805, 26.289920806884766, 28.355371475219727, 30.420822143554688, 32.48627471923828, 34.55172348022461, 36.61717224121094, 38.68262481689453, 40.748077392578125, 42.81352615356445, 44.87897491455078, 46.944427490234375, 49.00988006591797, 51.0753288269043, 53.140777587890625, 55.20623016357422, 57.27168273925781, 59.33713150024414, 61.40258026123047, 63.46803283691406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 17.0, 11.0, 9.0, 16.0, 21.0, 20.0, 30.0, 29.0, 35.0, 39.0, 33.0, 41.0, 39.0, 55.0, 34.0, 38.0, 43.0, 49.0, 48.0, 46.0, 32.0, 36.0, 34.0, 25.0, 32.0, 28.0, 24.0, 19.0, 10.0, 16.0, 7.0, 11.0, 12.0, 6.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.5546875, -9.28680419921875, -9.0189208984375, -8.75103759765625, -8.483154296875, -8.21527099609375, -7.9473876953125, -7.67950439453125, -7.41162109375, -7.14373779296875, -6.8758544921875, -6.60797119140625, -6.340087890625, -6.07220458984375, -5.8043212890625, -5.53643798828125, -5.2685546875, -5.00067138671875, -4.7327880859375, -4.46490478515625, -4.197021484375, -3.92913818359375, -3.6612548828125, -3.39337158203125, -3.12548828125, -2.85760498046875, -2.5897216796875, -2.32183837890625, -2.053955078125, -1.78607177734375, -1.5181884765625, -1.25030517578125, -0.982421875, -0.71453857421875, -0.4466552734375, -0.17877197265625, 0.089111328125, 0.35699462890625, 0.6248779296875, 0.89276123046875, 1.16064453125, 1.42852783203125, 1.6964111328125, 1.96429443359375, 2.232177734375, 2.50006103515625, 2.7679443359375, 3.03582763671875, 3.3037109375, 3.57159423828125, 3.8394775390625, 4.10736083984375, 4.375244140625, 4.64312744140625, 4.9110107421875, 5.17889404296875, 5.44677734375, 5.71466064453125, 5.9825439453125, 6.25042724609375, 6.518310546875, 6.78619384765625, 7.0540771484375, 7.32196044921875, 7.58984375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 7.0, 6.0, 11.0, 21.0, 25.0, 47.0, 53.0, 105.0, 137.0, 198.0, 228.0, 347.0, 453.0, 694.0, 941.0, 1414.0, 2069.0, 3031.0, 4375.0, 6617.0, 9942.0, 15281.0, 23662.0, 37226.0, 59597.0, 96489.0, 158861.0, 222728.0, 151581.0, 92177.0, 56968.0, 35597.0, 22982.0, 14834.0, 9638.0, 6352.0, 4185.0, 2967.0, 2014.0, 1423.0, 1015.0, 695.0, 458.0, 341.0, 241.0, 164.0, 117.0, 65.0, 59.0, 33.0, 27.0, 17.0, 14.0, 9.0, 8.0, 7.0, 2.0, 2.0], "bins": [-0.1878662109375, -0.1822509765625, -0.1766357421875, -0.1710205078125, -0.1654052734375, -0.1597900390625, -0.1541748046875, -0.1485595703125, -0.1429443359375, -0.1373291015625, -0.1317138671875, -0.1260986328125, -0.1204833984375, -0.1148681640625, -0.1092529296875, -0.1036376953125, -0.0980224609375, -0.0924072265625, -0.0867919921875, -0.0811767578125, -0.0755615234375, -0.0699462890625, -0.0643310546875, -0.0587158203125, -0.0531005859375, -0.0474853515625, -0.0418701171875, -0.0362548828125, -0.0306396484375, -0.0250244140625, -0.0194091796875, -0.0137939453125, -0.0081787109375, -0.0025634765625, 0.0030517578125, 0.0086669921875, 0.0142822265625, 0.0198974609375, 0.0255126953125, 0.0311279296875, 0.0367431640625, 0.0423583984375, 0.0479736328125, 0.0535888671875, 0.0592041015625, 0.0648193359375, 0.0704345703125, 0.0760498046875, 0.0816650390625, 0.0872802734375, 0.0928955078125, 0.0985107421875, 0.1041259765625, 0.1097412109375, 0.1153564453125, 0.1209716796875, 0.1265869140625, 0.1322021484375, 0.1378173828125, 0.1434326171875, 0.1490478515625, 0.1546630859375, 0.1602783203125, 0.1658935546875, 0.1715087890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 9.0, 10.0, 11.0, 10.0, 16.0, 12.0, 14.0, 24.0, 17.0, 28.0, 28.0, 36.0, 27.0, 30.0, 31.0, 31.0, 31.0, 35.0, 35.0, 1070.0, 39.0, 27.0, 44.0, 28.0, 46.0, 42.0, 26.0, 31.0, 26.0, 29.0, 19.0, 16.0, 25.0, 14.0, 10.0, 17.0, 11.0, 14.0, 4.0, 14.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0], "bins": [-5.1953125, -5.03619384765625, -4.8770751953125, -4.71795654296875, -4.558837890625, -4.39971923828125, -4.2406005859375, -4.08148193359375, -3.92236328125, -3.76324462890625, -3.6041259765625, -3.44500732421875, -3.285888671875, -3.12677001953125, -2.9676513671875, -2.80853271484375, -2.6494140625, -2.49029541015625, -2.3311767578125, -2.17205810546875, -2.012939453125, -1.85382080078125, -1.6947021484375, -1.53558349609375, -1.37646484375, -1.21734619140625, -1.0582275390625, -0.89910888671875, -0.739990234375, -0.58087158203125, -0.4217529296875, -0.26263427734375, -0.103515625, 0.05560302734375, 0.2147216796875, 0.37384033203125, 0.532958984375, 0.69207763671875, 0.8511962890625, 1.01031494140625, 1.16943359375, 1.32855224609375, 1.4876708984375, 1.64678955078125, 1.805908203125, 1.96502685546875, 2.1241455078125, 2.28326416015625, 2.4423828125, 2.60150146484375, 2.7606201171875, 2.91973876953125, 3.078857421875, 3.23797607421875, 3.3970947265625, 3.55621337890625, 3.71533203125, 3.87445068359375, 4.0335693359375, 4.19268798828125, 4.351806640625, 4.51092529296875, 4.6700439453125, 4.82916259765625, 4.98828125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 9.0, 25.0, 38.0, 44.0, 83.0, 102.0, 144.0, 184.0, 316.0, 453.0, 682.0, 929.0, 1320.0, 1859.0, 2735.0, 4058.0, 5818.0, 8463.0, 12004.0, 17327.0, 24558.0, 35361.0, 50418.0, 72972.0, 107421.0, 165542.0, 1205452.0, 117356.0, 79724.0, 55293.0, 38362.0, 26893.0, 18773.0, 12894.0, 8941.0, 6372.0, 4322.0, 3013.0, 2126.0, 1457.0, 977.0, 686.0, 489.0, 362.0, 253.0, 153.0, 114.0, 80.0, 55.0, 37.0, 23.0, 11.0, 13.0, 7.0, 6.0, 6.0, 2.0, 1.0], "bins": [-0.07403564453125, -0.0717306137084961, -0.06942558288574219, -0.06712055206298828, -0.06481552124023438, -0.06251049041748047, -0.06020545959472656, -0.057900428771972656, -0.05559539794921875, -0.053290367126464844, -0.05098533630371094, -0.04868030548095703, -0.046375274658203125, -0.04407024383544922, -0.04176521301269531, -0.039460182189941406, -0.0371551513671875, -0.034850120544433594, -0.03254508972167969, -0.03024005889892578, -0.027935028076171875, -0.02562999725341797, -0.023324966430664062, -0.021019935607910156, -0.01871490478515625, -0.016409873962402344, -0.014104843139648438, -0.011799812316894531, -0.009494781494140625, -0.007189750671386719, -0.0048847198486328125, -0.0025796890258789062, -0.000274658203125, 0.0020303726196289062, 0.0043354034423828125, 0.006640434265136719, 0.008945465087890625, 0.011250495910644531, 0.013555526733398438, 0.015860557556152344, 0.01816558837890625, 0.020470619201660156, 0.022775650024414062, 0.02508068084716797, 0.027385711669921875, 0.02969074249267578, 0.03199577331542969, 0.034300804138183594, 0.0366058349609375, 0.038910865783691406, 0.04121589660644531, 0.04352092742919922, 0.045825958251953125, 0.04813098907470703, 0.05043601989746094, 0.052741050720214844, 0.05504608154296875, 0.057351112365722656, 0.05965614318847656, 0.06196117401123047, 0.06426620483398438, 0.06657123565673828, 0.06887626647949219, 0.0711812973022461, 0.073486328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 15.0, 14.0, 15.0, 16.0, 21.0, 23.0, 21.0, 36.0, 47.0, 50.0, 57.0, 60.0, 68.0, 62.0, 59.0, 59.0, 58.0, 52.0, 47.0, 43.0, 36.0, 20.0, 20.0, 19.0, 14.0, 15.0, 10.0, 6.0, 8.0, 4.0, 10.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008215904235839844, -0.0007985308766365051, -0.0007754713296890259, -0.0007524117827415466, -0.0007293522357940674, -0.0007062926888465881, -0.0006832331418991089, -0.0006601735949516296, -0.0006371140480041504, -0.0006140545010566711, -0.0005909949541091919, -0.0005679354071617126, -0.0005448758602142334, -0.0005218163132667542, -0.0004987567663192749, -0.00047569721937179565, -0.0004526376724243164, -0.00042957812547683716, -0.0004065185785293579, -0.00038345903158187866, -0.0003603994846343994, -0.00033733993768692017, -0.0003142803907394409, -0.00029122084379196167, -0.0002681612968444824, -0.0002451017498970032, -0.00022204220294952393, -0.00019898265600204468, -0.00017592310905456543, -0.00015286356210708618, -0.00012980401515960693, -0.00010674446821212769, -8.368492126464844e-05, -6.062537431716919e-05, -3.756582736968994e-05, -1.4506280422210693e-05, 8.553266525268555e-06, 3.16128134727478e-05, 5.467236042022705e-05, 7.77319073677063e-05, 0.00010079145431518555, 0.0001238510012626648, 0.00014691054821014404, 0.0001699700951576233, 0.00019302964210510254, 0.0002160891890525818, 0.00023914873600006104, 0.0002622082829475403, 0.00028526782989501953, 0.0003083273768424988, 0.00033138692378997803, 0.0003544464707374573, 0.0003775060176849365, 0.00040056556463241577, 0.000423625111579895, 0.00044668465852737427, 0.0004697442054748535, 0.0004928037524223328, 0.000515863299369812, 0.0005389228463172913, 0.0005619823932647705, 0.0005850419402122498, 0.000608101487159729, 0.0006311610341072083, 0.0006542205810546875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 5.0, 9.0, 6.0, 15.0, 15.0, 15.0, 21.0, 41.0, 31.0, 60.0, 86.0, 140.0, 161.0, 229.0, 417.0, 1007.0, 26295.0, 1011221.0, 6912.0, 742.0, 356.0, 224.0, 150.0, 106.0, 76.0, 62.0, 42.0, 31.0, 25.0, 17.0, 18.0, 4.0, 4.0, 6.0, 5.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01171112060546875, -0.011298298835754395, -0.010885477066040039, -0.010472655296325684, -0.010059833526611328, -0.009647011756896973, -0.009234189987182617, -0.008821368217468262, -0.008408546447753906, -0.00799572467803955, -0.007582902908325195, -0.00717008113861084, -0.006757259368896484, -0.006344437599182129, -0.0059316158294677734, -0.005518794059753418, -0.0051059722900390625, -0.004693150520324707, -0.0042803287506103516, -0.003867506980895996, -0.0034546852111816406, -0.003041863441467285, -0.0026290416717529297, -0.0022162199020385742, -0.0018033981323242188, -0.0013905763626098633, -0.0009777545928955078, -0.0005649328231811523, -0.00015211105346679688, 0.0002607107162475586, 0.0006735324859619141, 0.0010863542556762695, 0.001499176025390625, 0.0019119977951049805, 0.002324819564819336, 0.0027376413345336914, 0.003150463104248047, 0.0035632848739624023, 0.003976106643676758, 0.004388928413391113, 0.004801750183105469, 0.005214571952819824, 0.00562739372253418, 0.006040215492248535, 0.006453037261962891, 0.006865859031677246, 0.0072786808013916016, 0.007691502571105957, 0.008104324340820312, 0.008517146110534668, 0.008929967880249023, 0.009342789649963379, 0.009755611419677734, 0.01016843318939209, 0.010581254959106445, 0.0109940767288208, 0.011406898498535156, 0.011819720268249512, 0.012232542037963867, 0.012645363807678223, 0.013058185577392578, 0.013471007347106934, 0.013883829116821289, 0.014296650886535645, 0.01470947265625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 925.0, 84.0, 0.0, 1.0], "bins": [-0.025905147194862366, -0.025479130446910858, -0.02505311369895935, -0.024627096951007843, -0.024201078340411186, -0.02377506159245968, -0.02334904484450817, -0.022923028096556664, -0.022497011348605156, -0.02207099460065365, -0.02164497785270214, -0.021218961104750633, -0.020792942494153976, -0.02036692574620247, -0.01994090899825096, -0.019514892250299454, -0.019088875502347946, -0.01866285875439644, -0.01823684200644493, -0.017810825258493423, -0.017384806647896767, -0.01695878989994526, -0.01653277315199375, -0.016106756404042244, -0.015680739656090736, -0.015254722908139229, -0.014828705228865147, -0.014402688480913639, -0.013976671732962132, -0.01355065405368805, -0.013124637305736542, -0.012698620557785034, -0.012272601947188377, -0.01184658519923687, -0.011420567519962788, -0.01099455077201128, -0.010568534024059772, -0.01014251634478569, -0.009716499596834183, -0.009290482848882675, -0.008864466100931168, -0.00843844935297966, -0.008012431673705578, -0.00758641492575407, -0.007160398177802563, -0.006734380964189768, -0.006308363750576973, -0.005882347002625465, -0.005456330254673958, -0.005030313041061163, -0.004604296293109655, -0.0041782790794968605, -0.003752262331545353, -0.003326245117932558, -0.002900228137150407, -0.0024742111563682556, -0.0020481941755861044, -0.0016221771948039532, -0.001196160214021802, -0.0007701431168243289, -0.0003441261360421777, 8.189096115529537e-05, 0.0005079079419374466, 0.0009339249227195978, 0.001359941903501749]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 12.0, 8.0, 11.0, 20.0, 14.0, 41.0, 46.0, 60.0, 61.0, 74.0, 79.0, 85.0, 81.0, 68.0, 61.0, 64.0, 59.0, 39.0, 32.0, 27.0, 27.0, 15.0, 13.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008486509323120117, -0.0008117500692605972, -0.0007748492062091827, -0.0007379483431577682, -0.0007010474801063538, -0.0006641466170549393, -0.0006272457540035248, -0.0005903448909521103, -0.0005534440279006958, -0.0005165431648492813, -0.0004796423017978668, -0.00044274143874645233, -0.00040584057569503784, -0.00036893971264362335, -0.00033203884959220886, -0.00029513798654079437, -0.0002582371234893799, -0.0002213362604379654, -0.0001844353973865509, -0.00014753453433513641, -0.00011063367128372192, -7.373280823230743e-05, -3.6831945180892944e-05, 6.891787052154541e-08, 3.6969780921936035e-05, 7.387064397335052e-05, 0.00011077150702476501, 0.0001476723700761795, 0.000184573233127594, 0.00022147409617900848, 0.000258374959230423, 0.00029527582228183746, 0.00033217668533325195, 0.00036907754838466644, 0.00040597841143608093, 0.0004428792744874954, 0.0004797801375389099, 0.0005166810005903244, 0.0005535818636417389, 0.0005904827266931534, 0.0006273835897445679, 0.0006642844527959824, 0.0007011853158473969, 0.0007380861788988113, 0.0007749870419502258, 0.0008118879050016403, 0.0008487887680530548, 0.0008856896311044693, 0.0009225904941558838, 0.0009594913572072983, 0.0009963922202587128, 0.0010332930833101273, 0.0010701939463615417, 0.0011070948094129562, 0.0011439956724643707, 0.0011808965355157852, 0.0012177973985671997, 0.0012546982616186142, 0.0012915991246700287, 0.0013284999877214432, 0.0013654008507728577, 0.0014023017138242722, 0.0014392025768756866, 0.0014761034399271011, 0.0015130043029785156]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 17.0, 11.0, 9.0, 16.0, 21.0, 20.0, 30.0, 29.0, 35.0, 39.0, 33.0, 41.0, 39.0, 55.0, 34.0, 38.0, 43.0, 49.0, 48.0, 46.0, 32.0, 36.0, 34.0, 25.0, 32.0, 28.0, 24.0, 19.0, 10.0, 16.0, 7.0, 11.0, 12.0, 6.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.5546875, -9.28680419921875, -9.0189208984375, -8.75103759765625, -8.483154296875, -8.21527099609375, -7.9473876953125, -7.67950439453125, -7.41162109375, -7.14373779296875, -6.8758544921875, -6.60797119140625, -6.340087890625, -6.07220458984375, -5.8043212890625, -5.53643798828125, -5.2685546875, -5.00067138671875, -4.7327880859375, -4.46490478515625, -4.197021484375, -3.92913818359375, -3.6612548828125, -3.39337158203125, -3.12548828125, -2.85760498046875, -2.5897216796875, -2.32183837890625, -2.053955078125, -1.78607177734375, -1.5181884765625, -1.25030517578125, -0.982421875, -0.71453857421875, -0.4466552734375, -0.17877197265625, 0.089111328125, 0.35699462890625, 0.6248779296875, 0.89276123046875, 1.16064453125, 1.42852783203125, 1.6964111328125, 1.96429443359375, 2.232177734375, 2.50006103515625, 2.7679443359375, 3.03582763671875, 3.3037109375, 3.57159423828125, 3.8394775390625, 4.10736083984375, 4.375244140625, 4.64312744140625, 4.9110107421875, 5.17889404296875, 5.44677734375, 5.71466064453125, 5.9825439453125, 6.25042724609375, 6.518310546875, 6.78619384765625, 7.0540771484375, 7.32196044921875, 7.58984375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 11.0, 2.0, 2.0, 9.0, 11.0, 7.0, 12.0, 22.0, 30.0, 54.0, 58.0, 74.0, 108.0, 144.0, 199.0, 315.0, 424.0, 593.0, 866.0, 1339.0, 2117.0, 3457.0, 5796.0, 11233.0, 25894.0, 183710.0, 739638.0, 39274.0, 14551.0, 7086.0, 4091.0, 2462.0, 1636.0, 1008.0, 668.0, 522.0, 348.0, 214.0, 159.0, 94.0, 94.0, 72.0, 48.0, 31.0, 16.0, 18.0, 16.0, 2.0, 9.0, 10.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.765625, -17.135009765625, -16.50439453125, -15.873779296875, -15.2431640625, -14.612548828125, -13.98193359375, -13.351318359375, -12.720703125, -12.090087890625, -11.45947265625, -10.828857421875, -10.1982421875, -9.567626953125, -8.93701171875, -8.306396484375, -7.67578125, -7.045166015625, -6.41455078125, -5.783935546875, -5.1533203125, -4.522705078125, -3.89208984375, -3.261474609375, -2.630859375, -2.000244140625, -1.36962890625, -0.739013671875, -0.1083984375, 0.522216796875, 1.15283203125, 1.783447265625, 2.4140625, 3.044677734375, 3.67529296875, 4.305908203125, 4.9365234375, 5.567138671875, 6.19775390625, 6.828369140625, 7.458984375, 8.089599609375, 8.72021484375, 9.350830078125, 9.9814453125, 10.612060546875, 11.24267578125, 11.873291015625, 12.50390625, 13.134521484375, 13.76513671875, 14.395751953125, 15.0263671875, 15.656982421875, 16.28759765625, 16.918212890625, 17.548828125, 18.179443359375, 18.81005859375, 19.440673828125, 20.0712890625, 20.701904296875, 21.33251953125, 21.963134765625, 22.59375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 4.0, 10.0, 12.0, 12.0, 18.0, 19.0, 12.0, 16.0, 24.0, 32.0, 24.0, 33.0, 41.0, 47.0, 52.0, 63.0, 102.0, 195.0, 1676.0, 104.0, 85.0, 56.0, 51.0, 51.0, 41.0, 35.0, 32.0, 24.0, 30.0, 26.0, 17.0, 16.0, 16.0, 15.0, 13.0, 5.0, 7.0, 4.0, 5.0, 1.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.785400390625, -25.89892578125, -25.012451171875, -24.1259765625, -23.239501953125, -22.35302734375, -21.466552734375, -20.580078125, -19.693603515625, -18.80712890625, -17.920654296875, -17.0341796875, -16.147705078125, -15.26123046875, -14.374755859375, -13.48828125, -12.601806640625, -11.71533203125, -10.828857421875, -9.9423828125, -9.055908203125, -8.16943359375, -7.282958984375, -6.396484375, -5.510009765625, -4.62353515625, -3.737060546875, -2.8505859375, -1.964111328125, -1.07763671875, -0.191162109375, 0.6953125, 1.581787109375, 2.46826171875, 3.354736328125, 4.2412109375, 5.127685546875, 6.01416015625, 6.900634765625, 7.787109375, 8.673583984375, 9.56005859375, 10.446533203125, 11.3330078125, 12.219482421875, 13.10595703125, 13.992431640625, 14.87890625, 15.765380859375, 16.65185546875, 17.538330078125, 18.4248046875, 19.311279296875, 20.19775390625, 21.084228515625, 21.970703125, 22.857177734375, 23.74365234375, 24.630126953125, 25.5166015625, 26.403076171875, 27.28955078125, 28.176025390625, 29.0625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 8.0, 13.0, 16.0, 17.0, 26.0, 38.0, 42.0, 51.0, 55.0, 95.0, 130.0, 190.0, 445.0, 1245.0, 5268.0, 31459.0, 2813722.0, 271290.0, 16682.0, 3204.0, 841.0, 291.0, 159.0, 95.0, 77.0, 64.0, 35.0, 20.0, 16.0, 15.0, 11.0, 15.0, 13.0, 8.0, 9.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0, -56.23388671875, -54.4677734375, -52.70166015625, -50.935546875, -49.16943359375, -47.4033203125, -45.63720703125, -43.87109375, -42.10498046875, -40.3388671875, -38.57275390625, -36.806640625, -35.04052734375, -33.2744140625, -31.50830078125, -29.7421875, -27.97607421875, -26.2099609375, -24.44384765625, -22.677734375, -20.91162109375, -19.1455078125, -17.37939453125, -15.61328125, -13.84716796875, -12.0810546875, -10.31494140625, -8.548828125, -6.78271484375, -5.0166015625, -3.25048828125, -1.484375, 0.28173828125, 2.0478515625, 3.81396484375, 5.580078125, 7.34619140625, 9.1123046875, 10.87841796875, 12.64453125, 14.41064453125, 16.1767578125, 17.94287109375, 19.708984375, 21.47509765625, 23.2412109375, 25.00732421875, 26.7734375, 28.53955078125, 30.3056640625, 32.07177734375, 33.837890625, 35.60400390625, 37.3701171875, 39.13623046875, 40.90234375, 42.66845703125, 44.4345703125, 46.20068359375, 47.966796875, 49.73291015625, 51.4990234375, 53.26513671875, 55.03125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 228.0, 721.0, 54.0, 3.0, 1.0, 1.0], "bins": [-819.880126953125, -806.0418090820312, -792.2034912109375, -778.3651733398438, -764.5269165039062, -750.6885986328125, -736.8502807617188, -723.011962890625, -709.1736450195312, -695.3353271484375, -681.4970092773438, -667.65869140625, -653.8204345703125, -639.9821166992188, -626.143798828125, -612.3054809570312, -598.4671630859375, -584.6288452148438, -570.79052734375, -556.9522094726562, -543.1139526367188, -529.275634765625, -515.4373168945312, -501.5989990234375, -487.7607116699219, -473.9223937988281, -460.0841064453125, -446.24578857421875, -432.407470703125, -418.56915283203125, -404.7308654785156, -390.8925476074219, -377.05419921875, -363.21588134765625, -349.3775939941406, -335.5392761230469, -321.7009582519531, -307.8626708984375, -294.02435302734375, -280.18603515625, -266.34771728515625, -252.50941467285156, -238.6710968017578, -224.83279418945312, -210.99447631835938, -197.1561737060547, -183.31787109375, -169.47955322265625, -155.64126586914062, -141.80296325683594, -127.96464538574219, -114.1263427734375, -100.28802490234375, -86.44972229003906, -72.61141204833984, -58.773101806640625, -44.934783935546875, -31.096473693847656, -17.25816535949707, -3.4198570251464844, 10.418453216552734, 24.256759643554688, 38.095069885253906, 51.933380126953125, 65.77169036865234]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 7.0, 10.0, 8.0, 18.0, 27.0, 18.0, 16.0, 21.0, 32.0, 36.0, 41.0, 29.0, 28.0, 37.0, 37.0, 37.0, 33.0, 47.0, 53.0, 40.0, 33.0, 42.0, 36.0, 33.0, 35.0, 32.0, 24.0, 21.0, 26.0, 15.0, 23.0, 15.0, 11.0, 12.0, 10.0, 7.0, 5.0, 6.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.90670776367188, -73.55231475830078, -71.19792175292969, -68.84353637695312, -66.48914337158203, -64.13475036621094, -61.78036117553711, -59.42597198486328, -57.07157897949219, -54.717185974121094, -52.362796783447266, -50.00840759277344, -47.654014587402344, -45.29962158203125, -42.94523239135742, -40.590843200683594, -38.2364501953125, -35.882057189941406, -33.52766799926758, -31.173276901245117, -28.818885803222656, -26.464494705200195, -24.110103607177734, -21.755712509155273, -19.401321411132812, -17.04693031311035, -14.69253921508789, -12.33814811706543, -9.983757019042969, -7.629365921020508, -5.274974822998047, -2.920583724975586, -0.5661849975585938, 1.7882061004638672, 4.142597198486328, 6.496988296508789, 8.85137939453125, 11.205770492553711, 13.560161590576172, 15.914552688598633, 18.268943786621094, 20.623334884643555, 22.977725982666016, 25.332117080688477, 27.686508178710938, 30.0408992767334, 32.39529037475586, 34.74967956542969, 37.10407257080078, 39.458465576171875, 41.8128547668457, 44.16724395751953, 46.521636962890625, 48.87602996826172, 51.23041915893555, 53.584808349609375, 55.93920135498047, 58.29359436035156, 60.64798355102539, 63.00237274169922, 65.35676574707031, 67.7111587524414, 70.0655517578125, 72.41993713378906, 74.77433013916016]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 3.0, 7.0, 11.0, 11.0, 7.0, 15.0, 12.0, 23.0, 19.0, 21.0, 33.0, 28.0, 32.0, 43.0, 35.0, 39.0, 28.0, 55.0, 32.0, 48.0, 33.0, 60.0, 29.0, 41.0, 33.0, 33.0, 34.0, 38.0, 29.0, 24.0, 16.0, 21.0, 16.0, 14.0, 9.0, 10.0, 9.0, 12.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0], "bins": [-9.75, -9.4827880859375, -9.215576171875, -8.9483642578125, -8.68115234375, -8.4139404296875, -8.146728515625, -7.8795166015625, -7.6123046875, -7.3450927734375, -7.077880859375, -6.8106689453125, -6.54345703125, -6.2762451171875, -6.009033203125, -5.7418212890625, -5.474609375, -5.2073974609375, -4.940185546875, -4.6729736328125, -4.40576171875, -4.1385498046875, -3.871337890625, -3.6041259765625, -3.3369140625, -3.0697021484375, -2.802490234375, -2.5352783203125, -2.26806640625, -2.0008544921875, -1.733642578125, -1.4664306640625, -1.19921875, -0.9320068359375, -0.664794921875, -0.3975830078125, -0.13037109375, 0.1368408203125, 0.404052734375, 0.6712646484375, 0.9384765625, 1.2056884765625, 1.472900390625, 1.7401123046875, 2.00732421875, 2.2745361328125, 2.541748046875, 2.8089599609375, 3.076171875, 3.3433837890625, 3.610595703125, 3.8778076171875, 4.14501953125, 4.4122314453125, 4.679443359375, 4.9466552734375, 5.2138671875, 5.4810791015625, 5.748291015625, 6.0155029296875, 6.28271484375, 6.5499267578125, 6.817138671875, 7.0843505859375, 7.3515625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 4.0, 11.0, 15.0, 15.0, 12.0, 22.0, 34.0, 57.0, 68.0, 96.0, 182.0, 251.0, 438.0, 821.0, 1523.0, 3208.0, 7767.0, 23776.0, 437568.0, 3552986.0, 137312.0, 16442.0, 6118.0, 2630.0, 1255.0, 663.0, 381.0, 211.0, 120.0, 91.0, 47.0, 38.0, 25.0, 12.0, 14.0, 18.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-41.65625, -40.510498046875, -39.36474609375, -38.218994140625, -37.0732421875, -35.927490234375, -34.78173828125, -33.635986328125, -32.490234375, -31.344482421875, -30.19873046875, -29.052978515625, -27.9072265625, -26.761474609375, -25.61572265625, -24.469970703125, -23.32421875, -22.178466796875, -21.03271484375, -19.886962890625, -18.7412109375, -17.595458984375, -16.44970703125, -15.303955078125, -14.158203125, -13.012451171875, -11.86669921875, -10.720947265625, -9.5751953125, -8.429443359375, -7.28369140625, -6.137939453125, -4.9921875, -3.846435546875, -2.70068359375, -1.554931640625, -0.4091796875, 0.736572265625, 1.88232421875, 3.028076171875, 4.173828125, 5.319580078125, 6.46533203125, 7.611083984375, 8.7568359375, 9.902587890625, 11.04833984375, 12.194091796875, 13.33984375, 14.485595703125, 15.63134765625, 16.777099609375, 17.9228515625, 19.068603515625, 20.21435546875, 21.360107421875, 22.505859375, 23.651611328125, 24.79736328125, 25.943115234375, 27.0888671875, 28.234619140625, 29.38037109375, 30.526123046875, 31.671875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 4.0, 15.0, 12.0, 15.0, 17.0, 17.0, 24.0, 38.0, 53.0, 71.0, 132.0, 229.0, 444.0, 746.0, 794.0, 574.0, 324.0, 178.0, 100.0, 70.0, 48.0, 29.0, 27.0, 19.0, 14.0, 18.0, 8.0, 2.0, 3.0, 8.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.015625, -24.2841796875, -23.552734375, -22.8212890625, -22.08984375, -21.3583984375, -20.626953125, -19.8955078125, -19.1640625, -18.4326171875, -17.701171875, -16.9697265625, -16.23828125, -15.5068359375, -14.775390625, -14.0439453125, -13.3125, -12.5810546875, -11.849609375, -11.1181640625, -10.38671875, -9.6552734375, -8.923828125, -8.1923828125, -7.4609375, -6.7294921875, -5.998046875, -5.2666015625, -4.53515625, -3.8037109375, -3.072265625, -2.3408203125, -1.609375, -0.8779296875, -0.146484375, 0.5849609375, 1.31640625, 2.0478515625, 2.779296875, 3.5107421875, 4.2421875, 4.9736328125, 5.705078125, 6.4365234375, 7.16796875, 7.8994140625, 8.630859375, 9.3623046875, 10.09375, 10.8251953125, 11.556640625, 12.2880859375, 13.01953125, 13.7509765625, 14.482421875, 15.2138671875, 15.9453125, 16.6767578125, 17.408203125, 18.1396484375, 18.87109375, 19.6025390625, 20.333984375, 21.0654296875, 21.796875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 9.0, 14.0, 23.0, 30.0, 48.0, 81.0, 208.0, 443.0, 1143.0, 3506.0, 12403.0, 68974.0, 3424518.0, 638717.0, 32670.0, 7762.0, 2304.0, 775.0, 284.0, 132.0, 75.0, 39.0, 17.0, 20.0, 15.0, 11.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.0, -53.1552734375, -51.310546875, -49.4658203125, -47.62109375, -45.7763671875, -43.931640625, -42.0869140625, -40.2421875, -38.3974609375, -36.552734375, -34.7080078125, -32.86328125, -31.0185546875, -29.173828125, -27.3291015625, -25.484375, -23.6396484375, -21.794921875, -19.9501953125, -18.10546875, -16.2607421875, -14.416015625, -12.5712890625, -10.7265625, -8.8818359375, -7.037109375, -5.1923828125, -3.34765625, -1.5029296875, 0.341796875, 2.1865234375, 4.03125, 5.8759765625, 7.720703125, 9.5654296875, 11.41015625, 13.2548828125, 15.099609375, 16.9443359375, 18.7890625, 20.6337890625, 22.478515625, 24.3232421875, 26.16796875, 28.0126953125, 29.857421875, 31.7021484375, 33.546875, 35.3916015625, 37.236328125, 39.0810546875, 40.92578125, 42.7705078125, 44.615234375, 46.4599609375, 48.3046875, 50.1494140625, 51.994140625, 53.8388671875, 55.68359375, 57.5283203125, 59.373046875, 61.2177734375, 63.0625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 15.0, 40.0, 86.0, 210.0, 314.0, 184.0, 99.0, 24.0, 27.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-196.27145385742188, -189.37081909179688, -182.47018432617188, -175.56954956054688, -168.66891479492188, -161.76828002929688, -154.86764526367188, -147.96701049804688, -141.06637573242188, -134.16574096679688, -127.26510620117188, -120.36447143554688, -113.46383666992188, -106.56320190429688, -99.66256713867188, -92.76193237304688, -85.8613052368164, -78.9606704711914, -72.0600357055664, -65.1594009399414, -58.258766174316406, -51.35813522338867, -44.45750045776367, -37.55686569213867, -30.656230926513672, -23.755596160888672, -16.854961395263672, -9.954328536987305, -3.0536937713623047, 3.8469390869140625, 10.747573852539062, 17.648208618164062, 24.548843383789062, 31.449478149414062, 38.35011291503906, 45.25074768066406, 52.15138244628906, 59.0520133972168, 65.95265197753906, 72.85328674316406, 79.75392150878906, 86.65455627441406, 93.55519104003906, 100.45582580566406, 107.35646057128906, 114.25709533691406, 121.15773010253906, 128.05836486816406, 134.958984375, 141.859619140625, 148.76025390625, 155.660888671875, 162.5615234375, 169.462158203125, 176.36279296875, 183.263427734375, 190.1640625, 197.064697265625, 203.96533203125, 210.865966796875, 217.7666015625, 224.667236328125, 231.56787109375, 238.468505859375, 245.369140625]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 7.0, 11.0, 6.0, 10.0, 9.0, 7.0, 10.0, 17.0, 26.0, 30.0, 27.0, 28.0, 32.0, 30.0, 27.0, 36.0, 43.0, 42.0, 41.0, 38.0, 53.0, 38.0, 33.0, 44.0, 44.0, 43.0, 29.0, 22.0, 38.0, 25.0, 19.0, 15.0, 20.0, 23.0, 10.0, 13.0, 11.0, 14.0, 13.0, 3.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-74.88423156738281, -72.79228210449219, -70.70033264160156, -68.60838317871094, -66.51644134521484, -64.42449188232422, -62.332542419433594, -60.24059295654297, -58.148643493652344, -56.05669403076172, -53.96474838256836, -51.872798919677734, -49.78084945678711, -47.68890380859375, -45.596954345703125, -43.5050048828125, -41.41305923461914, -39.321109771728516, -37.229164123535156, -35.13721466064453, -33.045265197753906, -30.953317642211914, -28.861370086669922, -26.769420623779297, -24.677473068237305, -22.585525512695312, -20.493576049804688, -18.401628494262695, -16.309680938720703, -14.217731475830078, -12.125783920288086, -10.033835411071777, -7.941886901855469, -5.84993839263916, -3.7579903602600098, -1.6660423278808594, 0.4259061813354492, 2.517854690551758, 4.60980224609375, 6.701750755310059, 8.793699264526367, 10.885647773742676, 12.977596282958984, 15.069543838500977, 17.16149139404297, 19.253440856933594, 21.345388412475586, 23.437335968017578, 25.529285430908203, 27.621232986450195, 29.71318244934082, 31.805130004882812, 33.89707946777344, 35.98902893066406, 38.08097457885742, 40.17292404174805, 42.264869689941406, 44.35681915283203, 46.44876480102539, 48.540714263916016, 50.63266372680664, 52.724609375, 54.816558837890625, 56.90850830078125, 59.000457763671875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 13.0, 10.0, 10.0, 12.0, 13.0, 18.0, 15.0, 22.0, 23.0, 28.0, 30.0, 21.0, 37.0, 38.0, 50.0, 42.0, 52.0, 50.0, 41.0, 47.0, 46.0, 36.0, 41.0, 32.0, 39.0, 24.0, 42.0, 15.0, 18.0, 23.0, 21.0, 10.0, 11.0, 8.0, 10.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-10.09375, -9.81988525390625, -9.5460205078125, -9.27215576171875, -8.998291015625, -8.72442626953125, -8.4505615234375, -8.17669677734375, -7.90283203125, -7.62896728515625, -7.3551025390625, -7.08123779296875, -6.807373046875, -6.53350830078125, -6.2596435546875, -5.98577880859375, -5.7119140625, -5.43804931640625, -5.1641845703125, -4.89031982421875, -4.616455078125, -4.34259033203125, -4.0687255859375, -3.79486083984375, -3.52099609375, -3.24713134765625, -2.9732666015625, -2.69940185546875, -2.425537109375, -2.15167236328125, -1.8778076171875, -1.60394287109375, -1.330078125, -1.05621337890625, -0.7823486328125, -0.50848388671875, -0.234619140625, 0.03924560546875, 0.3131103515625, 0.58697509765625, 0.86083984375, 1.13470458984375, 1.4085693359375, 1.68243408203125, 1.956298828125, 2.23016357421875, 2.5040283203125, 2.77789306640625, 3.0517578125, 3.32562255859375, 3.5994873046875, 3.87335205078125, 4.147216796875, 4.42108154296875, 4.6949462890625, 4.96881103515625, 5.24267578125, 5.51654052734375, 5.7904052734375, 6.06427001953125, 6.338134765625, 6.61199951171875, 6.8858642578125, 7.15972900390625, 7.43359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 1.0, 1.0, 7.0, 20.0, 17.0, 34.0, 47.0, 69.0, 93.0, 124.0, 181.0, 264.0, 393.0, 505.0, 738.0, 1009.0, 1464.0, 2066.0, 3055.0, 4376.0, 6269.0, 8951.0, 13424.0, 19406.0, 28473.0, 42531.0, 64072.0, 97826.0, 151342.0, 200244.0, 134636.0, 88194.0, 58135.0, 38539.0, 25528.0, 17286.0, 12057.0, 8230.0, 5719.0, 3911.0, 2701.0, 1952.0, 1444.0, 928.0, 693.0, 463.0, 328.0, 237.0, 154.0, 119.0, 88.0, 67.0, 40.0, 46.0, 28.0, 8.0, 13.0, 7.0, 2.0, 8.0, 3.0], "bins": [-0.1748046875, -0.1694049835205078, -0.16400527954101562, -0.15860557556152344, -0.15320587158203125, -0.14780616760253906, -0.14240646362304688, -0.1370067596435547, -0.1316070556640625, -0.1262073516845703, -0.12080764770507812, -0.11540794372558594, -0.11000823974609375, -0.10460853576660156, -0.09920883178710938, -0.09380912780761719, -0.088409423828125, -0.08300971984863281, -0.07761001586914062, -0.07221031188964844, -0.06681060791015625, -0.06141090393066406, -0.056011199951171875, -0.05061149597167969, -0.0452117919921875, -0.03981208801269531, -0.034412384033203125, -0.029012680053710938, -0.02361297607421875, -0.018213272094726562, -0.012813568115234375, -0.0074138641357421875, -0.00201416015625, 0.0033855438232421875, 0.008785247802734375, 0.014184951782226562, 0.01958465576171875, 0.024984359741210938, 0.030384063720703125, 0.03578376770019531, 0.0411834716796875, 0.04658317565917969, 0.051982879638671875, 0.05738258361816406, 0.06278228759765625, 0.06818199157714844, 0.07358169555664062, 0.07898139953613281, 0.084381103515625, 0.08978080749511719, 0.09518051147460938, 0.10058021545410156, 0.10597991943359375, 0.11137962341308594, 0.11677932739257812, 0.12217903137207031, 0.1275787353515625, 0.1329784393310547, 0.13837814331054688, 0.14377784729003906, 0.14917755126953125, 0.15457725524902344, 0.15997695922851562, 0.1653766632080078, 0.1707763671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 4.0, 10.0, 15.0, 13.0, 17.0, 18.0, 25.0, 32.0, 25.0, 28.0, 31.0, 41.0, 42.0, 35.0, 51.0, 48.0, 1069.0, 42.0, 55.0, 38.0, 43.0, 39.0, 49.0, 35.0, 31.0, 31.0, 30.0, 13.0, 19.0, 22.0, 15.0, 12.0, 7.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.078125, -5.85986328125, -5.6416015625, -5.42333984375, -5.205078125, -4.98681640625, -4.7685546875, -4.55029296875, -4.33203125, -4.11376953125, -3.8955078125, -3.67724609375, -3.458984375, -3.24072265625, -3.0224609375, -2.80419921875, -2.5859375, -2.36767578125, -2.1494140625, -1.93115234375, -1.712890625, -1.49462890625, -1.2763671875, -1.05810546875, -0.83984375, -0.62158203125, -0.4033203125, -0.18505859375, 0.033203125, 0.25146484375, 0.4697265625, 0.68798828125, 0.90625, 1.12451171875, 1.3427734375, 1.56103515625, 1.779296875, 1.99755859375, 2.2158203125, 2.43408203125, 2.65234375, 2.87060546875, 3.0888671875, 3.30712890625, 3.525390625, 3.74365234375, 3.9619140625, 4.18017578125, 4.3984375, 4.61669921875, 4.8349609375, 5.05322265625, 5.271484375, 5.48974609375, 5.7080078125, 5.92626953125, 6.14453125, 6.36279296875, 6.5810546875, 6.79931640625, 7.017578125, 7.23583984375, 7.4541015625, 7.67236328125, 7.890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 17.0, 7.0, 20.0, 31.0, 38.0, 83.0, 112.0, 166.0, 242.0, 401.0, 580.0, 948.0, 1546.0, 2628.0, 4222.0, 6810.0, 11519.0, 18829.0, 31381.0, 52477.0, 87954.0, 150086.0, 1282605.0, 181280.0, 105781.0, 62148.0, 37637.0, 22703.0, 13740.0, 8270.0, 4869.0, 3094.0, 1859.0, 1127.0, 695.0, 425.0, 293.0, 170.0, 121.0, 74.0, 51.0, 35.0, 19.0, 16.0, 10.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1103515625, -0.10686779022216797, -0.10338401794433594, -0.0999002456665039, -0.09641647338867188, -0.09293270111083984, -0.08944892883300781, -0.08596515655517578, -0.08248138427734375, -0.07899761199951172, -0.07551383972167969, -0.07203006744384766, -0.06854629516601562, -0.0650625228881836, -0.06157875061035156, -0.05809497833251953, -0.0546112060546875, -0.05112743377685547, -0.04764366149902344, -0.044159889221191406, -0.040676116943359375, -0.037192344665527344, -0.03370857238769531, -0.03022480010986328, -0.02674102783203125, -0.02325725555419922, -0.019773483276367188, -0.016289710998535156, -0.012805938720703125, -0.009322166442871094, -0.0058383941650390625, -0.0023546218872070312, 0.001129150390625, 0.004612922668457031, 0.008096694946289062, 0.011580467224121094, 0.015064239501953125, 0.018548011779785156, 0.022031784057617188, 0.02551555633544922, 0.02899932861328125, 0.03248310089111328, 0.03596687316894531, 0.039450645446777344, 0.042934417724609375, 0.046418190002441406, 0.04990196228027344, 0.05338573455810547, 0.0568695068359375, 0.06035327911376953, 0.06383705139160156, 0.0673208236694336, 0.07080459594726562, 0.07428836822509766, 0.07777214050292969, 0.08125591278076172, 0.08473968505859375, 0.08822345733642578, 0.09170722961425781, 0.09519100189208984, 0.09867477416992188, 0.1021585464477539, 0.10564231872558594, 0.10912609100341797, 0.11260986328125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 5.0, 6.0, 20.0, 16.0, 32.0, 24.0, 32.0, 34.0, 32.0, 45.0, 49.0, 51.0, 46.0, 50.0, 59.0, 53.0, 47.0, 56.0, 40.0, 30.0, 42.0, 29.0, 31.0, 16.0, 26.0, 16.0, 17.0, 17.0, 9.0, 12.0, 4.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0008707046508789062, -0.000844612717628479, -0.0008185207843780518, -0.0007924288511276245, -0.0007663369178771973, -0.00074024498462677, -0.0007141530513763428, -0.0006880611181259155, -0.0006619691848754883, -0.000635877251625061, -0.0006097853183746338, -0.0005836933851242065, -0.0005576014518737793, -0.000531509518623352, -0.0005054175853729248, -0.00047932565212249756, -0.0004532337188720703, -0.00042714178562164307, -0.0004010498523712158, -0.0003749579191207886, -0.00034886598587036133, -0.0003227740526199341, -0.00029668211936950684, -0.0002705901861190796, -0.00024449825286865234, -0.0002184063196182251, -0.00019231438636779785, -0.0001662224531173706, -0.00014013051986694336, -0.00011403858661651611, -8.794665336608887e-05, -6.185472011566162e-05, -3.5762786865234375e-05, -9.670853614807129e-06, 1.6421079635620117e-05, 4.251301288604736e-05, 6.860494613647461e-05, 9.469687938690186e-05, 0.0001207888126373291, 0.00014688074588775635, 0.0001729726791381836, 0.00019906461238861084, 0.00022515654563903809, 0.00025124847888946533, 0.0002773404121398926, 0.0003034323453903198, 0.00032952427864074707, 0.0003556162118911743, 0.00038170814514160156, 0.0004078000783920288, 0.00043389201164245605, 0.0004599839448928833, 0.00048607587814331055, 0.0005121678113937378, 0.000538259744644165, 0.0005643516778945923, 0.0005904436111450195, 0.0006165355443954468, 0.000642627477645874, 0.0006687194108963013, 0.0006948113441467285, 0.0007209032773971558, 0.000746995210647583, 0.0007730871438980103, 0.0007991790771484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 11.0, 13.0, 19.0, 24.0, 16.0, 39.0, 31.0, 45.0, 72.0, 88.0, 135.0, 273.0, 415.0, 882.0, 7228.0, 985463.0, 50863.0, 1447.0, 498.0, 285.0, 204.0, 133.0, 95.0, 56.0, 51.0, 44.0, 26.0, 17.0, 10.0, 10.0, 9.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01458740234375, -0.014112234115600586, -0.013637065887451172, -0.013161897659301758, -0.012686729431152344, -0.01221156120300293, -0.011736392974853516, -0.011261224746704102, -0.010786056518554688, -0.010310888290405273, -0.00983572006225586, -0.009360551834106445, -0.008885383605957031, -0.008410215377807617, -0.007935047149658203, -0.007459878921508789, -0.006984710693359375, -0.006509542465209961, -0.006034374237060547, -0.005559206008911133, -0.005084037780761719, -0.004608869552612305, -0.004133701324462891, -0.0036585330963134766, -0.0031833648681640625, -0.0027081966400146484, -0.0022330284118652344, -0.0017578601837158203, -0.0012826919555664062, -0.0008075237274169922, -0.0003323554992675781, 0.00014281272888183594, 0.00061798095703125, 0.001093149185180664, 0.0015683174133300781, 0.002043485641479492, 0.0025186538696289062, 0.0029938220977783203, 0.0034689903259277344, 0.0039441585540771484, 0.0044193267822265625, 0.0048944950103759766, 0.005369663238525391, 0.005844831466674805, 0.006319999694824219, 0.006795167922973633, 0.007270336151123047, 0.007745504379272461, 0.008220672607421875, 0.008695840835571289, 0.009171009063720703, 0.009646177291870117, 0.010121345520019531, 0.010596513748168945, 0.01107168197631836, 0.011546850204467773, 0.012022018432617188, 0.012497186660766602, 0.012972354888916016, 0.01344752311706543, 0.013922691345214844, 0.014397859573364258, 0.014873027801513672, 0.015348196029663086, 0.0158233642578125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 105.0, 876.0, 28.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.017937416210770607, -0.017613166943192482, -0.017288919538259506, -0.01696467027068138, -0.016640421003103256, -0.01631617359817028, -0.015991924330592155, -0.01566767506301403, -0.01534342672675848, -0.01501917839050293, -0.014694929122924805, -0.014370680786669254, -0.014046432450413704, -0.013722183182835579, -0.013397934846580029, -0.013073686510324478, -0.012749437242746353, -0.012425188906490803, -0.012100939638912678, -0.011776691302657127, -0.011452442035079002, -0.011128193698823452, -0.010803945362567902, -0.010479696094989777, -0.010155447758734226, -0.009831199422478676, -0.00950695015490055, -0.009182701818645, -0.00885845348238945, -0.008534204214811325, -0.008209955878555775, -0.007885707542300224, -0.007561459206044674, -0.007237210404127836, -0.0069129616022109985, -0.006588713265955448, -0.0062644644640386105, -0.005940215662121773, -0.005615967325866222, -0.005291718523949385, -0.004967469722032547, -0.004643220920115709, -0.004318972118198872, -0.003994723781943321, -0.0036704749800264835, -0.003346226178109646, -0.003021977609023452, -0.0026977290399372578, -0.0023734800051897764, -0.0020492314361035824, -0.0017249826341867447, -0.0014007339486852288, -0.001076485263183713, -0.0007522365776821971, -0.00042798789218068123, -0.00010373932309448719, 0.0002205094788223505, 0.0005447581643238664, 0.0008690068498253822, 0.001193255535326898, 0.001517504220828414, 0.0018417529063299298, 0.0021660015918314457, 0.0024902501609176397, 0.0028144989628344774]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 14.0, 16.0, 16.0, 29.0, 17.0, 28.0, 31.0, 42.0, 40.0, 52.0, 39.0, 45.0, 40.0, 58.0, 48.0, 45.0, 48.0, 54.0, 63.0, 46.0, 46.0, 34.0, 22.0, 21.0, 20.0, 12.0, 13.0, 11.0, 14.0, 9.0, 6.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00109100341796875, -0.0010572606697678566, -0.0010235179215669632, -0.0009897751733660698, -0.0009560324251651764, -0.000922289676964283, -0.0008885469287633896, -0.0008548041805624962, -0.0008210614323616028, -0.0007873186841607094, -0.000753575935959816, -0.0007198331877589226, -0.0006860904395580292, -0.0006523476913571358, -0.0006186049431562424, -0.000584862194955349, -0.0005511194467544556, -0.0005173766985535622, -0.00048363395035266876, -0.00044989120215177536, -0.00041614845395088196, -0.00038240570574998856, -0.00034866295754909515, -0.00031492020934820175, -0.00028117746114730835, -0.00024743471294641495, -0.00021369196474552155, -0.00017994921654462814, -0.00014620646834373474, -0.00011246372014284134, -7.872097194194794e-05, -4.4978223741054535e-05, -1.1235475540161133e-05, 2.250727266073227e-05, 5.625002086162567e-05, 8.999276906251907e-05, 0.00012373551726341248, 0.00015747826546430588, 0.00019122101366519928, 0.00022496376186609268, 0.0002587065100669861, 0.0002924492582678795, 0.0003261920064687729, 0.0003599347546696663, 0.0003936775028705597, 0.0004274202510714531, 0.0004611629992723465, 0.0004949057474732399, 0.0005286484956741333, 0.0005623912438750267, 0.0005961339920759201, 0.0006298767402768135, 0.0006636194884777069, 0.0006973622366786003, 0.0007311049848794937, 0.0007648477330803871, 0.0007985904812812805, 0.0008323332294821739, 0.0008660759776830673, 0.0008998187258839607, 0.0009335614740848541, 0.0009673042222857475, 0.001001046970486641, 0.0010347897186875343, 0.0010685324668884277]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 13.0, 10.0, 10.0, 12.0, 13.0, 18.0, 15.0, 22.0, 23.0, 28.0, 30.0, 21.0, 37.0, 38.0, 50.0, 42.0, 52.0, 50.0, 41.0, 47.0, 46.0, 36.0, 41.0, 32.0, 39.0, 24.0, 42.0, 15.0, 18.0, 23.0, 21.0, 10.0, 11.0, 8.0, 10.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0], "bins": [-10.09375, -9.81988525390625, -9.5460205078125, -9.27215576171875, -8.998291015625, -8.72442626953125, -8.4505615234375, -8.17669677734375, -7.90283203125, -7.62896728515625, -7.3551025390625, -7.08123779296875, -6.807373046875, -6.53350830078125, -6.2596435546875, -5.98577880859375, -5.7119140625, -5.43804931640625, -5.1641845703125, -4.89031982421875, -4.616455078125, -4.34259033203125, -4.0687255859375, -3.79486083984375, -3.52099609375, -3.24713134765625, -2.9732666015625, -2.69940185546875, -2.425537109375, -2.15167236328125, -1.8778076171875, -1.60394287109375, -1.330078125, -1.05621337890625, -0.7823486328125, -0.50848388671875, -0.234619140625, 0.03924560546875, 0.3131103515625, 0.58697509765625, 0.86083984375, 1.13470458984375, 1.4085693359375, 1.68243408203125, 1.956298828125, 2.23016357421875, 2.5040283203125, 2.77789306640625, 3.0517578125, 3.32562255859375, 3.5994873046875, 3.87335205078125, 4.147216796875, 4.42108154296875, 4.6949462890625, 4.96881103515625, 5.24267578125, 5.51654052734375, 5.7904052734375, 6.06427001953125, 6.338134765625, 6.61199951171875, 6.8858642578125, 7.15972900390625, 7.43359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 3.0, 6.0, 17.0, 12.0, 29.0, 30.0, 39.0, 49.0, 79.0, 101.0, 141.0, 187.0, 277.0, 410.0, 602.0, 999.0, 1652.0, 2833.0, 5441.0, 12591.0, 40454.0, 603973.0, 321894.0, 33530.0, 11141.0, 5022.0, 2613.0, 1537.0, 946.0, 615.0, 412.0, 297.0, 171.0, 132.0, 81.0, 72.0, 41.0, 28.0, 24.0, 13.0, 13.0, 15.0, 8.0, 3.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.203125, -23.36669921875, -22.5302734375, -21.69384765625, -20.857421875, -20.02099609375, -19.1845703125, -18.34814453125, -17.51171875, -16.67529296875, -15.8388671875, -15.00244140625, -14.166015625, -13.32958984375, -12.4931640625, -11.65673828125, -10.8203125, -9.98388671875, -9.1474609375, -8.31103515625, -7.474609375, -6.63818359375, -5.8017578125, -4.96533203125, -4.12890625, -3.29248046875, -2.4560546875, -1.61962890625, -0.783203125, 0.05322265625, 0.8896484375, 1.72607421875, 2.5625, 3.39892578125, 4.2353515625, 5.07177734375, 5.908203125, 6.74462890625, 7.5810546875, 8.41748046875, 9.25390625, 10.09033203125, 10.9267578125, 11.76318359375, 12.599609375, 13.43603515625, 14.2724609375, 15.10888671875, 15.9453125, 16.78173828125, 17.6181640625, 18.45458984375, 19.291015625, 20.12744140625, 20.9638671875, 21.80029296875, 22.63671875, 23.47314453125, 24.3095703125, 25.14599609375, 25.982421875, 26.81884765625, 27.6552734375, 28.49169921875, 29.328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 8.0, 3.0, 5.0, 7.0, 8.0, 5.0, 11.0, 10.0, 19.0, 27.0, 19.0, 36.0, 29.0, 36.0, 34.0, 45.0, 45.0, 51.0, 98.0, 171.0, 1685.0, 175.0, 88.0, 64.0, 34.0, 47.0, 36.0, 38.0, 40.0, 31.0, 29.0, 16.0, 19.0, 24.0, 9.0, 16.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.07666015625, -32.0595703125, -31.04248046875, -30.025390625, -29.00830078125, -27.9912109375, -26.97412109375, -25.95703125, -24.93994140625, -23.9228515625, -22.90576171875, -21.888671875, -20.87158203125, -19.8544921875, -18.83740234375, -17.8203125, -16.80322265625, -15.7861328125, -14.76904296875, -13.751953125, -12.73486328125, -11.7177734375, -10.70068359375, -9.68359375, -8.66650390625, -7.6494140625, -6.63232421875, -5.615234375, -4.59814453125, -3.5810546875, -2.56396484375, -1.546875, -0.52978515625, 0.4873046875, 1.50439453125, 2.521484375, 3.53857421875, 4.5556640625, 5.57275390625, 6.58984375, 7.60693359375, 8.6240234375, 9.64111328125, 10.658203125, 11.67529296875, 12.6923828125, 13.70947265625, 14.7265625, 15.74365234375, 16.7607421875, 17.77783203125, 18.794921875, 19.81201171875, 20.8291015625, 21.84619140625, 22.86328125, 23.88037109375, 24.8974609375, 25.91455078125, 26.931640625, 27.94873046875, 28.9658203125, 29.98291015625, 31.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 6.0, 3.0, 12.0, 6.0, 17.0, 14.0, 31.0, 37.0, 30.0, 39.0, 104.0, 133.0, 281.0, 532.0, 1206.0, 3287.0, 11054.0, 77604.0, 2945764.0, 87569.0, 11888.0, 3543.0, 1342.0, 528.0, 235.0, 117.0, 81.0, 54.0, 37.0, 33.0, 25.0, 11.0, 17.0, 11.0, 10.0, 8.0, 7.0, 7.0, 3.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.4375, -48.6689453125, -46.900390625, -45.1318359375, -43.36328125, -41.5947265625, -39.826171875, -38.0576171875, -36.2890625, -34.5205078125, -32.751953125, -30.9833984375, -29.21484375, -27.4462890625, -25.677734375, -23.9091796875, -22.140625, -20.3720703125, -18.603515625, -16.8349609375, -15.06640625, -13.2978515625, -11.529296875, -9.7607421875, -7.9921875, -6.2236328125, -4.455078125, -2.6865234375, -0.91796875, 0.8505859375, 2.619140625, 4.3876953125, 6.15625, 7.9248046875, 9.693359375, 11.4619140625, 13.23046875, 14.9990234375, 16.767578125, 18.5361328125, 20.3046875, 22.0732421875, 23.841796875, 25.6103515625, 27.37890625, 29.1474609375, 30.916015625, 32.6845703125, 34.453125, 36.2216796875, 37.990234375, 39.7587890625, 41.52734375, 43.2958984375, 45.064453125, 46.8330078125, 48.6015625, 50.3701171875, 52.138671875, 53.9072265625, 55.67578125, 57.4443359375, 59.212890625, 60.9814453125, 62.75]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 41.0, 905.0, 74.0, 0.0, 1.0], "bins": [-1604.9996337890625, -1578.48681640625, -1551.973876953125, -1525.4610595703125, -1498.9482421875, -1472.435302734375, -1445.9224853515625, -1419.40966796875, -1392.896728515625, -1366.3839111328125, -1339.8709716796875, -1313.358154296875, -1286.8453369140625, -1260.3323974609375, -1233.819580078125, -1207.3067626953125, -1180.7939453125, -1154.2811279296875, -1127.7681884765625, -1101.25537109375, -1074.7425537109375, -1048.2296142578125, -1021.716796875, -995.2039794921875, -968.6910400390625, -942.1781616210938, -915.6653442382812, -889.1524658203125, -862.6395874023438, -836.1267700195312, -809.6138916015625, -783.10107421875, -756.5881958007812, -730.0753173828125, -703.5625, -677.0496215820312, -650.5367431640625, -624.02392578125, -597.5110473632812, -570.9981689453125, -544.4853515625, -517.9724731445312, -491.4596252441406, -464.94677734375, -438.4339294433594, -411.92108154296875, -385.408203125, -358.8953552246094, -332.3824768066406, -305.86962890625, -279.35675048828125, -252.84390258789062, -226.3310546875, -199.8181915283203, -173.30532836914062, -146.79248046875, -120.27960968017578, -93.76675415039062, -67.25389099121094, -40.74103546142578, -14.228179931640625, 12.284675598144531, 38.79753875732422, 65.31038665771484, 91.82324981689453]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 4.0, 12.0, 13.0, 13.0, 26.0, 14.0, 19.0, 21.0, 27.0, 23.0, 37.0, 28.0, 40.0, 42.0, 29.0, 41.0, 22.0, 38.0, 32.0, 43.0, 49.0, 45.0, 31.0, 37.0, 34.0, 26.0, 23.0, 31.0, 29.0, 23.0, 20.0, 16.0, 14.0, 16.0, 15.0, 8.0, 8.0, 6.0, 5.0, 9.0, 8.0, 1.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.74593353271484, -77.18772888183594, -74.62952423095703, -72.07131958007812, -69.51311492919922, -66.95491027832031, -64.3967056274414, -61.8385009765625, -59.280296325683594, -56.72209167480469, -54.16388702392578, -51.605682373046875, -49.04747772216797, -46.48927307128906, -43.931068420410156, -41.37286376953125, -38.814659118652344, -36.25645446777344, -33.69824981689453, -31.140045166015625, -28.58184051513672, -26.023635864257812, -23.465431213378906, -20.9072265625, -18.349021911621094, -15.790817260742188, -13.232612609863281, -10.674407958984375, -8.116203308105469, -5.5579986572265625, -2.9997940063476562, -0.44158935546875, 2.116607666015625, 4.674812316894531, 7.2330169677734375, 9.791221618652344, 12.34942626953125, 14.907630920410156, 17.465835571289062, 20.02404022216797, 22.582244873046875, 25.14044952392578, 27.698654174804688, 30.256858825683594, 32.8150634765625, 35.373268127441406, 37.93147277832031, 40.48967742919922, 43.047882080078125, 45.60608673095703, 48.16429138183594, 50.722496032714844, 53.28070068359375, 55.838905334472656, 58.39710998535156, 60.95531463623047, 63.513519287109375, 66.07172393798828, 68.62992858886719, 71.1881332397461, 73.746337890625, 76.3045425415039, 78.86274719238281, 81.42095184326172, 83.97915649414062]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 6.0, 10.0, 9.0, 9.0, 8.0, 13.0, 13.0, 17.0, 21.0, 17.0, 19.0, 39.0, 29.0, 35.0, 23.0, 49.0, 43.0, 52.0, 40.0, 33.0, 50.0, 46.0, 40.0, 48.0, 43.0, 36.0, 33.0, 27.0, 30.0, 21.0, 16.0, 24.0, 18.0, 10.0, 11.0, 11.0, 11.0, 3.0, 11.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0], "bins": [-11.0859375, -10.7911376953125, -10.496337890625, -10.2015380859375, -9.90673828125, -9.6119384765625, -9.317138671875, -9.0223388671875, -8.7275390625, -8.4327392578125, -8.137939453125, -7.8431396484375, -7.54833984375, -7.2535400390625, -6.958740234375, -6.6639404296875, -6.369140625, -6.0743408203125, -5.779541015625, -5.4847412109375, -5.18994140625, -4.8951416015625, -4.600341796875, -4.3055419921875, -4.0107421875, -3.7159423828125, -3.421142578125, -3.1263427734375, -2.83154296875, -2.5367431640625, -2.241943359375, -1.9471435546875, -1.65234375, -1.3575439453125, -1.062744140625, -0.7679443359375, -0.47314453125, -0.1783447265625, 0.116455078125, 0.4112548828125, 0.7060546875, 1.0008544921875, 1.295654296875, 1.5904541015625, 1.88525390625, 2.1800537109375, 2.474853515625, 2.7696533203125, 3.064453125, 3.3592529296875, 3.654052734375, 3.9488525390625, 4.24365234375, 4.5384521484375, 4.833251953125, 5.1280517578125, 5.4228515625, 5.7176513671875, 6.012451171875, 6.3072509765625, 6.60205078125, 6.8968505859375, 7.191650390625, 7.4864501953125, 7.78125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 13.0, 10.0, 14.0, 12.0, 25.0, 33.0, 32.0, 57.0, 64.0, 73.0, 134.0, 181.0, 224.0, 320.0, 443.0, 570.0, 811.0, 1209.0, 1734.0, 2636.0, 4021.0, 6601.0, 11650.0, 23663.0, 105516.0, 713560.0, 2444780.0, 706215.0, 110818.0, 27797.0, 11982.0, 6706.0, 4052.0, 2649.0, 1754.0, 1129.0, 821.0, 567.0, 398.0, 285.0, 234.0, 138.0, 94.0, 78.0, 60.0, 35.0, 28.0, 27.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0], "bins": [-19.03125, -18.5098876953125, -17.988525390625, -17.4671630859375, -16.94580078125, -16.4244384765625, -15.903076171875, -15.3817138671875, -14.8603515625, -14.3389892578125, -13.817626953125, -13.2962646484375, -12.77490234375, -12.2535400390625, -11.732177734375, -11.2108154296875, -10.689453125, -10.1680908203125, -9.646728515625, -9.1253662109375, -8.60400390625, -8.0826416015625, -7.561279296875, -7.0399169921875, -6.5185546875, -5.9971923828125, -5.475830078125, -4.9544677734375, -4.43310546875, -3.9117431640625, -3.390380859375, -2.8690185546875, -2.34765625, -1.8262939453125, -1.304931640625, -0.7835693359375, -0.26220703125, 0.2591552734375, 0.780517578125, 1.3018798828125, 1.8232421875, 2.3446044921875, 2.865966796875, 3.3873291015625, 3.90869140625, 4.4300537109375, 4.951416015625, 5.4727783203125, 5.994140625, 6.5155029296875, 7.036865234375, 7.5582275390625, 8.07958984375, 8.6009521484375, 9.122314453125, 9.6436767578125, 10.1650390625, 10.6864013671875, 11.207763671875, 11.7291259765625, 12.25048828125, 12.7718505859375, 13.293212890625, 13.8145751953125, 14.3359375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 10.0, 6.0, 8.0, 9.0, 10.0, 17.0, 20.0, 34.0, 45.0, 45.0, 83.0, 159.0, 280.0, 540.0, 933.0, 876.0, 426.0, 205.0, 122.0, 71.0, 46.0, 33.0, 12.0, 14.0, 23.0, 13.0, 6.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.1875, -29.267578125, -28.34765625, -27.427734375, -26.5078125, -25.587890625, -24.66796875, -23.748046875, -22.828125, -21.908203125, -20.98828125, -20.068359375, -19.1484375, -18.228515625, -17.30859375, -16.388671875, -15.46875, -14.548828125, -13.62890625, -12.708984375, -11.7890625, -10.869140625, -9.94921875, -9.029296875, -8.109375, -7.189453125, -6.26953125, -5.349609375, -4.4296875, -3.509765625, -2.58984375, -1.669921875, -0.75, 0.169921875, 1.08984375, 2.009765625, 2.9296875, 3.849609375, 4.76953125, 5.689453125, 6.609375, 7.529296875, 8.44921875, 9.369140625, 10.2890625, 11.208984375, 12.12890625, 13.048828125, 13.96875, 14.888671875, 15.80859375, 16.728515625, 17.6484375, 18.568359375, 19.48828125, 20.408203125, 21.328125, 22.248046875, 23.16796875, 24.087890625, 25.0078125, 25.927734375, 26.84765625, 27.767578125, 28.6875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 9.0, 10.0, 12.0, 19.0, 51.0, 47.0, 87.0, 137.0, 303.0, 674.0, 1636.0, 4902.0, 18757.0, 129255.0, 3709487.0, 290481.0, 27887.0, 6676.0, 2196.0, 792.0, 374.0, 195.0, 106.0, 70.0, 34.0, 25.0, 19.0, 10.0, 9.0, 11.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.34375, -53.59375, -51.84375, -50.09375, -48.34375, -46.59375, -44.84375, -43.09375, -41.34375, -39.59375, -37.84375, -36.09375, -34.34375, -32.59375, -30.84375, -29.09375, -27.34375, -25.59375, -23.84375, -22.09375, -20.34375, -18.59375, -16.84375, -15.09375, -13.34375, -11.59375, -9.84375, -8.09375, -6.34375, -4.59375, -2.84375, -1.09375, 0.65625, 2.40625, 4.15625, 5.90625, 7.65625, 9.40625, 11.15625, 12.90625, 14.65625, 16.40625, 18.15625, 19.90625, 21.65625, 23.40625, 25.15625, 26.90625, 28.65625, 30.40625, 32.15625, 33.90625, 35.65625, 37.40625, 39.15625, 40.90625, 42.65625, 44.40625, 46.15625, 47.90625, 49.65625, 51.40625, 53.15625, 54.90625, 56.65625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 15.0, 27.0, 76.0, 109.0, 251.0, 253.0, 145.0, 53.0, 36.0, 20.0, 9.0, 8.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.91897583007812, -145.04087829589844, -138.16278076171875, -131.28468322753906, -124.40658569335938, -117.52848815917969, -110.650390625, -103.77229309082031, -96.89419555664062, -90.01609802246094, -83.13800048828125, -76.25990295410156, -69.38180541992188, -62.50370407104492, -55.625606536865234, -48.74750900268555, -41.869407653808594, -34.991310119628906, -28.11321258544922, -21.2351131439209, -14.357015609741211, -7.478916168212891, -0.6008186340332031, 6.277278900146484, 13.155376434326172, 20.03347396850586, 26.911571502685547, 33.7896728515625, 40.66777038574219, 47.545867919921875, 54.42396545410156, 61.30206298828125, 68.18016052246094, 75.05825805664062, 81.93635559082031, 88.814453125, 95.69255065917969, 102.57064819335938, 109.44874572753906, 116.32684326171875, 123.20494079589844, 130.08303833007812, 136.9611358642578, 143.8392333984375, 150.7173309326172, 157.59542846679688, 164.47352600097656, 171.35162353515625, 178.229736328125, 185.1078338623047, 191.98593139648438, 198.86402893066406, 205.74212646484375, 212.62022399902344, 219.49832153320312, 226.3764190673828, 233.2545166015625, 240.1326141357422, 247.01071166992188, 253.88880920410156, 260.76690673828125, 267.64501953125, 274.5231018066406, 281.4012145996094, 288.279296875]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 12.0, 9.0, 10.0, 10.0, 20.0, 25.0, 9.0, 16.0, 26.0, 19.0, 25.0, 32.0, 40.0, 28.0, 41.0, 42.0, 36.0, 45.0, 40.0, 40.0, 36.0, 34.0, 39.0, 42.0, 33.0, 29.0, 27.0, 36.0, 20.0, 27.0, 23.0, 18.0, 18.0, 14.0, 8.0, 13.0, 11.0, 9.0, 8.0, 4.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-65.20747375488281, -63.1240234375, -61.04057312011719, -58.957122802734375, -56.8736686706543, -54.790218353271484, -52.70676803588867, -50.62331771850586, -48.53986358642578, -46.45641326904297, -44.372962951660156, -42.289512634277344, -40.206058502197266, -38.12260818481445, -36.03915786743164, -33.95570755004883, -31.872257232666016, -29.788806915283203, -27.705354690551758, -25.621904373168945, -23.5384521484375, -21.455001831054688, -19.371551513671875, -17.288101196289062, -15.204648971557617, -13.121197700500488, -11.03774642944336, -8.954296112060547, -6.870844841003418, -4.787393569946289, -2.7039432525634766, -0.6204919815063477, 1.4629592895507812, 3.546410322189331, 5.629861354827881, 7.713312149047852, 9.79676342010498, 11.88021469116211, 13.963665008544922, 16.047115325927734, 18.13056755065918, 20.214017868041992, 22.297470092773438, 24.38092041015625, 26.464370727539062, 28.547822952270508, 30.63127326965332, 32.714725494384766, 34.79817581176758, 36.88162612915039, 38.9650764465332, 41.04853057861328, 43.131980895996094, 45.215431213378906, 47.29888153076172, 49.38233184814453, 51.465782165527344, 53.549232482910156, 55.63268280029297, 57.71613311767578, 59.79958724975586, 61.88303756713867, 63.966487884521484, 66.04994201660156, 68.13339233398438]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 5.0, 7.0, 5.0, 16.0, 14.0, 13.0, 14.0, 13.0, 21.0, 18.0, 25.0, 37.0, 26.0, 24.0, 41.0, 32.0, 31.0, 42.0, 47.0, 45.0, 49.0, 51.0, 42.0, 43.0, 37.0, 27.0, 35.0, 34.0, 25.0, 26.0, 17.0, 18.0, 21.0, 17.0, 14.0, 17.0, 9.0, 6.0, 5.0, 2.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.375, -10.085205078125, -9.79541015625, -9.505615234375, -9.2158203125, -8.926025390625, -8.63623046875, -8.346435546875, -8.056640625, -7.766845703125, -7.47705078125, -7.187255859375, -6.8974609375, -6.607666015625, -6.31787109375, -6.028076171875, -5.73828125, -5.448486328125, -5.15869140625, -4.868896484375, -4.5791015625, -4.289306640625, -3.99951171875, -3.709716796875, -3.419921875, -3.130126953125, -2.84033203125, -2.550537109375, -2.2607421875, -1.970947265625, -1.68115234375, -1.391357421875, -1.1015625, -0.811767578125, -0.52197265625, -0.232177734375, 0.0576171875, 0.347412109375, 0.63720703125, 0.927001953125, 1.216796875, 1.506591796875, 1.79638671875, 2.086181640625, 2.3759765625, 2.665771484375, 2.95556640625, 3.245361328125, 3.53515625, 3.824951171875, 4.11474609375, 4.404541015625, 4.6943359375, 4.984130859375, 5.27392578125, 5.563720703125, 5.853515625, 6.143310546875, 6.43310546875, 6.722900390625, 7.0126953125, 7.302490234375, 7.59228515625, 7.882080078125, 8.171875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 10.0, 14.0, 20.0, 25.0, 42.0, 72.0, 88.0, 129.0, 188.0, 327.0, 497.0, 747.0, 1119.0, 1762.0, 2568.0, 3867.0, 5786.0, 9041.0, 13290.0, 19871.0, 29675.0, 45765.0, 71796.0, 114046.0, 182441.0, 197268.0, 123555.0, 78405.0, 50117.0, 32502.0, 21442.0, 14371.0, 9249.0, 6104.0, 4169.0, 2805.0, 1818.0, 1197.0, 772.0, 532.0, 345.0, 228.0, 160.0, 110.0, 60.0, 50.0, 22.0, 31.0, 24.0, 8.0, 11.0, 4.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1983642578125, -0.1919841766357422, -0.18560409545898438, -0.17922401428222656, -0.17284393310546875, -0.16646385192871094, -0.16008377075195312, -0.1537036895751953, -0.1473236083984375, -0.1409435272216797, -0.13456344604492188, -0.12818336486816406, -0.12180328369140625, -0.11542320251464844, -0.10904312133789062, -0.10266304016113281, -0.096282958984375, -0.08990287780761719, -0.08352279663085938, -0.07714271545410156, -0.07076263427734375, -0.06438255310058594, -0.058002471923828125, -0.05162239074707031, -0.0452423095703125, -0.03886222839355469, -0.032482147216796875, -0.026102066040039062, -0.01972198486328125, -0.013341903686523438, -0.006961822509765625, -0.0005817413330078125, 0.00579833984375, 0.012178421020507812, 0.018558502197265625, 0.024938583374023438, 0.03131866455078125, 0.03769874572753906, 0.044078826904296875, 0.05045890808105469, 0.0568389892578125, 0.06321907043457031, 0.06959915161132812, 0.07597923278808594, 0.08235931396484375, 0.08873939514160156, 0.09511947631835938, 0.10149955749511719, 0.107879638671875, 0.11425971984863281, 0.12063980102539062, 0.12701988220214844, 0.13339996337890625, 0.13978004455566406, 0.14616012573242188, 0.1525402069091797, 0.1589202880859375, 0.1653003692626953, 0.17168045043945312, 0.17806053161621094, 0.18444061279296875, 0.19082069396972656, 0.19720077514648438, 0.2035808563232422, 0.2099609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 6.0, 10.0, 7.0, 7.0, 17.0, 12.0, 11.0, 22.0, 24.0, 22.0, 29.0, 27.0, 25.0, 28.0, 26.0, 36.0, 45.0, 32.0, 45.0, 45.0, 1062.0, 40.0, 26.0, 34.0, 38.0, 33.0, 25.0, 33.0, 31.0, 21.0, 26.0, 32.0, 22.0, 21.0, 12.0, 12.0, 14.0, 16.0, 5.0, 15.0, 2.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.625, -6.41632080078125, -6.2076416015625, -5.99896240234375, -5.790283203125, -5.58160400390625, -5.3729248046875, -5.16424560546875, -4.95556640625, -4.74688720703125, -4.5382080078125, -4.32952880859375, -4.120849609375, -3.91217041015625, -3.7034912109375, -3.49481201171875, -3.2861328125, -3.07745361328125, -2.8687744140625, -2.66009521484375, -2.451416015625, -2.24273681640625, -2.0340576171875, -1.82537841796875, -1.61669921875, -1.40802001953125, -1.1993408203125, -0.99066162109375, -0.781982421875, -0.57330322265625, -0.3646240234375, -0.15594482421875, 0.052734375, 0.26141357421875, 0.4700927734375, 0.67877197265625, 0.887451171875, 1.09613037109375, 1.3048095703125, 1.51348876953125, 1.72216796875, 1.93084716796875, 2.1395263671875, 2.34820556640625, 2.556884765625, 2.76556396484375, 2.9742431640625, 3.18292236328125, 3.3916015625, 3.60028076171875, 3.8089599609375, 4.01763916015625, 4.226318359375, 4.43499755859375, 4.6436767578125, 4.85235595703125, 5.06103515625, 5.26971435546875, 5.4783935546875, 5.68707275390625, 5.895751953125, 6.10443115234375, 6.3131103515625, 6.52178955078125, 6.73046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 8.0, 13.0, 12.0, 23.0, 35.0, 37.0, 63.0, 95.0, 117.0, 174.0, 255.0, 344.0, 534.0, 687.0, 1041.0, 1453.0, 2057.0, 2982.0, 4537.0, 6308.0, 9226.0, 13232.0, 19364.0, 28493.0, 41017.0, 59968.0, 88889.0, 133187.0, 1227620.0, 146327.0, 98426.0, 66002.0, 44808.0, 31213.0, 21449.0, 14731.0, 9805.0, 6926.0, 4777.0, 3335.0, 2264.0, 1522.0, 1153.0, 769.0, 534.0, 372.0, 253.0, 214.0, 146.0, 82.0, 90.0, 55.0, 33.0, 29.0, 14.0, 13.0, 9.0, 4.0, 6.0, 3.0, 3.0], "bins": [-0.08935546875, -0.08652973175048828, -0.08370399475097656, -0.08087825775146484, -0.07805252075195312, -0.0752267837524414, -0.07240104675292969, -0.06957530975341797, -0.06674957275390625, -0.06392383575439453, -0.06109809875488281, -0.058272361755371094, -0.055446624755859375, -0.052620887756347656, -0.04979515075683594, -0.04696941375732422, -0.0441436767578125, -0.04131793975830078, -0.03849220275878906, -0.035666465759277344, -0.032840728759765625, -0.030014991760253906, -0.027189254760742188, -0.02436351776123047, -0.02153778076171875, -0.01871204376220703, -0.015886306762695312, -0.013060569763183594, -0.010234832763671875, -0.007409095764160156, -0.0045833587646484375, -0.0017576217651367188, 0.001068115234375, 0.0038938522338867188, 0.0067195892333984375, 0.009545326232910156, 0.012371063232421875, 0.015196800231933594, 0.018022537231445312, 0.02084827423095703, 0.02367401123046875, 0.02649974822998047, 0.029325485229492188, 0.032151222229003906, 0.034976959228515625, 0.037802696228027344, 0.04062843322753906, 0.04345417022705078, 0.0462799072265625, 0.04910564422607422, 0.05193138122558594, 0.054757118225097656, 0.057582855224609375, 0.060408592224121094, 0.06323432922363281, 0.06606006622314453, 0.06888580322265625, 0.07171154022216797, 0.07453727722167969, 0.0773630142211914, 0.08018875122070312, 0.08301448822021484, 0.08584022521972656, 0.08866596221923828, 0.09149169921875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 9.0, 8.0, 13.0, 10.0, 16.0, 15.0, 18.0, 29.0, 35.0, 31.0, 40.0, 52.0, 44.0, 55.0, 49.0, 56.0, 55.0, 39.0, 40.0, 43.0, 43.0, 42.0, 42.0, 36.0, 21.0, 30.0, 19.0, 14.0, 17.0, 9.0, 8.0, 12.0, 7.0, 2.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0010166168212890625, -0.0009859949350357056, -0.0009553730487823486, -0.0009247511625289917, -0.0008941292762756348, -0.0008635073900222778, -0.0008328855037689209, -0.000802263617515564, -0.000771641731262207, -0.0007410198450088501, -0.0007103979587554932, -0.0006797760725021362, -0.0006491541862487793, -0.0006185322999954224, -0.0005879104137420654, -0.0005572885274887085, -0.0005266666412353516, -0.0004960447549819946, -0.0004654228687286377, -0.00043480098247528076, -0.00040417909622192383, -0.0003735572099685669, -0.00034293532371520996, -0.00031231343746185303, -0.0002816915512084961, -0.00025106966495513916, -0.00022044777870178223, -0.0001898258924484253, -0.00015920400619506836, -0.00012858211994171143, -9.796023368835449e-05, -6.733834743499756e-05, -3.6716461181640625e-05, -6.094574928283691e-06, 2.4527311325073242e-05, 5.5149197578430176e-05, 8.577108383178711e-05, 0.00011639297008514404, 0.00014701485633850098, 0.0001776367425918579, 0.00020825862884521484, 0.00023888051509857178, 0.0002695024013519287, 0.00030012428760528564, 0.0003307461738586426, 0.0003613680601119995, 0.00039198994636535645, 0.0004226118326187134, 0.0004532337188720703, 0.00048385560512542725, 0.0005144774913787842, 0.0005450993776321411, 0.000575721263885498, 0.000606343150138855, 0.0006369650363922119, 0.0006675869226455688, 0.0006982088088989258, 0.0007288306951522827, 0.0007594525814056396, 0.0007900744676589966, 0.0008206963539123535, 0.0008513182401657104, 0.0008819401264190674, 0.0009125620126724243, 0.0009431838989257812]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 14.0, 13.0, 14.0, 18.0, 22.0, 28.0, 35.0, 75.0, 103.0, 158.0, 244.0, 480.0, 1127.0, 28473.0, 1008390.0, 7349.0, 879.0, 402.0, 216.0, 134.0, 83.0, 58.0, 50.0, 32.0, 25.0, 22.0, 12.0, 9.0, 11.0, 10.0, 7.0, 5.0, 10.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184173583984375, -0.017810821533203125, -0.01720428466796875, -0.016597747802734375, -0.0159912109375, -0.015384674072265625, -0.01477813720703125, -0.014171600341796875, -0.0135650634765625, -0.012958526611328125, -0.01235198974609375, -0.011745452880859375, -0.011138916015625, -0.010532379150390625, -0.00992584228515625, -0.009319305419921875, -0.0087127685546875, -0.008106231689453125, -0.00749969482421875, -0.006893157958984375, -0.00628662109375, -0.005680084228515625, -0.00507354736328125, -0.004467010498046875, -0.0038604736328125, -0.003253936767578125, -0.00264739990234375, -0.002040863037109375, -0.001434326171875, -0.000827789306640625, -0.00022125244140625, 0.000385284423828125, 0.0009918212890625, 0.001598358154296875, 0.00220489501953125, 0.002811431884765625, 0.00341796875, 0.004024505615234375, 0.00463104248046875, 0.005237579345703125, 0.0058441162109375, 0.006450653076171875, 0.00705718994140625, 0.007663726806640625, 0.008270263671875, 0.008876800537109375, 0.00948333740234375, 0.010089874267578125, 0.0106964111328125, 0.011302947998046875, 0.01190948486328125, 0.012516021728515625, 0.01312255859375, 0.013729095458984375, 0.01433563232421875, 0.014942169189453125, 0.0155487060546875, 0.016155242919921875, 0.01676177978515625, 0.017368316650390625, 0.017974853515625, 0.018581390380859375, 0.01918792724609375, 0.019794464111328125, 0.0204010009765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 353.0, 658.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03300518915057182, -0.032426510006189346, -0.03184782713651657, -0.031269147992134094, -0.03069046512246132, -0.030111784115433693, -0.029533103108406067, -0.02895442396402359, -0.028375741094350815, -0.02779706008732319, -0.027218379080295563, -0.026639698073267937, -0.02606101706624031, -0.025482336059212685, -0.02490365505218506, -0.024324975907802582, -0.023746294900774956, -0.02316761389374733, -0.022588932886719704, -0.022010251879692078, -0.02143157087266445, -0.020852889865636826, -0.0202742088586092, -0.019695527851581573, -0.019116848707199097, -0.01853816770017147, -0.017959486693143845, -0.01738080568611622, -0.016802124679088593, -0.016223443672060966, -0.01564476266503334, -0.015066082589328289, -0.014487400650978088, -0.013908719643950462, -0.013330038636922836, -0.01275135762989521, -0.012172676622867584, -0.011593995615839958, -0.011015315540134907, -0.01043663453310728, -0.009857953526079655, -0.009279272519052029, -0.008700591512024403, -0.008121910504996777, -0.007543229963630438, -0.006964548956602812, -0.006385868415236473, -0.005807187408208847, -0.005228506401181221, -0.004649825394153595, -0.004071144387125969, -0.00349246384575963, -0.002913782838732004, -0.002335101831704378, -0.0017564210575073957, -0.0011777402833104134, -0.0005990592762827873, -2.0378385670483112e-05, 0.0005583025049418211, 0.0011369833955541253, 0.0017156642861664295, 0.0022943452931940556, 0.002873026067391038, 0.0034517068415880203, 0.004030387848615646]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 12.0, 19.0, 19.0, 25.0, 21.0, 25.0, 35.0, 29.0, 41.0, 61.0, 56.0, 63.0, 64.0, 75.0, 64.0, 49.0, 62.0, 55.0, 37.0, 25.0, 27.0, 34.0, 18.0, 20.0, 16.0, 11.0, 4.0, 3.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001224815845489502, -0.0011795097962021828, -0.0011342037469148636, -0.0010888976976275444, -0.0010435916483402252, -0.000998285599052906, -0.0009529795497655869, -0.0009076735004782677, -0.0008623674511909485, -0.0008170614019036293, -0.0007717553526163101, -0.0007264493033289909, -0.0006811432540416718, -0.0006358372047543526, -0.0005905311554670334, -0.0005452251061797142, -0.000499919056892395, -0.00045461300760507584, -0.00040930695831775665, -0.00036400090903043747, -0.0003186948597431183, -0.0002733888104557991, -0.00022808276116847992, -0.00018277671188116074, -0.00013747066259384155, -9.216461330652237e-05, -4.6858564019203186e-05, -1.5525147318840027e-06, 4.375353455543518e-05, 8.905958384275436e-05, 0.00013436563313007355, 0.00017967168241739273, 0.00022497773170471191, 0.0002702837809920311, 0.0003155898302793503, 0.00036089587956666946, 0.00040620192885398865, 0.00045150797814130783, 0.000496814027428627, 0.0005421200767159462, 0.0005874261260032654, 0.0006327321752905846, 0.0006780382245779037, 0.0007233442738652229, 0.0007686503231525421, 0.0008139563724398613, 0.0008592624217271805, 0.0009045684710144997, 0.0009498745203018188, 0.000995180569589138, 0.0010404866188764572, 0.0010857926681637764, 0.0011310987174510956, 0.0011764047667384148, 0.001221710816025734, 0.0012670168653130531, 0.0013123229146003723, 0.0013576289638876915, 0.0014029350131750107, 0.0014482410624623299, 0.001493547111749649, 0.0015388531610369682, 0.0015841592103242874, 0.0016294652596116066, 0.0016747713088989258]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 5.0, 7.0, 5.0, 16.0, 14.0, 13.0, 14.0, 13.0, 21.0, 18.0, 25.0, 37.0, 26.0, 24.0, 41.0, 32.0, 31.0, 42.0, 47.0, 45.0, 49.0, 51.0, 42.0, 43.0, 37.0, 27.0, 35.0, 34.0, 25.0, 26.0, 17.0, 18.0, 21.0, 17.0, 14.0, 17.0, 9.0, 6.0, 5.0, 2.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.375, -10.085205078125, -9.79541015625, -9.505615234375, -9.2158203125, -8.926025390625, -8.63623046875, -8.346435546875, -8.056640625, -7.766845703125, -7.47705078125, -7.187255859375, -6.8974609375, -6.607666015625, -6.31787109375, -6.028076171875, -5.73828125, -5.448486328125, -5.15869140625, -4.868896484375, -4.5791015625, -4.289306640625, -3.99951171875, -3.709716796875, -3.419921875, -3.130126953125, -2.84033203125, -2.550537109375, -2.2607421875, -1.970947265625, -1.68115234375, -1.391357421875, -1.1015625, -0.811767578125, -0.52197265625, -0.232177734375, 0.0576171875, 0.347412109375, 0.63720703125, 0.927001953125, 1.216796875, 1.506591796875, 1.79638671875, 2.086181640625, 2.3759765625, 2.665771484375, 2.95556640625, 3.245361328125, 3.53515625, 3.824951171875, 4.11474609375, 4.404541015625, 4.6943359375, 4.984130859375, 5.27392578125, 5.563720703125, 5.853515625, 6.143310546875, 6.43310546875, 6.722900390625, 7.0126953125, 7.302490234375, 7.59228515625, 7.882080078125, 8.171875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 11.0, 11.0, 9.0, 22.0, 26.0, 38.0, 46.0, 56.0, 117.0, 130.0, 179.0, 292.0, 352.0, 610.0, 869.0, 1427.0, 2291.0, 3905.0, 7545.0, 16775.0, 48818.0, 246793.0, 578209.0, 90315.0, 25894.0, 10732.0, 5056.0, 2949.0, 1746.0, 1094.0, 707.0, 445.0, 322.0, 222.0, 151.0, 124.0, 72.0, 55.0, 28.0, 38.0, 16.0, 11.0, 11.0, 12.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-18.65625, -18.1265869140625, -17.596923828125, -17.0672607421875, -16.53759765625, -16.0079345703125, -15.478271484375, -14.9486083984375, -14.4189453125, -13.8892822265625, -13.359619140625, -12.8299560546875, -12.30029296875, -11.7706298828125, -11.240966796875, -10.7113037109375, -10.181640625, -9.6519775390625, -9.122314453125, -8.5926513671875, -8.06298828125, -7.5333251953125, -7.003662109375, -6.4739990234375, -5.9443359375, -5.4146728515625, -4.885009765625, -4.3553466796875, -3.82568359375, -3.2960205078125, -2.766357421875, -2.2366943359375, -1.70703125, -1.1773681640625, -0.647705078125, -0.1180419921875, 0.41162109375, 0.9412841796875, 1.470947265625, 2.0006103515625, 2.5302734375, 3.0599365234375, 3.589599609375, 4.1192626953125, 4.64892578125, 5.1785888671875, 5.708251953125, 6.2379150390625, 6.767578125, 7.2972412109375, 7.826904296875, 8.3565673828125, 8.88623046875, 9.4158935546875, 9.945556640625, 10.4752197265625, 11.0048828125, 11.5345458984375, 12.064208984375, 12.5938720703125, 13.12353515625, 13.6531982421875, 14.182861328125, 14.7125244140625, 15.2421875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 2.0, 4.0, 7.0, 10.0, 10.0, 12.0, 20.0, 15.0, 25.0, 33.0, 33.0, 38.0, 44.0, 54.0, 86.0, 106.0, 231.0, 1662.0, 180.0, 93.0, 72.0, 42.0, 55.0, 32.0, 36.0, 29.0, 22.0, 16.0, 19.0, 11.0, 15.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.625, -36.29736328125, -34.9697265625, -33.64208984375, -32.314453125, -30.98681640625, -29.6591796875, -28.33154296875, -27.00390625, -25.67626953125, -24.3486328125, -23.02099609375, -21.693359375, -20.36572265625, -19.0380859375, -17.71044921875, -16.3828125, -15.05517578125, -13.7275390625, -12.39990234375, -11.072265625, -9.74462890625, -8.4169921875, -7.08935546875, -5.76171875, -4.43408203125, -3.1064453125, -1.77880859375, -0.451171875, 0.87646484375, 2.2041015625, 3.53173828125, 4.859375, 6.18701171875, 7.5146484375, 8.84228515625, 10.169921875, 11.49755859375, 12.8251953125, 14.15283203125, 15.48046875, 16.80810546875, 18.1357421875, 19.46337890625, 20.791015625, 22.11865234375, 23.4462890625, 24.77392578125, 26.1015625, 27.42919921875, 28.7568359375, 30.08447265625, 31.412109375, 32.73974609375, 34.0673828125, 35.39501953125, 36.72265625, 38.05029296875, 39.3779296875, 40.70556640625, 42.033203125, 43.36083984375, 44.6884765625, 46.01611328125, 47.34375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 11.0, 15.0, 19.0, 27.0, 33.0, 52.0, 66.0, 73.0, 112.0, 198.0, 388.0, 1237.0, 9768.0, 761521.0, 2356929.0, 12689.0, 1465.0, 416.0, 170.0, 124.0, 96.0, 71.0, 39.0, 44.0, 34.0, 24.0, 17.0, 12.0, 7.0, 4.0, 6.0, 11.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-84.8125, -82.4599609375, -80.107421875, -77.7548828125, -75.40234375, -73.0498046875, -70.697265625, -68.3447265625, -65.9921875, -63.6396484375, -61.287109375, -58.9345703125, -56.58203125, -54.2294921875, -51.876953125, -49.5244140625, -47.171875, -44.8193359375, -42.466796875, -40.1142578125, -37.76171875, -35.4091796875, -33.056640625, -30.7041015625, -28.3515625, -25.9990234375, -23.646484375, -21.2939453125, -18.94140625, -16.5888671875, -14.236328125, -11.8837890625, -9.53125, -7.1787109375, -4.826171875, -2.4736328125, -0.12109375, 2.2314453125, 4.583984375, 6.9365234375, 9.2890625, 11.6416015625, 13.994140625, 16.3466796875, 18.69921875, 21.0517578125, 23.404296875, 25.7568359375, 28.109375, 30.4619140625, 32.814453125, 35.1669921875, 37.51953125, 39.8720703125, 42.224609375, 44.5771484375, 46.9296875, 49.2822265625, 51.634765625, 53.9873046875, 56.33984375, 58.6923828125, 61.044921875, 63.3974609375, 65.75]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 266.0, 751.0], "bins": [-1739.109375, -1711.553466796875, -1683.9976806640625, -1656.4417724609375, -1628.8858642578125, -1601.3299560546875, -1573.774169921875, -1546.21826171875, -1518.662353515625, -1491.1064453125, -1463.5506591796875, -1435.9947509765625, -1408.4388427734375, -1380.8829345703125, -1353.3271484375, -1325.771240234375, -1298.21533203125, -1270.659423828125, -1243.1036376953125, -1215.5477294921875, -1187.9918212890625, -1160.4359130859375, -1132.880126953125, -1105.32421875, -1077.7684326171875, -1050.2125244140625, -1022.6566772460938, -995.100830078125, -967.544921875, -939.9890747070312, -912.4332275390625, -884.8773193359375, -857.3213500976562, -829.7655029296875, -802.2095947265625, -774.6537475585938, -747.0978393554688, -719.5419921875, -691.986083984375, -664.4302368164062, -636.8743896484375, -609.3185424804688, -581.7626342773438, -554.206787109375, -526.65087890625, -499.09503173828125, -471.5391540527344, -443.9832763671875, -416.4273986816406, -388.87152099609375, -361.3156433105469, -333.759765625, -306.20391845703125, -278.64801025390625, -251.0921630859375, -223.53628540039062, -195.9803924560547, -168.4245147705078, -140.86865234375, -113.31277465820312, -85.75689697265625, -58.201019287109375, -30.645156860351562, -3.0892791748046875, 24.466596603393555]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 11.0, 7.0, 7.0, 12.0, 10.0, 10.0, 10.0, 22.0, 16.0, 32.0, 28.0, 36.0, 34.0, 44.0, 38.0, 36.0, 48.0, 30.0, 39.0, 49.0, 37.0, 42.0, 38.0, 37.0, 40.0, 36.0, 36.0, 25.0, 37.0, 19.0, 21.0, 17.0, 16.0, 12.0, 12.0, 10.0, 10.0, 15.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-83.80767822265625, -81.05241394042969, -78.29714965820312, -75.5418930053711, -72.78662872314453, -70.03136444091797, -67.27610778808594, -64.52084350585938, -61.76557922363281, -59.01031494140625, -56.25505447387695, -53.499794006347656, -50.744529724121094, -47.98926544189453, -45.234004974365234, -42.47874450683594, -39.723480224609375, -36.96821594238281, -34.212955474853516, -31.457693099975586, -28.702430725097656, -25.947168350219727, -23.191905975341797, -20.436643600463867, -17.681381225585938, -14.926118850708008, -12.170856475830078, -9.415594100952148, -6.660331726074219, -3.905069351196289, -1.1498069763183594, 1.6054553985595703, 4.3607177734375, 7.11598014831543, 9.87124252319336, 12.626504898071289, 15.381767272949219, 18.13702964782715, 20.892292022705078, 23.647554397583008, 26.402816772460938, 29.158079147338867, 31.913341522216797, 34.668601989746094, 37.423866271972656, 40.17913055419922, 42.934391021728516, 45.68965148925781, 48.444915771484375, 51.20018005371094, 53.955440521240234, 56.71070098876953, 59.465965270996094, 62.221229553222656, 64.97648620605469, 67.73175048828125, 70.48701477050781, 73.24227905273438, 75.99754333496094, 78.75279998779297, 81.50806427001953, 84.2633285522461, 87.01858520507812, 89.77384948730469, 92.52911376953125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 2.0, 3.0, 6.0, 11.0, 11.0, 9.0, 16.0, 16.0, 20.0, 17.0, 20.0, 32.0, 23.0, 32.0, 29.0, 40.0, 31.0, 42.0, 50.0, 53.0, 41.0, 42.0, 46.0, 46.0, 49.0, 42.0, 31.0, 28.0, 30.0, 27.0, 17.0, 17.0, 20.0, 16.0, 15.0, 19.0, 11.0, 6.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.8046875, -11.4803466796875, -11.156005859375, -10.8316650390625, -10.50732421875, -10.1829833984375, -9.858642578125, -9.5343017578125, -9.2099609375, -8.8856201171875, -8.561279296875, -8.2369384765625, -7.91259765625, -7.5882568359375, -7.263916015625, -6.9395751953125, -6.615234375, -6.2908935546875, -5.966552734375, -5.6422119140625, -5.31787109375, -4.9935302734375, -4.669189453125, -4.3448486328125, -4.0205078125, -3.6961669921875, -3.371826171875, -3.0474853515625, -2.72314453125, -2.3988037109375, -2.074462890625, -1.7501220703125, -1.42578125, -1.1014404296875, -0.777099609375, -0.4527587890625, -0.12841796875, 0.1959228515625, 0.520263671875, 0.8446044921875, 1.1689453125, 1.4932861328125, 1.817626953125, 2.1419677734375, 2.46630859375, 2.7906494140625, 3.114990234375, 3.4393310546875, 3.763671875, 4.0880126953125, 4.412353515625, 4.7366943359375, 5.06103515625, 5.3853759765625, 5.709716796875, 6.0340576171875, 6.3583984375, 6.6827392578125, 7.007080078125, 7.3314208984375, 7.65576171875, 7.9801025390625, 8.304443359375, 8.6287841796875, 8.953125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 5.0, 12.0, 10.0, 21.0, 24.0, 27.0, 33.0, 46.0, 66.0, 96.0, 192.0, 257.0, 472.0, 994.0, 2276.0, 5838.0, 18281.0, 221331.0, 3653669.0, 261517.0, 19055.0, 5786.0, 2169.0, 935.0, 429.0, 262.0, 119.0, 85.0, 62.0, 47.0, 28.0, 30.0, 17.0, 26.0, 15.0, 8.0, 3.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -46.10791015625, -44.8095703125, -43.51123046875, -42.212890625, -40.91455078125, -39.6162109375, -38.31787109375, -37.01953125, -35.72119140625, -34.4228515625, -33.12451171875, -31.826171875, -30.52783203125, -29.2294921875, -27.93115234375, -26.6328125, -25.33447265625, -24.0361328125, -22.73779296875, -21.439453125, -20.14111328125, -18.8427734375, -17.54443359375, -16.24609375, -14.94775390625, -13.6494140625, -12.35107421875, -11.052734375, -9.75439453125, -8.4560546875, -7.15771484375, -5.859375, -4.56103515625, -3.2626953125, -1.96435546875, -0.666015625, 0.63232421875, 1.9306640625, 3.22900390625, 4.52734375, 5.82568359375, 7.1240234375, 8.42236328125, 9.720703125, 11.01904296875, 12.3173828125, 13.61572265625, 14.9140625, 16.21240234375, 17.5107421875, 18.80908203125, 20.107421875, 21.40576171875, 22.7041015625, 24.00244140625, 25.30078125, 26.59912109375, 27.8974609375, 29.19580078125, 30.494140625, 31.79248046875, 33.0908203125, 34.38916015625, 35.6875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 11.0, 6.0, 16.0, 11.0, 18.0, 22.0, 30.0, 37.0, 56.0, 95.0, 166.0, 329.0, 648.0, 833.0, 773.0, 420.0, 222.0, 125.0, 61.0, 41.0, 36.0, 20.0, 19.0, 21.0, 19.0, 8.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.166015625, -32.23828125, -31.310546875, -30.3828125, -29.455078125, -28.52734375, -27.599609375, -26.671875, -25.744140625, -24.81640625, -23.888671875, -22.9609375, -22.033203125, -21.10546875, -20.177734375, -19.25, -18.322265625, -17.39453125, -16.466796875, -15.5390625, -14.611328125, -13.68359375, -12.755859375, -11.828125, -10.900390625, -9.97265625, -9.044921875, -8.1171875, -7.189453125, -6.26171875, -5.333984375, -4.40625, -3.478515625, -2.55078125, -1.623046875, -0.6953125, 0.232421875, 1.16015625, 2.087890625, 3.015625, 3.943359375, 4.87109375, 5.798828125, 6.7265625, 7.654296875, 8.58203125, 9.509765625, 10.4375, 11.365234375, 12.29296875, 13.220703125, 14.1484375, 15.076171875, 16.00390625, 16.931640625, 17.859375, 18.787109375, 19.71484375, 20.642578125, 21.5703125, 22.498046875, 23.42578125, 24.353515625, 25.28125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 12.0, 18.0, 31.0, 28.0, 48.0, 96.0, 175.0, 447.0, 1269.0, 4109.0, 18060.0, 158441.0, 3820213.0, 166582.0, 18326.0, 4249.0, 1276.0, 438.0, 178.0, 105.0, 51.0, 22.0, 19.0, 20.0, 19.0, 7.0, 11.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.59375, -53.57275390625, -51.5517578125, -49.53076171875, -47.509765625, -45.48876953125, -43.4677734375, -41.44677734375, -39.42578125, -37.40478515625, -35.3837890625, -33.36279296875, -31.341796875, -29.32080078125, -27.2998046875, -25.27880859375, -23.2578125, -21.23681640625, -19.2158203125, -17.19482421875, -15.173828125, -13.15283203125, -11.1318359375, -9.11083984375, -7.08984375, -5.06884765625, -3.0478515625, -1.02685546875, 0.994140625, 3.01513671875, 5.0361328125, 7.05712890625, 9.078125, 11.09912109375, 13.1201171875, 15.14111328125, 17.162109375, 19.18310546875, 21.2041015625, 23.22509765625, 25.24609375, 27.26708984375, 29.2880859375, 31.30908203125, 33.330078125, 35.35107421875, 37.3720703125, 39.39306640625, 41.4140625, 43.43505859375, 45.4560546875, 47.47705078125, 49.498046875, 51.51904296875, 53.5400390625, 55.56103515625, 57.58203125, 59.60302734375, 61.6240234375, 63.64501953125, 65.666015625, 67.68701171875, 69.7080078125, 71.72900390625, 73.75]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 6.0, 7.0, 8.0, 12.0, 30.0, 25.0, 35.0, 64.0, 82.0, 110.0, 143.0, 130.0, 110.0, 88.0, 49.0, 40.0, 22.0, 22.0, 12.0, 4.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.06134033203125, -50.48974609375, -46.91815185546875, -43.346561431884766, -39.774967193603516, -36.203372955322266, -32.63178253173828, -29.06018829345703, -25.48859405517578, -21.91699981689453, -18.345407485961914, -14.77381420135498, -11.202220916748047, -7.630626678466797, -4.05903434753418, -0.4874420166015625, 3.0841522216796875, 6.655745506286621, 10.227338790893555, 13.798932075500488, 17.370525360107422, 20.942119598388672, 24.51371192932129, 28.085304260253906, 31.656898498535156, 35.228492736816406, 38.800086975097656, 42.37167739868164, 45.94327163696289, 49.51486587524414, 53.086456298828125, 56.658050537109375, 60.229644775390625, 63.801239013671875, 67.37283325195312, 70.94442749023438, 74.51602172851562, 78.08761596679688, 81.6592025756836, 85.23079681396484, 88.8023910522461, 92.37398529052734, 95.9455795288086, 99.51717376708984, 103.08876037597656, 106.66035461425781, 110.23194885253906, 113.80354309082031, 117.37513732910156, 120.94673156738281, 124.51832580566406, 128.0899200439453, 131.66151428222656, 135.2331085205078, 138.80470275878906, 142.37628173828125, 145.9478759765625, 149.51947021484375, 153.091064453125, 156.66265869140625, 160.2342529296875, 163.80584716796875, 167.37744140625, 170.94903564453125, 174.5206298828125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 12.0, 17.0, 18.0, 20.0, 13.0, 20.0, 16.0, 26.0, 24.0, 23.0, 22.0, 31.0, 40.0, 40.0, 34.0, 36.0, 35.0, 41.0, 36.0, 41.0, 40.0, 34.0, 50.0, 34.0, 34.0, 34.0, 29.0, 18.0, 14.0, 24.0, 19.0, 9.0, 19.0, 18.0, 9.0, 7.0, 5.0, 6.0, 4.0, 6.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-70.21063995361328, -68.07457733154297, -65.93851470947266, -63.802452087402344, -61.6663932800293, -59.530330657958984, -57.39426803588867, -55.25820541381836, -53.12214660644531, -50.986083984375, -48.85002136230469, -46.713958740234375, -44.57789993286133, -42.441837310791016, -40.3057746887207, -38.16971206665039, -36.03364944458008, -33.897586822509766, -31.761526107788086, -29.625463485717773, -27.489402770996094, -25.35334014892578, -23.21727752685547, -21.081214904785156, -18.945154190063477, -16.809091567993164, -14.673030853271484, -12.536968231201172, -10.400906562805176, -8.26484489440918, -6.128782272338867, -3.992720603942871, -1.856658935546875, 0.2794029712677002, 2.4154648780822754, 4.55152702331543, 6.687588691711426, 8.823650360107422, 10.959712982177734, 13.09577465057373, 15.231836318969727, 17.36789894104004, 19.50395965576172, 21.64002227783203, 23.776084899902344, 25.912145614624023, 28.048208236694336, 30.184268951416016, 32.32033157348633, 34.45639419555664, 36.59245681762695, 38.728515625, 40.86457824707031, 43.000640869140625, 45.13670349121094, 47.27276611328125, 49.40882873535156, 51.544891357421875, 53.68095397949219, 55.8170166015625, 57.95307540893555, 60.08913803100586, 62.22520065307617, 64.36125946044922, 66.49732208251953]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 6.0, 14.0, 17.0, 19.0, 25.0, 20.0, 27.0, 24.0, 30.0, 23.0, 32.0, 36.0, 32.0, 42.0, 41.0, 48.0, 37.0, 35.0, 42.0, 37.0, 30.0, 37.0, 38.0, 41.0, 31.0, 28.0, 25.0, 18.0, 16.0, 13.0, 9.0, 21.0, 12.0, 6.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.234375, -9.9442138671875, -9.654052734375, -9.3638916015625, -9.07373046875, -8.7835693359375, -8.493408203125, -8.2032470703125, -7.9130859375, -7.6229248046875, -7.332763671875, -7.0426025390625, -6.75244140625, -6.4622802734375, -6.172119140625, -5.8819580078125, -5.591796875, -5.3016357421875, -5.011474609375, -4.7213134765625, -4.43115234375, -4.1409912109375, -3.850830078125, -3.5606689453125, -3.2705078125, -2.9803466796875, -2.690185546875, -2.4000244140625, -2.10986328125, -1.8197021484375, -1.529541015625, -1.2393798828125, -0.94921875, -0.6590576171875, -0.368896484375, -0.0787353515625, 0.21142578125, 0.5015869140625, 0.791748046875, 1.0819091796875, 1.3720703125, 1.6622314453125, 1.952392578125, 2.2425537109375, 2.53271484375, 2.8228759765625, 3.113037109375, 3.4031982421875, 3.693359375, 3.9835205078125, 4.273681640625, 4.5638427734375, 4.85400390625, 5.1441650390625, 5.434326171875, 5.7244873046875, 6.0146484375, 6.3048095703125, 6.594970703125, 6.8851318359375, 7.17529296875, 7.4654541015625, 7.755615234375, 8.0457763671875, 8.3359375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 15.0, 18.0, 30.0, 42.0, 77.0, 97.0, 165.0, 222.0, 309.0, 433.0, 668.0, 907.0, 1284.0, 1815.0, 2550.0, 3673.0, 5007.0, 7467.0, 10665.0, 15277.0, 22079.0, 32237.0, 48584.0, 73283.0, 114971.0, 178679.0, 180405.0, 116513.0, 74597.0, 49311.0, 33248.0, 22388.0, 15369.0, 10885.0, 7527.0, 5285.0, 3703.0, 2666.0, 1840.0, 1258.0, 956.0, 685.0, 436.0, 307.0, 197.0, 125.0, 120.0, 76.0, 39.0, 14.0, 14.0, 19.0, 9.0, 6.0, 2.0, 3.0], "bins": [-0.211669921875, -0.20544815063476562, -0.19922637939453125, -0.19300460815429688, -0.1867828369140625, -0.18056106567382812, -0.17433929443359375, -0.16811752319335938, -0.161895751953125, -0.15567398071289062, -0.14945220947265625, -0.14323043823242188, -0.1370086669921875, -0.13078689575195312, -0.12456512451171875, -0.11834335327148438, -0.11212158203125, -0.10589981079101562, -0.09967803955078125, -0.09345626831054688, -0.0872344970703125, -0.08101272583007812, -0.07479095458984375, -0.06856918334960938, -0.062347412109375, -0.056125640869140625, -0.04990386962890625, -0.043682098388671875, -0.0374603271484375, -0.031238555908203125, -0.02501678466796875, -0.018795013427734375, -0.0125732421875, -0.006351470947265625, -0.00012969970703125, 0.006092071533203125, 0.0123138427734375, 0.018535614013671875, 0.02475738525390625, 0.030979156494140625, 0.037200927734375, 0.043422698974609375, 0.04964447021484375, 0.055866241455078125, 0.0620880126953125, 0.06830978393554688, 0.07453155517578125, 0.08075332641601562, 0.08697509765625, 0.09319686889648438, 0.09941864013671875, 0.10564041137695312, 0.1118621826171875, 0.11808395385742188, 0.12430572509765625, 0.13052749633789062, 0.136749267578125, 0.14297103881835938, 0.14919281005859375, 0.15541458129882812, 0.1616363525390625, 0.16785812377929688, 0.17407989501953125, 0.18030166625976562, 0.1865234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 8.0, 8.0, 13.0, 14.0, 15.0, 19.0, 25.0, 28.0, 28.0, 31.0, 42.0, 29.0, 34.0, 38.0, 44.0, 39.0, 39.0, 1077.0, 47.0, 45.0, 42.0, 42.0, 43.0, 28.0, 33.0, 30.0, 21.0, 28.0, 18.0, 13.0, 11.0, 15.0, 14.0, 7.0, 13.0, 6.0, 5.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.234375, -6.9774169921875, -6.720458984375, -6.4635009765625, -6.20654296875, -5.9495849609375, -5.692626953125, -5.4356689453125, -5.1787109375, -4.9217529296875, -4.664794921875, -4.4078369140625, -4.15087890625, -3.8939208984375, -3.636962890625, -3.3800048828125, -3.123046875, -2.8660888671875, -2.609130859375, -2.3521728515625, -2.09521484375, -1.8382568359375, -1.581298828125, -1.3243408203125, -1.0673828125, -0.8104248046875, -0.553466796875, -0.2965087890625, -0.03955078125, 0.2174072265625, 0.474365234375, 0.7313232421875, 0.98828125, 1.2452392578125, 1.502197265625, 1.7591552734375, 2.01611328125, 2.2730712890625, 2.530029296875, 2.7869873046875, 3.0439453125, 3.3009033203125, 3.557861328125, 3.8148193359375, 4.07177734375, 4.3287353515625, 4.585693359375, 4.8426513671875, 5.099609375, 5.3565673828125, 5.613525390625, 5.8704833984375, 6.12744140625, 6.3843994140625, 6.641357421875, 6.8983154296875, 7.1552734375, 7.4122314453125, 7.669189453125, 7.9261474609375, 8.18310546875, 8.4400634765625, 8.697021484375, 8.9539794921875, 9.2109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 14.0, 21.0, 25.0, 42.0, 67.0, 91.0, 125.0, 213.0, 281.0, 399.0, 617.0, 870.0, 1297.0, 1905.0, 2792.0, 4256.0, 6508.0, 9810.0, 14706.0, 22952.0, 35822.0, 55471.0, 91191.0, 152594.0, 1269645.0, 161718.0, 96723.0, 59217.0, 37749.0, 24023.0, 15623.0, 10245.0, 6714.0, 4399.0, 2856.0, 1891.0, 1326.0, 871.0, 654.0, 427.0, 301.0, 211.0, 150.0, 111.0, 64.0, 43.0, 40.0, 15.0, 16.0, 7.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 3.0, 4.0], "bins": [-0.110107421875, -0.10650444030761719, -0.10290145874023438, -0.09929847717285156, -0.09569549560546875, -0.09209251403808594, -0.08848953247070312, -0.08488655090332031, -0.0812835693359375, -0.07768058776855469, -0.07407760620117188, -0.07047462463378906, -0.06687164306640625, -0.06326866149902344, -0.059665679931640625, -0.05606269836425781, -0.052459716796875, -0.04885673522949219, -0.045253753662109375, -0.04165077209472656, -0.03804779052734375, -0.03444480895996094, -0.030841827392578125, -0.027238845825195312, -0.0236358642578125, -0.020032882690429688, -0.016429901123046875, -0.012826919555664062, -0.00922393798828125, -0.0056209564208984375, -0.002017974853515625, 0.0015850067138671875, 0.00518798828125, 0.008790969848632812, 0.012393951416015625, 0.015996932983398438, 0.01959991455078125, 0.023202896118164062, 0.026805877685546875, 0.030408859252929688, 0.0340118408203125, 0.03761482238769531, 0.041217803955078125, 0.04482078552246094, 0.04842376708984375, 0.05202674865722656, 0.055629730224609375, 0.05923271179199219, 0.062835693359375, 0.06643867492675781, 0.07004165649414062, 0.07364463806152344, 0.07724761962890625, 0.08085060119628906, 0.08445358276367188, 0.08805656433105469, 0.0916595458984375, 0.09526252746582031, 0.09886550903320312, 0.10246849060058594, 0.10607147216796875, 0.10967445373535156, 0.11327743530273438, 0.11688041687011719, 0.1204833984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 10.0, 9.0, 14.0, 15.0, 16.0, 15.0, 35.0, 36.0, 50.0, 39.0, 72.0, 73.0, 74.0, 76.0, 68.0, 68.0, 55.0, 54.0, 45.0, 27.0, 28.0, 20.0, 17.0, 18.0, 11.0, 9.0, 3.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0013179779052734375, -0.0012768656015396118, -0.0012357532978057861, -0.0011946409940719604, -0.0011535286903381348, -0.001112416386604309, -0.0010713040828704834, -0.0010301917791366577, -0.000989079475402832, -0.0009479671716690063, -0.0009068548679351807, -0.000865742564201355, -0.0008246302604675293, -0.0007835179567337036, -0.0007424056529998779, -0.0007012933492660522, -0.0006601810455322266, -0.0006190687417984009, -0.0005779564380645752, -0.0005368441343307495, -0.0004957318305969238, -0.00045461952686309814, -0.00041350722312927246, -0.0003723949193954468, -0.0003312826156616211, -0.0002901703119277954, -0.0002490580081939697, -0.00020794570446014404, -0.00016683340072631836, -0.00012572109699249268, -8.460879325866699e-05, -4.349648952484131e-05, -2.384185791015625e-06, 3.872811794281006e-05, 7.984042167663574e-05, 0.00012095272541046143, 0.0001620650291442871, 0.0002031773328781128, 0.0002442896366119385, 0.00028540194034576416, 0.00032651424407958984, 0.00036762654781341553, 0.0004087388515472412, 0.0004498511552810669, 0.0004909634590148926, 0.0005320757627487183, 0.0005731880664825439, 0.0006143003702163696, 0.0006554126739501953, 0.000696524977684021, 0.0007376372814178467, 0.0007787495851516724, 0.000819861888885498, 0.0008609741926193237, 0.0009020864963531494, 0.0009431988000869751, 0.0009843111038208008, 0.0010254234075546265, 0.0010665357112884521, 0.0011076480150222778, 0.0011487603187561035, 0.0011898726224899292, 0.0012309849262237549, 0.0012720972299575806, 0.0013132095336914062]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 10.0, 10.0, 14.0, 21.0, 23.0, 34.0, 35.0, 66.0, 116.0, 206.0, 445.0, 1739.0, 931753.0, 112000.0, 1200.0, 391.0, 164.0, 77.0, 75.0, 40.0, 18.0, 23.0, 15.0, 15.0, 9.0, 10.0, 11.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027862548828125, -0.026988983154296875, -0.02611541748046875, -0.025241851806640625, -0.0243682861328125, -0.023494720458984375, -0.02262115478515625, -0.021747589111328125, -0.0208740234375, -0.020000457763671875, -0.01912689208984375, -0.018253326416015625, -0.0173797607421875, -0.016506195068359375, -0.01563262939453125, -0.014759063720703125, -0.013885498046875, -0.013011932373046875, -0.01213836669921875, -0.011264801025390625, -0.0103912353515625, -0.009517669677734375, -0.00864410400390625, -0.007770538330078125, -0.00689697265625, -0.006023406982421875, -0.00514984130859375, -0.004276275634765625, -0.0034027099609375, -0.002529144287109375, -0.00165557861328125, -0.000782012939453125, 9.1552734375e-05, 0.000965118408203125, 0.00183868408203125, 0.002712249755859375, 0.0035858154296875, 0.004459381103515625, 0.00533294677734375, 0.006206512451171875, 0.007080078125, 0.007953643798828125, 0.00882720947265625, 0.009700775146484375, 0.0105743408203125, 0.011447906494140625, 0.01232147216796875, 0.013195037841796875, 0.014068603515625, 0.014942169189453125, 0.01581573486328125, 0.016689300537109375, 0.0175628662109375, 0.018436431884765625, 0.01930999755859375, 0.020183563232421875, 0.02105712890625, 0.021930694580078125, 0.02280426025390625, 0.023677825927734375, 0.0245513916015625, 0.025424957275390625, 0.02629852294921875, 0.027172088623046875, 0.028045654296875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 28.0, 967.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03016747534275055, -0.02961399033665657, -0.029060503467917442, -0.028507018461823463, -0.027953531593084335, -0.027400046586990356, -0.02684655971825123, -0.02629307471215725, -0.02573958784341812, -0.025186102837324142, -0.024632615968585014, -0.024079130962491035, -0.023525644093751907, -0.02297215908765793, -0.0224186722189188, -0.02186518721282482, -0.021311702206730843, -0.020758217200636864, -0.020204730331897736, -0.019651245325803757, -0.01909775845706463, -0.01854427345097065, -0.01799078658223152, -0.017437301576137543, -0.016883816570043564, -0.016330331563949585, -0.015776844695210457, -0.015223358757793903, -0.01466987282037735, -0.014116387814283371, -0.013562901876866817, -0.013009415939450264, -0.012455929070711136, -0.011902443133294582, -0.011348957195878029, -0.010795471258461475, -0.010241985321044922, -0.009688500314950943, -0.00913501437753439, -0.008581528440117836, -0.008028042502701283, -0.007474556565284729, -0.0069210706278681755, -0.006367585156112909, -0.005814099218696356, -0.005260613281279802, -0.004707127809524536, -0.004153641872107983, -0.003600155934691429, -0.0030466699972748756, -0.002493184292688966, -0.0019396984716877341, -0.0013862126506865025, -0.000832726713269949, -0.0002792410086840391, 0.00027424469590187073, 0.0008277306333184242, 0.001381216454319656, 0.0019347022753208876, 0.0024881879799067974, 0.003041673917323351, 0.0035951598547399044, 0.004148645326495171, 0.004702131263911724, 0.005255617201328278]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 0.0, 5.0, 1.0, 3.0, 2.0, 6.0, 9.0, 6.0, 8.0, 8.0, 17.0, 21.0, 17.0, 25.0, 25.0, 28.0, 37.0, 47.0, 36.0, 37.0, 41.0, 44.0, 36.0, 47.0, 44.0, 53.0, 50.0, 39.0, 50.0, 28.0, 41.0, 26.0, 26.0, 27.0, 25.0, 15.0, 18.0, 10.0, 15.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010303258895874023, -0.0009916974231600761, -0.0009530689567327499, -0.0009144404903054237, -0.0008758120238780975, -0.0008371835574507713, -0.0007985550910234451, -0.0007599266245961189, -0.0007212981581687927, -0.0006826696917414665, -0.0006440412253141403, -0.0006054127588868141, -0.0005667842924594879, -0.0005281558260321617, -0.0004895273596048355, -0.0004508988931775093, -0.0004122704267501831, -0.0003736419603228569, -0.0003350134938955307, -0.0002963850274682045, -0.0002577565610408783, -0.0002191280946135521, -0.0001804996281862259, -0.0001418711617588997, -0.00010324269533157349, -6.461422890424728e-05, -2.598576247692108e-05, 1.2642703950405121e-05, 5.127117037773132e-05, 8.989963680505753e-05, 0.00012852810323238373, 0.00016715656965970993, 0.00020578503608703613, 0.00024441350251436234, 0.00028304196894168854, 0.00032167043536901474, 0.00036029890179634094, 0.00039892736822366714, 0.00043755583465099335, 0.00047618430107831955, 0.0005148127675056458, 0.000553441233932972, 0.0005920697003602982, 0.0006306981667876244, 0.0006693266332149506, 0.0007079550996422768, 0.000746583566069603, 0.0007852120324969292, 0.0008238404989242554, 0.0008624689653515816, 0.0009010974317789078, 0.000939725898206234, 0.0009783543646335602, 0.0010169828310608864, 0.0010556112974882126, 0.0010942397639155388, 0.001132868230342865, 0.0011714966967701912, 0.0012101251631975174, 0.0012487536296248436, 0.0012873820960521698, 0.001326010562479496, 0.0013646390289068222, 0.0014032674953341484, 0.0014418959617614746]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 6.0, 14.0, 17.0, 19.0, 25.0, 20.0, 27.0, 24.0, 30.0, 23.0, 32.0, 36.0, 32.0, 42.0, 41.0, 48.0, 37.0, 35.0, 42.0, 37.0, 30.0, 37.0, 38.0, 41.0, 31.0, 28.0, 25.0, 18.0, 16.0, 13.0, 9.0, 21.0, 12.0, 6.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.234375, -9.9442138671875, -9.654052734375, -9.3638916015625, -9.07373046875, -8.7835693359375, -8.493408203125, -8.2032470703125, -7.9130859375, -7.6229248046875, -7.332763671875, -7.0426025390625, -6.75244140625, -6.4622802734375, -6.172119140625, -5.8819580078125, -5.591796875, -5.3016357421875, -5.011474609375, -4.7213134765625, -4.43115234375, -4.1409912109375, -3.850830078125, -3.5606689453125, -3.2705078125, -2.9803466796875, -2.690185546875, -2.4000244140625, -2.10986328125, -1.8197021484375, -1.529541015625, -1.2393798828125, -0.94921875, -0.6590576171875, -0.368896484375, -0.0787353515625, 0.21142578125, 0.5015869140625, 0.791748046875, 1.0819091796875, 1.3720703125, 1.6622314453125, 1.952392578125, 2.2425537109375, 2.53271484375, 2.8228759765625, 3.113037109375, 3.4031982421875, 3.693359375, 3.9835205078125, 4.273681640625, 4.5638427734375, 4.85400390625, 5.1441650390625, 5.434326171875, 5.7244873046875, 6.0146484375, 6.3048095703125, 6.594970703125, 6.8851318359375, 7.17529296875, 7.4654541015625, 7.755615234375, 8.0457763671875, 8.3359375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 10.0, 18.0, 20.0, 27.0, 33.0, 52.0, 66.0, 106.0, 152.0, 215.0, 267.0, 434.0, 598.0, 917.0, 1269.0, 2167.0, 3378.0, 5230.0, 8896.0, 16607.0, 39525.0, 225401.0, 622552.0, 68457.0, 22757.0, 11284.0, 6499.0, 3900.0, 2588.0, 1620.0, 1113.0, 718.0, 507.0, 368.0, 247.0, 182.0, 103.0, 96.0, 48.0, 37.0, 29.0, 21.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.787109375, -18.12109375, -17.455078125, -16.7890625, -16.123046875, -15.45703125, -14.791015625, -14.125, -13.458984375, -12.79296875, -12.126953125, -11.4609375, -10.794921875, -10.12890625, -9.462890625, -8.796875, -8.130859375, -7.46484375, -6.798828125, -6.1328125, -5.466796875, -4.80078125, -4.134765625, -3.46875, -2.802734375, -2.13671875, -1.470703125, -0.8046875, -0.138671875, 0.52734375, 1.193359375, 1.859375, 2.525390625, 3.19140625, 3.857421875, 4.5234375, 5.189453125, 5.85546875, 6.521484375, 7.1875, 7.853515625, 8.51953125, 9.185546875, 9.8515625, 10.517578125, 11.18359375, 11.849609375, 12.515625, 13.181640625, 13.84765625, 14.513671875, 15.1796875, 15.845703125, 16.51171875, 17.177734375, 17.84375, 18.509765625, 19.17578125, 19.841796875, 20.5078125, 21.173828125, 21.83984375, 22.505859375, 23.171875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 4.0, 6.0, 8.0, 6.0, 11.0, 16.0, 17.0, 13.0, 22.0, 21.0, 29.0, 32.0, 37.0, 34.0, 39.0, 39.0, 54.0, 58.0, 104.0, 287.0, 1579.0, 138.0, 70.0, 43.0, 34.0, 42.0, 32.0, 29.0, 33.0, 25.0, 23.0, 17.0, 19.0, 23.0, 10.0, 17.0, 9.0, 5.0, 6.0, 7.0, 6.0, 3.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-30.859375, -29.956298828125, -29.05322265625, -28.150146484375, -27.2470703125, -26.343994140625, -25.44091796875, -24.537841796875, -23.634765625, -22.731689453125, -21.82861328125, -20.925537109375, -20.0224609375, -19.119384765625, -18.21630859375, -17.313232421875, -16.41015625, -15.507080078125, -14.60400390625, -13.700927734375, -12.7978515625, -11.894775390625, -10.99169921875, -10.088623046875, -9.185546875, -8.282470703125, -7.37939453125, -6.476318359375, -5.5732421875, -4.670166015625, -3.76708984375, -2.864013671875, -1.9609375, -1.057861328125, -0.15478515625, 0.748291015625, 1.6513671875, 2.554443359375, 3.45751953125, 4.360595703125, 5.263671875, 6.166748046875, 7.06982421875, 7.972900390625, 8.8759765625, 9.779052734375, 10.68212890625, 11.585205078125, 12.48828125, 13.391357421875, 14.29443359375, 15.197509765625, 16.1005859375, 17.003662109375, 17.90673828125, 18.809814453125, 19.712890625, 20.615966796875, 21.51904296875, 22.422119140625, 23.3251953125, 24.228271484375, 25.13134765625, 26.034423828125, 26.9375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [6.0, 1.0, 3.0, 6.0, 5.0, 4.0, 2.0, 10.0, 8.0, 9.0, 2.0, 17.0, 13.0, 18.0, 30.0, 24.0, 27.0, 37.0, 45.0, 54.0, 91.0, 123.0, 243.0, 454.0, 1152.0, 3349.0, 12321.0, 88925.0, 2947977.0, 73954.0, 11136.0, 3324.0, 1153.0, 433.0, 201.0, 134.0, 92.0, 68.0, 50.0, 38.0, 26.0, 30.0, 18.0, 16.0, 22.0, 15.0, 9.0, 6.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-49.90625, -48.1533203125, -46.400390625, -44.6474609375, -42.89453125, -41.1416015625, -39.388671875, -37.6357421875, -35.8828125, -34.1298828125, -32.376953125, -30.6240234375, -28.87109375, -27.1181640625, -25.365234375, -23.6123046875, -21.859375, -20.1064453125, -18.353515625, -16.6005859375, -14.84765625, -13.0947265625, -11.341796875, -9.5888671875, -7.8359375, -6.0830078125, -4.330078125, -2.5771484375, -0.82421875, 0.9287109375, 2.681640625, 4.4345703125, 6.1875, 7.9404296875, 9.693359375, 11.4462890625, 13.19921875, 14.9521484375, 16.705078125, 18.4580078125, 20.2109375, 21.9638671875, 23.716796875, 25.4697265625, 27.22265625, 28.9755859375, 30.728515625, 32.4814453125, 34.234375, 35.9873046875, 37.740234375, 39.4931640625, 41.24609375, 42.9990234375, 44.751953125, 46.5048828125, 48.2578125, 50.0107421875, 51.763671875, 53.5166015625, 55.26953125, 57.0224609375, 58.775390625, 60.5283203125, 62.28125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 33.0, 162.0, 486.0, 261.0, 59.0, 11.0], "bins": [-482.2396240234375, -474.2826232910156, -466.32562255859375, -458.36865234375, -450.4116516113281, -442.45465087890625, -434.4976501464844, -426.5406799316406, -418.58367919921875, -410.6266784667969, -402.669677734375, -394.71270751953125, -386.7557067871094, -378.7987060546875, -370.8417053222656, -362.8847351074219, -354.927734375, -346.9707336425781, -339.01373291015625, -331.0567626953125, -323.0997619628906, -315.14276123046875, -307.1857604980469, -299.2287902832031, -291.27178955078125, -283.3147888183594, -275.3577880859375, -267.40081787109375, -259.4438171386719, -251.48681640625, -243.5298309326172, -235.5728302001953, -227.61582946777344, -219.65882873535156, -211.70184326171875, -203.74484252929688, -195.78785705566406, -187.8308563232422, -179.87387084960938, -171.9168701171875, -163.9598846435547, -156.0028839111328, -148.0458984375, -140.08889770507812, -132.1319122314453, -124.17491149902344, -116.21792602539062, -108.26092529296875, -100.3039321899414, -92.34693908691406, -84.38994598388672, -76.43295288085938, -68.47595977783203, -60.51896286010742, -52.56196975708008, -44.604976654052734, -36.64798355102539, -28.690990447998047, -20.733997344970703, -12.777002334594727, -4.820009231567383, 3.1369857788085938, 11.093978881835938, 19.05097198486328, 27.007965087890625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 9.0, 8.0, 11.0, 18.0, 27.0, 24.0, 14.0, 31.0, 37.0, 30.0, 35.0, 38.0, 43.0, 55.0, 46.0, 44.0, 46.0, 44.0, 45.0, 41.0, 37.0, 29.0, 28.0, 33.0, 43.0, 29.0, 21.0, 19.0, 17.0, 22.0, 4.0, 14.0, 7.0, 10.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.95658111572266, -89.61892700195312, -86.28126525878906, -82.94361114501953, -79.60595703125, -76.26829528808594, -72.9306411743164, -69.59298706054688, -66.25532531738281, -62.917667388916016, -59.58000946044922, -56.24235534667969, -52.90469741821289, -49.567039489746094, -46.22938537597656, -42.891727447509766, -39.55406951904297, -36.21641159057617, -32.878753662109375, -29.541099548339844, -26.203441619873047, -22.86578369140625, -19.528127670288086, -16.190471649169922, -12.852813720703125, -9.515156745910645, -6.177499771118164, -2.8398427963256836, 0.4978141784667969, 3.8354721069335938, 7.173128128051758, 10.510784149169922, 13.84844970703125, 17.186107635498047, 20.52376365661621, 23.861419677734375, 27.199077606201172, 30.53673553466797, 33.8743896484375, 37.2120475769043, 40.549705505371094, 43.88736343383789, 47.22502136230469, 50.56267547607422, 53.900333404541016, 57.23799133300781, 60.575645446777344, 63.91330337524414, 67.25096130371094, 70.58861541748047, 73.92627716064453, 77.26393127441406, 80.60159301757812, 83.93924713134766, 87.27690124511719, 90.61456298828125, 93.95221710205078, 97.28987121582031, 100.62753295898438, 103.9651870727539, 107.30284118652344, 110.6405029296875, 113.97815704345703, 117.31581115722656, 120.65347290039062]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 7.0, 8.0, 12.0, 10.0, 14.0, 12.0, 15.0, 18.0, 25.0, 20.0, 28.0, 33.0, 38.0, 24.0, 34.0, 37.0, 41.0, 47.0, 37.0, 46.0, 31.0, 38.0, 32.0, 29.0, 40.0, 55.0, 26.0, 35.0, 34.0, 18.0, 20.0, 15.0, 13.0, 14.0, 17.0, 19.0, 9.0, 6.0, 6.0, 5.0, 3.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.03125, -10.7103271484375, -10.389404296875, -10.0684814453125, -9.74755859375, -9.4266357421875, -9.105712890625, -8.7847900390625, -8.4638671875, -8.1429443359375, -7.822021484375, -7.5010986328125, -7.18017578125, -6.8592529296875, -6.538330078125, -6.2174072265625, -5.896484375, -5.5755615234375, -5.254638671875, -4.9337158203125, -4.61279296875, -4.2918701171875, -3.970947265625, -3.6500244140625, -3.3291015625, -3.0081787109375, -2.687255859375, -2.3663330078125, -2.04541015625, -1.7244873046875, -1.403564453125, -1.0826416015625, -0.76171875, -0.4407958984375, -0.119873046875, 0.2010498046875, 0.52197265625, 0.8428955078125, 1.163818359375, 1.4847412109375, 1.8056640625, 2.1265869140625, 2.447509765625, 2.7684326171875, 3.08935546875, 3.4102783203125, 3.731201171875, 4.0521240234375, 4.373046875, 4.6939697265625, 5.014892578125, 5.3358154296875, 5.65673828125, 5.9776611328125, 6.298583984375, 6.6195068359375, 6.9404296875, 7.2613525390625, 7.582275390625, 7.9031982421875, 8.22412109375, 8.5450439453125, 8.865966796875, 9.1868896484375, 9.5078125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 10.0, 15.0, 13.0, 9.0, 17.0, 19.0, 20.0, 34.0, 55.0, 82.0, 154.0, 246.0, 432.0, 856.0, 1734.0, 3905.0, 9767.0, 33470.0, 564452.0, 3260179.0, 280625.0, 24716.0, 7663.0, 3050.0, 1313.0, 612.0, 321.0, 161.0, 92.0, 56.0, 40.0, 34.0, 21.0, 13.0, 21.0, 12.0, 11.0, 9.0, 4.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.25, -34.22509765625, -33.2001953125, -32.17529296875, -31.150390625, -30.12548828125, -29.1005859375, -28.07568359375, -27.05078125, -26.02587890625, -25.0009765625, -23.97607421875, -22.951171875, -21.92626953125, -20.9013671875, -19.87646484375, -18.8515625, -17.82666015625, -16.8017578125, -15.77685546875, -14.751953125, -13.72705078125, -12.7021484375, -11.67724609375, -10.65234375, -9.62744140625, -8.6025390625, -7.57763671875, -6.552734375, -5.52783203125, -4.5029296875, -3.47802734375, -2.453125, -1.42822265625, -0.4033203125, 0.62158203125, 1.646484375, 2.67138671875, 3.6962890625, 4.72119140625, 5.74609375, 6.77099609375, 7.7958984375, 8.82080078125, 9.845703125, 10.87060546875, 11.8955078125, 12.92041015625, 13.9453125, 14.97021484375, 15.9951171875, 17.02001953125, 18.044921875, 19.06982421875, 20.0947265625, 21.11962890625, 22.14453125, 23.16943359375, 24.1943359375, 25.21923828125, 26.244140625, 27.26904296875, 28.2939453125, 29.31884765625, 30.34375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 7.0, 6.0, 18.0, 8.0, 19.0, 24.0, 26.0, 37.0, 44.0, 69.0, 123.0, 141.0, 255.0, 444.0, 656.0, 797.0, 564.0, 310.0, 168.0, 106.0, 61.0, 36.0, 32.0, 25.0, 15.0, 18.0, 9.0, 11.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.296875, -23.5146484375, -22.732421875, -21.9501953125, -21.16796875, -20.3857421875, -19.603515625, -18.8212890625, -18.0390625, -17.2568359375, -16.474609375, -15.6923828125, -14.91015625, -14.1279296875, -13.345703125, -12.5634765625, -11.78125, -10.9990234375, -10.216796875, -9.4345703125, -8.65234375, -7.8701171875, -7.087890625, -6.3056640625, -5.5234375, -4.7412109375, -3.958984375, -3.1767578125, -2.39453125, -1.6123046875, -0.830078125, -0.0478515625, 0.734375, 1.5166015625, 2.298828125, 3.0810546875, 3.86328125, 4.6455078125, 5.427734375, 6.2099609375, 6.9921875, 7.7744140625, 8.556640625, 9.3388671875, 10.12109375, 10.9033203125, 11.685546875, 12.4677734375, 13.25, 14.0322265625, 14.814453125, 15.5966796875, 16.37890625, 17.1611328125, 17.943359375, 18.7255859375, 19.5078125, 20.2900390625, 21.072265625, 21.8544921875, 22.63671875, 23.4189453125, 24.201171875, 24.9833984375, 25.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 10.0, 16.0, 17.0, 28.0, 35.0, 70.0, 118.0, 289.0, 926.0, 3886.0, 34057.0, 3632592.0, 504462.0, 14393.0, 2196.0, 577.0, 221.0, 128.0, 54.0, 36.0, 34.0, 22.0, 16.0, 13.0, 16.0, 4.0, 8.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-92.5625, -89.7431640625, -86.923828125, -84.1044921875, -81.28515625, -78.4658203125, -75.646484375, -72.8271484375, -70.0078125, -67.1884765625, -64.369140625, -61.5498046875, -58.73046875, -55.9111328125, -53.091796875, -50.2724609375, -47.453125, -44.6337890625, -41.814453125, -38.9951171875, -36.17578125, -33.3564453125, -30.537109375, -27.7177734375, -24.8984375, -22.0791015625, -19.259765625, -16.4404296875, -13.62109375, -10.8017578125, -7.982421875, -5.1630859375, -2.34375, 0.4755859375, 3.294921875, 6.1142578125, 8.93359375, 11.7529296875, 14.572265625, 17.3916015625, 20.2109375, 23.0302734375, 25.849609375, 28.6689453125, 31.48828125, 34.3076171875, 37.126953125, 39.9462890625, 42.765625, 45.5849609375, 48.404296875, 51.2236328125, 54.04296875, 56.8623046875, 59.681640625, 62.5009765625, 65.3203125, 68.1396484375, 70.958984375, 73.7783203125, 76.59765625, 79.4169921875, 82.236328125, 85.0556640625, 87.875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 22.0, 62.0, 279.0, 402.0, 168.0, 58.0, 16.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-568.2228393554688, -556.716796875, -545.2108154296875, -533.7047729492188, -522.19873046875, -510.6927490234375, -499.18670654296875, -487.6806945800781, -476.1746826171875, -464.6686706542969, -453.1626281738281, -441.6566162109375, -430.1506042480469, -418.64459228515625, -407.1385498046875, -395.6325378417969, -384.1264953613281, -372.6204833984375, -361.11444091796875, -349.6084289550781, -338.1024169921875, -326.59637451171875, -315.0903625488281, -303.5843505859375, -292.07830810546875, -280.5722961425781, -269.0662536621094, -257.56024169921875, -246.05422973632812, -234.54820251464844, -223.04217529296875, -211.53616333007812, -200.03016662597656, -188.52413940429688, -177.01812744140625, -165.51210021972656, -154.00607299804688, -142.50006103515625, -130.99403381347656, -119.4880142211914, -107.98199462890625, -96.4759750366211, -84.96995544433594, -73.46392822265625, -61.957908630371094, -50.45188903808594, -38.94586181640625, -27.439842224121094, -15.933822631835938, -4.427801132202148, 7.078220367431641, 18.584243774414062, 30.09026336669922, 41.596282958984375, 53.10231018066406, 64.60832977294922, 76.11434936523438, 87.62036895751953, 99.12638854980469, 110.63241577148438, 122.13843536376953, 133.6444549560547, 145.15048217773438, 156.656494140625, 168.1625213623047]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 12.0, 9.0, 10.0, 8.0, 15.0, 13.0, 10.0, 24.0, 21.0, 13.0, 30.0, 16.0, 20.0, 28.0, 26.0, 29.0, 44.0, 39.0, 36.0, 46.0, 24.0, 37.0, 31.0, 33.0, 41.0, 29.0, 48.0, 37.0, 35.0, 31.0, 28.0, 22.0, 25.0, 18.0, 21.0, 16.0, 16.0, 6.0, 15.0, 3.0, 13.0, 6.0, 2.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-74.22453308105469, -72.0906982421875, -69.95685577392578, -67.8230209350586, -65.6891860961914, -63.55534744262695, -61.4215087890625, -59.28767395019531, -57.15383529663086, -55.019996643066406, -52.88616180419922, -50.752323150634766, -48.61848449707031, -46.484649658203125, -44.35081100463867, -42.21697235107422, -40.08313751220703, -37.94929885864258, -35.81546401977539, -33.68162536621094, -31.547788619995117, -29.413951873779297, -27.280113220214844, -25.146276473999023, -23.012439727783203, -20.878602981567383, -18.744766235351562, -16.61092758178711, -14.477090835571289, -12.343254089355469, -10.209416389465332, -8.075578689575195, -5.941741943359375, -3.8079047203063965, -1.674067497253418, 0.45976972579956055, 2.593606948852539, 4.727443695068359, 6.861281394958496, 8.995119094848633, 11.128955841064453, 13.262792587280273, 15.39663028717041, 17.530467987060547, 19.664304733276367, 21.798141479492188, 23.93198013305664, 26.06581687927246, 28.19965362548828, 30.3334903717041, 32.46732711791992, 34.601165771484375, 36.73500061035156, 38.868839263916016, 41.00267791748047, 43.136512756347656, 45.27035140991211, 47.40419006347656, 49.53802490234375, 51.6718635559082, 53.805702209472656, 55.939537048339844, 58.0733757019043, 60.20721435546875, 62.34104919433594]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 7.0, 21.0, 14.0, 19.0, 24.0, 29.0, 22.0, 31.0, 31.0, 40.0, 38.0, 21.0, 39.0, 33.0, 44.0, 36.0, 37.0, 33.0, 35.0, 36.0, 46.0, 25.0, 33.0, 30.0, 36.0, 32.0, 20.0, 17.0, 16.0, 13.0, 19.0, 13.0, 17.0, 11.0, 13.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.375, -10.0693359375, -9.763671875, -9.4580078125, -9.15234375, -8.8466796875, -8.541015625, -8.2353515625, -7.9296875, -7.6240234375, -7.318359375, -7.0126953125, -6.70703125, -6.4013671875, -6.095703125, -5.7900390625, -5.484375, -5.1787109375, -4.873046875, -4.5673828125, -4.26171875, -3.9560546875, -3.650390625, -3.3447265625, -3.0390625, -2.7333984375, -2.427734375, -2.1220703125, -1.81640625, -1.5107421875, -1.205078125, -0.8994140625, -0.59375, -0.2880859375, 0.017578125, 0.3232421875, 0.62890625, 0.9345703125, 1.240234375, 1.5458984375, 1.8515625, 2.1572265625, 2.462890625, 2.7685546875, 3.07421875, 3.3798828125, 3.685546875, 3.9912109375, 4.296875, 4.6025390625, 4.908203125, 5.2138671875, 5.51953125, 5.8251953125, 6.130859375, 6.4365234375, 6.7421875, 7.0478515625, 7.353515625, 7.6591796875, 7.96484375, 8.2705078125, 8.576171875, 8.8818359375, 9.1875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 12.0, 8.0, 26.0, 27.0, 45.0, 75.0, 111.0, 137.0, 224.0, 311.0, 401.0, 711.0, 971.0, 1532.0, 2163.0, 3288.0, 4933.0, 7351.0, 11536.0, 18125.0, 27815.0, 43626.0, 69351.0, 113528.0, 181669.0, 204458.0, 132235.0, 81488.0, 50587.0, 32094.0, 20744.0, 13403.0, 8697.0, 5718.0, 3680.0, 2470.0, 1582.0, 1136.0, 773.0, 475.0, 324.0, 225.0, 163.0, 116.0, 74.0, 45.0, 30.0, 22.0, 17.0, 8.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.22259140014648438, -0.21495819091796875, -0.20732498168945312, -0.1996917724609375, -0.19205856323242188, -0.18442535400390625, -0.17679214477539062, -0.169158935546875, -0.16152572631835938, -0.15389251708984375, -0.14625930786132812, -0.1386260986328125, -0.13099288940429688, -0.12335968017578125, -0.11572647094726562, -0.10809326171875, -0.10046005249023438, -0.09282684326171875, -0.08519363403320312, -0.0775604248046875, -0.06992721557617188, -0.06229400634765625, -0.054660797119140625, -0.047027587890625, -0.039394378662109375, -0.03176116943359375, -0.024127960205078125, -0.0164947509765625, -0.008861541748046875, -0.00122833251953125, 0.006404876708984375, 0.0140380859375, 0.021671295166015625, 0.02930450439453125, 0.036937713623046875, 0.0445709228515625, 0.052204132080078125, 0.05983734130859375, 0.06747055053710938, 0.075103759765625, 0.08273696899414062, 0.09037017822265625, 0.09800338745117188, 0.1056365966796875, 0.11326980590820312, 0.12090301513671875, 0.12853622436523438, 0.13616943359375, 0.14380264282226562, 0.15143585205078125, 0.15906906127929688, 0.1667022705078125, 0.17433547973632812, 0.18196868896484375, 0.18960189819335938, 0.197235107421875, 0.20486831665039062, 0.21250152587890625, 0.22013473510742188, 0.2277679443359375, 0.23540115356445312, 0.24303436279296875, 0.2506675720214844, 0.25830078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 6.0, 11.0, 4.0, 10.0, 11.0, 15.0, 10.0, 23.0, 24.0, 27.0, 18.0, 28.0, 44.0, 31.0, 45.0, 41.0, 44.0, 37.0, 38.0, 38.0, 1063.0, 49.0, 43.0, 34.0, 39.0, 37.0, 39.0, 32.0, 24.0, 24.0, 18.0, 20.0, 15.0, 19.0, 10.0, 12.0, 12.0, 9.0, 8.0, 7.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.6976318359375, -7.434326171875, -7.1710205078125, -6.90771484375, -6.6444091796875, -6.381103515625, -6.1177978515625, -5.8544921875, -5.5911865234375, -5.327880859375, -5.0645751953125, -4.80126953125, -4.5379638671875, -4.274658203125, -4.0113525390625, -3.748046875, -3.4847412109375, -3.221435546875, -2.9581298828125, -2.69482421875, -2.4315185546875, -2.168212890625, -1.9049072265625, -1.6416015625, -1.3782958984375, -1.114990234375, -0.8516845703125, -0.58837890625, -0.3250732421875, -0.061767578125, 0.2015380859375, 0.46484375, 0.7281494140625, 0.991455078125, 1.2547607421875, 1.51806640625, 1.7813720703125, 2.044677734375, 2.3079833984375, 2.5712890625, 2.8345947265625, 3.097900390625, 3.3612060546875, 3.62451171875, 3.8878173828125, 4.151123046875, 4.4144287109375, 4.677734375, 4.9410400390625, 5.204345703125, 5.4676513671875, 5.73095703125, 5.9942626953125, 6.257568359375, 6.5208740234375, 6.7841796875, 7.0474853515625, 7.310791015625, 7.5740966796875, 7.83740234375, 8.1007080078125, 8.364013671875, 8.6273193359375, 8.890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 19.0, 17.0, 24.0, 41.0, 91.0, 97.0, 142.0, 200.0, 311.0, 472.0, 639.0, 1054.0, 1389.0, 2194.0, 3200.0, 4898.0, 7488.0, 11487.0, 17695.0, 27607.0, 43115.0, 68410.0, 111839.0, 190023.0, 1256078.0, 129643.0, 79537.0, 49504.0, 31792.0, 20409.0, 12986.0, 8249.0, 5482.0, 3626.0, 2380.0, 1547.0, 1063.0, 693.0, 556.0, 360.0, 237.0, 173.0, 117.0, 67.0, 53.0, 47.0, 25.0, 15.0, 11.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.12237548828125, -0.11856842041015625, -0.1147613525390625, -0.11095428466796875, -0.107147216796875, -0.10334014892578125, -0.0995330810546875, -0.09572601318359375, -0.0919189453125, -0.08811187744140625, -0.0843048095703125, -0.08049774169921875, -0.076690673828125, -0.07288360595703125, -0.0690765380859375, -0.06526947021484375, -0.06146240234375, -0.05765533447265625, -0.0538482666015625, -0.05004119873046875, -0.046234130859375, -0.04242706298828125, -0.0386199951171875, -0.03481292724609375, -0.031005859375, -0.02719879150390625, -0.0233917236328125, -0.01958465576171875, -0.015777587890625, -0.01197052001953125, -0.0081634521484375, -0.00435638427734375, -0.00054931640625, 0.00325775146484375, 0.0070648193359375, 0.01087188720703125, 0.014678955078125, 0.01848602294921875, 0.0222930908203125, 0.02610015869140625, 0.0299072265625, 0.03371429443359375, 0.0375213623046875, 0.04132843017578125, 0.045135498046875, 0.04894256591796875, 0.0527496337890625, 0.05655670166015625, 0.06036376953125, 0.06417083740234375, 0.0679779052734375, 0.07178497314453125, 0.075592041015625, 0.07939910888671875, 0.0832061767578125, 0.08701324462890625, 0.0908203125, 0.09462738037109375, 0.0984344482421875, 0.10224151611328125, 0.106048583984375, 0.10985565185546875, 0.1136627197265625, 0.11746978759765625, 0.12127685546875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 4.0, 10.0, 12.0, 15.0, 17.0, 23.0, 18.0, 20.0, 22.0, 25.0, 37.0, 41.0, 44.0, 47.0, 54.0, 63.0, 55.0, 56.0, 57.0, 55.0, 44.0, 36.0, 40.0, 28.0, 35.0, 20.0, 18.0, 17.0, 20.0, 13.0, 6.0, 7.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011873245239257812, -0.0011524409055709839, -0.0011175572872161865, -0.0010826736688613892, -0.0010477900505065918, -0.0010129064321517944, -0.000978022813796997, -0.0009431391954421997, -0.0009082555770874023, -0.000873371958732605, -0.0008384883403778076, -0.0008036047220230103, -0.0007687211036682129, -0.0007338374853134155, -0.0006989538669586182, -0.0006640702486038208, -0.0006291866302490234, -0.0005943030118942261, -0.0005594193935394287, -0.0005245357751846313, -0.000489652156829834, -0.0004547685384750366, -0.00041988492012023926, -0.0003850013017654419, -0.00035011768341064453, -0.00031523406505584717, -0.0002803504467010498, -0.00024546682834625244, -0.00021058320999145508, -0.00017569959163665771, -0.00014081597328186035, -0.00010593235492706299, -7.104873657226562e-05, -3.616511821746826e-05, -1.2814998626708984e-06, 3.3602118492126465e-05, 6.848573684692383e-05, 0.00010336935520172119, 0.00013825297355651855, 0.00017313659191131592, 0.00020802021026611328, 0.00024290382862091064, 0.000277787446975708, 0.00031267106533050537, 0.00034755468368530273, 0.0003824383020401001, 0.00041732192039489746, 0.0004522055387496948, 0.0004870891571044922, 0.0005219727754592896, 0.0005568563938140869, 0.0005917400121688843, 0.0006266236305236816, 0.000661507248878479, 0.0006963908672332764, 0.0007312744855880737, 0.0007661581039428711, 0.0008010417222976685, 0.0008359253406524658, 0.0008708089590072632, 0.0009056925773620605, 0.0009405761957168579, 0.0009754598140716553, 0.0010103434324264526, 0.00104522705078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 6.0, 8.0, 11.0, 19.0, 17.0, 18.0, 21.0, 35.0, 32.0, 55.0, 91.0, 186.0, 503.0, 1515.0, 636541.0, 407003.0, 1444.0, 458.0, 190.0, 98.0, 50.0, 40.0, 26.0, 25.0, 22.0, 17.0, 22.0, 15.0, 19.0, 11.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0230712890625, -0.022301912307739258, -0.021532535552978516, -0.020763158798217773, -0.01999378204345703, -0.01922440528869629, -0.018455028533935547, -0.017685651779174805, -0.016916275024414062, -0.01614689826965332, -0.015377521514892578, -0.014608144760131836, -0.013838768005371094, -0.013069391250610352, -0.01230001449584961, -0.011530637741088867, -0.010761260986328125, -0.009991884231567383, -0.00922250747680664, -0.008453130722045898, -0.007683753967285156, -0.006914377212524414, -0.006145000457763672, -0.00537562370300293, -0.0046062469482421875, -0.0038368701934814453, -0.003067493438720703, -0.002298116683959961, -0.0015287399291992188, -0.0007593631744384766, 1.0013580322265625e-05, 0.0007793903350830078, 0.00154876708984375, 0.002318143844604492, 0.0030875205993652344, 0.0038568973541259766, 0.004626274108886719, 0.005395650863647461, 0.006165027618408203, 0.006934404373168945, 0.0077037811279296875, 0.00847315788269043, 0.009242534637451172, 0.010011911392211914, 0.010781288146972656, 0.011550664901733398, 0.01232004165649414, 0.013089418411254883, 0.013858795166015625, 0.014628171920776367, 0.01539754867553711, 0.01616692543029785, 0.016936302185058594, 0.017705678939819336, 0.018475055694580078, 0.01924443244934082, 0.020013809204101562, 0.020783185958862305, 0.021552562713623047, 0.02232193946838379, 0.02309131622314453, 0.023860692977905273, 0.024630069732666016, 0.025399446487426758, 0.0261688232421875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 995.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04389767348766327, -0.04310816153883934, -0.04231865331530571, -0.04152914136648178, -0.04073963314294815, -0.03995012119412422, -0.03916060924530029, -0.03837110102176666, -0.037581589072942734, -0.036792077124118805, -0.036002568900585175, -0.035213056951761246, -0.03442354500293732, -0.033634036779403687, -0.03284452483057976, -0.03205501660704613, -0.0312655046582222, -0.03047599457204342, -0.02968648448586464, -0.02889697253704071, -0.02810746245086193, -0.02731795236468315, -0.026528440415859222, -0.025738930329680443, -0.024949420243501663, -0.024159910157322884, -0.023370400071144104, -0.022580888122320175, -0.021791378036141396, -0.021001867949962616, -0.020212356001138687, -0.019422845914959908, -0.018633335828781128, -0.01784382574260235, -0.01705431565642357, -0.01626480370759964, -0.01547529362142086, -0.01468578353524208, -0.013896272517740726, -0.013106761500239372, -0.012317251414060593, -0.011527741327881813, -0.010738230310380459, -0.009948719292879105, -0.009159209206700325, -0.008369699120521545, -0.007580188103020191, -0.006790677551180124, -0.00600116653367877, -0.005211655981838703, -0.004422145429998636, -0.0036326348781585693, -0.0028431243263185024, -0.0020536137744784355, -0.0012641032226383686, -0.0004745926707983017, 0.0003149178810417652, 0.0011044284328818321, 0.001893938984721899, 0.002683449536561966, 0.003472960088402033, 0.0042624706402421, 0.005051981192082167, 0.005841491743922234, 0.0066310022957623005]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 7.0, 10.0, 14.0, 16.0, 30.0, 32.0, 31.0, 37.0, 46.0, 50.0, 51.0, 54.0, 52.0, 57.0, 47.0, 57.0, 49.0, 54.0, 52.0, 44.0, 27.0, 41.0, 25.0, 25.0, 26.0, 12.0, 11.0, 13.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011968016624450684, -0.001146787777543068, -0.0010967738926410675, -0.001046760007739067, -0.0009967461228370667, -0.0009467322379350662, -0.0008967183530330658, -0.0008467044681310654, -0.0007966905832290649, -0.0007466766983270645, -0.0006966628134250641, -0.0006466489285230637, -0.0005966350436210632, -0.0005466211587190628, -0.0004966072738170624, -0.00044659338891506195, -0.0003965795040130615, -0.0003465656191110611, -0.00029655173420906067, -0.00024653784930706024, -0.00019652396440505981, -0.0001465100795030594, -9.649619460105896e-05, -4.648230969905853e-05, 3.5315752029418945e-06, 5.354546010494232e-05, 0.00010355934500694275, 0.00015357322990894318, 0.0002035871148109436, 0.00025360099971294403, 0.00030361488461494446, 0.0003536287695169449, 0.0004036426544189453, 0.00045365653932094574, 0.0005036704242229462, 0.0005536843091249466, 0.000603698194026947, 0.0006537120789289474, 0.0007037259638309479, 0.0007537398487329483, 0.0008037537336349487, 0.0008537676185369492, 0.0009037815034389496, 0.00095379538834095, 0.0010038092732429504, 0.0010538231581449509, 0.0011038370430469513, 0.0011538509279489517, 0.0012038648128509521, 0.0012538786977529526, 0.001303892582654953, 0.0013539064675569534, 0.0014039203524589539, 0.0014539342373609543, 0.0015039481222629547, 0.0015539620071649551, 0.0016039758920669556, 0.001653989776968956, 0.0017040036618709564, 0.0017540175467729568, 0.0018040314316749573, 0.0018540453165769577, 0.0019040592014789581, 0.0019540730863809586, 0.002004086971282959]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 7.0, 21.0, 14.0, 19.0, 24.0, 29.0, 22.0, 31.0, 31.0, 40.0, 38.0, 21.0, 39.0, 33.0, 44.0, 36.0, 37.0, 33.0, 35.0, 36.0, 46.0, 25.0, 33.0, 30.0, 36.0, 32.0, 20.0, 17.0, 16.0, 13.0, 19.0, 13.0, 17.0, 11.0, 13.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.375, -10.0693359375, -9.763671875, -9.4580078125, -9.15234375, -8.8466796875, -8.541015625, -8.2353515625, -7.9296875, -7.6240234375, -7.318359375, -7.0126953125, -6.70703125, -6.4013671875, -6.095703125, -5.7900390625, -5.484375, -5.1787109375, -4.873046875, -4.5673828125, -4.26171875, -3.9560546875, -3.650390625, -3.3447265625, -3.0390625, -2.7333984375, -2.427734375, -2.1220703125, -1.81640625, -1.5107421875, -1.205078125, -0.8994140625, -0.59375, -0.2880859375, 0.017578125, 0.3232421875, 0.62890625, 0.9345703125, 1.240234375, 1.5458984375, 1.8515625, 2.1572265625, 2.462890625, 2.7685546875, 3.07421875, 3.3798828125, 3.685546875, 3.9912109375, 4.296875, 4.6025390625, 4.908203125, 5.2138671875, 5.51953125, 5.8251953125, 6.130859375, 6.4365234375, 6.7421875, 7.0478515625, 7.353515625, 7.6591796875, 7.96484375, 8.2705078125, 8.576171875, 8.8818359375, 9.1875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 9.0, 6.0, 10.0, 19.0, 23.0, 26.0, 37.0, 54.0, 88.0, 94.0, 125.0, 196.0, 275.0, 353.0, 537.0, 721.0, 1021.0, 1511.0, 2156.0, 3350.0, 4873.0, 7661.0, 12315.0, 20738.0, 45198.0, 485957.0, 365725.0, 41618.0, 19696.0, 11756.0, 7414.0, 4731.0, 3174.0, 2113.0, 1478.0, 1012.0, 693.0, 507.0, 364.0, 256.0, 182.0, 133.0, 104.0, 69.0, 55.0, 28.0, 29.0, 19.0, 19.0, 13.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-17.6875, -17.134033203125, -16.58056640625, -16.027099609375, -15.4736328125, -14.920166015625, -14.36669921875, -13.813232421875, -13.259765625, -12.706298828125, -12.15283203125, -11.599365234375, -11.0458984375, -10.492431640625, -9.93896484375, -9.385498046875, -8.83203125, -8.278564453125, -7.72509765625, -7.171630859375, -6.6181640625, -6.064697265625, -5.51123046875, -4.957763671875, -4.404296875, -3.850830078125, -3.29736328125, -2.743896484375, -2.1904296875, -1.636962890625, -1.08349609375, -0.530029296875, 0.0234375, 0.576904296875, 1.13037109375, 1.683837890625, 2.2373046875, 2.790771484375, 3.34423828125, 3.897705078125, 4.451171875, 5.004638671875, 5.55810546875, 6.111572265625, 6.6650390625, 7.218505859375, 7.77197265625, 8.325439453125, 8.87890625, 9.432373046875, 9.98583984375, 10.539306640625, 11.0927734375, 11.646240234375, 12.19970703125, 12.753173828125, 13.306640625, 13.860107421875, 14.41357421875, 14.967041015625, 15.5205078125, 16.073974609375, 16.62744140625, 17.180908203125, 17.734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 7.0, 12.0, 12.0, 14.0, 17.0, 16.0, 20.0, 33.0, 17.0, 34.0, 35.0, 38.0, 52.0, 43.0, 79.0, 131.0, 1648.0, 281.0, 98.0, 72.0, 57.0, 51.0, 36.0, 28.0, 35.0, 27.0, 19.0, 20.0, 20.0, 6.0, 7.0, 14.0, 10.0, 10.0, 4.0, 6.0, 6.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.15625, -35.01806640625, -33.8798828125, -32.74169921875, -31.603515625, -30.46533203125, -29.3271484375, -28.18896484375, -27.05078125, -25.91259765625, -24.7744140625, -23.63623046875, -22.498046875, -21.35986328125, -20.2216796875, -19.08349609375, -17.9453125, -16.80712890625, -15.6689453125, -14.53076171875, -13.392578125, -12.25439453125, -11.1162109375, -9.97802734375, -8.83984375, -7.70166015625, -6.5634765625, -5.42529296875, -4.287109375, -3.14892578125, -2.0107421875, -0.87255859375, 0.265625, 1.40380859375, 2.5419921875, 3.68017578125, 4.818359375, 5.95654296875, 7.0947265625, 8.23291015625, 9.37109375, 10.50927734375, 11.6474609375, 12.78564453125, 13.923828125, 15.06201171875, 16.2001953125, 17.33837890625, 18.4765625, 19.61474609375, 20.7529296875, 21.89111328125, 23.029296875, 24.16748046875, 25.3056640625, 26.44384765625, 27.58203125, 28.72021484375, 29.8583984375, 30.99658203125, 32.134765625, 33.27294921875, 34.4111328125, 35.54931640625, 36.6875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 14.0, 19.0, 18.0, 35.0, 32.0, 37.0, 44.0, 68.0, 102.0, 123.0, 228.0, 481.0, 1618.0, 7972.0, 73557.0, 3010436.0, 42776.0, 5825.0, 1201.0, 376.0, 188.0, 127.0, 82.0, 71.0, 46.0, 47.0, 32.0, 31.0, 21.0, 21.0, 13.0, 14.0, 3.0, 8.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.125, -72.654296875, -70.18359375, -67.712890625, -65.2421875, -62.771484375, -60.30078125, -57.830078125, -55.359375, -52.888671875, -50.41796875, -47.947265625, -45.4765625, -43.005859375, -40.53515625, -38.064453125, -35.59375, -33.123046875, -30.65234375, -28.181640625, -25.7109375, -23.240234375, -20.76953125, -18.298828125, -15.828125, -13.357421875, -10.88671875, -8.416015625, -5.9453125, -3.474609375, -1.00390625, 1.466796875, 3.9375, 6.408203125, 8.87890625, 11.349609375, 13.8203125, 16.291015625, 18.76171875, 21.232421875, 23.703125, 26.173828125, 28.64453125, 31.115234375, 33.5859375, 36.056640625, 38.52734375, 40.998046875, 43.46875, 45.939453125, 48.41015625, 50.880859375, 53.3515625, 55.822265625, 58.29296875, 60.763671875, 63.234375, 65.705078125, 68.17578125, 70.646484375, 73.1171875, 75.587890625, 78.05859375, 80.529296875, 83.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 57.0, 115.0, 327.0, 268.0, 162.0, 52.0, 13.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.46795654296875, -282.6966857910156, -276.9254455566406, -271.1541748046875, -265.3829345703125, -259.6116638183594, -253.84042358398438, -248.0691680908203, -242.29791259765625, -236.5266571044922, -230.75540161132812, -224.98414611816406, -219.212890625, -213.44163513183594, -207.67037963867188, -201.8991241455078, -196.12786865234375, -190.3566131591797, -184.58535766601562, -178.81410217285156, -173.0428466796875, -167.27159118652344, -161.50033569335938, -155.7290802001953, -149.9578094482422, -144.18655395507812, -138.41529846191406, -132.64404296875, -126.87278747558594, -121.10153198242188, -115.33027648925781, -109.55902099609375, -103.78777313232422, -98.01651763916016, -92.2452621459961, -86.47400665283203, -80.70275115966797, -74.9314956665039, -69.16023254394531, -63.388980865478516, -57.61772537231445, -51.84646987915039, -46.07521438598633, -40.303955078125, -34.53269958496094, -28.761445999145508, -22.990188598632812, -17.21893310546875, -11.447677612304688, -5.676421642303467, 0.0948343276977539, 5.866090774536133, 11.637346267700195, 17.408601760864258, 23.179859161376953, 28.951114654541016, 34.72237014770508, 40.49362564086914, 46.2648811340332, 52.03614044189453, 57.807395935058594, 63.578651428222656, 69.34990692138672, 75.12116241455078, 80.89241790771484]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 10.0, 5.0, 11.0, 15.0, 17.0, 17.0, 18.0, 22.0, 15.0, 19.0, 25.0, 21.0, 28.0, 36.0, 29.0, 43.0, 29.0, 38.0, 39.0, 43.0, 41.0, 44.0, 36.0, 34.0, 39.0, 43.0, 39.0, 32.0, 29.0, 19.0, 21.0, 24.0, 13.0, 20.0, 17.0, 12.0, 13.0, 8.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-83.98104095458984, -81.23321533203125, -78.48538970947266, -75.7375717163086, -72.98974609375, -70.2419204711914, -67.49409484863281, -64.74627685546875, -61.998451232910156, -59.25062561035156, -56.502803802490234, -53.75497817993164, -51.00715637207031, -48.25933074951172, -45.511505126953125, -42.7636833190918, -40.0158576965332, -37.26803207397461, -34.52021026611328, -31.772384643554688, -29.02456283569336, -26.276737213134766, -23.528913497924805, -20.781089782714844, -18.033266067504883, -15.285442352294922, -12.537618637084961, -9.789793968200684, -7.041970252990723, -4.294146537780762, -1.5463218688964844, 1.2015018463134766, 3.9493255615234375, 6.697149276733398, 9.44497299194336, 12.192797660827637, 14.940621376037598, 17.688446044921875, 20.436269760131836, 23.184093475341797, 25.931917190551758, 28.67974090576172, 31.42756462097168, 34.17538833618164, 36.923213958740234, 39.67103576660156, 42.418861389160156, 45.16668701171875, 47.91450881958008, 50.66233444213867, 53.41015625, 56.157981872558594, 58.90580368041992, 61.653629302978516, 64.40145111083984, 67.14927673339844, 69.89710235595703, 72.64492797851562, 75.39275360107422, 78.14057159423828, 80.88839721679688, 83.63622283935547, 86.38404846191406, 89.13186645507812, 91.87969207763672]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 8.0, 7.0, 3.0, 8.0, 15.0, 18.0, 20.0, 28.0, 29.0, 32.0, 30.0, 38.0, 30.0, 49.0, 36.0, 38.0, 38.0, 46.0, 49.0, 34.0, 35.0, 39.0, 29.0, 45.0, 35.0, 34.0, 27.0, 38.0, 19.0, 17.0, 20.0, 16.0, 18.0, 14.0, 10.0, 6.0, 6.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0806884765625, -11.716064453125, -11.3514404296875, -10.98681640625, -10.6221923828125, -10.257568359375, -9.8929443359375, -9.5283203125, -9.1636962890625, -8.799072265625, -8.4344482421875, -8.06982421875, -7.7052001953125, -7.340576171875, -6.9759521484375, -6.611328125, -6.2467041015625, -5.882080078125, -5.5174560546875, -5.15283203125, -4.7882080078125, -4.423583984375, -4.0589599609375, -3.6943359375, -3.3297119140625, -2.965087890625, -2.6004638671875, -2.23583984375, -1.8712158203125, -1.506591796875, -1.1419677734375, -0.77734375, -0.4127197265625, -0.048095703125, 0.3165283203125, 0.68115234375, 1.0457763671875, 1.410400390625, 1.7750244140625, 2.1396484375, 2.5042724609375, 2.868896484375, 3.2335205078125, 3.59814453125, 3.9627685546875, 4.327392578125, 4.6920166015625, 5.056640625, 5.4212646484375, 5.785888671875, 6.1505126953125, 6.51513671875, 6.8797607421875, 7.244384765625, 7.6090087890625, 7.9736328125, 8.3382568359375, 8.702880859375, 9.0675048828125, 9.43212890625, 9.7967529296875, 10.161376953125, 10.5260009765625, 10.890625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 4.0, 9.0, 5.0, 6.0, 10.0, 17.0, 27.0, 18.0, 34.0, 32.0, 45.0, 59.0, 83.0, 85.0, 144.0, 222.0, 382.0, 672.0, 1366.0, 3198.0, 8733.0, 31378.0, 570900.0, 3307796.0, 235309.0, 22153.0, 6558.0, 2448.0, 1068.0, 529.0, 273.0, 177.0, 118.0, 106.0, 67.0, 54.0, 53.0, 43.0, 20.0, 17.0, 15.0, 12.0, 17.0, 6.0, 2.0, 7.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.53125, -36.40673828125, -35.2822265625, -34.15771484375, -33.033203125, -31.90869140625, -30.7841796875, -29.65966796875, -28.53515625, -27.41064453125, -26.2861328125, -25.16162109375, -24.037109375, -22.91259765625, -21.7880859375, -20.66357421875, -19.5390625, -18.41455078125, -17.2900390625, -16.16552734375, -15.041015625, -13.91650390625, -12.7919921875, -11.66748046875, -10.54296875, -9.41845703125, -8.2939453125, -7.16943359375, -6.044921875, -4.92041015625, -3.7958984375, -2.67138671875, -1.546875, -0.42236328125, 0.7021484375, 1.82666015625, 2.951171875, 4.07568359375, 5.2001953125, 6.32470703125, 7.44921875, 8.57373046875, 9.6982421875, 10.82275390625, 11.947265625, 13.07177734375, 14.1962890625, 15.32080078125, 16.4453125, 17.56982421875, 18.6943359375, 19.81884765625, 20.943359375, 22.06787109375, 23.1923828125, 24.31689453125, 25.44140625, 26.56591796875, 27.6904296875, 28.81494140625, 29.939453125, 31.06396484375, 32.1884765625, 33.31298828125, 34.4375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 12.0, 12.0, 18.0, 20.0, 24.0, 32.0, 44.0, 55.0, 80.0, 129.0, 254.0, 441.0, 778.0, 852.0, 567.0, 304.0, 137.0, 89.0, 56.0, 44.0, 30.0, 26.0, 17.0, 12.0, 7.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.734375, -27.8125, -26.890625, -25.96875, -25.046875, -24.125, -23.203125, -22.28125, -21.359375, -20.4375, -19.515625, -18.59375, -17.671875, -16.75, -15.828125, -14.90625, -13.984375, -13.0625, -12.140625, -11.21875, -10.296875, -9.375, -8.453125, -7.53125, -6.609375, -5.6875, -4.765625, -3.84375, -2.921875, -2.0, -1.078125, -0.15625, 0.765625, 1.6875, 2.609375, 3.53125, 4.453125, 5.375, 6.296875, 7.21875, 8.140625, 9.0625, 9.984375, 10.90625, 11.828125, 12.75, 13.671875, 14.59375, 15.515625, 16.4375, 17.359375, 18.28125, 19.203125, 20.125, 21.046875, 21.96875, 22.890625, 23.8125, 24.734375, 25.65625, 26.578125, 27.5, 28.421875, 29.34375, 30.265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 4.0, 11.0, 24.0, 29.0, 46.0, 68.0, 123.0, 218.0, 700.0, 3311.0, 41140.0, 3933711.0, 205214.0, 7665.0, 1170.0, 338.0, 181.0, 105.0, 47.0, 46.0, 29.0, 18.0, 15.0, 17.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-105.0, -101.7890625, -98.578125, -95.3671875, -92.15625, -88.9453125, -85.734375, -82.5234375, -79.3125, -76.1015625, -72.890625, -69.6796875, -66.46875, -63.2578125, -60.046875, -56.8359375, -53.625, -50.4140625, -47.203125, -43.9921875, -40.78125, -37.5703125, -34.359375, -31.1484375, -27.9375, -24.7265625, -21.515625, -18.3046875, -15.09375, -11.8828125, -8.671875, -5.4609375, -2.25, 0.9609375, 4.171875, 7.3828125, 10.59375, 13.8046875, 17.015625, 20.2265625, 23.4375, 26.6484375, 29.859375, 33.0703125, 36.28125, 39.4921875, 42.703125, 45.9140625, 49.125, 52.3359375, 55.546875, 58.7578125, 61.96875, 65.1796875, 68.390625, 71.6015625, 74.8125, 78.0234375, 81.234375, 84.4453125, 87.65625, 90.8671875, 94.078125, 97.2890625, 100.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 21.0, 37.0, 85.0, 142.0, 232.0, 217.0, 135.0, 70.0, 33.0, 18.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.5796890258789, -107.28607940673828, -100.99246215820312, -94.6988525390625, -88.40523529052734, -82.11162567138672, -75.81800842285156, -69.52439880371094, -63.23078536987305, -56.937171936035156, -50.643558502197266, -44.349945068359375, -38.05633544921875, -31.762720108032227, -25.46910858154297, -19.175495147705078, -12.881881713867188, -6.588268756866455, -0.29465579986572266, 5.998956680297852, 12.292570114135742, 18.586183547973633, 24.87979507446289, 31.17340850830078, 37.46702194213867, 43.76063537597656, 50.05424880981445, 56.347862243652344, 62.64147186279297, 68.93508911132812, 75.22869873046875, 81.52230834960938, 87.81593322753906, 94.10954284667969, 100.40316009521484, 106.69676971435547, 112.99038696289062, 119.28399658203125, 125.57760620117188, 131.8712158203125, 138.1648406982422, 144.4584503173828, 150.75205993652344, 157.04568481445312, 163.33929443359375, 169.63290405273438, 175.926513671875, 182.22012329101562, 188.51373291015625, 194.80734252929688, 201.1009521484375, 207.3945770263672, 213.6881866455078, 219.98179626464844, 226.27540588378906, 232.56903076171875, 238.86264038085938, 245.15625, 251.44985961914062, 257.74346923828125, 264.0370788574219, 270.3307189941406, 276.62432861328125, 282.9179382324219, 289.2115478515625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 14.0, 11.0, 14.0, 23.0, 17.0, 19.0, 16.0, 30.0, 24.0, 38.0, 33.0, 32.0, 41.0, 36.0, 40.0, 36.0, 39.0, 39.0, 49.0, 27.0, 36.0, 45.0, 29.0, 34.0, 29.0, 24.0, 22.0, 29.0, 24.0, 27.0, 13.0, 14.0, 8.0, 12.0, 8.0, 8.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.63673400878906, -63.30698776245117, -60.97724533081055, -58.647499084472656, -56.31775665283203, -53.98801040649414, -51.65826416015625, -49.328521728515625, -46.998775482177734, -44.669029235839844, -42.33928680419922, -40.00954055786133, -37.67979431152344, -35.35005187988281, -33.02030563354492, -30.690561294555664, -28.360816955566406, -26.03107261657715, -23.70132827758789, -21.37158203125, -19.041837692260742, -16.712093353271484, -14.38234806060791, -12.052602767944336, -9.722858428955078, -7.393113613128662, -5.063368797302246, -2.73362398147583, -0.40387916564941406, 1.9258651733398438, 4.255610466003418, 6.585355758666992, 8.91510009765625, 11.244844436645508, 13.574589729309082, 15.904335021972656, 18.234079360961914, 20.563823699951172, 22.893569946289062, 25.22331428527832, 27.553058624267578, 29.882802963256836, 32.212547302246094, 34.542293548583984, 36.872039794921875, 39.2017822265625, 41.53152847290039, 43.86127471923828, 46.191017150878906, 48.5207633972168, 50.85050582885742, 53.18025207519531, 55.50999450683594, 57.83974075317383, 60.16948699951172, 62.499229431152344, 64.8289794921875, 67.15872192382812, 69.48847198486328, 71.8182144165039, 74.14795684814453, 76.47770690917969, 78.80744934082031, 81.13719177246094, 83.46693420410156]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 15.0, 21.0, 23.0, 28.0, 25.0, 36.0, 36.0, 36.0, 34.0, 35.0, 32.0, 50.0, 50.0, 36.0, 46.0, 33.0, 40.0, 24.0, 31.0, 44.0, 29.0, 27.0, 34.0, 17.0, 24.0, 24.0, 13.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.90625, -11.570068359375, -11.23388671875, -10.897705078125, -10.5615234375, -10.225341796875, -9.88916015625, -9.552978515625, -9.216796875, -8.880615234375, -8.54443359375, -8.208251953125, -7.8720703125, -7.535888671875, -7.19970703125, -6.863525390625, -6.52734375, -6.191162109375, -5.85498046875, -5.518798828125, -5.1826171875, -4.846435546875, -4.51025390625, -4.174072265625, -3.837890625, -3.501708984375, -3.16552734375, -2.829345703125, -2.4931640625, -2.156982421875, -1.82080078125, -1.484619140625, -1.1484375, -0.812255859375, -0.47607421875, -0.139892578125, 0.1962890625, 0.532470703125, 0.86865234375, 1.204833984375, 1.541015625, 1.877197265625, 2.21337890625, 2.549560546875, 2.8857421875, 3.221923828125, 3.55810546875, 3.894287109375, 4.23046875, 4.566650390625, 4.90283203125, 5.239013671875, 5.5751953125, 5.911376953125, 6.24755859375, 6.583740234375, 6.919921875, 7.256103515625, 7.59228515625, 7.928466796875, 8.2646484375, 8.600830078125, 8.93701171875, 9.273193359375, 9.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 6.0, 15.0, 13.0, 16.0, 36.0, 43.0, 84.0, 125.0, 181.0, 316.0, 498.0, 824.0, 1199.0, 2013.0, 3313.0, 5221.0, 8644.0, 14412.0, 24489.0, 42307.0, 73871.0, 133143.0, 238699.0, 217301.0, 119529.0, 67412.0, 38504.0, 22531.0, 13167.0, 8006.0, 4710.0, 2983.0, 1874.0, 1120.0, 724.0, 440.0, 295.0, 174.0, 114.0, 73.0, 44.0, 31.0, 28.0, 7.0, 12.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.32666015625, -0.3170280456542969, -0.30739593505859375, -0.2977638244628906, -0.2881317138671875, -0.2784996032714844, -0.26886749267578125, -0.2592353820800781, -0.249603271484375, -0.23997116088867188, -0.23033905029296875, -0.22070693969726562, -0.2110748291015625, -0.20144271850585938, -0.19181060791015625, -0.18217849731445312, -0.17254638671875, -0.16291427612304688, -0.15328216552734375, -0.14365005493164062, -0.1340179443359375, -0.12438583374023438, -0.11475372314453125, -0.10512161254882812, -0.095489501953125, -0.08585739135742188, -0.07622528076171875, -0.06659317016601562, -0.0569610595703125, -0.047328948974609375, -0.03769683837890625, -0.028064727783203125, -0.0184326171875, -0.008800506591796875, 0.00083160400390625, 0.010463714599609375, 0.0200958251953125, 0.029727935791015625, 0.03936004638671875, 0.048992156982421875, 0.058624267578125, 0.06825637817382812, 0.07788848876953125, 0.08752059936523438, 0.0971527099609375, 0.10678482055664062, 0.11641693115234375, 0.12604904174804688, 0.13568115234375, 0.14531326293945312, 0.15494537353515625, 0.16457748413085938, 0.1742095947265625, 0.18384170532226562, 0.19347381591796875, 0.20310592651367188, 0.212738037109375, 0.22237014770507812, 0.23200225830078125, 0.24163436889648438, 0.2512664794921875, 0.2608985900878906, 0.27053070068359375, 0.2801628112792969, 0.289794921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 5.0, 6.0, 10.0, 13.0, 11.0, 14.0, 17.0, 27.0, 21.0, 30.0, 25.0, 37.0, 38.0, 37.0, 32.0, 31.0, 39.0, 32.0, 51.0, 1067.0, 39.0, 47.0, 36.0, 42.0, 36.0, 39.0, 28.0, 31.0, 31.0, 24.0, 16.0, 26.0, 12.0, 12.0, 15.0, 9.0, 9.0, 5.0, 4.0, 6.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.75, -9.458984375, -9.16796875, -8.876953125, -8.5859375, -8.294921875, -8.00390625, -7.712890625, -7.421875, -7.130859375, -6.83984375, -6.548828125, -6.2578125, -5.966796875, -5.67578125, -5.384765625, -5.09375, -4.802734375, -4.51171875, -4.220703125, -3.9296875, -3.638671875, -3.34765625, -3.056640625, -2.765625, -2.474609375, -2.18359375, -1.892578125, -1.6015625, -1.310546875, -1.01953125, -0.728515625, -0.4375, -0.146484375, 0.14453125, 0.435546875, 0.7265625, 1.017578125, 1.30859375, 1.599609375, 1.890625, 2.181640625, 2.47265625, 2.763671875, 3.0546875, 3.345703125, 3.63671875, 3.927734375, 4.21875, 4.509765625, 4.80078125, 5.091796875, 5.3828125, 5.673828125, 5.96484375, 6.255859375, 6.546875, 6.837890625, 7.12890625, 7.419921875, 7.7109375, 8.001953125, 8.29296875, 8.583984375, 8.875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 5.0, 2.0, 4.0, 3.0, 7.0, 14.0, 14.0, 12.0, 16.0, 39.0, 59.0, 61.0, 113.0, 156.0, 228.0, 322.0, 471.0, 650.0, 899.0, 1292.0, 1877.0, 2677.0, 3955.0, 5607.0, 8550.0, 13106.0, 19830.0, 30262.0, 46790.0, 72628.0, 116999.0, 311714.0, 1123449.0, 119730.0, 75081.0, 47820.0, 31141.0, 20526.0, 13401.0, 8696.0, 5947.0, 3919.0, 2728.0, 1902.0, 1266.0, 909.0, 671.0, 440.0, 350.0, 252.0, 169.0, 112.0, 85.0, 63.0, 49.0, 29.0, 20.0, 13.0, 4.0, 5.0, 3.0, 0.0, 5.0], "bins": [-0.1302490234375, -0.12630558013916016, -0.12236213684082031, -0.11841869354248047, -0.11447525024414062, -0.11053180694580078, -0.10658836364746094, -0.1026449203491211, -0.09870147705078125, -0.0947580337524414, -0.09081459045410156, -0.08687114715576172, -0.08292770385742188, -0.07898426055908203, -0.07504081726074219, -0.07109737396240234, -0.0671539306640625, -0.06321048736572266, -0.05926704406738281, -0.05532360076904297, -0.051380157470703125, -0.04743671417236328, -0.04349327087402344, -0.039549827575683594, -0.03560638427734375, -0.031662940979003906, -0.027719497680664062, -0.02377605438232422, -0.019832611083984375, -0.01588916778564453, -0.011945724487304688, -0.008002281188964844, -0.004058837890625, -0.00011539459228515625, 0.0038280487060546875, 0.007771492004394531, 0.011714935302734375, 0.01565837860107422, 0.019601821899414062, 0.023545265197753906, 0.02748870849609375, 0.031432151794433594, 0.03537559509277344, 0.03931903839111328, 0.043262481689453125, 0.04720592498779297, 0.05114936828613281, 0.055092811584472656, 0.0590362548828125, 0.06297969818115234, 0.06692314147949219, 0.07086658477783203, 0.07481002807617188, 0.07875347137451172, 0.08269691467285156, 0.0866403579711914, 0.09058380126953125, 0.0945272445678711, 0.09847068786621094, 0.10241413116455078, 0.10635757446289062, 0.11030101776123047, 0.11424446105957031, 0.11818790435791016, 0.12213134765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 3.0, 1.0, 6.0, 9.0, 13.0, 12.0, 9.0, 16.0, 17.0, 17.0, 20.0, 15.0, 37.0, 30.0, 34.0, 36.0, 49.0, 41.0, 43.0, 62.0, 59.0, 51.0, 44.0, 52.0, 42.0, 43.0, 28.0, 33.0, 30.0, 27.0, 13.0, 16.0, 13.0, 16.0, 8.0, 13.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0009794235229492188, -0.0009486228227615356, -0.0009178221225738525, -0.0008870214223861694, -0.0008562207221984863, -0.0008254200220108032, -0.0007946193218231201, -0.000763818621635437, -0.0007330179214477539, -0.0007022172212600708, -0.0006714165210723877, -0.0006406158208847046, -0.0006098151206970215, -0.0005790144205093384, -0.0005482137203216553, -0.0005174130201339722, -0.00048661231994628906, -0.00045581161975860596, -0.00042501091957092285, -0.00039421021938323975, -0.00036340951919555664, -0.00033260881900787354, -0.00030180811882019043, -0.0002710074186325073, -0.00024020671844482422, -0.0002094060182571411, -0.000178605318069458, -0.0001478046178817749, -0.0001170039176940918, -8.620321750640869e-05, -5.5402517318725586e-05, -2.460181713104248e-05, 6.198883056640625e-06, 3.699958324432373e-05, 6.780028343200684e-05, 9.860098361968994e-05, 0.00012940168380737305, 0.00016020238399505615, 0.00019100308418273926, 0.00022180378437042236, 0.00025260448455810547, 0.0002834051847457886, 0.0003142058849334717, 0.0003450065851211548, 0.0003758072853088379, 0.000406607985496521, 0.0004374086856842041, 0.0004682093858718872, 0.0004990100860595703, 0.0005298107862472534, 0.0005606114864349365, 0.0005914121866226196, 0.0006222128868103027, 0.0006530135869979858, 0.0006838142871856689, 0.000714614987373352, 0.0007454156875610352, 0.0007762163877487183, 0.0008070170879364014, 0.0008378177881240845, 0.0008686184883117676, 0.0008994191884994507, 0.0009302198886871338, 0.0009610205888748169, 0.0009918212890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 7.0, 7.0, 11.0, 8.0, 17.0, 12.0, 15.0, 16.0, 28.0, 35.0, 35.0, 44.0, 89.0, 180.0, 401.0, 1119.0, 55831.0, 986733.0, 2675.0, 581.0, 232.0, 115.0, 68.0, 53.0, 33.0, 35.0, 18.0, 19.0, 18.0, 20.0, 14.0, 9.0, 11.0, 14.0, 8.0, 6.0, 2.0, 3.0, 6.0, 9.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0220184326171875, -0.02133488655090332, -0.02065134048461914, -0.01996779441833496, -0.01928424835205078, -0.0186007022857666, -0.017917156219482422, -0.017233610153198242, -0.016550064086914062, -0.015866518020629883, -0.015182971954345703, -0.014499425888061523, -0.013815879821777344, -0.013132333755493164, -0.012448787689208984, -0.011765241622924805, -0.011081695556640625, -0.010398149490356445, -0.009714603424072266, -0.009031057357788086, -0.008347511291503906, -0.0076639652252197266, -0.006980419158935547, -0.006296873092651367, -0.0056133270263671875, -0.004929780960083008, -0.004246234893798828, -0.0035626888275146484, -0.0028791427612304688, -0.002195596694946289, -0.0015120506286621094, -0.0008285045623779297, -0.00014495849609375, 0.0005385875701904297, 0.0012221336364746094, 0.001905679702758789, 0.0025892257690429688, 0.0032727718353271484, 0.003956317901611328, 0.004639863967895508, 0.0053234100341796875, 0.006006956100463867, 0.006690502166748047, 0.0073740482330322266, 0.008057594299316406, 0.008741140365600586, 0.009424686431884766, 0.010108232498168945, 0.010791778564453125, 0.011475324630737305, 0.012158870697021484, 0.012842416763305664, 0.013525962829589844, 0.014209508895874023, 0.014893054962158203, 0.015576601028442383, 0.016260147094726562, 0.016943693161010742, 0.017627239227294922, 0.0183107852935791, 0.01899433135986328, 0.01967787742614746, 0.02036142349243164, 0.02104496955871582, 0.021728515625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 397.0, 613.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022900115698575974, -0.022442439571022987, -0.02198476344347, -0.021527087315917015, -0.02106941118836403, -0.020611733198165894, -0.020154058933258057, -0.01969638094305992, -0.019238704815506935, -0.01878102868795395, -0.018323352560400963, -0.017865676432847977, -0.01740800030529499, -0.016950324177742004, -0.01649264618754387, -0.016034970059990883, -0.015577294863760471, -0.015119618736207485, -0.014661942608654499, -0.014204265549778938, -0.013746589422225952, -0.013288913294672966, -0.01283123716711998, -0.012373561039566994, -0.011915884912014008, -0.011458208784461021, -0.011000532656908035, -0.01054285652935505, -0.010085179470479488, -0.009627503342926502, -0.009169827215373516, -0.00871215108782053, -0.008254473097622395, -0.007796796970069408, -0.007339120376855135, -0.006881444249302149, -0.006423767656087875, -0.005966091528534889, -0.005508415400981903, -0.005050739273428917, -0.0045930626802146435, -0.004135386552661657, -0.003677709959447384, -0.0032200338318943977, -0.002762357471510768, -0.002304681111127138, -0.001847004983574152, -0.0013893286231905222, -0.0009316522628068924, -0.0004739759606309235, -1.6299658454954624e-05, 0.00044137658551335335, 0.0008990529458969831, 0.001356729306280613, 0.001814405433833599, 0.002272081794217229, 0.0027297581546008587, 0.0031874345149844885, 0.0036451108753681183, 0.004102787002921104, 0.004560463130474091, 0.005018139723688364, 0.00547581585124135, 0.005933492444455624, 0.00639116857200861]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 9.0, 12.0, 16.0, 13.0, 24.0, 25.0, 34.0, 29.0, 31.0, 35.0, 40.0, 49.0, 55.0, 52.0, 48.0, 44.0, 56.0, 47.0, 43.0, 33.0, 49.0, 43.0, 35.0, 31.0, 28.0, 19.0, 14.0, 15.0, 14.0, 12.0, 8.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010987520217895508, -0.0010580597445368767, -0.0010173674672842026, -0.0009766751900315285, -0.0009359829127788544, -0.0008952906355261803, -0.0008545983582735062, -0.0008139060810208321, -0.000773213803768158, -0.0007325215265154839, -0.0006918292492628098, -0.0006511369720101357, -0.0006104446947574615, -0.0005697524175047874, -0.0005290601402521133, -0.0004883678629994392, -0.00044767558574676514, -0.00040698330849409103, -0.00036629103124141693, -0.00032559875398874283, -0.0002849064767360687, -0.0002442141994833946, -0.00020352192223072052, -0.00016282964497804642, -0.00012213736772537231, -8.144509047269821e-05, -4.075281322002411e-05, -6.05359673500061e-08, 4.06317412853241e-05, 8.13240185379982e-05, 0.0001220162957906723, 0.0001627085730433464, 0.0002034008502960205, 0.0002440931275486946, 0.0002847854048013687, 0.0003254776820540428, 0.0003661699593067169, 0.000406862236559391, 0.0004475545138120651, 0.00048824679106473923, 0.0005289390683174133, 0.0005696313455700874, 0.0006103236228227615, 0.0006510159000754356, 0.0006917081773281097, 0.0007324004545807838, 0.000773092731833458, 0.000813785009086132, 0.0008544772863388062, 0.0008951695635914803, 0.0009358618408441544, 0.0009765541180968285, 0.0010172463953495026, 0.0010579386726021767, 0.0010986309498548508, 0.0011393232271075249, 0.001180015504360199, 0.001220707781612873, 0.0012614000588655472, 0.0013020923361182213, 0.0013427846133708954, 0.0013834768906235695, 0.0014241691678762436, 0.0014648614451289177, 0.0015055537223815918]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 15.0, 21.0, 23.0, 28.0, 25.0, 36.0, 36.0, 36.0, 34.0, 35.0, 32.0, 50.0, 50.0, 36.0, 46.0, 33.0, 40.0, 24.0, 31.0, 44.0, 29.0, 27.0, 34.0, 17.0, 24.0, 24.0, 13.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.90625, -11.570068359375, -11.23388671875, -10.897705078125, -10.5615234375, -10.225341796875, -9.88916015625, -9.552978515625, -9.216796875, -8.880615234375, -8.54443359375, -8.208251953125, -7.8720703125, -7.535888671875, -7.19970703125, -6.863525390625, -6.52734375, -6.191162109375, -5.85498046875, -5.518798828125, -5.1826171875, -4.846435546875, -4.51025390625, -4.174072265625, -3.837890625, -3.501708984375, -3.16552734375, -2.829345703125, -2.4931640625, -2.156982421875, -1.82080078125, -1.484619140625, -1.1484375, -0.812255859375, -0.47607421875, -0.139892578125, 0.1962890625, 0.532470703125, 0.86865234375, 1.204833984375, 1.541015625, 1.877197265625, 2.21337890625, 2.549560546875, 2.8857421875, 3.221923828125, 3.55810546875, 3.894287109375, 4.23046875, 4.566650390625, 4.90283203125, 5.239013671875, 5.5751953125, 5.911376953125, 6.24755859375, 6.583740234375, 6.919921875, 7.256103515625, 7.59228515625, 7.928466796875, 8.2646484375, 8.600830078125, 8.93701171875, 9.273193359375, 9.609375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 11.0, 17.0, 22.0, 31.0, 37.0, 67.0, 80.0, 126.0, 149.0, 221.0, 327.0, 492.0, 777.0, 1082.0, 1694.0, 2586.0, 4183.0, 7570.0, 15172.0, 48859.0, 613288.0, 289859.0, 32559.0, 12322.0, 6343.0, 3751.0, 2301.0, 1478.0, 991.0, 644.0, 457.0, 302.0, 218.0, 176.0, 94.0, 64.0, 64.0, 32.0, 26.0, 10.0, 21.0, 8.0, 12.0, 3.0, 3.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-17.015625, -16.51318359375, -16.0107421875, -15.50830078125, -15.005859375, -14.50341796875, -14.0009765625, -13.49853515625, -12.99609375, -12.49365234375, -11.9912109375, -11.48876953125, -10.986328125, -10.48388671875, -9.9814453125, -9.47900390625, -8.9765625, -8.47412109375, -7.9716796875, -7.46923828125, -6.966796875, -6.46435546875, -5.9619140625, -5.45947265625, -4.95703125, -4.45458984375, -3.9521484375, -3.44970703125, -2.947265625, -2.44482421875, -1.9423828125, -1.43994140625, -0.9375, -0.43505859375, 0.0673828125, 0.56982421875, 1.072265625, 1.57470703125, 2.0771484375, 2.57958984375, 3.08203125, 3.58447265625, 4.0869140625, 4.58935546875, 5.091796875, 5.59423828125, 6.0966796875, 6.59912109375, 7.1015625, 7.60400390625, 8.1064453125, 8.60888671875, 9.111328125, 9.61376953125, 10.1162109375, 10.61865234375, 11.12109375, 11.62353515625, 12.1259765625, 12.62841796875, 13.130859375, 13.63330078125, 14.1357421875, 14.63818359375, 15.140625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 9.0, 11.0, 9.0, 13.0, 10.0, 15.0, 18.0, 17.0, 26.0, 30.0, 32.0, 46.0, 53.0, 33.0, 46.0, 58.0, 80.0, 378.0, 1619.0, 92.0, 65.0, 55.0, 44.0, 38.0, 29.0, 41.0, 25.0, 34.0, 18.0, 18.0, 13.0, 17.0, 8.0, 6.0, 11.0, 5.0, 3.0, 6.0, 9.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6875, -34.41650390625, -33.1455078125, -31.87451171875, -30.603515625, -29.33251953125, -28.0615234375, -26.79052734375, -25.51953125, -24.24853515625, -22.9775390625, -21.70654296875, -20.435546875, -19.16455078125, -17.8935546875, -16.62255859375, -15.3515625, -14.08056640625, -12.8095703125, -11.53857421875, -10.267578125, -8.99658203125, -7.7255859375, -6.45458984375, -5.18359375, -3.91259765625, -2.6416015625, -1.37060546875, -0.099609375, 1.17138671875, 2.4423828125, 3.71337890625, 4.984375, 6.25537109375, 7.5263671875, 8.79736328125, 10.068359375, 11.33935546875, 12.6103515625, 13.88134765625, 15.15234375, 16.42333984375, 17.6943359375, 18.96533203125, 20.236328125, 21.50732421875, 22.7783203125, 24.04931640625, 25.3203125, 26.59130859375, 27.8623046875, 29.13330078125, 30.404296875, 31.67529296875, 32.9462890625, 34.21728515625, 35.48828125, 36.75927734375, 38.0302734375, 39.30126953125, 40.572265625, 41.84326171875, 43.1142578125, 44.38525390625, 45.65625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 10.0, 7.0, 7.0, 11.0, 12.0, 8.0, 12.0, 19.0, 27.0, 25.0, 40.0, 61.0, 75.0, 90.0, 101.0, 150.0, 266.0, 698.0, 2972.0, 23391.0, 2989555.0, 118163.0, 7421.0, 1394.0, 388.0, 205.0, 135.0, 109.0, 77.0, 66.0, 47.0, 39.0, 31.0, 20.0, 12.0, 12.0, 10.0, 13.0, 9.0, 11.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-82.8125, -80.49609375, -78.1796875, -75.86328125, -73.546875, -71.23046875, -68.9140625, -66.59765625, -64.28125, -61.96484375, -59.6484375, -57.33203125, -55.015625, -52.69921875, -50.3828125, -48.06640625, -45.75, -43.43359375, -41.1171875, -38.80078125, -36.484375, -34.16796875, -31.8515625, -29.53515625, -27.21875, -24.90234375, -22.5859375, -20.26953125, -17.953125, -15.63671875, -13.3203125, -11.00390625, -8.6875, -6.37109375, -4.0546875, -1.73828125, 0.578125, 2.89453125, 5.2109375, 7.52734375, 9.84375, 12.16015625, 14.4765625, 16.79296875, 19.109375, 21.42578125, 23.7421875, 26.05859375, 28.375, 30.69140625, 33.0078125, 35.32421875, 37.640625, 39.95703125, 42.2734375, 44.58984375, 46.90625, 49.22265625, 51.5390625, 53.85546875, 56.171875, 58.48828125, 60.8046875, 63.12109375, 65.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 28.0, 447.0, 512.0, 33.0], "bins": [-662.664794921875, -651.9754638671875, -641.2861938476562, -630.5968627929688, -619.9075927734375, -609.21826171875, -598.5289916992188, -587.8396606445312, -577.150390625, -566.4610595703125, -555.7717895507812, -545.0824584960938, -534.3931884765625, -523.703857421875, -513.0145874023438, -502.3252868652344, -491.635986328125, -480.9466857910156, -470.25738525390625, -459.5680847167969, -448.8787841796875, -438.1894836425781, -427.50018310546875, -416.8108825683594, -406.1215515136719, -395.4322509765625, -384.7429504394531, -374.05364990234375, -363.3643493652344, -352.675048828125, -341.9857482910156, -331.29644775390625, -320.6071472167969, -309.9178466796875, -299.2285461425781, -288.53924560546875, -277.8499450683594, -267.16064453125, -256.4713439941406, -245.78204345703125, -235.09274291992188, -224.4034423828125, -213.71414184570312, -203.02484130859375, -192.33554077148438, -181.646240234375, -170.95693969726562, -160.26763916015625, -149.57833862304688, -138.8890380859375, -128.19973754882812, -117.51043701171875, -106.82113647460938, -96.1318359375, -85.4425277709961, -74.75322723388672, -64.06391906738281, -53.37461853027344, -42.68531799316406, -31.996013641357422, -21.306713104248047, -10.617412567138672, 0.07189178466796875, 10.761192321777344, 21.450489044189453]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 6.0, 6.0, 12.0, 10.0, 15.0, 11.0, 16.0, 19.0, 21.0, 24.0, 40.0, 35.0, 28.0, 24.0, 32.0, 28.0, 40.0, 43.0, 40.0, 34.0, 35.0, 32.0, 35.0, 37.0, 35.0, 41.0, 32.0, 33.0, 34.0, 31.0, 22.0, 17.0, 11.0, 20.0, 10.0, 14.0, 12.0, 5.0, 13.0, 8.0, 6.0, 5.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.49776458740234, -78.55269622802734, -75.60762786865234, -72.66256713867188, -69.71749877929688, -66.77243041992188, -63.827362060546875, -60.88229751586914, -57.937232971191406, -54.992164611816406, -52.04710006713867, -49.10203170776367, -46.15696716308594, -43.21189880371094, -40.26683044433594, -37.3217658996582, -34.3766975402832, -31.431631088256836, -28.48656463623047, -25.54149627685547, -22.596431732177734, -19.651363372802734, -16.706296920776367, -13.76123046875, -10.816164016723633, -7.871097564697266, -4.92603063583374, -1.9809637069702148, 0.9641027450561523, 3.9091691970825195, 6.854236602783203, 9.79930305480957, 12.744369506835938, 15.689435958862305, 18.634502410888672, 21.579570770263672, 24.524635314941406, 27.469703674316406, 30.414770126342773, 33.35983657836914, 36.304901123046875, 39.249969482421875, 42.19503402709961, 45.14010238647461, 48.085166931152344, 51.030235290527344, 53.975303649902344, 56.92036819458008, 59.86543655395508, 62.81050491333008, 65.75556945800781, 68.70063781738281, 71.64570617675781, 74.59076690673828, 77.53583526611328, 80.48090362548828, 83.42597198486328, 86.37104034423828, 89.31610870361328, 92.26116943359375, 95.20623779296875, 98.15130615234375, 101.09637451171875, 104.04144287109375, 106.98650360107422]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 11.0, 11.0, 16.0, 18.0, 14.0, 14.0, 23.0, 37.0, 34.0, 39.0, 32.0, 39.0, 37.0, 36.0, 55.0, 44.0, 44.0, 41.0, 52.0, 33.0, 30.0, 34.0, 47.0, 24.0, 28.0, 23.0, 36.0, 20.0, 22.0, 13.0, 10.0, 13.0, 11.0, 8.0, 10.0, 4.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-13.3125, -12.939453125, -12.56640625, -12.193359375, -11.8203125, -11.447265625, -11.07421875, -10.701171875, -10.328125, -9.955078125, -9.58203125, -9.208984375, -8.8359375, -8.462890625, -8.08984375, -7.716796875, -7.34375, -6.970703125, -6.59765625, -6.224609375, -5.8515625, -5.478515625, -5.10546875, -4.732421875, -4.359375, -3.986328125, -3.61328125, -3.240234375, -2.8671875, -2.494140625, -2.12109375, -1.748046875, -1.375, -1.001953125, -0.62890625, -0.255859375, 0.1171875, 0.490234375, 0.86328125, 1.236328125, 1.609375, 1.982421875, 2.35546875, 2.728515625, 3.1015625, 3.474609375, 3.84765625, 4.220703125, 4.59375, 4.966796875, 5.33984375, 5.712890625, 6.0859375, 6.458984375, 6.83203125, 7.205078125, 7.578125, 7.951171875, 8.32421875, 8.697265625, 9.0703125, 9.443359375, 9.81640625, 10.189453125, 10.5625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 7.0, 14.0, 13.0, 12.0, 24.0, 35.0, 31.0, 55.0, 92.0, 91.0, 125.0, 195.0, 303.0, 472.0, 828.0, 1396.0, 2610.0, 5371.0, 12949.0, 42954.0, 442248.0, 2901188.0, 692827.0, 60820.0, 15952.0, 6480.0, 3049.0, 1582.0, 910.0, 530.0, 327.0, 234.0, 156.0, 100.0, 67.0, 48.0, 32.0, 28.0, 27.0, 21.0, 17.0, 11.0, 11.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-29.03125, -28.19189453125, -27.3525390625, -26.51318359375, -25.673828125, -24.83447265625, -23.9951171875, -23.15576171875, -22.31640625, -21.47705078125, -20.6376953125, -19.79833984375, -18.958984375, -18.11962890625, -17.2802734375, -16.44091796875, -15.6015625, -14.76220703125, -13.9228515625, -13.08349609375, -12.244140625, -11.40478515625, -10.5654296875, -9.72607421875, -8.88671875, -8.04736328125, -7.2080078125, -6.36865234375, -5.529296875, -4.68994140625, -3.8505859375, -3.01123046875, -2.171875, -1.33251953125, -0.4931640625, 0.34619140625, 1.185546875, 2.02490234375, 2.8642578125, 3.70361328125, 4.54296875, 5.38232421875, 6.2216796875, 7.06103515625, 7.900390625, 8.73974609375, 9.5791015625, 10.41845703125, 11.2578125, 12.09716796875, 12.9365234375, 13.77587890625, 14.615234375, 15.45458984375, 16.2939453125, 17.13330078125, 17.97265625, 18.81201171875, 19.6513671875, 20.49072265625, 21.330078125, 22.16943359375, 23.0087890625, 23.84814453125, 24.6875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 7.0, 6.0, 5.0, 11.0, 12.0, 6.0, 16.0, 17.0, 21.0, 32.0, 45.0, 51.0, 64.0, 79.0, 139.0, 201.0, 310.0, 549.0, 640.0, 610.0, 426.0, 243.0, 151.0, 91.0, 80.0, 60.0, 39.0, 37.0, 20.0, 16.0, 17.0, 12.0, 5.0, 5.0, 9.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.421875, -20.747314453125, -20.07275390625, -19.398193359375, -18.7236328125, -18.049072265625, -17.37451171875, -16.699951171875, -16.025390625, -15.350830078125, -14.67626953125, -14.001708984375, -13.3271484375, -12.652587890625, -11.97802734375, -11.303466796875, -10.62890625, -9.954345703125, -9.27978515625, -8.605224609375, -7.9306640625, -7.256103515625, -6.58154296875, -5.906982421875, -5.232421875, -4.557861328125, -3.88330078125, -3.208740234375, -2.5341796875, -1.859619140625, -1.18505859375, -0.510498046875, 0.1640625, 0.838623046875, 1.51318359375, 2.187744140625, 2.8623046875, 3.536865234375, 4.21142578125, 4.885986328125, 5.560546875, 6.235107421875, 6.90966796875, 7.584228515625, 8.2587890625, 8.933349609375, 9.60791015625, 10.282470703125, 10.95703125, 11.631591796875, 12.30615234375, 12.980712890625, 13.6552734375, 14.329833984375, 15.00439453125, 15.678955078125, 16.353515625, 17.028076171875, 17.70263671875, 18.377197265625, 19.0517578125, 19.726318359375, 20.40087890625, 21.075439453125, 21.75]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 5.0, 9.0, 6.0, 8.0, 7.0, 8.0, 12.0, 17.0, 17.0, 26.0, 40.0, 52.0, 79.0, 105.0, 191.0, 467.0, 2148.0, 22950.0, 3268477.0, 883111.0, 14082.0, 1440.0, 416.0, 171.0, 108.0, 66.0, 65.0, 45.0, 23.0, 25.0, 20.0, 12.0, 9.0, 8.0, 12.0, 4.0, 9.0, 4.0, 5.0, 6.0, 4.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.125, -97.9560546875, -94.787109375, -91.6181640625, -88.44921875, -85.2802734375, -82.111328125, -78.9423828125, -75.7734375, -72.6044921875, -69.435546875, -66.2666015625, -63.09765625, -59.9287109375, -56.759765625, -53.5908203125, -50.421875, -47.2529296875, -44.083984375, -40.9150390625, -37.74609375, -34.5771484375, -31.408203125, -28.2392578125, -25.0703125, -21.9013671875, -18.732421875, -15.5634765625, -12.39453125, -9.2255859375, -6.056640625, -2.8876953125, 0.28125, 3.4501953125, 6.619140625, 9.7880859375, 12.95703125, 16.1259765625, 19.294921875, 22.4638671875, 25.6328125, 28.8017578125, 31.970703125, 35.1396484375, 38.30859375, 41.4775390625, 44.646484375, 47.8154296875, 50.984375, 54.1533203125, 57.322265625, 60.4912109375, 63.66015625, 66.8291015625, 69.998046875, 73.1669921875, 76.3359375, 79.5048828125, 82.673828125, 85.8427734375, 89.01171875, 92.1806640625, 95.349609375, 98.5185546875, 101.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 23.0, 83.0, 186.0, 327.0, 268.0, 78.0, 29.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-413.9048156738281, -404.8369140625, -395.76898193359375, -386.7010803222656, -377.6331481933594, -368.56524658203125, -359.497314453125, -350.4294128417969, -341.36151123046875, -332.2936096191406, -323.2256774902344, -314.15777587890625, -305.08984375, -296.0219421386719, -286.9540100097656, -277.8861083984375, -268.81817626953125, -259.7502746582031, -250.68234252929688, -241.6144256591797, -232.5465087890625, -223.47860717773438, -214.4106903076172, -205.3427734375, -196.2748565673828, -187.20693969726562, -178.13902282714844, -169.07110595703125, -160.00320434570312, -150.93527221679688, -141.86737060546875, -132.79945373535156, -123.73152160644531, -114.66360473632812, -105.59568786621094, -96.52777862548828, -87.4598617553711, -78.3919448852539, -69.32403564453125, -60.25611877441406, -51.188201904296875, -42.12028503417969, -33.052371978759766, -23.98445701599121, -14.916542053222656, -5.848625183105469, 3.219287872314453, 12.287200927734375, 21.355117797851562, 30.423032760620117, 39.49094772338867, 48.558860778808594, 57.62677764892578, 66.69469451904297, 75.76260375976562, 84.83052062988281, 93.8984375, 102.96635437011719, 112.03427124023438, 121.10218048095703, 130.17010498046875, 139.23800659179688, 148.30592346191406, 157.37384033203125, 166.44175720214844]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 16.0, 16.0, 17.0, 22.0, 26.0, 27.0, 34.0, 25.0, 36.0, 34.0, 40.0, 63.0, 46.0, 64.0, 54.0, 38.0, 51.0, 42.0, 40.0, 38.0, 30.0, 41.0, 32.0, 24.0, 26.0, 21.0, 19.0, 10.0, 14.0, 7.0, 5.0, 4.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-102.3641586303711, -99.72129821777344, -97.07844543457031, -94.43558502197266, -91.792724609375, -89.14987182617188, -86.50701141357422, -83.86415100097656, -81.22129821777344, -78.57843780517578, -75.93558502197266, -73.292724609375, -70.64987182617188, -68.00701141357422, -65.36415100097656, -62.72129440307617, -60.07843780517578, -57.43558120727539, -54.792724609375, -52.149864196777344, -49.50700759887695, -46.86415100097656, -44.221290588378906, -41.578433990478516, -38.935577392578125, -36.292720794677734, -33.649864196777344, -31.007003784179688, -28.364147186279297, -25.721290588378906, -23.078432083129883, -20.43557357788086, -17.792709350585938, -15.14985179901123, -12.506994247436523, -9.864136695861816, -7.221279144287109, -4.578421592712402, -1.9355640411376953, 0.7072944641113281, 3.3501510620117188, 5.993008613586426, 8.635866165161133, 11.27872371673584, 13.921581268310547, 16.564437866210938, 19.20729637145996, 21.850154876708984, 24.493011474609375, 27.135868072509766, 29.77872657775879, 32.42158508300781, 35.0644416809082, 37.707298278808594, 40.35015869140625, 42.99301528930664, 45.63587188720703, 48.27872848510742, 50.92158508300781, 53.56444549560547, 56.20730209350586, 58.85015869140625, 61.493019104003906, 64.13587951660156, 66.77873229980469]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 16.0, 21.0, 17.0, 16.0, 20.0, 28.0, 33.0, 29.0, 47.0, 46.0, 42.0, 48.0, 47.0, 49.0, 42.0, 50.0, 43.0, 47.0, 46.0, 41.0, 46.0, 34.0, 29.0, 22.0, 17.0, 23.0, 9.0, 8.0, 11.0, 10.0, 12.0, 10.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.1387939453125, -10.746337890625, -10.3538818359375, -9.96142578125, -9.5689697265625, -9.176513671875, -8.7840576171875, -8.3916015625, -7.9991455078125, -7.606689453125, -7.2142333984375, -6.82177734375, -6.4293212890625, -6.036865234375, -5.6444091796875, -5.251953125, -4.8594970703125, -4.467041015625, -4.0745849609375, -3.68212890625, -3.2896728515625, -2.897216796875, -2.5047607421875, -2.1123046875, -1.7198486328125, -1.327392578125, -0.9349365234375, -0.54248046875, -0.1500244140625, 0.242431640625, 0.6348876953125, 1.02734375, 1.4197998046875, 1.812255859375, 2.2047119140625, 2.59716796875, 2.9896240234375, 3.382080078125, 3.7745361328125, 4.1669921875, 4.5594482421875, 4.951904296875, 5.3443603515625, 5.73681640625, 6.1292724609375, 6.521728515625, 6.9141845703125, 7.306640625, 7.6990966796875, 8.091552734375, 8.4840087890625, 8.87646484375, 9.2689208984375, 9.661376953125, 10.0538330078125, 10.4462890625, 10.8387451171875, 11.231201171875, 11.6236572265625, 12.01611328125, 12.4085693359375, 12.801025390625, 13.1934814453125, 13.5859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 7.0, 13.0, 38.0, 38.0, 70.0, 83.0, 119.0, 185.0, 288.0, 435.0, 612.0, 927.0, 1298.0, 2105.0, 2925.0, 4443.0, 6616.0, 10037.0, 15429.0, 23526.0, 36663.0, 57985.0, 94546.0, 162413.0, 228635.0, 152367.0, 90258.0, 54912.0, 35018.0, 22679.0, 14549.0, 9752.0, 6357.0, 4305.0, 2929.0, 1901.0, 1252.0, 919.0, 632.0, 421.0, 293.0, 185.0, 125.0, 82.0, 55.0, 44.0, 25.0, 20.0, 19.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2421875, -0.23423385620117188, -0.22628021240234375, -0.21832656860351562, -0.2103729248046875, -0.20241928100585938, -0.19446563720703125, -0.18651199340820312, -0.178558349609375, -0.17060470581054688, -0.16265106201171875, -0.15469741821289062, -0.1467437744140625, -0.13879013061523438, -0.13083648681640625, -0.12288284301757812, -0.11492919921875, -0.10697555541992188, -0.09902191162109375, -0.09106826782226562, -0.0831146240234375, -0.07516098022460938, -0.06720733642578125, -0.059253692626953125, -0.051300048828125, -0.043346405029296875, -0.03539276123046875, -0.027439117431640625, -0.0194854736328125, -0.011531829833984375, -0.00357818603515625, 0.004375457763671875, 0.0123291015625, 0.020282745361328125, 0.02823638916015625, 0.036190032958984375, 0.0441436767578125, 0.052097320556640625, 0.06005096435546875, 0.06800460815429688, 0.075958251953125, 0.08391189575195312, 0.09186553955078125, 0.09981918334960938, 0.1077728271484375, 0.11572647094726562, 0.12368011474609375, 0.13163375854492188, 0.13958740234375, 0.14754104614257812, 0.15549468994140625, 0.16344833374023438, 0.1714019775390625, 0.17935562133789062, 0.18730926513671875, 0.19526290893554688, 0.203216552734375, 0.21117019653320312, 0.21912384033203125, 0.22707748413085938, 0.2350311279296875, 0.24298477172851562, 0.25093841552734375, 0.2588920593261719, 0.266845703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 9.0, 8.0, 14.0, 13.0, 15.0, 16.0, 15.0, 14.0, 20.0, 22.0, 30.0, 29.0, 36.0, 44.0, 41.0, 47.0, 39.0, 47.0, 42.0, 1073.0, 33.0, 51.0, 33.0, 32.0, 31.0, 32.0, 28.0, 28.0, 23.0, 19.0, 23.0, 28.0, 23.0, 15.0, 11.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.265625, -8.9947509765625, -8.723876953125, -8.4530029296875, -8.18212890625, -7.9112548828125, -7.640380859375, -7.3695068359375, -7.0986328125, -6.8277587890625, -6.556884765625, -6.2860107421875, -6.01513671875, -5.7442626953125, -5.473388671875, -5.2025146484375, -4.931640625, -4.6607666015625, -4.389892578125, -4.1190185546875, -3.84814453125, -3.5772705078125, -3.306396484375, -3.0355224609375, -2.7646484375, -2.4937744140625, -2.222900390625, -1.9520263671875, -1.68115234375, -1.4102783203125, -1.139404296875, -0.8685302734375, -0.59765625, -0.3267822265625, -0.055908203125, 0.2149658203125, 0.48583984375, 0.7567138671875, 1.027587890625, 1.2984619140625, 1.5693359375, 1.8402099609375, 2.111083984375, 2.3819580078125, 2.65283203125, 2.9237060546875, 3.194580078125, 3.4654541015625, 3.736328125, 4.0072021484375, 4.278076171875, 4.5489501953125, 4.81982421875, 5.0906982421875, 5.361572265625, 5.6324462890625, 5.9033203125, 6.1741943359375, 6.445068359375, 6.7159423828125, 6.98681640625, 7.2576904296875, 7.528564453125, 7.7994384765625, 8.0703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 13.0, 23.0, 29.0, 39.0, 64.0, 86.0, 101.0, 133.0, 204.0, 325.0, 452.0, 638.0, 959.0, 1282.0, 1958.0, 2712.0, 4097.0, 6002.0, 9216.0, 13708.0, 20504.0, 31385.0, 48777.0, 74989.0, 122619.0, 1209038.0, 222482.0, 116616.0, 72149.0, 46336.0, 30170.0, 19723.0, 12773.0, 8714.0, 5930.0, 4035.0, 2754.0, 1911.0, 1282.0, 882.0, 626.0, 426.0, 286.0, 212.0, 131.0, 102.0, 76.0, 54.0, 33.0, 24.0, 14.0, 13.0, 4.0, 5.0, 6.0, 3.0, 2.0], "bins": [-0.1263427734375, -0.12250804901123047, -0.11867332458496094, -0.1148386001586914, -0.11100387573242188, -0.10716915130615234, -0.10333442687988281, -0.09949970245361328, -0.09566497802734375, -0.09183025360107422, -0.08799552917480469, -0.08416080474853516, -0.08032608032226562, -0.0764913558959961, -0.07265663146972656, -0.06882190704345703, -0.0649871826171875, -0.06115245819091797, -0.05731773376464844, -0.053483009338378906, -0.049648284912109375, -0.045813560485839844, -0.04197883605957031, -0.03814411163330078, -0.03430938720703125, -0.03047466278076172, -0.026639938354492188, -0.022805213928222656, -0.018970489501953125, -0.015135765075683594, -0.011301040649414062, -0.007466316223144531, -0.003631591796875, 0.00020313262939453125, 0.0040378570556640625, 0.007872581481933594, 0.011707305908203125, 0.015542030334472656, 0.019376754760742188, 0.02321147918701172, 0.02704620361328125, 0.03088092803955078, 0.03471565246582031, 0.038550376892089844, 0.042385101318359375, 0.046219825744628906, 0.05005455017089844, 0.05388927459716797, 0.0577239990234375, 0.06155872344970703, 0.06539344787597656, 0.0692281723022461, 0.07306289672851562, 0.07689762115478516, 0.08073234558105469, 0.08456707000732422, 0.08840179443359375, 0.09223651885986328, 0.09607124328613281, 0.09990596771240234, 0.10374069213867188, 0.1075754165649414, 0.11141014099121094, 0.11524486541748047, 0.11907958984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 13.0, 7.0, 16.0, 17.0, 24.0, 13.0, 40.0, 33.0, 42.0, 46.0, 57.0, 51.0, 53.0, 79.0, 55.0, 62.0, 61.0, 51.0, 51.0, 28.0, 30.0, 20.0, 22.0, 21.0, 23.0, 20.0, 7.0, 9.0, 7.0, 1.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007834434509277344, -0.0007560700178146362, -0.0007286965847015381, -0.0007013231515884399, -0.0006739497184753418, -0.0006465762853622437, -0.0006192028522491455, -0.0005918294191360474, -0.0005644559860229492, -0.0005370825529098511, -0.0005097091197967529, -0.0004823356866836548, -0.00045496225357055664, -0.0004275888204574585, -0.00040021538734436035, -0.0003728419542312622, -0.00034546852111816406, -0.0003180950880050659, -0.0002907216548919678, -0.00026334822177886963, -0.00023597478866577148, -0.00020860135555267334, -0.0001812279224395752, -0.00015385448932647705, -0.0001264810562133789, -9.910762310028076e-05, -7.173418998718262e-05, -4.436075687408447e-05, -1.6987323760986328e-05, 1.0386109352111816e-05, 3.775954246520996e-05, 6.51329755783081e-05, 9.250640869140625e-05, 0.0001198798418045044, 0.00014725327491760254, 0.00017462670803070068, 0.00020200014114379883, 0.00022937357425689697, 0.0002567470073699951, 0.00028412044048309326, 0.0003114938735961914, 0.00033886730670928955, 0.0003662407398223877, 0.00039361417293548584, 0.000420987606048584, 0.00044836103916168213, 0.0004757344722747803, 0.0005031079053878784, 0.0005304813385009766, 0.0005578547716140747, 0.0005852282047271729, 0.000612601637840271, 0.0006399750709533691, 0.0006673485040664673, 0.0006947219371795654, 0.0007220953702926636, 0.0007494688034057617, 0.0007768422365188599, 0.000804215669631958, 0.0008315891027450562, 0.0008589625358581543, 0.0008863359689712524, 0.0009137094020843506, 0.0009410828351974487, 0.0009684562683105469]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 3.0, 10.0, 9.0, 13.0, 27.0, 14.0, 31.0, 22.0, 32.0, 28.0, 64.0, 95.0, 194.0, 506.0, 4028.0, 1033124.0, 9130.0, 632.0, 205.0, 98.0, 58.0, 45.0, 48.0, 16.0, 24.0, 16.0, 15.0, 9.0, 11.0, 8.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0225067138671875, -0.021874189376831055, -0.02124166488647461, -0.020609140396118164, -0.01997661590576172, -0.019344091415405273, -0.018711566925048828, -0.018079042434692383, -0.017446517944335938, -0.016813993453979492, -0.016181468963623047, -0.015548944473266602, -0.014916419982910156, -0.014283895492553711, -0.013651371002197266, -0.01301884651184082, -0.012386322021484375, -0.01175379753112793, -0.011121273040771484, -0.010488748550415039, -0.009856224060058594, -0.009223699569702148, -0.008591175079345703, -0.007958650588989258, -0.0073261260986328125, -0.006693601608276367, -0.006061077117919922, -0.0054285526275634766, -0.004796028137207031, -0.004163503646850586, -0.0035309791564941406, -0.0028984546661376953, -0.00226593017578125, -0.0016334056854248047, -0.0010008811950683594, -0.00036835670471191406, 0.00026416778564453125, 0.0008966922760009766, 0.0015292167663574219, 0.002161741256713867, 0.0027942657470703125, 0.003426790237426758, 0.004059314727783203, 0.0046918392181396484, 0.005324363708496094, 0.005956888198852539, 0.006589412689208984, 0.00722193717956543, 0.007854461669921875, 0.00848698616027832, 0.009119510650634766, 0.009752035140991211, 0.010384559631347656, 0.011017084121704102, 0.011649608612060547, 0.012282133102416992, 0.012914657592773438, 0.013547182083129883, 0.014179706573486328, 0.014812231063842773, 0.015444755554199219, 0.016077280044555664, 0.01670980453491211, 0.017342329025268555, 0.017974853515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 305.0, 707.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022845227271318436, -0.02241465635597706, -0.02198408544063568, -0.021553512662649155, -0.021122941747307777, -0.0206923708319664, -0.020261799916625023, -0.019831229001283646, -0.01940065808594227, -0.01897008717060089, -0.018539516255259514, -0.018108945339918137, -0.01767837256193161, -0.017247801646590233, -0.016817230731248856, -0.01638665981590748, -0.0159560889005661, -0.015525517985224724, -0.015094946138560772, -0.014664375223219395, -0.014233804307878017, -0.013803232461214066, -0.013372661545872688, -0.012942090630531311, -0.012511517852544785, -0.012080946937203407, -0.011650375090539455, -0.011219804175198078, -0.010789233259856701, -0.010358661413192749, -0.009928090497851372, -0.009497519582509995, -0.009066947735846043, -0.008636376820504665, -0.008205804973840714, -0.007775234058499336, -0.007344663143157959, -0.006914091762155294, -0.00648352038115263, -0.006052949465811253, -0.005622378084808588, -0.0051918067038059235, -0.004761235788464546, -0.004330664407461882, -0.0039000932592898607, -0.00346952211111784, -0.0030389507301151752, -0.0026083795819431543, -0.0021778084337711334, -0.0017472372855991125, -0.0013166660210117698, -0.000886094756424427, -0.0004555236082524061, -2.4952460080385208e-05, 0.00040561892092227936, 0.0008361900690943003, 0.0012667612172663212, 0.001697332365438342, 0.002127903513610363, 0.0025584748946130276, 0.0029890460427850485, 0.0034196171909570694, 0.003850188571959734, 0.0042807599529623985, 0.004711330868303776]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 10.0, 13.0, 16.0, 9.0, 22.0, 25.0, 22.0, 30.0, 41.0, 31.0, 39.0, 54.0, 34.0, 63.0, 53.0, 39.0, 52.0, 55.0, 54.0, 33.0, 30.0, 41.0, 32.0, 35.0, 20.0, 20.0, 27.0, 19.0, 19.0, 17.0, 9.0, 12.0, 4.0, 7.0, 3.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007668137550354004, -0.0007376745343208313, -0.0007085353136062622, -0.0006793960928916931, -0.000650256872177124, -0.0006211176514625549, -0.0005919784307479858, -0.0005628392100334167, -0.0005336999893188477, -0.0005045607686042786, -0.00047542154788970947, -0.0004462823271751404, -0.0004171431064605713, -0.0003880038857460022, -0.0003588646650314331, -0.000329725444316864, -0.0003005862236022949, -0.00027144700288772583, -0.00024230778217315674, -0.00021316856145858765, -0.00018402934074401855, -0.00015489012002944946, -0.00012575089931488037, -9.661167860031128e-05, -6.747245788574219e-05, -3.8333237171173096e-05, -9.194016456604004e-06, 1.9945204257965088e-05, 4.908442497253418e-05, 7.822364568710327e-05, 0.00010736286640167236, 0.00013650208711624146, 0.00016564130783081055, 0.00019478052854537964, 0.00022391974925994873, 0.0002530589699745178, 0.0002821981906890869, 0.000311337411403656, 0.0003404766321182251, 0.0003696158528327942, 0.0003987550735473633, 0.0004278942942619324, 0.00045703351497650146, 0.00048617273569107056, 0.0005153119564056396, 0.0005444511771202087, 0.0005735903978347778, 0.0006027296185493469, 0.000631868839263916, 0.0006610080599784851, 0.0006901472806930542, 0.0007192865014076233, 0.0007484257221221924, 0.0007775649428367615, 0.0008067041635513306, 0.0008358433842658997, 0.0008649826049804688, 0.0008941218256950378, 0.0009232610464096069, 0.000952400267124176, 0.0009815394878387451, 0.0010106787085533142, 0.0010398179292678833, 0.0010689571499824524, 0.0010980963706970215]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 16.0, 21.0, 17.0, 16.0, 20.0, 28.0, 33.0, 29.0, 47.0, 46.0, 42.0, 48.0, 47.0, 49.0, 42.0, 50.0, 43.0, 47.0, 46.0, 41.0, 46.0, 34.0, 29.0, 22.0, 17.0, 23.0, 9.0, 8.0, 11.0, 10.0, 12.0, 10.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.1387939453125, -10.746337890625, -10.3538818359375, -9.96142578125, -9.5689697265625, -9.176513671875, -8.7840576171875, -8.3916015625, -7.9991455078125, -7.606689453125, -7.2142333984375, -6.82177734375, -6.4293212890625, -6.036865234375, -5.6444091796875, -5.251953125, -4.8594970703125, -4.467041015625, -4.0745849609375, -3.68212890625, -3.2896728515625, -2.897216796875, -2.5047607421875, -2.1123046875, -1.7198486328125, -1.327392578125, -0.9349365234375, -0.54248046875, -0.1500244140625, 0.242431640625, 0.6348876953125, 1.02734375, 1.4197998046875, 1.812255859375, 2.2047119140625, 2.59716796875, 2.9896240234375, 3.382080078125, 3.7745361328125, 4.1669921875, 4.5594482421875, 4.951904296875, 5.3443603515625, 5.73681640625, 6.1292724609375, 6.521728515625, 6.9141845703125, 7.306640625, 7.6990966796875, 8.091552734375, 8.4840087890625, 8.87646484375, 9.2689208984375, 9.661376953125, 10.0538330078125, 10.4462890625, 10.8387451171875, 11.231201171875, 11.6236572265625, 12.01611328125, 12.4085693359375, 12.801025390625, 13.1934814453125, 13.5859375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 10.0, 11.0, 11.0, 19.0, 23.0, 45.0, 54.0, 79.0, 106.0, 149.0, 172.0, 232.0, 339.0, 483.0, 698.0, 1030.0, 1402.0, 2091.0, 3260.0, 4902.0, 8415.0, 16188.0, 39790.0, 139154.0, 623795.0, 129454.0, 37939.0, 15742.0, 8023.0, 4955.0, 3124.0, 2086.0, 1351.0, 961.0, 699.0, 482.0, 352.0, 231.0, 187.0, 141.0, 91.0, 76.0, 43.0, 35.0, 31.0, 20.0, 18.0, 19.0, 4.0, 14.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-13.3984375, -12.9727783203125, -12.547119140625, -12.1214599609375, -11.69580078125, -11.2701416015625, -10.844482421875, -10.4188232421875, -9.9931640625, -9.5675048828125, -9.141845703125, -8.7161865234375, -8.29052734375, -7.8648681640625, -7.439208984375, -7.0135498046875, -6.587890625, -6.1622314453125, -5.736572265625, -5.3109130859375, -4.88525390625, -4.4595947265625, -4.033935546875, -3.6082763671875, -3.1826171875, -2.7569580078125, -2.331298828125, -1.9056396484375, -1.47998046875, -1.0543212890625, -0.628662109375, -0.2030029296875, 0.22265625, 0.6483154296875, 1.073974609375, 1.4996337890625, 1.92529296875, 2.3509521484375, 2.776611328125, 3.2022705078125, 3.6279296875, 4.0535888671875, 4.479248046875, 4.9049072265625, 5.33056640625, 5.7562255859375, 6.181884765625, 6.6075439453125, 7.033203125, 7.4588623046875, 7.884521484375, 8.3101806640625, 8.73583984375, 9.1614990234375, 9.587158203125, 10.0128173828125, 10.4384765625, 10.8641357421875, 11.289794921875, 11.7154541015625, 12.14111328125, 12.5667724609375, 12.992431640625, 13.4180908203125, 13.84375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 6.0, 8.0, 8.0, 9.0, 14.0, 9.0, 19.0, 20.0, 21.0, 21.0, 19.0, 30.0, 21.0, 33.0, 42.0, 38.0, 50.0, 50.0, 91.0, 177.0, 1736.0, 150.0, 68.0, 48.0, 48.0, 35.0, 39.0, 36.0, 25.0, 31.0, 29.0, 26.0, 23.0, 18.0, 10.0, 14.0, 5.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.73095703125, -35.5244140625, -34.31787109375, -33.111328125, -31.90478515625, -30.6982421875, -29.49169921875, -28.28515625, -27.07861328125, -25.8720703125, -24.66552734375, -23.458984375, -22.25244140625, -21.0458984375, -19.83935546875, -18.6328125, -17.42626953125, -16.2197265625, -15.01318359375, -13.806640625, -12.60009765625, -11.3935546875, -10.18701171875, -8.98046875, -7.77392578125, -6.5673828125, -5.36083984375, -4.154296875, -2.94775390625, -1.7412109375, -0.53466796875, 0.671875, 1.87841796875, 3.0849609375, 4.29150390625, 5.498046875, 6.70458984375, 7.9111328125, 9.11767578125, 10.32421875, 11.53076171875, 12.7373046875, 13.94384765625, 15.150390625, 16.35693359375, 17.5634765625, 18.77001953125, 19.9765625, 21.18310546875, 22.3896484375, 23.59619140625, 24.802734375, 26.00927734375, 27.2158203125, 28.42236328125, 29.62890625, 30.83544921875, 32.0419921875, 33.24853515625, 34.455078125, 35.66162109375, 36.8681640625, 38.07470703125, 39.28125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 6.0, 9.0, 14.0, 17.0, 21.0, 29.0, 31.0, 34.0, 45.0, 50.0, 91.0, 140.0, 146.0, 229.0, 645.0, 2103.0, 13423.0, 2467508.0, 647140.0, 10784.0, 1814.0, 515.0, 238.0, 146.0, 115.0, 86.0, 49.0, 48.0, 39.0, 37.0, 31.0, 35.0, 11.0, 9.0, 13.0, 10.0, 8.0, 4.0, 7.0, 5.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.8125, -86.271484375, -83.73046875, -81.189453125, -78.6484375, -76.107421875, -73.56640625, -71.025390625, -68.484375, -65.943359375, -63.40234375, -60.861328125, -58.3203125, -55.779296875, -53.23828125, -50.697265625, -48.15625, -45.615234375, -43.07421875, -40.533203125, -37.9921875, -35.451171875, -32.91015625, -30.369140625, -27.828125, -25.287109375, -22.74609375, -20.205078125, -17.6640625, -15.123046875, -12.58203125, -10.041015625, -7.5, -4.958984375, -2.41796875, 0.123046875, 2.6640625, 5.205078125, 7.74609375, 10.287109375, 12.828125, 15.369140625, 17.91015625, 20.451171875, 22.9921875, 25.533203125, 28.07421875, 30.615234375, 33.15625, 35.697265625, 38.23828125, 40.779296875, 43.3203125, 45.861328125, 48.40234375, 50.943359375, 53.484375, 56.025390625, 58.56640625, 61.107421875, 63.6484375, 66.189453125, 68.73046875, 71.271484375, 73.8125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 42.0, 218.0, 542.0, 161.0, 36.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.95651245117188, -108.3705062866211, -101.78450012207031, -95.19850158691406, -88.61249542236328, -82.0264892578125, -75.44048309326172, -68.85447692871094, -62.26847457885742, -55.68246841430664, -49.096466064453125, -42.510459899902344, -35.92445373535156, -29.338451385498047, -22.752445220947266, -16.16644287109375, -9.580436706542969, -2.994431972503662, 3.5915727615356445, 10.17757797241211, 16.763582229614258, 23.349586486816406, 29.935592651367188, 36.5215950012207, 43.107601165771484, 49.693607330322266, 56.27960968017578, 62.86561584472656, 69.45162200927734, 76.03762817382812, 82.62362670898438, 89.20963287353516, 95.79563903808594, 102.38164520263672, 108.9676513671875, 115.55364990234375, 122.13965606689453, 128.7256622314453, 135.31167602539062, 141.89767456054688, 148.48367309570312, 155.06967163085938, 161.6556854248047, 168.24168395996094, 174.82769775390625, 181.4136962890625, 187.99969482421875, 194.58570861816406, 201.17172241210938, 207.75772094726562, 214.34373474121094, 220.9297332763672, 227.5157470703125, 234.10174560546875, 240.687744140625, 247.2737579345703, 253.85975646972656, 260.4457702636719, 267.0317687988281, 273.6177673339844, 280.2037658691406, 286.789794921875, 293.37579345703125, 299.9617919921875, 306.54779052734375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 10.0, 6.0, 11.0, 14.0, 11.0, 8.0, 7.0, 14.0, 12.0, 39.0, 31.0, 39.0, 25.0, 37.0, 41.0, 44.0, 44.0, 42.0, 43.0, 43.0, 43.0, 35.0, 41.0, 35.0, 47.0, 27.0, 38.0, 35.0, 18.0, 21.0, 18.0, 22.0, 13.0, 18.0, 17.0, 11.0, 7.0, 7.0, 7.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-88.6780776977539, -85.90892791748047, -83.13977813720703, -80.37063598632812, -77.60148620605469, -74.83233642578125, -72.06318664550781, -69.29403686523438, -66.52489471435547, -63.75574493408203, -60.98659896850586, -58.21744918823242, -55.44830322265625, -52.67915344238281, -49.910003662109375, -47.1408576965332, -44.371707916259766, -41.60255813598633, -38.833412170410156, -36.06426239013672, -33.29511642456055, -30.52596664428711, -27.756818771362305, -24.9876708984375, -22.218523025512695, -19.44937515258789, -16.680227279663086, -13.911078453063965, -11.14193058013916, -8.372782707214355, -5.603633880615234, -2.8344860076904297, -0.065338134765625, 2.703809976577759, 5.472958087921143, 8.242106437683105, 11.01125431060791, 13.780402183532715, 16.549551010131836, 19.31869888305664, 22.087846755981445, 24.85699462890625, 27.626142501831055, 30.39529037475586, 33.1644401550293, 35.93358612060547, 38.702735900878906, 41.471885681152344, 44.241031646728516, 47.01018142700195, 49.779327392578125, 52.54847717285156, 55.317623138427734, 58.08677291870117, 60.855918884277344, 63.62506866455078, 66.39421844482422, 69.16336822509766, 71.9325180053711, 74.70166015625, 77.47080993652344, 80.23995971679688, 83.00910949707031, 85.77825927734375, 88.54740142822266]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 6.0, 15.0, 14.0, 16.0, 16.0, 18.0, 15.0, 26.0, 25.0, 34.0, 44.0, 44.0, 45.0, 47.0, 46.0, 34.0, 51.0, 50.0, 46.0, 38.0, 34.0, 41.0, 47.0, 39.0, 29.0, 30.0, 23.0, 25.0, 11.0, 15.0, 11.0, 9.0, 8.0, 3.0, 9.0, 5.0, 7.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.604736328125, -11.21728515625, -10.829833984375, -10.4423828125, -10.054931640625, -9.66748046875, -9.280029296875, -8.892578125, -8.505126953125, -8.11767578125, -7.730224609375, -7.3427734375, -6.955322265625, -6.56787109375, -6.180419921875, -5.79296875, -5.405517578125, -5.01806640625, -4.630615234375, -4.2431640625, -3.855712890625, -3.46826171875, -3.080810546875, -2.693359375, -2.305908203125, -1.91845703125, -1.531005859375, -1.1435546875, -0.756103515625, -0.36865234375, 0.018798828125, 0.40625, 0.793701171875, 1.18115234375, 1.568603515625, 1.9560546875, 2.343505859375, 2.73095703125, 3.118408203125, 3.505859375, 3.893310546875, 4.28076171875, 4.668212890625, 5.0556640625, 5.443115234375, 5.83056640625, 6.218017578125, 6.60546875, 6.992919921875, 7.38037109375, 7.767822265625, 8.1552734375, 8.542724609375, 8.93017578125, 9.317626953125, 9.705078125, 10.092529296875, 10.47998046875, 10.867431640625, 11.2548828125, 11.642333984375, 12.02978515625, 12.417236328125, 12.8046875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 6.0, 13.0, 20.0, 21.0, 20.0, 26.0, 34.0, 64.0, 78.0, 139.0, 218.0, 429.0, 935.0, 2282.0, 6164.0, 19801.0, 146059.0, 3074374.0, 883168.0, 42907.0, 10812.0, 3701.0, 1376.0, 688.0, 365.0, 181.0, 113.0, 62.0, 59.0, 40.0, 26.0, 14.0, 11.0, 13.0, 9.0, 6.0, 9.0, 7.0, 4.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.85986328125, -33.6884765625, -32.51708984375, -31.345703125, -30.17431640625, -29.0029296875, -27.83154296875, -26.66015625, -25.48876953125, -24.3173828125, -23.14599609375, -21.974609375, -20.80322265625, -19.6318359375, -18.46044921875, -17.2890625, -16.11767578125, -14.9462890625, -13.77490234375, -12.603515625, -11.43212890625, -10.2607421875, -9.08935546875, -7.91796875, -6.74658203125, -5.5751953125, -4.40380859375, -3.232421875, -2.06103515625, -0.8896484375, 0.28173828125, 1.453125, 2.62451171875, 3.7958984375, 4.96728515625, 6.138671875, 7.31005859375, 8.4814453125, 9.65283203125, 10.82421875, 11.99560546875, 13.1669921875, 14.33837890625, 15.509765625, 16.68115234375, 17.8525390625, 19.02392578125, 20.1953125, 21.36669921875, 22.5380859375, 23.70947265625, 24.880859375, 26.05224609375, 27.2236328125, 28.39501953125, 29.56640625, 30.73779296875, 31.9091796875, 33.08056640625, 34.251953125, 35.42333984375, 36.5947265625, 37.76611328125, 38.9375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 5.0, 3.0, 7.0, 8.0, 17.0, 19.0, 15.0, 27.0, 30.0, 31.0, 53.0, 75.0, 101.0, 126.0, 261.0, 485.0, 740.0, 748.0, 520.0, 302.0, 144.0, 103.0, 65.0, 40.0, 37.0, 23.0, 21.0, 10.0, 15.0, 9.0, 9.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.78125, -25.001708984375, -24.22216796875, -23.442626953125, -22.6630859375, -21.883544921875, -21.10400390625, -20.324462890625, -19.544921875, -18.765380859375, -17.98583984375, -17.206298828125, -16.4267578125, -15.647216796875, -14.86767578125, -14.088134765625, -13.30859375, -12.529052734375, -11.74951171875, -10.969970703125, -10.1904296875, -9.410888671875, -8.63134765625, -7.851806640625, -7.072265625, -6.292724609375, -5.51318359375, -4.733642578125, -3.9541015625, -3.174560546875, -2.39501953125, -1.615478515625, -0.8359375, -0.056396484375, 0.72314453125, 1.502685546875, 2.2822265625, 3.061767578125, 3.84130859375, 4.620849609375, 5.400390625, 6.179931640625, 6.95947265625, 7.739013671875, 8.5185546875, 9.298095703125, 10.07763671875, 10.857177734375, 11.63671875, 12.416259765625, 13.19580078125, 13.975341796875, 14.7548828125, 15.534423828125, 16.31396484375, 17.093505859375, 17.873046875, 18.652587890625, 19.43212890625, 20.211669921875, 20.9912109375, 21.770751953125, 22.55029296875, 23.329833984375, 24.109375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 4.0, 11.0, 12.0, 13.0, 22.0, 25.0, 29.0, 51.0, 76.0, 142.0, 309.0, 1206.0, 13398.0, 3166538.0, 1001611.0, 9165.0, 966.0, 221.0, 145.0, 84.0, 56.0, 36.0, 29.0, 32.0, 19.0, 16.0, 15.0, 10.0, 8.0, 1.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-117.375, -113.5810546875, -109.787109375, -105.9931640625, -102.19921875, -98.4052734375, -94.611328125, -90.8173828125, -87.0234375, -83.2294921875, -79.435546875, -75.6416015625, -71.84765625, -68.0537109375, -64.259765625, -60.4658203125, -56.671875, -52.8779296875, -49.083984375, -45.2900390625, -41.49609375, -37.7021484375, -33.908203125, -30.1142578125, -26.3203125, -22.5263671875, -18.732421875, -14.9384765625, -11.14453125, -7.3505859375, -3.556640625, 0.2373046875, 4.03125, 7.8251953125, 11.619140625, 15.4130859375, 19.20703125, 23.0009765625, 26.794921875, 30.5888671875, 34.3828125, 38.1767578125, 41.970703125, 45.7646484375, 49.55859375, 53.3525390625, 57.146484375, 60.9404296875, 64.734375, 68.5283203125, 72.322265625, 76.1162109375, 79.91015625, 83.7041015625, 87.498046875, 91.2919921875, 95.0859375, 98.8798828125, 102.673828125, 106.4677734375, 110.26171875, 114.0556640625, 117.849609375, 121.6435546875, 125.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 11.0, 23.0, 57.0, 90.0, 157.0, 195.0, 201.0, 145.0, 75.0, 27.0, 19.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.41262817382812, -127.2995834350586, -122.1865463256836, -117.07350158691406, -111.96046447753906, -106.84741973876953, -101.734375, -96.621337890625, -91.50829315185547, -86.39524841308594, -81.28221130371094, -76.1691665649414, -71.05612182617188, -65.94308471679688, -60.830039978027344, -55.71699905395508, -50.60395812988281, -45.49091720581055, -40.37787628173828, -35.26483154296875, -30.151790618896484, -25.03874969482422, -19.92570686340332, -14.812664031982422, -9.699623107910156, -4.586581230163574, 0.5264606475830078, 5.63950252532959, 10.752544403076172, 15.865585327148438, 20.978628158569336, 26.091670989990234, 31.204696655273438, 36.3177375793457, 41.43077850341797, 46.5438232421875, 51.656864166259766, 56.76990509033203, 61.88294982910156, 66.99598693847656, 72.1090316772461, 77.22207641601562, 82.33511352539062, 87.44815826416016, 92.56120300292969, 97.67424011230469, 102.78728485107422, 107.90032958984375, 113.01336669921875, 118.12641143798828, 123.23944854736328, 128.3524932861328, 133.4655303955078, 138.57858276367188, 143.69161987304688, 148.80465698242188, 153.91769409179688, 159.03073120117188, 164.14378356933594, 169.25682067871094, 174.36985778808594, 179.48291015625, 184.595947265625, 189.708984375, 194.82203674316406]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 7.0, 8.0, 11.0, 12.0, 18.0, 14.0, 16.0, 24.0, 22.0, 29.0, 35.0, 32.0, 40.0, 27.0, 39.0, 41.0, 50.0, 49.0, 39.0, 57.0, 45.0, 37.0, 48.0, 38.0, 28.0, 38.0, 37.0, 29.0, 29.0, 21.0, 18.0, 12.0, 10.0, 10.0, 8.0, 7.0, 6.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.47439575195312, -73.06916046142578, -70.66392517089844, -68.25869750976562, -65.85346221923828, -63.44822692871094, -61.042991638183594, -58.63775634765625, -56.23252487182617, -53.82728958129883, -51.42205810546875, -49.016822814941406, -46.61158752441406, -44.206356048583984, -41.80112075805664, -39.39588928222656, -36.99065399169922, -34.585418701171875, -32.1801872253418, -29.774951934814453, -27.369718551635742, -24.96448516845703, -22.559249877929688, -20.154016494750977, -17.748783111572266, -15.343549728393555, -12.938315391540527, -10.5330810546875, -8.127847671508789, -5.722614288330078, -3.317379951477051, -0.9121456146240234, 1.4930877685546875, 3.8983216285705566, 6.303555488586426, 8.708789825439453, 11.114023208618164, 13.519256591796875, 15.924490928649902, 18.32972526550293, 20.73495864868164, 23.14019203186035, 25.545425415039062, 27.950660705566406, 30.355894088745117, 32.76112747192383, 35.16636276245117, 37.57159423828125, 39.976829528808594, 42.38206481933594, 44.787296295166016, 47.19253158569336, 49.59776306152344, 52.00299835205078, 54.408233642578125, 56.81346893310547, 59.21870040893555, 61.62393569946289, 64.02916717529297, 66.43440246582031, 68.83963775634766, 71.244873046875, 73.65010070800781, 76.05533599853516, 78.4605712890625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 8.0, 8.0, 8.0, 13.0, 20.0, 19.0, 18.0, 20.0, 29.0, 33.0, 34.0, 42.0, 34.0, 41.0, 40.0, 43.0, 42.0, 33.0, 49.0, 39.0, 44.0, 42.0, 35.0, 44.0, 26.0, 29.0, 35.0, 18.0, 22.0, 19.0, 17.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0078125, -10.6531982421875, -10.298583984375, -9.9439697265625, -9.58935546875, -9.2347412109375, -8.880126953125, -8.5255126953125, -8.1708984375, -7.8162841796875, -7.461669921875, -7.1070556640625, -6.75244140625, -6.3978271484375, -6.043212890625, -5.6885986328125, -5.333984375, -4.9793701171875, -4.624755859375, -4.2701416015625, -3.91552734375, -3.5609130859375, -3.206298828125, -2.8516845703125, -2.4970703125, -2.1424560546875, -1.787841796875, -1.4332275390625, -1.07861328125, -0.7239990234375, -0.369384765625, -0.0147705078125, 0.33984375, 0.6944580078125, 1.049072265625, 1.4036865234375, 1.75830078125, 2.1129150390625, 2.467529296875, 2.8221435546875, 3.1767578125, 3.5313720703125, 3.885986328125, 4.2406005859375, 4.59521484375, 4.9498291015625, 5.304443359375, 5.6590576171875, 6.013671875, 6.3682861328125, 6.722900390625, 7.0775146484375, 7.43212890625, 7.7867431640625, 8.141357421875, 8.4959716796875, 8.8505859375, 9.2052001953125, 9.559814453125, 9.9144287109375, 10.26904296875, 10.6236572265625, 10.978271484375, 11.3328857421875, 11.6875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 5.0, 7.0, 6.0, 10.0, 21.0, 16.0, 24.0, 33.0, 53.0, 71.0, 95.0, 142.0, 201.0, 291.0, 405.0, 548.0, 774.0, 1119.0, 1524.0, 2302.0, 3233.0, 4731.0, 6505.0, 9760.0, 14520.0, 21567.0, 32333.0, 49374.0, 75475.0, 116719.0, 186003.0, 183837.0, 115538.0, 74450.0, 48511.0, 31814.0, 21155.0, 14196.0, 9511.0, 6533.0, 4583.0, 3167.0, 2176.0, 1509.0, 1064.0, 790.0, 559.0, 368.0, 272.0, 174.0, 151.0, 111.0, 68.0, 38.0, 41.0, 28.0, 19.0, 18.0, 9.0, 7.0, 5.0, 2.0], "bins": [-0.2447509765625, -0.23732948303222656, -0.22990798950195312, -0.2224864959716797, -0.21506500244140625, -0.2076435089111328, -0.20022201538085938, -0.19280052185058594, -0.1853790283203125, -0.17795753479003906, -0.17053604125976562, -0.1631145477294922, -0.15569305419921875, -0.1482715606689453, -0.14085006713867188, -0.13342857360839844, -0.126007080078125, -0.11858558654785156, -0.11116409301757812, -0.10374259948730469, -0.09632110595703125, -0.08889961242675781, -0.08147811889648438, -0.07405662536621094, -0.0666351318359375, -0.05921363830566406, -0.051792144775390625, -0.04437065124511719, -0.03694915771484375, -0.029527664184570312, -0.022106170654296875, -0.014684677124023438, -0.00726318359375, 0.0001583099365234375, 0.007579803466796875, 0.015001296997070312, 0.02242279052734375, 0.029844284057617188, 0.037265777587890625, 0.04468727111816406, 0.0521087646484375, 0.05953025817871094, 0.06695175170898438, 0.07437324523925781, 0.08179473876953125, 0.08921623229980469, 0.09663772583007812, 0.10405921936035156, 0.111480712890625, 0.11890220642089844, 0.12632369995117188, 0.1337451934814453, 0.14116668701171875, 0.1485881805419922, 0.15600967407226562, 0.16343116760253906, 0.1708526611328125, 0.17827415466308594, 0.18569564819335938, 0.1931171417236328, 0.20053863525390625, 0.2079601287841797, 0.21538162231445312, 0.22280311584472656, 0.230224609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 5.0, 7.0, 9.0, 13.0, 23.0, 20.0, 23.0, 36.0, 25.0, 29.0, 43.0, 30.0, 45.0, 29.0, 35.0, 45.0, 1067.0, 49.0, 52.0, 39.0, 46.0, 41.0, 35.0, 35.0, 22.0, 38.0, 18.0, 27.0, 27.0, 16.0, 20.0, 13.0, 14.0, 10.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9605712890625, -7.671142578125, -7.3817138671875, -7.09228515625, -6.8028564453125, -6.513427734375, -6.2239990234375, -5.9345703125, -5.6451416015625, -5.355712890625, -5.0662841796875, -4.77685546875, -4.4874267578125, -4.197998046875, -3.9085693359375, -3.619140625, -3.3297119140625, -3.040283203125, -2.7508544921875, -2.46142578125, -2.1719970703125, -1.882568359375, -1.5931396484375, -1.3037109375, -1.0142822265625, -0.724853515625, -0.4354248046875, -0.14599609375, 0.1434326171875, 0.432861328125, 0.7222900390625, 1.01171875, 1.3011474609375, 1.590576171875, 1.8800048828125, 2.16943359375, 2.4588623046875, 2.748291015625, 3.0377197265625, 3.3271484375, 3.6165771484375, 3.906005859375, 4.1954345703125, 4.48486328125, 4.7742919921875, 5.063720703125, 5.3531494140625, 5.642578125, 5.9320068359375, 6.221435546875, 6.5108642578125, 6.80029296875, 7.0897216796875, 7.379150390625, 7.6685791015625, 7.9580078125, 8.2474365234375, 8.536865234375, 8.8262939453125, 9.11572265625, 9.4051513671875, 9.694580078125, 9.9840087890625, 10.2734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 8.0, 9.0, 9.0, 23.0, 33.0, 70.0, 78.0, 118.0, 152.0, 250.0, 358.0, 491.0, 809.0, 1132.0, 1786.0, 2546.0, 3868.0, 6008.0, 9198.0, 14203.0, 21965.0, 34272.0, 53427.0, 84543.0, 139063.0, 1259097.0, 173519.0, 106158.0, 66261.0, 41833.0, 26542.0, 17115.0, 10950.0, 7101.0, 4689.0, 3031.0, 2082.0, 1374.0, 949.0, 629.0, 448.0, 294.0, 207.0, 146.0, 96.0, 64.0, 44.0, 34.0, 19.0, 11.0, 6.0, 5.0, 10.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1217041015625, -0.11761093139648438, -0.11351776123046875, -0.10942459106445312, -0.1053314208984375, -0.10123825073242188, -0.09714508056640625, -0.09305191040039062, -0.088958740234375, -0.08486557006835938, -0.08077239990234375, -0.07667922973632812, -0.0725860595703125, -0.06849288940429688, -0.06439971923828125, -0.060306549072265625, -0.05621337890625, -0.052120208740234375, -0.04802703857421875, -0.043933868408203125, -0.0398406982421875, -0.035747528076171875, -0.03165435791015625, -0.027561187744140625, -0.023468017578125, -0.019374847412109375, -0.01528167724609375, -0.011188507080078125, -0.0070953369140625, -0.003002166748046875, 0.00109100341796875, 0.005184173583984375, 0.00927734375, 0.013370513916015625, 0.01746368408203125, 0.021556854248046875, 0.0256500244140625, 0.029743194580078125, 0.03383636474609375, 0.037929534912109375, 0.042022705078125, 0.046115875244140625, 0.05020904541015625, 0.054302215576171875, 0.0583953857421875, 0.062488555908203125, 0.06658172607421875, 0.07067489624023438, 0.07476806640625, 0.07886123657226562, 0.08295440673828125, 0.08704757690429688, 0.0911407470703125, 0.09523391723632812, 0.09932708740234375, 0.10342025756835938, 0.107513427734375, 0.11160659790039062, 0.11569976806640625, 0.11979293823242188, 0.1238861083984375, 0.12797927856445312, 0.13207244873046875, 0.13616561889648438, 0.1402587890625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 3.0, 14.0, 12.0, 19.0, 13.0, 24.0, 31.0, 44.0, 45.0, 71.0, 96.0, 85.0, 100.0, 76.0, 70.0, 64.0, 33.0, 42.0, 28.0, 20.0, 23.0, 16.0, 12.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011749267578125, -0.0011394768953323364, -0.0011040270328521729, -0.0010685771703720093, -0.0010331273078918457, -0.0009976774454116821, -0.0009622275829315186, -0.000926777720451355, -0.0008913278579711914, -0.0008558779954910278, -0.0008204281330108643, -0.0007849782705307007, -0.0007495284080505371, -0.0007140785455703735, -0.00067862868309021, -0.0006431788206100464, -0.0006077289581298828, -0.0005722790956497192, -0.0005368292331695557, -0.0005013793706893921, -0.0004659295082092285, -0.00043047964572906494, -0.00039502978324890137, -0.0003595799207687378, -0.0003241300582885742, -0.00028868019580841064, -0.00025323033332824707, -0.0002177804708480835, -0.00018233060836791992, -0.00014688074588775635, -0.00011143088340759277, -7.59810209274292e-05, -4.0531158447265625e-05, -5.081295967102051e-06, 3.0368566513061523e-05, 6.58184289932251e-05, 0.00010126829147338867, 0.00013671815395355225, 0.00017216801643371582, 0.0002076178789138794, 0.00024306774139404297, 0.00027851760387420654, 0.0003139674663543701, 0.0003494173288345337, 0.00038486719131469727, 0.00042031705379486084, 0.0004557669162750244, 0.000491216778755188, 0.0005266666412353516, 0.0005621165037155151, 0.0005975663661956787, 0.0006330162286758423, 0.0006684660911560059, 0.0007039159536361694, 0.000739365816116333, 0.0007748156785964966, 0.0008102655410766602, 0.0008457154035568237, 0.0008811652660369873, 0.0009166151285171509, 0.0009520649909973145, 0.000987514853477478, 0.0010229647159576416, 0.0010584145784378052, 0.0010938644409179688]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 7.0, 11.0, 12.0, 17.0, 21.0, 23.0, 29.0, 52.0, 54.0, 121.0, 276.0, 1337.0, 1016373.0, 29138.0, 600.0, 183.0, 79.0, 55.0, 36.0, 23.0, 16.0, 19.0, 11.0, 15.0, 2.0, 11.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0255584716796875, -0.02472853660583496, -0.023898601531982422, -0.023068666458129883, -0.022238731384277344, -0.021408796310424805, -0.020578861236572266, -0.019748926162719727, -0.018918991088867188, -0.01808905601501465, -0.01725912094116211, -0.01642918586730957, -0.015599250793457031, -0.014769315719604492, -0.013939380645751953, -0.013109445571899414, -0.012279510498046875, -0.011449575424194336, -0.010619640350341797, -0.009789705276489258, -0.008959770202636719, -0.00812983512878418, -0.007299900054931641, -0.0064699649810791016, -0.0056400299072265625, -0.0048100948333740234, -0.003980159759521484, -0.0031502246856689453, -0.0023202896118164062, -0.0014903545379638672, -0.0006604194641113281, 0.00016951560974121094, 0.00099945068359375, 0.001829385757446289, 0.002659320831298828, 0.003489255905151367, 0.004319190979003906, 0.005149126052856445, 0.005979061126708984, 0.0068089962005615234, 0.0076389312744140625, 0.008468866348266602, 0.00929880142211914, 0.01012873649597168, 0.010958671569824219, 0.011788606643676758, 0.012618541717529297, 0.013448476791381836, 0.014278411865234375, 0.015108346939086914, 0.015938282012939453, 0.016768217086791992, 0.01759815216064453, 0.01842808723449707, 0.01925802230834961, 0.02008795738220215, 0.020917892456054688, 0.021747827529907227, 0.022577762603759766, 0.023407697677612305, 0.024237632751464844, 0.025067567825317383, 0.025897502899169922, 0.02672743797302246, 0.027557373046875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 29.0, 973.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02001454494893551, -0.01960132271051407, -0.01918810047209263, -0.018774880096316338, -0.018361657857894897, -0.017948435619473457, -0.017535213381052017, -0.017121993005275726, -0.016708770766854286, -0.016295548528432846, -0.015882326290011406, -0.01546910498291254, -0.015055883675813675, -0.014642661437392235, -0.01422944013029337, -0.01381621789187193, -0.013402996584773064, -0.012989774346351624, -0.012576553039252758, -0.012163330800831318, -0.011750109493732452, -0.011336887255311012, -0.010923665948212147, -0.010510443709790707, -0.010097221471369267, -0.009683999232947826, -0.009270777925848961, -0.00885755568742752, -0.008444334380328655, -0.008031112141907215, -0.00761789083480835, -0.0072046685963869095, -0.006791446823626757, -0.006378225050866604, -0.005965003278106451, -0.005551781505346298, -0.005138559732586145, -0.004725337959825993, -0.0043121157214045525, -0.0038988941814750433, -0.0034856724087148905, -0.0030724506359547377, -0.002659228863194585, -0.0022460068576037884, -0.0018327852012589574, -0.0014195633120834827, -0.00100634153932333, -0.0005931197665631771, -0.0001798979938030243, 0.00023332380806095898, 0.0006465456099249423, 0.001059767440892756, 0.0014729892136529088, 0.0018862111028283834, 0.0022994328755885363, 0.002712654648348689, 0.003125876421108842, 0.0035390981938689947, 0.003952320199459791, 0.004365541972219944, 0.004778763744980097, 0.00519198551774025, 0.0056052072905004025, 0.006018429063260555, 0.006431650836020708]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 13.0, 13.0, 15.0, 18.0, 27.0, 27.0, 28.0, 45.0, 43.0, 45.0, 55.0, 43.0, 57.0, 52.0, 70.0, 61.0, 59.0, 53.0, 52.0, 38.0, 33.0, 38.0, 29.0, 22.0, 22.0, 13.0, 11.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008541345596313477, -0.000818164087831974, -0.0007821936160326004, -0.0007462231442332268, -0.0007102526724338531, -0.0006742822006344795, -0.0006383117288351059, -0.0006023412570357323, -0.0005663707852363586, -0.000530400313436985, -0.0004944298416376114, -0.00045845936983823776, -0.00042248889803886414, -0.0003865184262394905, -0.0003505479544401169, -0.00031457748264074326, -0.00027860701084136963, -0.000242636539041996, -0.00020666606724262238, -0.00017069559544324875, -0.00013472512364387512, -9.87546518445015e-05, -6.278418004512787e-05, -2.6813708245754242e-05, 9.156763553619385e-06, 4.512723535299301e-05, 8.109770715236664e-05, 0.00011706817895174026, 0.0001530386507511139, 0.00018900912255048752, 0.00022497959434986115, 0.00026095006614923477, 0.0002969205379486084, 0.000332891009747982, 0.00036886148154735565, 0.0004048319533467293, 0.0004408024251461029, 0.00047677289694547653, 0.0005127433687448502, 0.0005487138405442238, 0.0005846843123435974, 0.000620654784142971, 0.0006566252559423447, 0.0006925957277417183, 0.0007285661995410919, 0.0007645366713404655, 0.0008005071431398392, 0.0008364776149392128, 0.0008724480867385864, 0.00090841855853796, 0.0009443890303373337, 0.0009803595021367073, 0.001016329973936081, 0.0010523004457354546, 0.0010882709175348282, 0.0011242413893342018, 0.0011602118611335754, 0.001196182332932949, 0.0012321528047323227, 0.0012681232765316963, 0.00130409374833107, 0.0013400642201304436, 0.0013760346919298172, 0.0014120051637291908, 0.0014479756355285645]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 8.0, 8.0, 8.0, 13.0, 20.0, 19.0, 18.0, 20.0, 29.0, 33.0, 34.0, 42.0, 34.0, 41.0, 40.0, 43.0, 42.0, 33.0, 49.0, 39.0, 44.0, 42.0, 35.0, 44.0, 26.0, 29.0, 35.0, 18.0, 22.0, 19.0, 17.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0078125, -10.6531982421875, -10.298583984375, -9.9439697265625, -9.58935546875, -9.2347412109375, -8.880126953125, -8.5255126953125, -8.1708984375, -7.8162841796875, -7.461669921875, -7.1070556640625, -6.75244140625, -6.3978271484375, -6.043212890625, -5.6885986328125, -5.333984375, -4.9793701171875, -4.624755859375, -4.2701416015625, -3.91552734375, -3.5609130859375, -3.206298828125, -2.8516845703125, -2.4970703125, -2.1424560546875, -1.787841796875, -1.4332275390625, -1.07861328125, -0.7239990234375, -0.369384765625, -0.0147705078125, 0.33984375, 0.6944580078125, 1.049072265625, 1.4036865234375, 1.75830078125, 2.1129150390625, 2.467529296875, 2.8221435546875, 3.1767578125, 3.5313720703125, 3.885986328125, 4.2406005859375, 4.59521484375, 4.9498291015625, 5.304443359375, 5.6590576171875, 6.013671875, 6.3682861328125, 6.722900390625, 7.0775146484375, 7.43212890625, 7.7867431640625, 8.141357421875, 8.4959716796875, 8.8505859375, 9.2052001953125, 9.559814453125, 9.9144287109375, 10.26904296875, 10.6236572265625, 10.978271484375, 11.3328857421875, 11.6875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 13.0, 24.0, 36.0, 32.0, 62.0, 83.0, 118.0, 162.0, 286.0, 381.0, 584.0, 940.0, 1550.0, 2575.0, 4714.0, 8813.0, 17360.0, 41374.0, 235358.0, 623616.0, 62569.0, 23148.0, 10850.0, 5678.0, 3063.0, 1905.0, 1146.0, 760.0, 433.0, 313.0, 183.0, 122.0, 89.0, 52.0, 57.0, 28.0, 28.0, 5.0, 13.0, 9.0, 11.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.8125, -16.170166015625, -15.52783203125, -14.885498046875, -14.2431640625, -13.600830078125, -12.95849609375, -12.316162109375, -11.673828125, -11.031494140625, -10.38916015625, -9.746826171875, -9.1044921875, -8.462158203125, -7.81982421875, -7.177490234375, -6.53515625, -5.892822265625, -5.25048828125, -4.608154296875, -3.9658203125, -3.323486328125, -2.68115234375, -2.038818359375, -1.396484375, -0.754150390625, -0.11181640625, 0.530517578125, 1.1728515625, 1.815185546875, 2.45751953125, 3.099853515625, 3.7421875, 4.384521484375, 5.02685546875, 5.669189453125, 6.3115234375, 6.953857421875, 7.59619140625, 8.238525390625, 8.880859375, 9.523193359375, 10.16552734375, 10.807861328125, 11.4501953125, 12.092529296875, 12.73486328125, 13.377197265625, 14.01953125, 14.661865234375, 15.30419921875, 15.946533203125, 16.5888671875, 17.231201171875, 17.87353515625, 18.515869140625, 19.158203125, 19.800537109375, 20.44287109375, 21.085205078125, 21.7275390625, 22.369873046875, 23.01220703125, 23.654541015625, 24.296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 7.0, 10.0, 9.0, 18.0, 14.0, 23.0, 24.0, 25.0, 24.0, 34.0, 37.0, 33.0, 45.0, 50.0, 61.0, 85.0, 192.0, 1723.0, 121.0, 81.0, 58.0, 56.0, 44.0, 32.0, 28.0, 26.0, 34.0, 25.0, 16.0, 25.0, 11.0, 5.0, 20.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.27734375, -30.2109375, -29.14453125, -28.078125, -27.01171875, -25.9453125, -24.87890625, -23.8125, -22.74609375, -21.6796875, -20.61328125, -19.546875, -18.48046875, -17.4140625, -16.34765625, -15.28125, -14.21484375, -13.1484375, -12.08203125, -11.015625, -9.94921875, -8.8828125, -7.81640625, -6.75, -5.68359375, -4.6171875, -3.55078125, -2.484375, -1.41796875, -0.3515625, 0.71484375, 1.78125, 2.84765625, 3.9140625, 4.98046875, 6.046875, 7.11328125, 8.1796875, 9.24609375, 10.3125, 11.37890625, 12.4453125, 13.51171875, 14.578125, 15.64453125, 16.7109375, 17.77734375, 18.84375, 19.91015625, 20.9765625, 22.04296875, 23.109375, 24.17578125, 25.2421875, 26.30859375, 27.375, 28.44140625, 29.5078125, 30.57421875, 31.640625, 32.70703125, 33.7734375, 34.83984375, 35.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 6.0, 7.0, 11.0, 13.0, 33.0, 35.0, 35.0, 51.0, 71.0, 93.0, 127.0, 216.0, 364.0, 1078.0, 4535.0, 36465.0, 2971330.0, 119285.0, 8852.0, 1730.0, 544.0, 243.0, 172.0, 103.0, 71.0, 59.0, 38.0, 34.0, 21.0, 20.0, 10.0, 11.0, 14.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.4833984375, -62.154296875, -59.8251953125, -57.49609375, -55.1669921875, -52.837890625, -50.5087890625, -48.1796875, -45.8505859375, -43.521484375, -41.1923828125, -38.86328125, -36.5341796875, -34.205078125, -31.8759765625, -29.546875, -27.2177734375, -24.888671875, -22.5595703125, -20.23046875, -17.9013671875, -15.572265625, -13.2431640625, -10.9140625, -8.5849609375, -6.255859375, -3.9267578125, -1.59765625, 0.7314453125, 3.060546875, 5.3896484375, 7.71875, 10.0478515625, 12.376953125, 14.7060546875, 17.03515625, 19.3642578125, 21.693359375, 24.0224609375, 26.3515625, 28.6806640625, 31.009765625, 33.3388671875, 35.66796875, 37.9970703125, 40.326171875, 42.6552734375, 44.984375, 47.3134765625, 49.642578125, 51.9716796875, 54.30078125, 56.6298828125, 58.958984375, 61.2880859375, 63.6171875, 65.9462890625, 68.275390625, 70.6044921875, 72.93359375, 75.2626953125, 77.591796875, 79.9208984375, 82.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 122.0, 866.0, 27.0], "bins": [-1239.0430908203125, -1219.1612548828125, -1199.279296875, -1179.3974609375, -1159.515625, -1139.6337890625, -1119.7518310546875, -1099.8699951171875, -1079.9881591796875, -1060.1063232421875, -1040.224365234375, -1020.342529296875, -1000.460693359375, -980.5787963867188, -960.6968994140625, -940.8150634765625, -920.93310546875, -901.0512084960938, -881.1693725585938, -861.2874755859375, -841.4056396484375, -821.5237426757812, -801.641845703125, -781.760009765625, -761.878173828125, -741.9962768554688, -722.1144409179688, -702.2325439453125, -682.3507080078125, -662.4688110351562, -642.5869140625, -622.705078125, -602.8231811523438, -582.9412841796875, -563.0594482421875, -543.1775512695312, -523.2957153320312, -503.413818359375, -483.5319519042969, -463.65008544921875, -443.7681884765625, -423.8863220214844, -404.00445556640625, -384.12255859375, -364.2406921386719, -344.35882568359375, -324.4769592285156, -304.5950927734375, -284.71319580078125, -264.8313293457031, -244.94944763183594, -225.0675811767578, -205.18569946289062, -185.3038330078125, -165.42196655273438, -145.5400848388672, -125.65821838378906, -105.7763442993164, -85.89447021484375, -66.01260375976562, -46.13072967529297, -26.248855590820312, -6.3669891357421875, 13.514892578125, 33.39675521850586]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 6.0, 10.0, 5.0, 6.0, 13.0, 14.0, 18.0, 23.0, 19.0, 21.0, 32.0, 28.0, 34.0, 34.0, 29.0, 35.0, 35.0, 31.0, 45.0, 38.0, 52.0, 36.0, 42.0, 38.0, 41.0, 35.0, 30.0, 29.0, 29.0, 30.0, 24.0, 13.0, 21.0, 12.0, 16.0, 13.0, 16.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.21829223632812, -75.77754974365234, -73.33680725097656, -70.89607238769531, -68.45532989501953, -66.01458740234375, -63.57384490966797, -61.13310241699219, -58.69236373901367, -56.25162124633789, -53.810882568359375, -51.370140075683594, -48.92939758300781, -46.4886589050293, -44.047916412353516, -41.607177734375, -39.16643524169922, -36.72569274902344, -34.28495407104492, -31.84421157836914, -29.403470993041992, -26.962730407714844, -24.521987915039062, -22.081247329711914, -19.640506744384766, -17.199766159057617, -14.759024620056152, -12.318283081054688, -9.877542495727539, -7.436801910400391, -4.996060371398926, -2.555318832397461, -0.11458587646484375, 2.326155185699463, 4.7668962478637695, 7.207637310028076, 9.648378372192383, 12.089118957519531, 14.529860496520996, 16.97060203552246, 19.41134262084961, 21.852083206176758, 24.292823791503906, 26.733566284179688, 29.174306869506836, 31.615047454833984, 34.055789947509766, 36.49652862548828, 38.93727111816406, 41.378013610839844, 43.81875228881836, 46.25949478149414, 48.700233459472656, 51.14097595214844, 53.58171844482422, 56.0224609375, 58.463199615478516, 60.9039421081543, 63.34468078613281, 65.7854232788086, 68.22616577148438, 70.66690063476562, 73.1076431274414, 75.54838562011719, 77.98912811279297]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 9.0, 14.0, 9.0, 14.0, 19.0, 23.0, 31.0, 28.0, 34.0, 26.0, 38.0, 33.0, 30.0, 40.0, 40.0, 41.0, 31.0, 34.0, 35.0, 44.0, 38.0, 38.0, 31.0, 35.0, 32.0, 29.0, 25.0, 23.0, 26.0, 17.0, 12.0, 7.0, 17.0, 8.0, 9.0, 9.0, 5.0, 10.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-11.2421875, -10.89111328125, -10.5400390625, -10.18896484375, -9.837890625, -9.48681640625, -9.1357421875, -8.78466796875, -8.43359375, -8.08251953125, -7.7314453125, -7.38037109375, -7.029296875, -6.67822265625, -6.3271484375, -5.97607421875, -5.625, -5.27392578125, -4.9228515625, -4.57177734375, -4.220703125, -3.86962890625, -3.5185546875, -3.16748046875, -2.81640625, -2.46533203125, -2.1142578125, -1.76318359375, -1.412109375, -1.06103515625, -0.7099609375, -0.35888671875, -0.0078125, 0.34326171875, 0.6943359375, 1.04541015625, 1.396484375, 1.74755859375, 2.0986328125, 2.44970703125, 2.80078125, 3.15185546875, 3.5029296875, 3.85400390625, 4.205078125, 4.55615234375, 4.9072265625, 5.25830078125, 5.609375, 5.96044921875, 6.3115234375, 6.66259765625, 7.013671875, 7.36474609375, 7.7158203125, 8.06689453125, 8.41796875, 8.76904296875, 9.1201171875, 9.47119140625, 9.822265625, 10.17333984375, 10.5244140625, 10.87548828125, 11.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 14.0, 18.0, 19.0, 20.0, 26.0, 46.0, 70.0, 124.0, 200.0, 383.0, 794.0, 2090.0, 6047.0, 21449.0, 234319.0, 3529361.0, 362935.0, 25184.0, 6684.0, 2394.0, 986.0, 445.0, 224.0, 110.0, 77.0, 53.0, 41.0, 19.0, 27.0, 15.0, 11.0, 8.0, 10.0, 11.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.16357421875, -36.8271484375, -35.49072265625, -34.154296875, -32.81787109375, -31.4814453125, -30.14501953125, -28.80859375, -27.47216796875, -26.1357421875, -24.79931640625, -23.462890625, -22.12646484375, -20.7900390625, -19.45361328125, -18.1171875, -16.78076171875, -15.4443359375, -14.10791015625, -12.771484375, -11.43505859375, -10.0986328125, -8.76220703125, -7.42578125, -6.08935546875, -4.7529296875, -3.41650390625, -2.080078125, -0.74365234375, 0.5927734375, 1.92919921875, 3.265625, 4.60205078125, 5.9384765625, 7.27490234375, 8.611328125, 9.94775390625, 11.2841796875, 12.62060546875, 13.95703125, 15.29345703125, 16.6298828125, 17.96630859375, 19.302734375, 20.63916015625, 21.9755859375, 23.31201171875, 24.6484375, 25.98486328125, 27.3212890625, 28.65771484375, 29.994140625, 31.33056640625, 32.6669921875, 34.00341796875, 35.33984375, 36.67626953125, 38.0126953125, 39.34912109375, 40.685546875, 42.02197265625, 43.3583984375, 44.69482421875, 46.03125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 13.0, 10.0, 16.0, 17.0, 24.0, 42.0, 43.0, 59.0, 70.0, 121.0, 205.0, 390.0, 726.0, 872.0, 573.0, 323.0, 185.0, 109.0, 71.0, 63.0, 28.0, 37.0, 11.0, 7.0, 9.0, 8.0, 3.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.28125, -31.438720703125, -30.59619140625, -29.753662109375, -28.9111328125, -28.068603515625, -27.22607421875, -26.383544921875, -25.541015625, -24.698486328125, -23.85595703125, -23.013427734375, -22.1708984375, -21.328369140625, -20.48583984375, -19.643310546875, -18.80078125, -17.958251953125, -17.11572265625, -16.273193359375, -15.4306640625, -14.588134765625, -13.74560546875, -12.903076171875, -12.060546875, -11.218017578125, -10.37548828125, -9.532958984375, -8.6904296875, -7.847900390625, -7.00537109375, -6.162841796875, -5.3203125, -4.477783203125, -3.63525390625, -2.792724609375, -1.9501953125, -1.107666015625, -0.26513671875, 0.577392578125, 1.419921875, 2.262451171875, 3.10498046875, 3.947509765625, 4.7900390625, 5.632568359375, 6.47509765625, 7.317626953125, 8.16015625, 9.002685546875, 9.84521484375, 10.687744140625, 11.5302734375, 12.372802734375, 13.21533203125, 14.057861328125, 14.900390625, 15.742919921875, 16.58544921875, 17.427978515625, 18.2705078125, 19.113037109375, 19.95556640625, 20.798095703125, 21.640625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 7.0, 8.0, 2.0, 9.0, 15.0, 33.0, 36.0, 54.0, 76.0, 142.0, 292.0, 1007.0, 22037.0, 4091031.0, 76887.0, 1793.0, 362.0, 147.0, 82.0, 62.0, 42.0, 38.0, 24.0, 21.0, 12.0, 11.0, 15.0, 7.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.25, -125.359375, -120.46875, -115.578125, -110.6875, -105.796875, -100.90625, -96.015625, -91.125, -86.234375, -81.34375, -76.453125, -71.5625, -66.671875, -61.78125, -56.890625, -52.0, -47.109375, -42.21875, -37.328125, -32.4375, -27.546875, -22.65625, -17.765625, -12.875, -7.984375, -3.09375, 1.796875, 6.6875, 11.578125, 16.46875, 21.359375, 26.25, 31.140625, 36.03125, 40.921875, 45.8125, 50.703125, 55.59375, 60.484375, 65.375, 70.265625, 75.15625, 80.046875, 84.9375, 89.828125, 94.71875, 99.609375, 104.5, 109.390625, 114.28125, 119.171875, 124.0625, 128.953125, 133.84375, 138.734375, 143.625, 148.515625, 153.40625, 158.296875, 163.1875, 168.078125, 172.96875, 177.859375, 182.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 15.0, 39.0, 62.0, 133.0, 234.0, 234.0, 154.0, 82.0, 32.0, 11.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.8446960449219, -255.1780548095703, -249.51141357421875, -243.8447723388672, -238.17813110351562, -232.51148986816406, -226.8448486328125, -221.17822265625, -215.51156616210938, -209.8449249267578, -204.17828369140625, -198.5116424560547, -192.84500122070312, -187.17835998535156, -181.51171875, -175.8450927734375, -170.17845153808594, -164.51181030273438, -158.8451690673828, -153.17852783203125, -147.5118865966797, -141.84524536132812, -136.17861938476562, -130.511962890625, -124.84532928466797, -119.1786880493164, -113.51204681396484, -107.84541320800781, -102.17877197265625, -96.51213073730469, -90.84548950195312, -85.17884826660156, -79.51219177246094, -73.84555053710938, -68.17890930175781, -62.512271881103516, -56.84563064575195, -51.17898941040039, -45.512351989746094, -39.84571075439453, -34.17906951904297, -28.512428283691406, -22.845788955688477, -17.179149627685547, -11.512508392333984, -5.845867156982422, -0.179229736328125, 5.4874114990234375, 11.154052734375, 16.820693969726562, 22.487333297729492, 28.153972625732422, 33.820613861083984, 39.48725509643555, 45.153892517089844, 50.820533752441406, 56.48717498779297, 62.15381622314453, 67.8204574584961, 73.48709106445312, 79.15373229980469, 84.82037353515625, 90.48701477050781, 96.15365600585938, 101.82029724121094]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 8.0, 7.0, 7.0, 19.0, 17.0, 12.0, 21.0, 17.0, 25.0, 18.0, 24.0, 31.0, 35.0, 38.0, 39.0, 25.0, 31.0, 41.0, 36.0, 37.0, 41.0, 38.0, 38.0, 36.0, 34.0, 50.0, 34.0, 24.0, 33.0, 27.0, 28.0, 20.0, 19.0, 12.0, 17.0, 10.0, 5.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-68.22395324707031, -66.15882110595703, -64.09368133544922, -62.02854919433594, -59.96341323852539, -57.898277282714844, -55.8331413269043, -53.76800537109375, -51.70287322998047, -49.63773727416992, -47.572601318359375, -45.507469177246094, -43.44233322143555, -41.377197265625, -39.31206130981445, -37.246925354003906, -35.18178939819336, -33.11665344238281, -31.0515193939209, -28.98638343811035, -26.921249389648438, -24.85611343383789, -22.790977478027344, -20.725841522216797, -18.660707473754883, -16.595571517944336, -14.530437469482422, -12.465301513671875, -10.400166511535645, -8.335031509399414, -6.269895553588867, -4.204760551452637, -2.1396255493164062, -0.07449030876159668, 1.990644931793213, 4.055780410766602, 6.120915412902832, 8.186050415039062, 10.25118637084961, 12.31632137298584, 14.38145637512207, 16.446592330932617, 18.51172637939453, 20.576862335205078, 22.641998291015625, 24.70713233947754, 26.772268295288086, 28.83740234375, 30.902538299560547, 32.967674255371094, 35.03281021118164, 37.09794616699219, 39.16307830810547, 41.228214263916016, 43.29335021972656, 45.35848617553711, 47.423622131347656, 49.4887580871582, 51.55389404296875, 53.61902618408203, 55.68416213989258, 57.749298095703125, 59.81443405151367, 61.87957000732422, 63.9447021484375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 19.0, 21.0, 25.0, 27.0, 25.0, 39.0, 28.0, 35.0, 41.0, 27.0, 26.0, 38.0, 48.0, 45.0, 52.0, 49.0, 38.0, 41.0, 34.0, 35.0, 36.0, 19.0, 29.0, 23.0, 16.0, 23.0, 11.0, 19.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4022216796875, -10.023193359375, -9.6441650390625, -9.26513671875, -8.8861083984375, -8.507080078125, -8.1280517578125, -7.7490234375, -7.3699951171875, -6.990966796875, -6.6119384765625, -6.23291015625, -5.8538818359375, -5.474853515625, -5.0958251953125, -4.716796875, -4.3377685546875, -3.958740234375, -3.5797119140625, -3.20068359375, -2.8216552734375, -2.442626953125, -2.0635986328125, -1.6845703125, -1.3055419921875, -0.926513671875, -0.5474853515625, -0.16845703125, 0.2105712890625, 0.589599609375, 0.9686279296875, 1.34765625, 1.7266845703125, 2.105712890625, 2.4847412109375, 2.86376953125, 3.2427978515625, 3.621826171875, 4.0008544921875, 4.3798828125, 4.7589111328125, 5.137939453125, 5.5169677734375, 5.89599609375, 6.2750244140625, 6.654052734375, 7.0330810546875, 7.412109375, 7.7911376953125, 8.170166015625, 8.5491943359375, 8.92822265625, 9.3072509765625, 9.686279296875, 10.0653076171875, 10.4443359375, 10.8233642578125, 11.202392578125, 11.5814208984375, 11.96044921875, 12.3394775390625, 12.718505859375, 13.0975341796875, 13.4765625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 13.0, 22.0, 25.0, 39.0, 62.0, 89.0, 139.0, 243.0, 269.0, 428.0, 691.0, 1003.0, 1454.0, 2269.0, 3409.0, 5156.0, 7910.0, 12275.0, 19321.0, 30183.0, 48509.0, 77044.0, 120369.0, 187091.0, 191843.0, 123560.0, 78273.0, 49288.0, 31043.0, 19817.0, 12621.0, 8215.0, 5449.0, 3404.0, 2350.0, 1565.0, 1011.0, 704.0, 469.0, 307.0, 198.0, 134.0, 91.0, 56.0, 41.0, 32.0, 25.0, 15.0, 2.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.270751953125, -0.2625541687011719, -0.25435638427734375, -0.24615859985351562, -0.2379608154296875, -0.22976303100585938, -0.22156524658203125, -0.21336746215820312, -0.205169677734375, -0.19697189331054688, -0.18877410888671875, -0.18057632446289062, -0.1723785400390625, -0.16418075561523438, -0.15598297119140625, -0.14778518676757812, -0.13958740234375, -0.13138961791992188, -0.12319183349609375, -0.11499404907226562, -0.1067962646484375, -0.09859848022460938, -0.09040069580078125, -0.08220291137695312, -0.074005126953125, -0.06580734252929688, -0.05760955810546875, -0.049411773681640625, -0.0412139892578125, -0.033016204833984375, -0.02481842041015625, -0.016620635986328125, -0.0084228515625, -0.000225067138671875, 0.00797271728515625, 0.016170501708984375, 0.0243682861328125, 0.032566070556640625, 0.04076385498046875, 0.048961639404296875, 0.057159423828125, 0.06535720825195312, 0.07355499267578125, 0.08175277709960938, 0.0899505615234375, 0.09814834594726562, 0.10634613037109375, 0.11454391479492188, 0.12274169921875, 0.13093948364257812, 0.13913726806640625, 0.14733505249023438, 0.1555328369140625, 0.16373062133789062, 0.17192840576171875, 0.18012619018554688, 0.188323974609375, 0.19652175903320312, 0.20471954345703125, 0.21291732788085938, 0.2211151123046875, 0.22931289672851562, 0.23751068115234375, 0.24570846557617188, 0.25390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 4.0, 12.0, 15.0, 14.0, 15.0, 27.0, 15.0, 15.0, 20.0, 18.0, 29.0, 27.0, 28.0, 33.0, 26.0, 33.0, 49.0, 35.0, 38.0, 1068.0, 42.0, 35.0, 37.0, 35.0, 39.0, 38.0, 35.0, 19.0, 21.0, 28.0, 26.0, 21.0, 15.0, 15.0, 13.0, 18.0, 10.0, 9.0, 8.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.9609375, -7.701904296875, -7.44287109375, -7.183837890625, -6.9248046875, -6.665771484375, -6.40673828125, -6.147705078125, -5.888671875, -5.629638671875, -5.37060546875, -5.111572265625, -4.8525390625, -4.593505859375, -4.33447265625, -4.075439453125, -3.81640625, -3.557373046875, -3.29833984375, -3.039306640625, -2.7802734375, -2.521240234375, -2.26220703125, -2.003173828125, -1.744140625, -1.485107421875, -1.22607421875, -0.967041015625, -0.7080078125, -0.448974609375, -0.18994140625, 0.069091796875, 0.328125, 0.587158203125, 0.84619140625, 1.105224609375, 1.3642578125, 1.623291015625, 1.88232421875, 2.141357421875, 2.400390625, 2.659423828125, 2.91845703125, 3.177490234375, 3.4365234375, 3.695556640625, 3.95458984375, 4.213623046875, 4.47265625, 4.731689453125, 4.99072265625, 5.249755859375, 5.5087890625, 5.767822265625, 6.02685546875, 6.285888671875, 6.544921875, 6.803955078125, 7.06298828125, 7.322021484375, 7.5810546875, 7.840087890625, 8.09912109375, 8.358154296875, 8.6171875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 6.0, 7.0, 11.0, 11.0, 19.0, 23.0, 38.0, 57.0, 92.0, 115.0, 174.0, 254.0, 324.0, 432.0, 681.0, 977.0, 1270.0, 1721.0, 2336.0, 3249.0, 4757.0, 6824.0, 9663.0, 13874.0, 20319.0, 29646.0, 44018.0, 67707.0, 106036.0, 172016.0, 1244791.0, 125251.0, 78771.0, 50890.0, 34106.0, 22939.0, 15990.0, 11174.0, 7684.0, 5576.0, 3761.0, 2725.0, 1924.0, 1426.0, 1023.0, 732.0, 494.0, 372.0, 240.0, 200.0, 129.0, 100.0, 58.0, 47.0, 34.0, 26.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0], "bins": [-0.11517333984375, -0.11147880554199219, -0.10778427124023438, -0.10408973693847656, -0.10039520263671875, -0.09670066833496094, -0.09300613403320312, -0.08931159973144531, -0.0856170654296875, -0.08192253112792969, -0.07822799682617188, -0.07453346252441406, -0.07083892822265625, -0.06714439392089844, -0.06344985961914062, -0.05975532531738281, -0.056060791015625, -0.05236625671386719, -0.048671722412109375, -0.04497718811035156, -0.04128265380859375, -0.03758811950683594, -0.033893585205078125, -0.030199050903320312, -0.0265045166015625, -0.022809982299804688, -0.019115447998046875, -0.015420913696289062, -0.01172637939453125, -0.008031845092773438, -0.004337310791015625, -0.0006427764892578125, 0.0030517578125, 0.0067462921142578125, 0.010440826416015625, 0.014135360717773438, 0.01782989501953125, 0.021524429321289062, 0.025218963623046875, 0.028913497924804688, 0.0326080322265625, 0.03630256652832031, 0.039997100830078125, 0.04369163513183594, 0.04738616943359375, 0.05108070373535156, 0.054775238037109375, 0.05846977233886719, 0.062164306640625, 0.06585884094238281, 0.06955337524414062, 0.07324790954589844, 0.07694244384765625, 0.08063697814941406, 0.08433151245117188, 0.08802604675292969, 0.0917205810546875, 0.09541511535644531, 0.09910964965820312, 0.10280418395996094, 0.10649871826171875, 0.11019325256347656, 0.11388778686523438, 0.11758232116699219, 0.12127685546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 8.0, 7.0, 11.0, 12.0, 12.0, 15.0, 29.0, 32.0, 28.0, 39.0, 41.0, 46.0, 56.0, 61.0, 62.0, 53.0, 67.0, 65.0, 59.0, 40.0, 44.0, 24.0, 28.0, 21.0, 18.0, 15.0, 11.0, 4.0, 9.0, 17.0, 3.0, 7.0, 1.0, 7.0, 2.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0006089210510253906, -0.0005890354514122009, -0.0005691498517990112, -0.0005492642521858215, -0.0005293786525726318, -0.0005094930529594421, -0.0004896074533462524, -0.00046972185373306274, -0.00044983625411987305, -0.00042995065450668335, -0.00041006505489349365, -0.00039017945528030396, -0.00037029385566711426, -0.00035040825605392456, -0.00033052265644073486, -0.00031063705682754517, -0.00029075145721435547, -0.00027086585760116577, -0.0002509802579879761, -0.00023109465837478638, -0.00021120905876159668, -0.00019132345914840698, -0.00017143785953521729, -0.0001515522599220276, -0.0001316666603088379, -0.0001117810606956482, -9.18954610824585e-05, -7.20098614692688e-05, -5.21242618560791e-05, -3.2238662242889404e-05, -1.2353062629699707e-05, 7.53253698348999e-06, 2.7418136596679688e-05, 4.7303736209869385e-05, 6.718933582305908e-05, 8.707493543624878e-05, 0.00010696053504943848, 0.00012684613466262817, 0.00014673173427581787, 0.00016661733388900757, 0.00018650293350219727, 0.00020638853311538696, 0.00022627413272857666, 0.00024615973234176636, 0.00026604533195495605, 0.00028593093156814575, 0.00030581653118133545, 0.00032570213079452515, 0.00034558773040771484, 0.00036547333002090454, 0.00038535892963409424, 0.00040524452924728394, 0.00042513012886047363, 0.00044501572847366333, 0.00046490132808685303, 0.0004847869277000427, 0.0005046725273132324, 0.0005245581269264221, 0.0005444437265396118, 0.0005643293261528015, 0.0005842149257659912, 0.0006041005253791809, 0.0006239861249923706, 0.0006438717246055603, 0.00066375732421875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 7.0, 2.0, 4.0, 3.0, 19.0, 9.0, 4.0, 11.0, 14.0, 19.0, 26.0, 29.0, 36.0, 56.0, 69.0, 125.0, 234.0, 660.0, 17312.0, 1021426.0, 7418.0, 494.0, 185.0, 93.0, 58.0, 43.0, 46.0, 34.0, 18.0, 11.0, 11.0, 12.0, 8.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.015869140625, -0.015394210815429688, -0.014919281005859375, -0.014444351196289062, -0.01396942138671875, -0.013494491577148438, -0.013019561767578125, -0.012544631958007812, -0.0120697021484375, -0.011594772338867188, -0.011119842529296875, -0.010644912719726562, -0.01016998291015625, -0.009695053100585938, -0.009220123291015625, -0.008745193481445312, -0.008270263671875, -0.0077953338623046875, -0.007320404052734375, -0.0068454742431640625, -0.00637054443359375, -0.0058956146240234375, -0.005420684814453125, -0.0049457550048828125, -0.0044708251953125, -0.0039958953857421875, -0.003520965576171875, -0.0030460357666015625, -0.00257110595703125, -0.0020961761474609375, -0.001621246337890625, -0.0011463165283203125, -0.00067138671875, -0.0001964569091796875, 0.000278472900390625, 0.0007534027099609375, 0.00122833251953125, 0.0017032623291015625, 0.002178192138671875, 0.0026531219482421875, 0.0031280517578125, 0.0036029815673828125, 0.004077911376953125, 0.0045528411865234375, 0.00502777099609375, 0.0055027008056640625, 0.005977630615234375, 0.0064525604248046875, 0.006927490234375, 0.0074024200439453125, 0.007877349853515625, 0.008352279663085938, 0.00882720947265625, 0.009302139282226562, 0.009777069091796875, 0.010251998901367188, 0.0107269287109375, 0.011201858520507812, 0.011676788330078125, 0.012151718139648438, 0.01262664794921875, 0.013101577758789062, 0.013576507568359375, 0.014051437377929688, 0.0145263671875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 31.0, 982.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026336494833230972, -0.025868872180581093, -0.025401249527931213, -0.024933626875281334, -0.024466004222631454, -0.023998383432626724, -0.023530758917331696, -0.023063138127326965, -0.022595515474677086, -0.022127892822027206, -0.021660270169377327, -0.021192647516727448, -0.020725024864077568, -0.02025740221142769, -0.01978978142142296, -0.01932215876877308, -0.0188545361161232, -0.01838691346347332, -0.01791929081082344, -0.01745166815817356, -0.01698404550552368, -0.01651642471551895, -0.016048800200223923, -0.015581178478896618, -0.015113554894924164, -0.014645932242274284, -0.014178309589624405, -0.013710686936974525, -0.01324306521564722, -0.012775442562997341, -0.012307819910347462, -0.011840197257697582, -0.011372575536370277, -0.010904952883720398, -0.010437330231070518, -0.009969707578420639, -0.009502085857093334, -0.009034463204443455, -0.008566840551793575, -0.008099217899143696, -0.007631596177816391, -0.0071639735251665115, -0.006696351338177919, -0.00622872868552804, -0.005761106498539448, -0.005293483845889568, -0.004825861193239689, -0.004358238540589809, -0.0038906161207705736, -0.003422993700951338, -0.0029553710483014584, -0.0024877486284822226, -0.0020201262086629868, -0.001552503788843751, -0.0010848811361938715, -0.0006172587163746357, -0.0001496362965553999, 0.0003179861814714968, 0.0007856086594983935, 0.0012532311957329512, 0.001720853615552187, 0.0021884760353714228, 0.0026560986880213022, 0.003123721107840538, 0.003591343527659774]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 10.0, 11.0, 18.0, 15.0, 23.0, 34.0, 52.0, 49.0, 55.0, 49.0, 71.0, 72.0, 79.0, 77.0, 70.0, 58.0, 49.0, 39.0, 45.0, 35.0, 24.0, 18.0, 16.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008350610733032227, -0.0008047772571444511, -0.0007744934409856796, -0.0007442096248269081, -0.0007139258086681366, -0.0006836419925093651, -0.0006533581763505936, -0.000623074360191822, -0.0005927905440330505, -0.000562506727874279, -0.0005322229117155075, -0.000501939095556736, -0.0004716552793979645, -0.00044137146323919296, -0.00041108764708042145, -0.00038080383092164993, -0.0003505200147628784, -0.0003202361986041069, -0.0002899523824453354, -0.0002596685662865639, -0.00022938475012779236, -0.00019910093396902084, -0.00016881711781024933, -0.00013853330165147781, -0.0001082494854927063, -7.796566933393478e-05, -4.768185317516327e-05, -1.7398037016391754e-05, 1.288577914237976e-05, 4.3169595301151276e-05, 7.345341145992279e-05, 0.0001037372276186943, 0.00013402104377746582, 0.00016430485993623734, 0.00019458867609500885, 0.00022487249225378036, 0.0002551563084125519, 0.0002854401245713234, 0.0003157239407300949, 0.0003460077568888664, 0.00037629157304763794, 0.00040657538920640945, 0.00043685920536518097, 0.0004671430215239525, 0.000497426837682724, 0.0005277106538414955, 0.000557994470000267, 0.0005882782861590385, 0.0006185621023178101, 0.0006488459184765816, 0.0006791297346353531, 0.0007094135507941246, 0.0007396973669528961, 0.0007699811831116676, 0.0008002649992704391, 0.0008305488154292107, 0.0008608326315879822, 0.0008911164477467537, 0.0009214002639055252, 0.0009516840800642967, 0.0009819678962230682, 0.0010122517123818398, 0.0010425355285406113, 0.0010728193446993828, 0.0011031031608581543]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 19.0, 21.0, 25.0, 27.0, 25.0, 39.0, 28.0, 35.0, 41.0, 27.0, 26.0, 38.0, 48.0, 45.0, 52.0, 49.0, 38.0, 41.0, 34.0, 35.0, 36.0, 19.0, 29.0, 23.0, 16.0, 23.0, 11.0, 19.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4022216796875, -10.023193359375, -9.6441650390625, -9.26513671875, -8.8861083984375, -8.507080078125, -8.1280517578125, -7.7490234375, -7.3699951171875, -6.990966796875, -6.6119384765625, -6.23291015625, -5.8538818359375, -5.474853515625, -5.0958251953125, -4.716796875, -4.3377685546875, -3.958740234375, -3.5797119140625, -3.20068359375, -2.8216552734375, -2.442626953125, -2.0635986328125, -1.6845703125, -1.3055419921875, -0.926513671875, -0.5474853515625, -0.16845703125, 0.2105712890625, 0.589599609375, 0.9686279296875, 1.34765625, 1.7266845703125, 2.105712890625, 2.4847412109375, 2.86376953125, 3.2427978515625, 3.621826171875, 4.0008544921875, 4.3798828125, 4.7589111328125, 5.137939453125, 5.5169677734375, 5.89599609375, 6.2750244140625, 6.654052734375, 7.0330810546875, 7.412109375, 7.7911376953125, 8.170166015625, 8.5491943359375, 8.92822265625, 9.3072509765625, 9.686279296875, 10.0653076171875, 10.4443359375, 10.8233642578125, 11.202392578125, 11.5814208984375, 11.96044921875, 12.3394775390625, 12.718505859375, 13.0975341796875, 13.4765625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 5.0, 12.0, 14.0, 19.0, 23.0, 44.0, 65.0, 88.0, 115.0, 177.0, 276.0, 396.0, 575.0, 926.0, 1383.0, 2385.0, 4006.0, 7459.0, 15303.0, 41789.0, 288605.0, 585906.0, 59489.0, 18574.0, 8836.0, 4786.0, 2726.0, 1656.0, 983.0, 597.0, 409.0, 269.0, 198.0, 131.0, 113.0, 62.0, 32.0, 39.0, 28.0, 14.0, 10.0, 6.0, 3.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1953125, -13.7078857421875, -13.220458984375, -12.7330322265625, -12.24560546875, -11.7581787109375, -11.270751953125, -10.7833251953125, -10.2958984375, -9.8084716796875, -9.321044921875, -8.8336181640625, -8.34619140625, -7.8587646484375, -7.371337890625, -6.8839111328125, -6.396484375, -5.9090576171875, -5.421630859375, -4.9342041015625, -4.44677734375, -3.9593505859375, -3.471923828125, -2.9844970703125, -2.4970703125, -2.0096435546875, -1.522216796875, -1.0347900390625, -0.54736328125, -0.0599365234375, 0.427490234375, 0.9149169921875, 1.40234375, 1.8897705078125, 2.377197265625, 2.8646240234375, 3.35205078125, 3.8394775390625, 4.326904296875, 4.8143310546875, 5.3017578125, 5.7891845703125, 6.276611328125, 6.7640380859375, 7.25146484375, 7.7388916015625, 8.226318359375, 8.7137451171875, 9.201171875, 9.6885986328125, 10.176025390625, 10.6634521484375, 11.15087890625, 11.6383056640625, 12.125732421875, 12.6131591796875, 13.1005859375, 13.5880126953125, 14.075439453125, 14.5628662109375, 15.05029296875, 15.5377197265625, 16.025146484375, 16.5125732421875, 17.0]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 8.0, 11.0, 15.0, 22.0, 19.0, 18.0, 29.0, 37.0, 33.0, 30.0, 39.0, 45.0, 54.0, 82.0, 171.0, 1812.0, 114.0, 86.0, 55.0, 44.0, 41.0, 41.0, 31.0, 40.0, 26.0, 33.0, 17.0, 14.0, 10.0, 10.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.12646484375, -37.8779296875, -36.62939453125, -35.380859375, -34.13232421875, -32.8837890625, -31.63525390625, -30.38671875, -29.13818359375, -27.8896484375, -26.64111328125, -25.392578125, -24.14404296875, -22.8955078125, -21.64697265625, -20.3984375, -19.14990234375, -17.9013671875, -16.65283203125, -15.404296875, -14.15576171875, -12.9072265625, -11.65869140625, -10.41015625, -9.16162109375, -7.9130859375, -6.66455078125, -5.416015625, -4.16748046875, -2.9189453125, -1.67041015625, -0.421875, 0.82666015625, 2.0751953125, 3.32373046875, 4.572265625, 5.82080078125, 7.0693359375, 8.31787109375, 9.56640625, 10.81494140625, 12.0634765625, 13.31201171875, 14.560546875, 15.80908203125, 17.0576171875, 18.30615234375, 19.5546875, 20.80322265625, 22.0517578125, 23.30029296875, 24.548828125, 25.79736328125, 27.0458984375, 28.29443359375, 29.54296875, 30.79150390625, 32.0400390625, 33.28857421875, 34.537109375, 35.78564453125, 37.0341796875, 38.28271484375, 39.53125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 7.0, 5.0, 6.0, 6.0, 13.0, 14.0, 17.0, 27.0, 36.0, 46.0, 48.0, 71.0, 95.0, 136.0, 340.0, 1119.0, 10193.0, 2881240.0, 245333.0, 5405.0, 832.0, 221.0, 128.0, 70.0, 54.0, 51.0, 35.0, 33.0, 26.0, 22.0, 13.0, 11.0, 9.0, 6.0, 13.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-91.125, -88.2666015625, -85.408203125, -82.5498046875, -79.69140625, -76.8330078125, -73.974609375, -71.1162109375, -68.2578125, -65.3994140625, -62.541015625, -59.6826171875, -56.82421875, -53.9658203125, -51.107421875, -48.2490234375, -45.390625, -42.5322265625, -39.673828125, -36.8154296875, -33.95703125, -31.0986328125, -28.240234375, -25.3818359375, -22.5234375, -19.6650390625, -16.806640625, -13.9482421875, -11.08984375, -8.2314453125, -5.373046875, -2.5146484375, 0.34375, 3.2021484375, 6.060546875, 8.9189453125, 11.77734375, 14.6357421875, 17.494140625, 20.3525390625, 23.2109375, 26.0693359375, 28.927734375, 31.7861328125, 34.64453125, 37.5029296875, 40.361328125, 43.2197265625, 46.078125, 48.9365234375, 51.794921875, 54.6533203125, 57.51171875, 60.3701171875, 63.228515625, 66.0869140625, 68.9453125, 71.8037109375, 74.662109375, 77.5205078125, 80.37890625, 83.2373046875, 86.095703125, 88.9541015625, 91.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 16.0, 193.0, 543.0, 232.0, 24.0, 5.0, 0.0, 2.0], "bins": [-378.1009826660156, -371.63995361328125, -365.17889404296875, -358.7178649902344, -352.2568054199219, -345.7957763671875, -339.334716796875, -332.8736877441406, -326.41265869140625, -319.9516296386719, -313.4905700683594, -307.029541015625, -300.5684814453125, -294.1074523925781, -287.64642333984375, -281.18536376953125, -274.72430419921875, -268.2632751464844, -261.8022155761719, -255.3411865234375, -248.88014221191406, -242.41909790039062, -235.9580535888672, -229.49700927734375, -223.03598022460938, -216.57493591308594, -210.1138916015625, -203.65286254882812, -197.1918182373047, -190.73077392578125, -184.2697296142578, -177.80868530273438, -171.34765625, -164.88661193847656, -158.42556762695312, -151.96453857421875, -145.5034942626953, -139.04244995117188, -132.58140563964844, -126.120361328125, -119.65933227539062, -113.19828796386719, -106.73725128173828, -100.27620697021484, -93.81517028808594, -87.3541259765625, -80.89308166503906, -74.43203735351562, -67.97099304199219, -61.509952545166016, -55.048912048339844, -48.587867736816406, -42.126827239990234, -35.66578674316406, -29.204742431640625, -22.743701934814453, -16.282665252685547, -9.821623802185059, -3.3605823516845703, 3.1004600524902344, 9.561500549316406, 16.022541046142578, 22.483585357666016, 28.944625854492188, 35.40566635131836]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 7.0, 19.0, 15.0, 14.0, 22.0, 25.0, 24.0, 27.0, 26.0, 25.0, 32.0, 29.0, 38.0, 34.0, 39.0, 33.0, 40.0, 45.0, 38.0, 45.0, 38.0, 32.0, 26.0, 29.0, 25.0, 24.0, 24.0, 18.0, 23.0, 22.0, 16.0, 24.0, 16.0, 8.0, 15.0, 8.0, 5.0, 4.0, 10.0, 3.0, 6.0, 5.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-84.20744323730469, -81.36939239501953, -78.53133392333984, -75.69328308105469, -72.855224609375, -70.01717376708984, -67.17912292480469, -64.341064453125, -61.503013610839844, -58.66495895385742, -55.826904296875, -52.988853454589844, -50.15079879760742, -47.312744140625, -44.474693298339844, -41.63663864135742, -38.798583984375, -35.96052932739258, -33.122474670410156, -30.284423828125, -27.446369171142578, -24.608314514160156, -21.770261764526367, -18.932209014892578, -16.094154357910156, -13.25610065460205, -10.418046951293945, -7.57999324798584, -4.741939544677734, -1.903885841369629, 0.9341678619384766, 3.7722206115722656, 6.6102752685546875, 9.448328971862793, 12.286382675170898, 15.124436378479004, 17.96249008178711, 20.80054473876953, 23.63859748840332, 26.47665023803711, 29.31470489501953, 32.15275955200195, 34.990814208984375, 37.82886505126953, 40.66691970825195, 43.504974365234375, 46.34302520751953, 49.18107986450195, 52.019134521484375, 54.8571891784668, 57.69524383544922, 60.533294677734375, 63.3713493347168, 66.20940399169922, 69.04745483398438, 71.88551330566406, 74.72356414794922, 77.56161499023438, 80.39967346191406, 83.23772430419922, 86.07577514648438, 88.91383361816406, 91.75188446044922, 94.58993530273438, 97.42799377441406]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 7.0, 13.0, 15.0, 18.0, 22.0, 23.0, 22.0, 27.0, 27.0, 37.0, 30.0, 31.0, 33.0, 31.0, 34.0, 40.0, 34.0, 48.0, 44.0, 47.0, 39.0, 31.0, 46.0, 38.0, 32.0, 23.0, 25.0, 19.0, 20.0, 20.0, 18.0, 13.0, 13.0, 7.0, 11.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.6953125, -11.310546875, -10.92578125, -10.541015625, -10.15625, -9.771484375, -9.38671875, -9.001953125, -8.6171875, -8.232421875, -7.84765625, -7.462890625, -7.078125, -6.693359375, -6.30859375, -5.923828125, -5.5390625, -5.154296875, -4.76953125, -4.384765625, -4.0, -3.615234375, -3.23046875, -2.845703125, -2.4609375, -2.076171875, -1.69140625, -1.306640625, -0.921875, -0.537109375, -0.15234375, 0.232421875, 0.6171875, 1.001953125, 1.38671875, 1.771484375, 2.15625, 2.541015625, 2.92578125, 3.310546875, 3.6953125, 4.080078125, 4.46484375, 4.849609375, 5.234375, 5.619140625, 6.00390625, 6.388671875, 6.7734375, 7.158203125, 7.54296875, 7.927734375, 8.3125, 8.697265625, 9.08203125, 9.466796875, 9.8515625, 10.236328125, 10.62109375, 11.005859375, 11.390625, 11.775390625, 12.16015625, 12.544921875, 12.9296875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 26.0, 42.0, 50.0, 81.0, 123.0, 172.0, 232.0, 317.0, 463.0, 723.0, 1092.0, 1612.0, 2520.0, 3823.0, 6411.0, 10861.0, 20646.0, 49804.0, 157302.0, 576315.0, 1623025.0, 1191677.0, 378867.0, 97068.0, 32230.0, 15359.0, 8634.0, 5103.0, 3222.0, 2047.0, 1459.0, 915.0, 545.0, 407.0, 309.0, 211.0, 152.0, 122.0, 79.0, 56.0, 30.0, 26.0, 19.0, 18.0, 13.0, 9.0, 8.0, 6.0, 2.0, 6.0, 0.0, 3.0, 1.0], "bins": [-14.421875, -13.9686279296875, -13.515380859375, -13.0621337890625, -12.60888671875, -12.1556396484375, -11.702392578125, -11.2491455078125, -10.7958984375, -10.3426513671875, -9.889404296875, -9.4361572265625, -8.98291015625, -8.5296630859375, -8.076416015625, -7.6231689453125, -7.169921875, -6.7166748046875, -6.263427734375, -5.8101806640625, -5.35693359375, -4.9036865234375, -4.450439453125, -3.9971923828125, -3.5439453125, -3.0906982421875, -2.637451171875, -2.1842041015625, -1.73095703125, -1.2777099609375, -0.824462890625, -0.3712158203125, 0.08203125, 0.5352783203125, 0.988525390625, 1.4417724609375, 1.89501953125, 2.3482666015625, 2.801513671875, 3.2547607421875, 3.7080078125, 4.1612548828125, 4.614501953125, 5.0677490234375, 5.52099609375, 5.9742431640625, 6.427490234375, 6.8807373046875, 7.333984375, 7.7872314453125, 8.240478515625, 8.6937255859375, 9.14697265625, 9.6002197265625, 10.053466796875, 10.5067138671875, 10.9599609375, 11.4132080078125, 11.866455078125, 12.3197021484375, 12.77294921875, 13.2261962890625, 13.679443359375, 14.1326904296875, 14.5859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 10.0, 9.0, 13.0, 22.0, 34.0, 35.0, 52.0, 64.0, 81.0, 154.0, 226.0, 411.0, 695.0, 823.0, 589.0, 311.0, 167.0, 104.0, 63.0, 57.0, 34.0, 23.0, 20.0, 20.0, 17.0, 10.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.96875, -35.07568359375, -34.1826171875, -33.28955078125, -32.396484375, -31.50341796875, -30.6103515625, -29.71728515625, -28.82421875, -27.93115234375, -27.0380859375, -26.14501953125, -25.251953125, -24.35888671875, -23.4658203125, -22.57275390625, -21.6796875, -20.78662109375, -19.8935546875, -19.00048828125, -18.107421875, -17.21435546875, -16.3212890625, -15.42822265625, -14.53515625, -13.64208984375, -12.7490234375, -11.85595703125, -10.962890625, -10.06982421875, -9.1767578125, -8.28369140625, -7.390625, -6.49755859375, -5.6044921875, -4.71142578125, -3.818359375, -2.92529296875, -2.0322265625, -1.13916015625, -0.24609375, 0.64697265625, 1.5400390625, 2.43310546875, 3.326171875, 4.21923828125, 5.1123046875, 6.00537109375, 6.8984375, 7.79150390625, 8.6845703125, 9.57763671875, 10.470703125, 11.36376953125, 12.2568359375, 13.14990234375, 14.04296875, 14.93603515625, 15.8291015625, 16.72216796875, 17.615234375, 18.50830078125, 19.4013671875, 20.29443359375, 21.1875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 13.0, 19.0, 15.0, 23.0, 32.0, 29.0, 63.0, 97.0, 219.0, 536.0, 3075.0, 75594.0, 4028231.0, 82041.0, 3088.0, 594.0, 230.0, 106.0, 80.0, 48.0, 32.0, 35.0, 17.0, 12.0, 15.0, 4.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -83.8701171875, -80.302734375, -76.7353515625, -73.16796875, -69.6005859375, -66.033203125, -62.4658203125, -58.8984375, -55.3310546875, -51.763671875, -48.1962890625, -44.62890625, -41.0615234375, -37.494140625, -33.9267578125, -30.359375, -26.7919921875, -23.224609375, -19.6572265625, -16.08984375, -12.5224609375, -8.955078125, -5.3876953125, -1.8203125, 1.7470703125, 5.314453125, 8.8818359375, 12.44921875, 16.0166015625, 19.583984375, 23.1513671875, 26.71875, 30.2861328125, 33.853515625, 37.4208984375, 40.98828125, 44.5556640625, 48.123046875, 51.6904296875, 55.2578125, 58.8251953125, 62.392578125, 65.9599609375, 69.52734375, 73.0947265625, 76.662109375, 80.2294921875, 83.796875, 87.3642578125, 90.931640625, 94.4990234375, 98.06640625, 101.6337890625, 105.201171875, 108.7685546875, 112.3359375, 115.9033203125, 119.470703125, 123.0380859375, 126.60546875, 130.1728515625, 133.740234375, 137.3076171875, 140.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 21.0, 43.0, 104.0, 225.0, 298.0, 188.0, 87.0, 32.0, 12.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-356.9347229003906, -350.2441101074219, -343.5534973144531, -336.8628845214844, -330.1722717285156, -323.48162841796875, -316.791015625, -310.10040283203125, -303.4097900390625, -296.71917724609375, -290.028564453125, -283.33795166015625, -276.6473388671875, -269.95672607421875, -263.2660827636719, -256.5754699707031, -249.88485717773438, -243.19424438476562, -236.50363159179688, -229.81300354003906, -223.1223907470703, -216.43177795410156, -209.7411651611328, -203.050537109375, -196.3599395751953, -189.66932678222656, -182.9787139892578, -176.2880859375, -169.59747314453125, -162.9068603515625, -156.21624755859375, -149.525634765625, -142.8350067138672, -136.14439392089844, -129.4537811279297, -122.7631607055664, -116.07254028320312, -109.38192749023438, -102.69131469726562, -96.00069427490234, -89.31007385253906, -82.61946105957031, -75.92884063720703, -69.23822784423828, -62.547607421875, -55.85699462890625, -49.166378021240234, -42.47576141357422, -35.78514862060547, -29.094532012939453, -22.403915405273438, -15.713300704956055, -9.022684097290039, -2.3320693969726562, 4.358547210693359, 11.049163818359375, 17.73978042602539, 24.430397033691406, 31.121013641357422, 37.81163024902344, 44.50224304199219, 51.1928596496582, 57.88347625732422, 64.5740966796875, 71.26470947265625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 5.0, 11.0, 5.0, 11.0, 8.0, 9.0, 14.0, 8.0, 14.0, 12.0, 14.0, 17.0, 15.0, 24.0, 22.0, 24.0, 30.0, 30.0, 38.0, 25.0, 39.0, 39.0, 46.0, 25.0, 45.0, 43.0, 23.0, 39.0, 31.0, 29.0, 31.0, 34.0, 27.0, 33.0, 14.0, 31.0, 16.0, 11.0, 26.0, 10.0, 12.0, 12.0, 14.0, 7.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-61.083892822265625, -59.129764556884766, -57.175636291503906, -55.22150802612305, -53.26737976074219, -51.313255310058594, -49.359127044677734, -47.404998779296875, -45.450870513916016, -43.496742248535156, -41.5426139831543, -39.58848571777344, -37.634361267089844, -35.68022918701172, -33.726104736328125, -31.771976470947266, -29.817848205566406, -27.863719940185547, -25.909591674804688, -23.95546531677246, -22.0013370513916, -20.047208786010742, -18.093082427978516, -16.138954162597656, -14.184825897216797, -12.230697631835938, -10.276570320129395, -8.322443008422852, -6.368314743041992, -4.414186477661133, -2.46005916595459, -0.5059318542480469, 1.4481964111328125, 3.4023241996765137, 5.356451988220215, 7.310579776763916, 9.264707565307617, 11.218835830688477, 13.17296314239502, 15.127090454101562, 17.081218719482422, 19.03534698486328, 20.98947525024414, 22.943601608276367, 24.897729873657227, 26.851858139038086, 28.805984497070312, 30.760112762451172, 32.71424102783203, 34.66836929321289, 36.62249755859375, 38.57662582397461, 40.53075408935547, 42.48487854003906, 44.43900680541992, 46.39313507080078, 48.34726333618164, 50.3013916015625, 52.25551986694336, 54.20964813232422, 56.16377258300781, 58.11790466308594, 60.07202911376953, 62.02615737915039, 63.98028564453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 9.0, 17.0, 14.0, 14.0, 22.0, 25.0, 27.0, 20.0, 30.0, 31.0, 34.0, 29.0, 38.0, 39.0, 45.0, 35.0, 22.0, 34.0, 45.0, 42.0, 41.0, 32.0, 44.0, 34.0, 41.0, 26.0, 21.0, 25.0, 19.0, 20.0, 16.0, 22.0, 15.0, 8.0, 6.0, 5.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.8018798828125, -10.431884765625, -10.0618896484375, -9.69189453125, -9.3218994140625, -8.951904296875, -8.5819091796875, -8.2119140625, -7.8419189453125, -7.471923828125, -7.1019287109375, -6.73193359375, -6.3619384765625, -5.991943359375, -5.6219482421875, -5.251953125, -4.8819580078125, -4.511962890625, -4.1419677734375, -3.77197265625, -3.4019775390625, -3.031982421875, -2.6619873046875, -2.2919921875, -1.9219970703125, -1.552001953125, -1.1820068359375, -0.81201171875, -0.4420166015625, -0.072021484375, 0.2979736328125, 0.66796875, 1.0379638671875, 1.407958984375, 1.7779541015625, 2.14794921875, 2.5179443359375, 2.887939453125, 3.2579345703125, 3.6279296875, 3.9979248046875, 4.367919921875, 4.7379150390625, 5.10791015625, 5.4779052734375, 5.847900390625, 6.2178955078125, 6.587890625, 6.9578857421875, 7.327880859375, 7.6978759765625, 8.06787109375, 8.4378662109375, 8.807861328125, 9.1778564453125, 9.5478515625, 9.9178466796875, 10.287841796875, 10.6578369140625, 11.02783203125, 11.3978271484375, 11.767822265625, 12.1378173828125, 12.5078125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 20.0, 34.0, 33.0, 58.0, 89.0, 116.0, 192.0, 279.0, 402.0, 584.0, 900.0, 1293.0, 1802.0, 2693.0, 4068.0, 6039.0, 9374.0, 14132.0, 21761.0, 34075.0, 52989.0, 82495.0, 129726.0, 193510.0, 175237.0, 113171.0, 71329.0, 46019.0, 29680.0, 19181.0, 12604.0, 8176.0, 5424.0, 3586.0, 2434.0, 1577.0, 1099.0, 730.0, 488.0, 339.0, 252.0, 172.0, 122.0, 60.0, 56.0, 47.0, 31.0, 24.0, 12.0, 5.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.251953125, -0.24404144287109375, -0.2361297607421875, -0.22821807861328125, -0.220306396484375, -0.21239471435546875, -0.2044830322265625, -0.19657135009765625, -0.18865966796875, -0.18074798583984375, -0.1728363037109375, -0.16492462158203125, -0.157012939453125, -0.14910125732421875, -0.1411895751953125, -0.13327789306640625, -0.1253662109375, -0.11745452880859375, -0.1095428466796875, -0.10163116455078125, -0.093719482421875, -0.08580780029296875, -0.0778961181640625, -0.06998443603515625, -0.06207275390625, -0.05416107177734375, -0.0462493896484375, -0.03833770751953125, -0.030426025390625, -0.02251434326171875, -0.0146026611328125, -0.00669097900390625, 0.001220703125, 0.00913238525390625, 0.0170440673828125, 0.02495574951171875, 0.032867431640625, 0.04077911376953125, 0.0486907958984375, 0.05660247802734375, 0.06451416015625, 0.07242584228515625, 0.0803375244140625, 0.08824920654296875, 0.096160888671875, 0.10407257080078125, 0.1119842529296875, 0.11989593505859375, 0.1278076171875, 0.13571929931640625, 0.1436309814453125, 0.15154266357421875, 0.159454345703125, 0.16736602783203125, 0.1752777099609375, 0.18318939208984375, 0.19110107421875, 0.19901275634765625, 0.2069244384765625, 0.21483612060546875, 0.222747802734375, 0.23065948486328125, 0.2385711669921875, 0.24648284912109375, 0.25439453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 16.0, 10.0, 12.0, 18.0, 15.0, 14.0, 19.0, 27.0, 28.0, 28.0, 36.0, 36.0, 42.0, 28.0, 35.0, 26.0, 33.0, 34.0, 1055.0, 34.0, 32.0, 36.0, 30.0, 36.0, 30.0, 32.0, 28.0, 33.0, 24.0, 25.0, 27.0, 20.0, 29.0, 12.0, 11.0, 11.0, 13.0, 6.0, 3.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9921875, -7.7354736328125, -7.478759765625, -7.2220458984375, -6.96533203125, -6.7086181640625, -6.451904296875, -6.1951904296875, -5.9384765625, -5.6817626953125, -5.425048828125, -5.1683349609375, -4.91162109375, -4.6549072265625, -4.398193359375, -4.1414794921875, -3.884765625, -3.6280517578125, -3.371337890625, -3.1146240234375, -2.85791015625, -2.6011962890625, -2.344482421875, -2.0877685546875, -1.8310546875, -1.5743408203125, -1.317626953125, -1.0609130859375, -0.80419921875, -0.5474853515625, -0.290771484375, -0.0340576171875, 0.22265625, 0.4793701171875, 0.736083984375, 0.9927978515625, 1.24951171875, 1.5062255859375, 1.762939453125, 2.0196533203125, 2.2763671875, 2.5330810546875, 2.789794921875, 3.0465087890625, 3.30322265625, 3.5599365234375, 3.816650390625, 4.0733642578125, 4.330078125, 4.5867919921875, 4.843505859375, 5.1002197265625, 5.35693359375, 5.6136474609375, 5.870361328125, 6.1270751953125, 6.3837890625, 6.6405029296875, 6.897216796875, 7.1539306640625, 7.41064453125, 7.6673583984375, 7.924072265625, 8.1807861328125, 8.4375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 12.0, 12.0, 6.0, 29.0, 34.0, 55.0, 80.0, 92.0, 156.0, 206.0, 291.0, 398.0, 560.0, 764.0, 1138.0, 1611.0, 2183.0, 3201.0, 4589.0, 6509.0, 9522.0, 13725.0, 20087.0, 29447.0, 43131.0, 63589.0, 95331.0, 146462.0, 1235461.0, 138184.0, 90271.0, 60205.0, 40844.0, 27498.0, 18589.0, 12976.0, 8881.0, 6344.0, 4426.0, 2934.0, 2012.0, 1527.0, 1145.0, 754.0, 563.0, 392.0, 275.0, 184.0, 128.0, 101.0, 74.0, 57.0, 30.0, 24.0, 18.0, 11.0, 3.0, 3.0, 3.0, 1.0, 4.0], "bins": [-0.11627197265625, -0.11257266998291016, -0.10887336730957031, -0.10517406463623047, -0.10147476196289062, -0.09777545928955078, -0.09407615661621094, -0.0903768539428711, -0.08667755126953125, -0.0829782485961914, -0.07927894592285156, -0.07557964324951172, -0.07188034057617188, -0.06818103790283203, -0.06448173522949219, -0.060782432556152344, -0.0570831298828125, -0.053383827209472656, -0.04968452453613281, -0.04598522186279297, -0.042285919189453125, -0.03858661651611328, -0.03488731384277344, -0.031188011169433594, -0.02748870849609375, -0.023789405822753906, -0.020090103149414062, -0.01639080047607422, -0.012691497802734375, -0.008992195129394531, -0.0052928924560546875, -0.0015935897827148438, 0.002105712890625, 0.005805015563964844, 0.009504318237304688, 0.013203620910644531, 0.016902923583984375, 0.02060222625732422, 0.024301528930664062, 0.028000831604003906, 0.03170013427734375, 0.035399436950683594, 0.03909873962402344, 0.04279804229736328, 0.046497344970703125, 0.05019664764404297, 0.05389595031738281, 0.057595252990722656, 0.0612945556640625, 0.06499385833740234, 0.06869316101074219, 0.07239246368408203, 0.07609176635742188, 0.07979106903076172, 0.08349037170410156, 0.0871896743774414, 0.09088897705078125, 0.0945882797241211, 0.09828758239746094, 0.10198688507080078, 0.10568618774414062, 0.10938549041748047, 0.11308479309082031, 0.11678409576416016, 0.1204833984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 9.0, 7.0, 10.0, 11.0, 14.0, 13.0, 17.0, 23.0, 33.0, 42.0, 36.0, 66.0, 42.0, 61.0, 47.0, 85.0, 61.0, 56.0, 56.0, 42.0, 48.0, 37.0, 36.0, 27.0, 21.0, 16.0, 14.0, 11.0, 5.0, 9.0, 6.0, 5.0, 8.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0006504058837890625, -0.0006269589066505432, -0.0006035119295120239, -0.0005800649523735046, -0.0005566179752349854, -0.0005331709980964661, -0.0005097240209579468, -0.0004862770438194275, -0.0004628300666809082, -0.0004393830895423889, -0.00041593611240386963, -0.00039248913526535034, -0.00036904215812683105, -0.00034559518098831177, -0.0003221482038497925, -0.0002987012267112732, -0.0002752542495727539, -0.0002518072724342346, -0.00022836029529571533, -0.00020491331815719604, -0.00018146634101867676, -0.00015801936388015747, -0.00013457238674163818, -0.0001111254096031189, -8.767843246459961e-05, -6.423145532608032e-05, -4.0784478187561035e-05, -1.7337501049041748e-05, 6.109476089477539e-06, 2.9556453227996826e-05, 5.300343036651611e-05, 7.64504075050354e-05, 9.989738464355469e-05, 0.00012334436178207397, 0.00014679133892059326, 0.00017023831605911255, 0.00019368529319763184, 0.00021713227033615112, 0.0002405792474746704, 0.0002640262246131897, 0.000287473201751709, 0.00031092017889022827, 0.00033436715602874756, 0.00035781413316726685, 0.00038126111030578613, 0.0004047080874443054, 0.0004281550645828247, 0.000451602041721344, 0.0004750490188598633, 0.0004984959959983826, 0.0005219429731369019, 0.0005453899502754211, 0.0005688369274139404, 0.0005922839045524597, 0.000615730881690979, 0.0006391778588294983, 0.0006626248359680176, 0.0006860718131065369, 0.0007095187902450562, 0.0007329657673835754, 0.0007564127445220947, 0.000779859721660614, 0.0008033066987991333, 0.0008267536759376526, 0.0008502006530761719]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 7.0, 7.0, 7.0, 8.0, 17.0, 17.0, 22.0, 31.0, 49.0, 40.0, 91.0, 91.0, 217.0, 580.0, 17410.0, 1026642.0, 2394.0, 377.0, 144.0, 115.0, 46.0, 56.0, 39.0, 26.0, 16.0, 16.0, 11.0, 13.0, 11.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.02056884765625, -0.020002365112304688, -0.019435882568359375, -0.018869400024414062, -0.01830291748046875, -0.017736434936523438, -0.017169952392578125, -0.016603469848632812, -0.0160369873046875, -0.015470504760742188, -0.014904022216796875, -0.014337539672851562, -0.01377105712890625, -0.013204574584960938, -0.012638092041015625, -0.012071609497070312, -0.011505126953125, -0.010938644409179688, -0.010372161865234375, -0.009805679321289062, -0.00923919677734375, -0.008672714233398438, -0.008106231689453125, -0.0075397491455078125, -0.0069732666015625, -0.0064067840576171875, -0.005840301513671875, -0.0052738189697265625, -0.00470733642578125, -0.0041408538818359375, -0.003574371337890625, -0.0030078887939453125, -0.00244140625, -0.0018749237060546875, -0.001308441162109375, -0.0007419586181640625, -0.00017547607421875, 0.0003910064697265625, 0.000957489013671875, 0.0015239715576171875, 0.0020904541015625, 0.0026569366455078125, 0.003223419189453125, 0.0037899017333984375, 0.00435638427734375, 0.0049228668212890625, 0.005489349365234375, 0.0060558319091796875, 0.006622314453125, 0.0071887969970703125, 0.007755279541015625, 0.008321762084960938, 0.00888824462890625, 0.009454727172851562, 0.010021209716796875, 0.010587692260742188, 0.0111541748046875, 0.011720657348632812, 0.012287139892578125, 0.012853622436523438, 0.01342010498046875, 0.013986587524414062, 0.014553070068359375, 0.015119552612304688, 0.01568603515625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 21.0, 964.0, 27.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013575304299592972, -0.013312075287103653, -0.013048846274614334, -0.01278561633080244, -0.012522387318313122, -0.012259158305823803, -0.011995929293334484, -0.01173269934952259, -0.011469470337033272, -0.011206241324543953, -0.010943012312054634, -0.01067978236824274, -0.010416553355753422, -0.010153324343264103, -0.009890095330774784, -0.00962686538696289, -0.009363636374473572, -0.009100407361984253, -0.008837178349494934, -0.00857394840568304, -0.008310719393193722, -0.008047490380704403, -0.007784261368215084, -0.007521031890064478, -0.007257803343236446, -0.0069945743307471275, -0.006731344852596521, -0.0064681158401072025, -0.006204886361956596, -0.0059416573494672775, -0.005678428336977959, -0.0054151988588273525, -0.005151968449354172, -0.004888739436864853, -0.004625509958714247, -0.004362280946224928, -0.004099051468074322, -0.003835822455585003, -0.0035725932102650404, -0.003309363964945078, -0.003046134952455759, -0.0027829057071357965, -0.002519676461815834, -0.002256447449326515, -0.001993217971175909, -0.0017299888422712684, -0.0014667597133666277, -0.0012035304680466652, -0.0009403012227267027, -0.0006770719774067402, -0.0004138427902944386, -0.000150613603182137, 0.00011261564213782549, 0.000375844887457788, 0.0006390740163624287, 0.0009023032616823912, 0.0011655325070023537, 0.0014287617523223162, 0.0016919909976422787, 0.0019552200101315975, 0.0022184494882822037, 0.0024816785007715225, 0.002744907746091485, 0.0030081369914114475, 0.00327136623673141]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 11.0, 11.0, 23.0, 25.0, 31.0, 31.0, 56.0, 52.0, 70.0, 73.0, 93.0, 68.0, 83.0, 67.0, 61.0, 46.0, 53.0, 45.0, 33.0, 26.0, 21.0, 5.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000981152057647705, -0.0009465292096138, -0.000911906361579895, -0.00087728351354599, -0.000842660665512085, -0.0008080378174781799, -0.0007734149694442749, -0.0007387921214103699, -0.0007041692733764648, -0.0006695464253425598, -0.0006349235773086548, -0.0006003007292747498, -0.0005656778812408447, -0.0005310550332069397, -0.0004964321851730347, -0.00046180933713912964, -0.0004271864891052246, -0.0003925636410713196, -0.00035794079303741455, -0.0003233179450035095, -0.0002886950969696045, -0.00025407224893569946, -0.00021944940090179443, -0.0001848265528678894, -0.00015020370483398438, -0.00011558085680007935, -8.095800876617432e-05, -4.633516073226929e-05, -1.1712312698364258e-05, 2.291053533554077e-05, 5.75333833694458e-05, 9.215623140335083e-05, 0.00012677907943725586, 0.0001614019274711609, 0.00019602477550506592, 0.00023064762353897095, 0.000265270471572876, 0.000299893319606781, 0.00033451616764068604, 0.00036913901567459106, 0.0004037618637084961, 0.0004383847117424011, 0.00047300755977630615, 0.0005076304078102112, 0.0005422532558441162, 0.0005768761038780212, 0.0006114989519119263, 0.0006461217999458313, 0.0006807446479797363, 0.0007153674960136414, 0.0007499903440475464, 0.0007846131920814514, 0.0008192360401153564, 0.0008538588881492615, 0.0008884817361831665, 0.0009231045842170715, 0.0009577274322509766, 0.0009923502802848816, 0.0010269731283187866, 0.0010615959763526917, 0.0010962188243865967, 0.0011308416724205017, 0.0011654645204544067, 0.0012000873684883118, 0.0012347102165222168]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 9.0, 17.0, 14.0, 14.0, 22.0, 25.0, 27.0, 20.0, 30.0, 31.0, 34.0, 29.0, 38.0, 39.0, 45.0, 35.0, 22.0, 34.0, 45.0, 42.0, 41.0, 32.0, 44.0, 34.0, 41.0, 26.0, 21.0, 25.0, 19.0, 20.0, 16.0, 22.0, 15.0, 8.0, 6.0, 5.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.8018798828125, -10.431884765625, -10.0618896484375, -9.69189453125, -9.3218994140625, -8.951904296875, -8.5819091796875, -8.2119140625, -7.8419189453125, -7.471923828125, -7.1019287109375, -6.73193359375, -6.3619384765625, -5.991943359375, -5.6219482421875, -5.251953125, -4.8819580078125, -4.511962890625, -4.1419677734375, -3.77197265625, -3.4019775390625, -3.031982421875, -2.6619873046875, -2.2919921875, -1.9219970703125, -1.552001953125, -1.1820068359375, -0.81201171875, -0.4420166015625, -0.072021484375, 0.2979736328125, 0.66796875, 1.0379638671875, 1.407958984375, 1.7779541015625, 2.14794921875, 2.5179443359375, 2.887939453125, 3.2579345703125, 3.6279296875, 3.9979248046875, 4.367919921875, 4.7379150390625, 5.10791015625, 5.4779052734375, 5.847900390625, 6.2178955078125, 6.587890625, 6.9578857421875, 7.327880859375, 7.6978759765625, 8.06787109375, 8.4378662109375, 8.807861328125, 9.1778564453125, 9.5478515625, 9.9178466796875, 10.287841796875, 10.6578369140625, 11.02783203125, 11.3978271484375, 11.767822265625, 12.1378173828125, 12.5078125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 23.0, 27.0, 47.0, 64.0, 76.0, 114.0, 143.0, 217.0, 275.0, 389.0, 542.0, 839.0, 1216.0, 1710.0, 2669.0, 3970.0, 6194.0, 10212.0, 17637.0, 35771.0, 123558.0, 606771.0, 147948.0, 39043.0, 18968.0, 10721.0, 6557.0, 4097.0, 2784.0, 1787.0, 1241.0, 859.0, 604.0, 425.0, 294.0, 195.0, 144.0, 107.0, 85.0, 55.0, 40.0, 35.0, 22.0, 15.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0], "bins": [-18.609375, -18.0546875, -17.5, -16.9453125, -16.390625, -15.8359375, -15.28125, -14.7265625, -14.171875, -13.6171875, -13.0625, -12.5078125, -11.953125, -11.3984375, -10.84375, -10.2890625, -9.734375, -9.1796875, -8.625, -8.0703125, -7.515625, -6.9609375, -6.40625, -5.8515625, -5.296875, -4.7421875, -4.1875, -3.6328125, -3.078125, -2.5234375, -1.96875, -1.4140625, -0.859375, -0.3046875, 0.25, 0.8046875, 1.359375, 1.9140625, 2.46875, 3.0234375, 3.578125, 4.1328125, 4.6875, 5.2421875, 5.796875, 6.3515625, 6.90625, 7.4609375, 8.015625, 8.5703125, 9.125, 9.6796875, 10.234375, 10.7890625, 11.34375, 11.8984375, 12.453125, 13.0078125, 13.5625, 14.1171875, 14.671875, 15.2265625, 15.78125, 16.3359375, 16.890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 12.0, 19.0, 13.0, 16.0, 19.0, 14.0, 20.0, 32.0, 30.0, 38.0, 33.0, 38.0, 46.0, 49.0, 68.0, 101.0, 422.0, 1452.0, 113.0, 73.0, 61.0, 41.0, 48.0, 30.0, 39.0, 35.0, 31.0, 17.0, 32.0, 13.0, 16.0, 14.0, 14.0, 5.0, 9.0, 4.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.5625, -38.36376953125, -37.1650390625, -35.96630859375, -34.767578125, -33.56884765625, -32.3701171875, -31.17138671875, -29.97265625, -28.77392578125, -27.5751953125, -26.37646484375, -25.177734375, -23.97900390625, -22.7802734375, -21.58154296875, -20.3828125, -19.18408203125, -17.9853515625, -16.78662109375, -15.587890625, -14.38916015625, -13.1904296875, -11.99169921875, -10.79296875, -9.59423828125, -8.3955078125, -7.19677734375, -5.998046875, -4.79931640625, -3.6005859375, -2.40185546875, -1.203125, -0.00439453125, 1.1943359375, 2.39306640625, 3.591796875, 4.79052734375, 5.9892578125, 7.18798828125, 8.38671875, 9.58544921875, 10.7841796875, 11.98291015625, 13.181640625, 14.38037109375, 15.5791015625, 16.77783203125, 17.9765625, 19.17529296875, 20.3740234375, 21.57275390625, 22.771484375, 23.97021484375, 25.1689453125, 26.36767578125, 27.56640625, 28.76513671875, 29.9638671875, 31.16259765625, 32.361328125, 33.56005859375, 34.7587890625, 35.95751953125, 37.15625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 8.0, 10.0, 7.0, 21.0, 25.0, 24.0, 35.0, 56.0, 49.0, 78.0, 117.0, 189.0, 316.0, 627.0, 1569.0, 4319.0, 14289.0, 63878.0, 2662290.0, 349577.0, 34120.0, 8918.0, 2792.0, 1076.0, 481.0, 247.0, 159.0, 112.0, 80.0, 44.0, 39.0, 31.0, 28.0, 19.0, 17.0, 12.0, 11.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.34375, -47.7421875, -46.140625, -44.5390625, -42.9375, -41.3359375, -39.734375, -38.1328125, -36.53125, -34.9296875, -33.328125, -31.7265625, -30.125, -28.5234375, -26.921875, -25.3203125, -23.71875, -22.1171875, -20.515625, -18.9140625, -17.3125, -15.7109375, -14.109375, -12.5078125, -10.90625, -9.3046875, -7.703125, -6.1015625, -4.5, -2.8984375, -1.296875, 0.3046875, 1.90625, 3.5078125, 5.109375, 6.7109375, 8.3125, 9.9140625, 11.515625, 13.1171875, 14.71875, 16.3203125, 17.921875, 19.5234375, 21.125, 22.7265625, 24.328125, 25.9296875, 27.53125, 29.1328125, 30.734375, 32.3359375, 33.9375, 35.5390625, 37.140625, 38.7421875, 40.34375, 41.9453125, 43.546875, 45.1484375, 46.75, 48.3515625, 49.953125, 51.5546875, 53.15625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 12.0, 29.0, 97.0, 230.0, 314.0, 219.0, 76.0, 22.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84812545776367, -47.24433898925781, -41.64055252075195, -36.036766052246094, -30.432979583740234, -24.829193115234375, -19.225406646728516, -13.621620178222656, -8.017833709716797, -2.4140472412109375, 3.189739227294922, 8.793525695800781, 14.39731216430664, 20.0010986328125, 25.60488510131836, 31.20867156982422, 36.81245803833008, 42.41624450683594, 48.0200309753418, 53.623817443847656, 59.227603912353516, 64.83139038085938, 70.4351806640625, 76.0389633178711, 81.64274597167969, 87.24653625488281, 92.8503189086914, 98.4541015625, 104.05789184570312, 109.66168212890625, 115.26546478271484, 120.86924743652344, 126.47305297851562, 132.07684326171875, 137.68063354492188, 143.28440856933594, 148.88819885253906, 154.4919891357422, 160.09576416015625, 165.69955444335938, 171.3033447265625, 176.90713500976562, 182.51092529296875, 188.1147003173828, 193.71849060058594, 199.32228088378906, 204.92605590820312, 210.52984619140625, 216.13363647460938, 221.7374267578125, 227.34121704101562, 232.9449920654297, 238.5487823486328, 244.15257263183594, 249.75634765625, 255.36013793945312, 260.96392822265625, 266.5677185058594, 272.1715087890625, 277.7752990722656, 283.37908935546875, 288.98284912109375, 294.5866394042969, 300.1904296875, 305.7942199707031]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 9.0, 2.0, 7.0, 11.0, 8.0, 14.0, 10.0, 18.0, 17.0, 19.0, 15.0, 25.0, 36.0, 33.0, 31.0, 35.0, 32.0, 46.0, 34.0, 43.0, 45.0, 47.0, 37.0, 34.0, 30.0, 38.0, 28.0, 36.0, 26.0, 32.0, 30.0, 19.0, 23.0, 20.0, 18.0, 17.0, 10.0, 9.0, 11.0, 10.0, 9.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-104.2725830078125, -101.24817657470703, -98.22377014160156, -95.1993637084961, -92.17495727539062, -89.15054321289062, -86.12614440917969, -83.10173034667969, -80.07732391357422, -77.05291748046875, -74.02851104736328, -71.00410461425781, -67.97969818115234, -64.95529174804688, -61.93088150024414, -58.906471252441406, -55.8820686340332, -52.857662200927734, -49.833255767822266, -46.80884552001953, -43.78443908691406, -40.760032653808594, -37.735626220703125, -34.711219787597656, -31.686811447143555, -28.662405014038086, -25.637996673583984, -22.613590240478516, -19.589183807373047, -16.564775466918945, -13.540369033813477, -10.515960693359375, -7.491554260253906, -4.467146873474121, -1.4427399635314941, 1.5816669464111328, 4.606074333190918, 7.630481719970703, 10.654888153076172, 13.679296493530273, 16.703702926635742, 19.72810935974121, 22.752517700195312, 25.77692413330078, 28.80133056640625, 31.82573890686035, 34.85014343261719, 37.87455368041992, 40.89896011352539, 43.92336654663086, 46.94777297973633, 49.97218322753906, 52.99658966064453, 56.02099609375, 59.04540252685547, 62.06980895996094, 65.0942153930664, 68.11862182617188, 71.14302825927734, 74.16743469238281, 77.19184112548828, 80.21624755859375, 83.24066162109375, 86.26506805419922, 89.28947448730469]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 3.0, 11.0, 11.0, 15.0, 19.0, 19.0, 11.0, 27.0, 26.0, 39.0, 23.0, 18.0, 26.0, 32.0, 43.0, 40.0, 49.0, 33.0, 41.0, 49.0, 41.0, 47.0, 35.0, 50.0, 37.0, 30.0, 27.0, 37.0, 17.0, 24.0, 22.0, 13.0, 11.0, 14.0, 12.0, 12.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.8125, -13.4041748046875, -12.995849609375, -12.5875244140625, -12.17919921875, -11.7708740234375, -11.362548828125, -10.9542236328125, -10.5458984375, -10.1375732421875, -9.729248046875, -9.3209228515625, -8.91259765625, -8.5042724609375, -8.095947265625, -7.6876220703125, -7.279296875, -6.8709716796875, -6.462646484375, -6.0543212890625, -5.64599609375, -5.2376708984375, -4.829345703125, -4.4210205078125, -4.0126953125, -3.6043701171875, -3.196044921875, -2.7877197265625, -2.37939453125, -1.9710693359375, -1.562744140625, -1.1544189453125, -0.74609375, -0.3377685546875, 0.070556640625, 0.4788818359375, 0.88720703125, 1.2955322265625, 1.703857421875, 2.1121826171875, 2.5205078125, 2.9288330078125, 3.337158203125, 3.7454833984375, 4.15380859375, 4.5621337890625, 4.970458984375, 5.3787841796875, 5.787109375, 6.1954345703125, 6.603759765625, 7.0120849609375, 7.42041015625, 7.8287353515625, 8.237060546875, 8.6453857421875, 9.0537109375, 9.4620361328125, 9.870361328125, 10.2786865234375, 10.68701171875, 11.0953369140625, 11.503662109375, 11.9119873046875, 12.3203125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 7.0, 7.0, 9.0, 7.0, 9.0, 21.0, 22.0, 34.0, 34.0, 64.0, 100.0, 182.0, 286.0, 469.0, 953.0, 1783.0, 3376.0, 7161.0, 16217.0, 45591.0, 302019.0, 2766672.0, 920398.0, 85894.0, 23397.0, 9929.0, 4473.0, 2359.0, 1183.0, 636.0, 369.0, 220.0, 134.0, 76.0, 38.0, 47.0, 17.0, 21.0, 8.0, 13.0, 9.0, 4.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.546875, -26.64990234375, -25.7529296875, -24.85595703125, -23.958984375, -23.06201171875, -22.1650390625, -21.26806640625, -20.37109375, -19.47412109375, -18.5771484375, -17.68017578125, -16.783203125, -15.88623046875, -14.9892578125, -14.09228515625, -13.1953125, -12.29833984375, -11.4013671875, -10.50439453125, -9.607421875, -8.71044921875, -7.8134765625, -6.91650390625, -6.01953125, -5.12255859375, -4.2255859375, -3.32861328125, -2.431640625, -1.53466796875, -0.6376953125, 0.25927734375, 1.15625, 2.05322265625, 2.9501953125, 3.84716796875, 4.744140625, 5.64111328125, 6.5380859375, 7.43505859375, 8.33203125, 9.22900390625, 10.1259765625, 11.02294921875, 11.919921875, 12.81689453125, 13.7138671875, 14.61083984375, 15.5078125, 16.40478515625, 17.3017578125, 18.19873046875, 19.095703125, 19.99267578125, 20.8896484375, 21.78662109375, 22.68359375, 23.58056640625, 24.4775390625, 25.37451171875, 26.271484375, 27.16845703125, 28.0654296875, 28.96240234375, 29.859375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 7.0, 2.0, 8.0, 13.0, 13.0, 11.0, 15.0, 27.0, 36.0, 39.0, 59.0, 73.0, 108.0, 162.0, 317.0, 589.0, 842.0, 693.0, 383.0, 228.0, 129.0, 88.0, 61.0, 35.0, 25.0, 29.0, 21.0, 13.0, 12.0, 7.0, 13.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.453125, -23.60205078125, -22.7509765625, -21.89990234375, -21.048828125, -20.19775390625, -19.3466796875, -18.49560546875, -17.64453125, -16.79345703125, -15.9423828125, -15.09130859375, -14.240234375, -13.38916015625, -12.5380859375, -11.68701171875, -10.8359375, -9.98486328125, -9.1337890625, -8.28271484375, -7.431640625, -6.58056640625, -5.7294921875, -4.87841796875, -4.02734375, -3.17626953125, -2.3251953125, -1.47412109375, -0.623046875, 0.22802734375, 1.0791015625, 1.93017578125, 2.78125, 3.63232421875, 4.4833984375, 5.33447265625, 6.185546875, 7.03662109375, 7.8876953125, 8.73876953125, 9.58984375, 10.44091796875, 11.2919921875, 12.14306640625, 12.994140625, 13.84521484375, 14.6962890625, 15.54736328125, 16.3984375, 17.24951171875, 18.1005859375, 18.95166015625, 19.802734375, 20.65380859375, 21.5048828125, 22.35595703125, 23.20703125, 24.05810546875, 24.9091796875, 25.76025390625, 26.611328125, 27.46240234375, 28.3134765625, 29.16455078125, 30.015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 11.0, 16.0, 16.0, 24.0, 33.0, 35.0, 96.0, 138.0, 298.0, 955.0, 4823.0, 52995.0, 3789833.0, 327813.0, 14128.0, 2025.0, 508.0, 175.0, 125.0, 74.0, 35.0, 34.0, 15.0, 18.0, 9.0, 10.0, 12.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-119.25, -116.0048828125, -112.759765625, -109.5146484375, -106.26953125, -103.0244140625, -99.779296875, -96.5341796875, -93.2890625, -90.0439453125, -86.798828125, -83.5537109375, -80.30859375, -77.0634765625, -73.818359375, -70.5732421875, -67.328125, -64.0830078125, -60.837890625, -57.5927734375, -54.34765625, -51.1025390625, -47.857421875, -44.6123046875, -41.3671875, -38.1220703125, -34.876953125, -31.6318359375, -28.38671875, -25.1416015625, -21.896484375, -18.6513671875, -15.40625, -12.1611328125, -8.916015625, -5.6708984375, -2.42578125, 0.8193359375, 4.064453125, 7.3095703125, 10.5546875, 13.7998046875, 17.044921875, 20.2900390625, 23.53515625, 26.7802734375, 30.025390625, 33.2705078125, 36.515625, 39.7607421875, 43.005859375, 46.2509765625, 49.49609375, 52.7412109375, 55.986328125, 59.2314453125, 62.4765625, 65.7216796875, 68.966796875, 72.2119140625, 75.45703125, 78.7021484375, 81.947265625, 85.1923828125, 88.4375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 26.0, 61.0, 182.0, 300.0, 241.0, 135.0, 38.0, 18.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.0019226074219, -386.23809814453125, -378.4742431640625, -370.7104187011719, -362.94659423828125, -355.1827392578125, -347.4189147949219, -339.65509033203125, -331.8912353515625, -324.1274108886719, -316.3635559082031, -308.5997314453125, -300.8359069824219, -293.0720520019531, -285.3082275390625, -277.5444030761719, -269.78057861328125, -262.0167541503906, -254.25291442871094, -246.48907470703125, -238.72523498535156, -230.96139526367188, -223.19757080078125, -215.43373107910156, -207.66989135742188, -199.9060516357422, -192.14222717285156, -184.37838745117188, -176.6145477294922, -168.8507080078125, -161.08688354492188, -153.3230438232422, -145.5592041015625, -137.7953643798828, -130.0315399169922, -122.2677001953125, -114.50386047363281, -106.74002838134766, -98.9761962890625, -91.21235656738281, -83.44851684570312, -75.68468475341797, -67.92084503173828, -60.157012939453125, -52.3931770324707, -44.62934112548828, -36.865509033203125, -29.101673126220703, -21.33783721923828, -13.574002265930176, -5.81016731262207, 1.9536666870117188, 9.71750259399414, 17.481338500976562, 25.24517059326172, 33.00900650024414, 40.77284240722656, 48.536678314208984, 56.300514221191406, 64.06434631347656, 71.82818603515625, 79.5920181274414, 87.35585021972656, 95.11968994140625, 102.8835220336914]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 6.0, 17.0, 6.0, 10.0, 16.0, 20.0, 15.0, 16.0, 22.0, 24.0, 16.0, 24.0, 25.0, 29.0, 26.0, 38.0, 34.0, 29.0, 39.0, 41.0, 54.0, 37.0, 36.0, 31.0, 43.0, 26.0, 31.0, 39.0, 23.0, 31.0, 19.0, 23.0, 25.0, 16.0, 11.0, 18.0, 16.0, 13.0, 13.0, 5.0, 4.0, 2.0, 6.0, 8.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-63.54621124267578, -61.51509475708008, -59.48397445678711, -57.452857971191406, -55.42173767089844, -53.390621185302734, -51.35950469970703, -49.32838439941406, -47.29726791381836, -45.266151428222656, -43.23503112792969, -41.203914642333984, -39.17279815673828, -37.14167785644531, -35.11056137084961, -33.079444885253906, -31.048324584960938, -29.0172061920166, -26.986087799072266, -24.954971313476562, -22.923852920532227, -20.89273452758789, -18.861618041992188, -16.83049964904785, -14.799381256103516, -12.76826286315918, -10.73714542388916, -8.70602798461914, -6.674909591674805, -4.643791198730469, -2.612673759460449, -0.5815563201904297, 1.4495697021484375, 3.4806876182556152, 5.511805534362793, 7.542923450469971, 9.574041366577148, 11.605159759521484, 13.636277198791504, 15.667394638061523, 17.69851303100586, 19.729631423950195, 21.76074981689453, 23.791866302490234, 25.82298469543457, 27.854103088378906, 29.88521957397461, 31.916337966918945, 33.94745635986328, 35.978572845458984, 38.00969314575195, 40.040809631347656, 42.071929931640625, 44.10304641723633, 46.13416290283203, 48.165283203125, 50.1963996887207, 52.227516174316406, 54.258636474609375, 56.28975296020508, 58.32086944580078, 60.35198974609375, 62.38310623168945, 64.41422271728516, 66.44534301757812]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 16.0, 21.0, 17.0, 27.0, 27.0, 26.0, 36.0, 36.0, 35.0, 32.0, 36.0, 49.0, 41.0, 36.0, 48.0, 47.0, 40.0, 35.0, 40.0, 48.0, 39.0, 27.0, 30.0, 41.0, 26.0, 25.0, 11.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-15.6875, -15.247314453125, -14.80712890625, -14.366943359375, -13.9267578125, -13.486572265625, -13.04638671875, -12.606201171875, -12.166015625, -11.725830078125, -11.28564453125, -10.845458984375, -10.4052734375, -9.965087890625, -9.52490234375, -9.084716796875, -8.64453125, -8.204345703125, -7.76416015625, -7.323974609375, -6.8837890625, -6.443603515625, -6.00341796875, -5.563232421875, -5.123046875, -4.682861328125, -4.24267578125, -3.802490234375, -3.3623046875, -2.922119140625, -2.48193359375, -2.041748046875, -1.6015625, -1.161376953125, -0.72119140625, -0.281005859375, 0.1591796875, 0.599365234375, 1.03955078125, 1.479736328125, 1.919921875, 2.360107421875, 2.80029296875, 3.240478515625, 3.6806640625, 4.120849609375, 4.56103515625, 5.001220703125, 5.44140625, 5.881591796875, 6.32177734375, 6.761962890625, 7.2021484375, 7.642333984375, 8.08251953125, 8.522705078125, 8.962890625, 9.403076171875, 9.84326171875, 10.283447265625, 10.7236328125, 11.163818359375, 11.60400390625, 12.044189453125, 12.484375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 2.0, 11.0, 8.0, 13.0, 18.0, 31.0, 64.0, 78.0, 125.0, 171.0, 296.0, 453.0, 611.0, 1011.0, 1528.0, 2489.0, 3766.0, 6053.0, 9641.0, 15366.0, 25308.0, 41255.0, 67680.0, 109192.0, 170836.0, 216263.0, 142470.0, 89579.0, 55354.0, 33533.0, 20693.0, 12650.0, 8029.0, 5071.0, 3124.0, 2032.0, 1274.0, 840.0, 580.0, 352.0, 242.0, 155.0, 99.0, 65.0, 47.0, 31.0, 23.0, 18.0, 12.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.31201171875, -0.3029136657714844, -0.29381561279296875, -0.2847175598144531, -0.2756195068359375, -0.2665214538574219, -0.25742340087890625, -0.24832534790039062, -0.239227294921875, -0.23012924194335938, -0.22103118896484375, -0.21193313598632812, -0.2028350830078125, -0.19373703002929688, -0.18463897705078125, -0.17554092407226562, -0.16644287109375, -0.15734481811523438, -0.14824676513671875, -0.13914871215820312, -0.1300506591796875, -0.12095260620117188, -0.11185455322265625, -0.10275650024414062, -0.093658447265625, -0.08456039428710938, -0.07546234130859375, -0.06636428833007812, -0.0572662353515625, -0.048168182373046875, -0.03907012939453125, -0.029972076416015625, -0.0208740234375, -0.011775970458984375, -0.00267791748046875, 0.006420135498046875, 0.0155181884765625, 0.024616241455078125, 0.03371429443359375, 0.042812347412109375, 0.051910400390625, 0.061008453369140625, 0.07010650634765625, 0.07920455932617188, 0.0883026123046875, 0.09740066528320312, 0.10649871826171875, 0.11559677124023438, 0.12469482421875, 0.13379287719726562, 0.14289093017578125, 0.15198898315429688, 0.1610870361328125, 0.17018508911132812, 0.17928314208984375, 0.18838119506835938, 0.197479248046875, 0.20657730102539062, 0.21567535400390625, 0.22477340698242188, 0.2338714599609375, 0.24296951293945312, 0.25206756591796875, 0.2611656188964844, 0.270263671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 14.0, 14.0, 14.0, 18.0, 20.0, 18.0, 15.0, 28.0, 28.0, 28.0, 34.0, 28.0, 31.0, 46.0, 37.0, 35.0, 36.0, 43.0, 1063.0, 28.0, 34.0, 37.0, 25.0, 34.0, 39.0, 29.0, 25.0, 25.0, 30.0, 20.0, 19.0, 17.0, 17.0, 13.0, 15.0, 7.0, 2.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.6484375, -9.3492431640625, -9.050048828125, -8.7508544921875, -8.45166015625, -8.1524658203125, -7.853271484375, -7.5540771484375, -7.2548828125, -6.9556884765625, -6.656494140625, -6.3572998046875, -6.05810546875, -5.7589111328125, -5.459716796875, -5.1605224609375, -4.861328125, -4.5621337890625, -4.262939453125, -3.9637451171875, -3.66455078125, -3.3653564453125, -3.066162109375, -2.7669677734375, -2.4677734375, -2.1685791015625, -1.869384765625, -1.5701904296875, -1.27099609375, -0.9718017578125, -0.672607421875, -0.3734130859375, -0.07421875, 0.2249755859375, 0.524169921875, 0.8233642578125, 1.12255859375, 1.4217529296875, 1.720947265625, 2.0201416015625, 2.3193359375, 2.6185302734375, 2.917724609375, 3.2169189453125, 3.51611328125, 3.8153076171875, 4.114501953125, 4.4136962890625, 4.712890625, 5.0120849609375, 5.311279296875, 5.6104736328125, 5.90966796875, 6.2088623046875, 6.508056640625, 6.8072509765625, 7.1064453125, 7.4056396484375, 7.704833984375, 8.0040283203125, 8.30322265625, 8.6024169921875, 8.901611328125, 9.2008056640625, 9.5]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 9.0, 17.0, 26.0, 44.0, 60.0, 80.0, 121.0, 174.0, 222.0, 344.0, 459.0, 669.0, 979.0, 1348.0, 1968.0, 2793.0, 4209.0, 6275.0, 9380.0, 14070.0, 21643.0, 33014.0, 51496.0, 80813.0, 133304.0, 1252117.0, 177618.0, 109312.0, 67486.0, 43410.0, 27872.0, 18331.0, 12229.0, 8118.0, 5278.0, 3718.0, 2455.0, 1744.0, 1191.0, 863.0, 556.0, 379.0, 274.0, 203.0, 138.0, 104.0, 73.0, 56.0, 31.0, 15.0, 20.0, 11.0, 9.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.1551513671875, -0.150421142578125, -0.14569091796875, -0.140960693359375, -0.13623046875, -0.131500244140625, -0.12677001953125, -0.122039794921875, -0.1173095703125, -0.112579345703125, -0.10784912109375, -0.103118896484375, -0.098388671875, -0.093658447265625, -0.08892822265625, -0.084197998046875, -0.0794677734375, -0.074737548828125, -0.07000732421875, -0.065277099609375, -0.060546875, -0.055816650390625, -0.05108642578125, -0.046356201171875, -0.0416259765625, -0.036895751953125, -0.03216552734375, -0.027435302734375, -0.022705078125, -0.017974853515625, -0.01324462890625, -0.008514404296875, -0.0037841796875, 0.000946044921875, 0.00567626953125, 0.010406494140625, 0.01513671875, 0.019866943359375, 0.02459716796875, 0.029327392578125, 0.0340576171875, 0.038787841796875, 0.04351806640625, 0.048248291015625, 0.052978515625, 0.057708740234375, 0.06243896484375, 0.067169189453125, 0.0718994140625, 0.076629638671875, 0.08135986328125, 0.086090087890625, 0.0908203125, 0.095550537109375, 0.10028076171875, 0.105010986328125, 0.1097412109375, 0.114471435546875, 0.11920166015625, 0.123931884765625, 0.128662109375, 0.133392333984375, 0.13812255859375, 0.142852783203125, 0.1475830078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 14.0, 11.0, 10.0, 15.0, 18.0, 20.0, 27.0, 35.0, 43.0, 51.0, 70.0, 53.0, 62.0, 76.0, 72.0, 79.0, 65.0, 50.0, 42.0, 43.0, 28.0, 19.0, 23.0, 15.0, 17.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010423660278320312, -0.0010128617286682129, -0.0009833574295043945, -0.0009538531303405762, -0.0009243488311767578, -0.0008948445320129395, -0.0008653402328491211, -0.0008358359336853027, -0.0008063316345214844, -0.000776827335357666, -0.0007473230361938477, -0.0007178187370300293, -0.0006883144378662109, -0.0006588101387023926, -0.0006293058395385742, -0.0005998015403747559, -0.0005702972412109375, -0.0005407929420471191, -0.0005112886428833008, -0.0004817843437194824, -0.00045228004455566406, -0.0004227757453918457, -0.00039327144622802734, -0.000363767147064209, -0.0003342628479003906, -0.00030475854873657227, -0.0002752542495727539, -0.00024574995040893555, -0.0002162456512451172, -0.00018674135208129883, -0.00015723705291748047, -0.0001277327537536621, -9.822845458984375e-05, -6.872415542602539e-05, -3.921985626220703e-05, -9.715557098388672e-06, 1.9788742065429688e-05, 4.929304122924805e-05, 7.87973403930664e-05, 0.00010830163955688477, 0.00013780593872070312, 0.00016731023788452148, 0.00019681453704833984, 0.0002263188362121582, 0.00025582313537597656, 0.0002853274345397949, 0.0003148317337036133, 0.00034433603286743164, 0.00037384033203125, 0.00040334463119506836, 0.0004328489303588867, 0.0004623532295227051, 0.0004918575286865234, 0.0005213618278503418, 0.0005508661270141602, 0.0005803704261779785, 0.0006098747253417969, 0.0006393790245056152, 0.0006688833236694336, 0.000698387622833252, 0.0007278919219970703, 0.0007573962211608887, 0.000786900520324707, 0.0008164048194885254, 0.0008459091186523438]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 16.0, 17.0, 23.0, 21.0, 39.0, 49.0, 55.0, 93.0, 169.0, 384.0, 2094.0, 1033817.0, 10620.0, 555.0, 196.0, 112.0, 71.0, 48.0, 32.0, 23.0, 21.0, 16.0, 8.0, 12.0, 13.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01959228515625, -0.018908977508544922, -0.018225669860839844, -0.017542362213134766, -0.016859054565429688, -0.01617574691772461, -0.015492439270019531, -0.014809131622314453, -0.014125823974609375, -0.013442516326904297, -0.012759208679199219, -0.01207590103149414, -0.011392593383789062, -0.010709285736083984, -0.010025978088378906, -0.009342670440673828, -0.00865936279296875, -0.007976055145263672, -0.007292747497558594, -0.006609439849853516, -0.0059261322021484375, -0.005242824554443359, -0.004559516906738281, -0.003876209259033203, -0.003192901611328125, -0.002509593963623047, -0.0018262863159179688, -0.0011429786682128906, -0.0004596710205078125, 0.00022363662719726562, 0.0009069442749023438, 0.0015902519226074219, 0.0022735595703125, 0.002956867218017578, 0.0036401748657226562, 0.004323482513427734, 0.0050067901611328125, 0.005690097808837891, 0.006373405456542969, 0.007056713104248047, 0.007740020751953125, 0.008423328399658203, 0.009106636047363281, 0.00978994369506836, 0.010473251342773438, 0.011156558990478516, 0.011839866638183594, 0.012523174285888672, 0.01320648193359375, 0.013889789581298828, 0.014573097229003906, 0.015256404876708984, 0.015939712524414062, 0.01662302017211914, 0.01730632781982422, 0.017989635467529297, 0.018672943115234375, 0.019356250762939453, 0.02003955841064453, 0.02072286605834961, 0.021406173706054688, 0.022089481353759766, 0.022772789001464844, 0.023456096649169922, 0.024139404296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 21.0, 994.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027796540409326553, -0.02728552557528019, -0.026774512603878975, -0.02626349776983261, -0.025752484798431396, -0.025241469964385033, -0.024730456992983818, -0.024219442158937454, -0.02370842918753624, -0.023197414353489876, -0.02268640138208866, -0.022175386548042297, -0.021664373576641083, -0.02115335874259472, -0.020642345771193504, -0.02013133093714714, -0.019620317965745926, -0.019109303131699562, -0.018598290160298347, -0.018087275326251984, -0.01757626235485077, -0.017065247520804405, -0.01655423454940319, -0.016043219715356827, -0.015532204881310463, -0.015021190978586674, -0.014510177075862885, -0.013999163173139095, -0.013488149270415306, -0.012977135367691517, -0.012466121464967728, -0.011955106630921364, -0.011444094590842724, -0.010933080688118935, -0.010422066785395145, -0.009911052882671356, -0.009400038979947567, -0.008889025077223778, -0.008378010243177414, -0.0078669972717762, -0.007355982903391123, -0.006844969000667334, -0.006333955097943544, -0.005822940729558468, -0.005311926826834679, -0.0048009129241108894, -0.0042898990213871, -0.003778885118663311, -0.003267871215939522, -0.0027568573132157326, -0.0022458434104919434, -0.0017348292749375105, -0.0012238153722137213, -0.0007128014694899321, -0.0002017873339354992, 0.00030922656878829, 0.0008202404715120792, 0.0013312543742358685, 0.0018422683933749795, 0.0023532824125140905, 0.0028642963152378798, 0.003375310217961669, 0.003886324353516102, 0.004397338256239891, 0.00490835215896368]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 9.0, 20.0, 20.0, 48.0, 35.0, 46.0, 70.0, 59.0, 57.0, 97.0, 95.0, 87.0, 54.0, 69.0, 55.0, 51.0, 39.0, 20.0, 31.0, 17.0, 9.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010976195335388184, -0.0010590441524982452, -0.0010204687714576721, -0.000981893390417099, -0.0009433180093765259, -0.0009047426283359528, -0.0008661672472953796, -0.0008275918662548065, -0.0007890164852142334, -0.0007504411041736603, -0.0007118657231330872, -0.000673290342092514, -0.0006347149610519409, -0.0005961395800113678, -0.0005575641989707947, -0.0005189888179302216, -0.00048041343688964844, -0.0004418380558490753, -0.0004032626748085022, -0.0003646872937679291, -0.00032611191272735596, -0.00028753653168678284, -0.0002489611506462097, -0.0002103857696056366, -0.00017181038856506348, -0.00013323500752449036, -9.465962648391724e-05, -5.6084245443344116e-05, -1.7508864402770996e-05, 2.1066516637802124e-05, 5.9641897678375244e-05, 9.821727871894836e-05, 0.00013679265975952148, 0.0001753680408000946, 0.00021394342184066772, 0.00025251880288124084, 0.00029109418392181396, 0.0003296695649623871, 0.0003682449460029602, 0.0004068203270435333, 0.00044539570808410645, 0.00048397108912467957, 0.0005225464701652527, 0.0005611218512058258, 0.0005996972322463989, 0.000638272613286972, 0.0006768479943275452, 0.0007154233753681183, 0.0007539987564086914, 0.0007925741374492645, 0.0008311495184898376, 0.0008697248995304108, 0.0009083002805709839, 0.000946875661611557, 0.0009854510426521301, 0.0010240264236927032, 0.0010626018047332764, 0.0011011771857738495, 0.0011397525668144226, 0.0011783279478549957, 0.0012169033288955688, 0.001255478709936142, 0.001294054090976715, 0.0013326294720172882, 0.0013712048530578613]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 16.0, 21.0, 17.0, 27.0, 27.0, 26.0, 36.0, 36.0, 35.0, 32.0, 36.0, 49.0, 41.0, 36.0, 48.0, 47.0, 40.0, 35.0, 40.0, 48.0, 39.0, 27.0, 30.0, 41.0, 26.0, 25.0, 11.0, 17.0, 13.0, 11.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-15.6875, -15.247314453125, -14.80712890625, -14.366943359375, -13.9267578125, -13.486572265625, -13.04638671875, -12.606201171875, -12.166015625, -11.725830078125, -11.28564453125, -10.845458984375, -10.4052734375, -9.965087890625, -9.52490234375, -9.084716796875, -8.64453125, -8.204345703125, -7.76416015625, -7.323974609375, -6.8837890625, -6.443603515625, -6.00341796875, -5.563232421875, -5.123046875, -4.682861328125, -4.24267578125, -3.802490234375, -3.3623046875, -2.922119140625, -2.48193359375, -2.041748046875, -1.6015625, -1.161376953125, -0.72119140625, -0.281005859375, 0.1591796875, 0.599365234375, 1.03955078125, 1.479736328125, 1.919921875, 2.360107421875, 2.80029296875, 3.240478515625, 3.6806640625, 4.120849609375, 4.56103515625, 5.001220703125, 5.44140625, 5.881591796875, 6.32177734375, 6.761962890625, 7.2021484375, 7.642333984375, 8.08251953125, 8.522705078125, 8.962890625, 9.403076171875, 9.84326171875, 10.283447265625, 10.7236328125, 11.163818359375, 11.60400390625, 12.044189453125, 12.484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 12.0, 12.0, 8.0, 24.0, 21.0, 32.0, 56.0, 75.0, 100.0, 174.0, 268.0, 451.0, 760.0, 1283.0, 2078.0, 3496.0, 6501.0, 13329.0, 67869.0, 842644.0, 79158.0, 14402.0, 6640.0, 3655.0, 2162.0, 1283.0, 775.0, 482.0, 283.0, 171.0, 96.0, 73.0, 47.0, 39.0, 22.0, 18.0, 8.0, 12.0, 8.0, 7.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.875, -27.01806640625, -26.1611328125, -25.30419921875, -24.447265625, -23.59033203125, -22.7333984375, -21.87646484375, -21.01953125, -20.16259765625, -19.3056640625, -18.44873046875, -17.591796875, -16.73486328125, -15.8779296875, -15.02099609375, -14.1640625, -13.30712890625, -12.4501953125, -11.59326171875, -10.736328125, -9.87939453125, -9.0224609375, -8.16552734375, -7.30859375, -6.45166015625, -5.5947265625, -4.73779296875, -3.880859375, -3.02392578125, -2.1669921875, -1.31005859375, -0.453125, 0.40380859375, 1.2607421875, 2.11767578125, 2.974609375, 3.83154296875, 4.6884765625, 5.54541015625, 6.40234375, 7.25927734375, 8.1162109375, 8.97314453125, 9.830078125, 10.68701171875, 11.5439453125, 12.40087890625, 13.2578125, 14.11474609375, 14.9716796875, 15.82861328125, 16.685546875, 17.54248046875, 18.3994140625, 19.25634765625, 20.11328125, 20.97021484375, 21.8271484375, 22.68408203125, 23.541015625, 24.39794921875, 25.2548828125, 26.11181640625, 26.96875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 7.0, 3.0, 7.0, 12.0, 20.0, 14.0, 16.0, 17.0, 25.0, 24.0, 41.0, 28.0, 39.0, 48.0, 55.0, 69.0, 79.0, 487.0, 1585.0, 85.0, 58.0, 48.0, 42.0, 54.0, 33.0, 32.0, 27.0, 29.0, 13.0, 9.0, 14.0, 10.0, 8.0, 1.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -44.951171875, -43.40234375, -41.853515625, -40.3046875, -38.755859375, -37.20703125, -35.658203125, -34.109375, -32.560546875, -31.01171875, -29.462890625, -27.9140625, -26.365234375, -24.81640625, -23.267578125, -21.71875, -20.169921875, -18.62109375, -17.072265625, -15.5234375, -13.974609375, -12.42578125, -10.876953125, -9.328125, -7.779296875, -6.23046875, -4.681640625, -3.1328125, -1.583984375, -0.03515625, 1.513671875, 3.0625, 4.611328125, 6.16015625, 7.708984375, 9.2578125, 10.806640625, 12.35546875, 13.904296875, 15.453125, 17.001953125, 18.55078125, 20.099609375, 21.6484375, 23.197265625, 24.74609375, 26.294921875, 27.84375, 29.392578125, 30.94140625, 32.490234375, 34.0390625, 35.587890625, 37.13671875, 38.685546875, 40.234375, 41.783203125, 43.33203125, 44.880859375, 46.4296875, 47.978515625, 49.52734375, 51.076171875, 52.625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 16.0, 13.0, 17.0, 17.0, 29.0, 39.0, 43.0, 73.0, 107.0, 155.0, 434.0, 1715.0, 8807.0, 339904.0, 2779294.0, 11713.0, 2169.0, 508.0, 195.0, 107.0, 67.0, 59.0, 43.0, 32.0, 33.0, 18.0, 14.0, 14.0, 21.0, 12.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-86.5, -83.884765625, -81.26953125, -78.654296875, -76.0390625, -73.423828125, -70.80859375, -68.193359375, -65.578125, -62.962890625, -60.34765625, -57.732421875, -55.1171875, -52.501953125, -49.88671875, -47.271484375, -44.65625, -42.041015625, -39.42578125, -36.810546875, -34.1953125, -31.580078125, -28.96484375, -26.349609375, -23.734375, -21.119140625, -18.50390625, -15.888671875, -13.2734375, -10.658203125, -8.04296875, -5.427734375, -2.8125, -0.197265625, 2.41796875, 5.033203125, 7.6484375, 10.263671875, 12.87890625, 15.494140625, 18.109375, 20.724609375, 23.33984375, 25.955078125, 28.5703125, 31.185546875, 33.80078125, 36.416015625, 39.03125, 41.646484375, 44.26171875, 46.876953125, 49.4921875, 52.107421875, 54.72265625, 57.337890625, 59.953125, 62.568359375, 65.18359375, 67.798828125, 70.4140625, 73.029296875, 75.64453125, 78.259765625, 80.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 19.0, 228.0, 602.0, 151.0, 15.0, 0.0, 1.0, 0.0, 1.0], "bins": [-409.54376220703125, -402.4053955078125, -395.26702880859375, -388.128662109375, -380.99029541015625, -373.8519287109375, -366.71356201171875, -359.5751953125, -352.43682861328125, -345.2984619140625, -338.16009521484375, -331.021728515625, -323.88336181640625, -316.7449951171875, -309.60662841796875, -302.46826171875, -295.3298645019531, -288.1914978027344, -281.0531311035156, -273.9147644042969, -266.7763977050781, -259.6380310058594, -252.49964904785156, -245.3612823486328, -238.22291564941406, -231.0845489501953, -223.94618225097656, -216.8078155517578, -209.66943359375, -202.53106689453125, -195.3927001953125, -188.25433349609375, -181.115966796875, -173.97760009765625, -166.8392333984375, -159.70086669921875, -152.5625, -145.42413330078125, -138.28575134277344, -131.1473846435547, -124.00901794433594, -116.87065124511719, -109.73228454589844, -102.59391021728516, -95.4555435180664, -88.31717681884766, -81.17880249023438, -74.04043579101562, -66.90206909179688, -59.763702392578125, -52.62533187866211, -45.486961364746094, -38.348594665527344, -31.210227966308594, -24.071857452392578, -16.933486938476562, -9.795124053955078, -2.6567554473876953, 4.4816131591796875, 11.61998176574707, 18.758350372314453, 25.896717071533203, 33.03508758544922, 40.173458099365234, 47.311824798583984]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 4.0, 8.0, 4.0, 7.0, 15.0, 8.0, 9.0, 12.0, 17.0, 16.0, 25.0, 19.0, 31.0, 26.0, 30.0, 27.0, 38.0, 42.0, 36.0, 47.0, 52.0, 54.0, 52.0, 34.0, 44.0, 39.0, 39.0, 36.0, 24.0, 35.0, 22.0, 20.0, 18.0, 16.0, 25.0, 13.0, 17.0, 11.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-114.6417236328125, -111.21849822998047, -107.79527282714844, -104.37203979492188, -100.94881439208984, -97.52558898925781, -94.10236358642578, -90.67913818359375, -87.25590515136719, -83.83267974853516, -80.40945434570312, -76.98622131347656, -73.56299591064453, -70.1397705078125, -66.71654510498047, -63.29331970214844, -59.870094299316406, -56.446868896484375, -53.02363967895508, -49.60041427612305, -46.17718505859375, -42.75395965576172, -39.33073425292969, -35.907508850097656, -32.48427963256836, -29.061052322387695, -25.63782501220703, -22.214599609375, -18.791372299194336, -15.368144989013672, -11.94491958618164, -8.521692276000977, -5.098457336425781, -1.6752305030822754, 1.7479963302612305, 5.171222686767578, 8.594449996948242, 12.017677307128906, 15.440902709960938, 18.8641300201416, 22.287357330322266, 25.71058464050293, 29.133811950683594, 32.557037353515625, 35.980262756347656, 39.40349197387695, 42.826717376708984, 46.24994659423828, 49.67317199707031, 53.096397399902344, 56.51962661743164, 59.94285202026367, 63.36608123779297, 66.789306640625, 70.21253204345703, 73.63575744628906, 77.05899047851562, 80.48221588134766, 83.90544128417969, 87.32867431640625, 90.75189971923828, 94.17512512207031, 97.59835052490234, 101.02157592773438, 104.4448013305664]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 9.0, 19.0, 18.0, 25.0, 24.0, 22.0, 39.0, 29.0, 33.0, 30.0, 34.0, 32.0, 51.0, 44.0, 42.0, 46.0, 53.0, 42.0, 40.0, 33.0, 46.0, 36.0, 29.0, 38.0, 35.0, 29.0, 22.0, 15.0, 16.0, 7.0, 11.0, 5.0, 8.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.25, -15.7802734375, -15.310546875, -14.8408203125, -14.37109375, -13.9013671875, -13.431640625, -12.9619140625, -12.4921875, -12.0224609375, -11.552734375, -11.0830078125, -10.61328125, -10.1435546875, -9.673828125, -9.2041015625, -8.734375, -8.2646484375, -7.794921875, -7.3251953125, -6.85546875, -6.3857421875, -5.916015625, -5.4462890625, -4.9765625, -4.5068359375, -4.037109375, -3.5673828125, -3.09765625, -2.6279296875, -2.158203125, -1.6884765625, -1.21875, -0.7490234375, -0.279296875, 0.1904296875, 0.66015625, 1.1298828125, 1.599609375, 2.0693359375, 2.5390625, 3.0087890625, 3.478515625, 3.9482421875, 4.41796875, 4.8876953125, 5.357421875, 5.8271484375, 6.296875, 6.7666015625, 7.236328125, 7.7060546875, 8.17578125, 8.6455078125, 9.115234375, 9.5849609375, 10.0546875, 10.5244140625, 10.994140625, 11.4638671875, 11.93359375, 12.4033203125, 12.873046875, 13.3427734375, 13.8125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 2.0, 8.0, 12.0, 22.0, 26.0, 35.0, 39.0, 79.0, 126.0, 196.0, 348.0, 666.0, 1457.0, 3202.0, 7336.0, 18503.0, 62129.0, 600904.0, 3030853.0, 391512.0, 49195.0, 15962.0, 6419.0, 2653.0, 1208.0, 554.0, 321.0, 195.0, 105.0, 73.0, 38.0, 26.0, 12.0, 18.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.4375, -34.407958984375, -33.37841796875, -32.348876953125, -31.3193359375, -30.289794921875, -29.26025390625, -28.230712890625, -27.201171875, -26.171630859375, -25.14208984375, -24.112548828125, -23.0830078125, -22.053466796875, -21.02392578125, -19.994384765625, -18.96484375, -17.935302734375, -16.90576171875, -15.876220703125, -14.8466796875, -13.817138671875, -12.78759765625, -11.758056640625, -10.728515625, -9.698974609375, -8.66943359375, -7.639892578125, -6.6103515625, -5.580810546875, -4.55126953125, -3.521728515625, -2.4921875, -1.462646484375, -0.43310546875, 0.596435546875, 1.6259765625, 2.655517578125, 3.68505859375, 4.714599609375, 5.744140625, 6.773681640625, 7.80322265625, 8.832763671875, 9.8623046875, 10.891845703125, 11.92138671875, 12.950927734375, 13.98046875, 15.010009765625, 16.03955078125, 17.069091796875, 18.0986328125, 19.128173828125, 20.15771484375, 21.187255859375, 22.216796875, 23.246337890625, 24.27587890625, 25.305419921875, 26.3349609375, 27.364501953125, 28.39404296875, 29.423583984375, 30.453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 10.0, 6.0, 12.0, 19.0, 24.0, 44.0, 58.0, 87.0, 179.0, 357.0, 914.0, 1239.0, 578.0, 265.0, 121.0, 56.0, 28.0, 38.0, 14.0, 6.0, 12.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40625, -51.07080078125, -49.7353515625, -48.39990234375, -47.064453125, -45.72900390625, -44.3935546875, -43.05810546875, -41.72265625, -40.38720703125, -39.0517578125, -37.71630859375, -36.380859375, -35.04541015625, -33.7099609375, -32.37451171875, -31.0390625, -29.70361328125, -28.3681640625, -27.03271484375, -25.697265625, -24.36181640625, -23.0263671875, -21.69091796875, -20.35546875, -19.02001953125, -17.6845703125, -16.34912109375, -15.013671875, -13.67822265625, -12.3427734375, -11.00732421875, -9.671875, -8.33642578125, -7.0009765625, -5.66552734375, -4.330078125, -2.99462890625, -1.6591796875, -0.32373046875, 1.01171875, 2.34716796875, 3.6826171875, 5.01806640625, 6.353515625, 7.68896484375, 9.0244140625, 10.35986328125, 11.6953125, 13.03076171875, 14.3662109375, 15.70166015625, 17.037109375, 18.37255859375, 19.7080078125, 21.04345703125, 22.37890625, 23.71435546875, 25.0498046875, 26.38525390625, 27.720703125, 29.05615234375, 30.3916015625, 31.72705078125, 33.0625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 10.0, 10.0, 16.0, 28.0, 67.0, 96.0, 263.0, 568.0, 2158.0, 16275.0, 559943.0, 3571722.0, 38117.0, 3546.0, 806.0, 332.0, 142.0, 72.0, 37.0, 38.0, 15.0, 4.0, 9.0, 3.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.8125, -66.5126953125, -63.212890625, -59.9130859375, -56.61328125, -53.3134765625, -50.013671875, -46.7138671875, -43.4140625, -40.1142578125, -36.814453125, -33.5146484375, -30.21484375, -26.9150390625, -23.615234375, -20.3154296875, -17.015625, -13.7158203125, -10.416015625, -7.1162109375, -3.81640625, -0.5166015625, 2.783203125, 6.0830078125, 9.3828125, 12.6826171875, 15.982421875, 19.2822265625, 22.58203125, 25.8818359375, 29.181640625, 32.4814453125, 35.78125, 39.0810546875, 42.380859375, 45.6806640625, 48.98046875, 52.2802734375, 55.580078125, 58.8798828125, 62.1796875, 65.4794921875, 68.779296875, 72.0791015625, 75.37890625, 78.6787109375, 81.978515625, 85.2783203125, 88.578125, 91.8779296875, 95.177734375, 98.4775390625, 101.77734375, 105.0771484375, 108.376953125, 111.6767578125, 114.9765625, 118.2763671875, 121.576171875, 124.8759765625, 128.17578125, 131.4755859375, 134.775390625, 138.0751953125, 141.375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 14.0, 68.0, 183.0, 338.0, 259.0, 104.0, 23.0, 11.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.5100860595703, -227.67068481445312, -218.83128356933594, -209.99188232421875, -201.15248107910156, -192.31307983398438, -183.47369384765625, -174.63427734375, -165.79489135742188, -156.9554901123047, -148.1160888671875, -139.2766876220703, -130.43728637695312, -121.59788513183594, -112.75849151611328, -103.9190902709961, -95.07968139648438, -86.24028015136719, -77.40087890625, -68.56147766113281, -59.72208023071289, -50.8826789855957, -42.04328155517578, -33.203880310058594, -24.364479064941406, -15.525078773498535, -6.685678482055664, 2.1537208557128906, 10.993122100830078, 19.832523345947266, 28.671920776367188, 37.511322021484375, 46.350738525390625, 55.19013977050781, 64.029541015625, 72.86894226074219, 81.70834350585938, 90.54774475097656, 99.38713836669922, 108.2265396118164, 117.0659408569336, 125.90534210205078, 134.74473571777344, 143.58413696289062, 152.4235382080078, 161.262939453125, 170.1023406982422, 178.94174194335938, 187.78114318847656, 196.62054443359375, 205.45994567871094, 214.29934692382812, 223.1387481689453, 231.9781494140625, 240.81753540039062, 249.65695190429688, 258.496337890625, 267.3357238769531, 276.1751403808594, 285.0145263671875, 293.85394287109375, 302.6933288574219, 311.5327453613281, 320.37213134765625, 329.2115478515625]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 9.0, 7.0, 15.0, 16.0, 24.0, 23.0, 29.0, 32.0, 32.0, 26.0, 39.0, 33.0, 45.0, 36.0, 44.0, 64.0, 47.0, 53.0, 44.0, 44.0, 46.0, 42.0, 38.0, 27.0, 23.0, 21.0, 23.0, 13.0, 9.0, 13.0, 11.0, 13.0, 6.0, 8.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.86015319824219, -84.16903686523438, -81.47792053222656, -78.78680419921875, -76.09568786621094, -73.40457153320312, -70.71345520019531, -68.02234649658203, -65.33123016357422, -62.640113830566406, -59.948997497558594, -57.25788116455078, -54.566768646240234, -51.87565231323242, -49.18453598022461, -46.49342346191406, -43.802303314208984, -41.11118698120117, -38.42007064819336, -35.72895812988281, -33.037841796875, -30.346725463867188, -27.655609130859375, -24.964494705200195, -22.273378372192383, -19.58226203918457, -16.89114761352539, -14.200031280517578, -11.508915901184082, -8.817800521850586, -6.126684188842773, -3.4355697631835938, -0.7444534301757812, 1.946662187576294, 4.637777805328369, 7.328893661499023, 10.02000904083252, 12.711124420166016, 15.402240753173828, 18.093355178833008, 20.78447151184082, 23.475587844848633, 26.166702270507812, 28.857818603515625, 31.548934936523438, 34.24005126953125, 36.93116760253906, 39.62228012084961, 42.31339645385742, 45.004512786865234, 47.69562911987305, 50.386741638183594, 53.077857971191406, 55.76897430419922, 58.46009063720703, 61.151206970214844, 63.842323303222656, 66.53343963623047, 69.22455596923828, 71.9156723022461, 74.6067886352539, 77.29789733886719, 79.989013671875, 82.68013000488281, 85.37124633789062]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 3.0, 8.0, 7.0, 9.0, 7.0, 18.0, 20.0, 12.0, 26.0, 15.0, 28.0, 23.0, 28.0, 41.0, 48.0, 36.0, 46.0, 44.0, 40.0, 51.0, 47.0, 47.0, 41.0, 38.0, 24.0, 31.0, 32.0, 37.0, 22.0, 31.0, 23.0, 28.0, 14.0, 15.0, 12.0, 7.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.142333984375, -14.66748046875, -14.192626953125, -13.7177734375, -13.242919921875, -12.76806640625, -12.293212890625, -11.818359375, -11.343505859375, -10.86865234375, -10.393798828125, -9.9189453125, -9.444091796875, -8.96923828125, -8.494384765625, -8.01953125, -7.544677734375, -7.06982421875, -6.594970703125, -6.1201171875, -5.645263671875, -5.17041015625, -4.695556640625, -4.220703125, -3.745849609375, -3.27099609375, -2.796142578125, -2.3212890625, -1.846435546875, -1.37158203125, -0.896728515625, -0.421875, 0.052978515625, 0.52783203125, 1.002685546875, 1.4775390625, 1.952392578125, 2.42724609375, 2.902099609375, 3.376953125, 3.851806640625, 4.32666015625, 4.801513671875, 5.2763671875, 5.751220703125, 6.22607421875, 6.700927734375, 7.17578125, 7.650634765625, 8.12548828125, 8.600341796875, 9.0751953125, 9.550048828125, 10.02490234375, 10.499755859375, 10.974609375, 11.449462890625, 11.92431640625, 12.399169921875, 12.8740234375, 13.348876953125, 13.82373046875, 14.298583984375, 14.7734375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 14.0, 26.0, 34.0, 49.0, 81.0, 90.0, 144.0, 205.0, 301.0, 392.0, 578.0, 774.0, 1100.0, 1631.0, 2299.0, 3372.0, 4837.0, 7355.0, 10752.0, 15642.0, 22850.0, 34038.0, 49726.0, 72827.0, 108253.0, 162610.0, 178455.0, 118871.0, 79991.0, 54474.0, 37246.0, 25333.0, 17239.0, 11485.0, 7981.0, 5412.0, 3644.0, 2532.0, 1692.0, 1283.0, 881.0, 677.0, 424.0, 299.0, 194.0, 137.0, 103.0, 62.0, 52.0, 28.0, 35.0, 17.0, 8.0, 6.0, 3.0, 5.0, 3.0, 3.0], "bins": [-0.247802734375, -0.24008750915527344, -0.23237228393554688, -0.2246570587158203, -0.21694183349609375, -0.2092266082763672, -0.20151138305664062, -0.19379615783691406, -0.1860809326171875, -0.17836570739746094, -0.17065048217773438, -0.1629352569580078, -0.15522003173828125, -0.1475048065185547, -0.13978958129882812, -0.13207435607910156, -0.124359130859375, -0.11664390563964844, -0.10892868041992188, -0.10121345520019531, -0.09349822998046875, -0.08578300476074219, -0.07806777954101562, -0.07035255432128906, -0.0626373291015625, -0.05492210388183594, -0.047206878662109375, -0.03949165344238281, -0.03177642822265625, -0.024061203002929688, -0.016345977783203125, -0.008630752563476562, -0.00091552734375, 0.0067996978759765625, 0.014514923095703125, 0.022230148315429688, 0.02994537353515625, 0.03766059875488281, 0.045375823974609375, 0.05309104919433594, 0.0608062744140625, 0.06852149963378906, 0.07623672485351562, 0.08395195007324219, 0.09166717529296875, 0.09938240051269531, 0.10709762573242188, 0.11481285095214844, 0.122528076171875, 0.13024330139160156, 0.13795852661132812, 0.1456737518310547, 0.15338897705078125, 0.1611042022705078, 0.16881942749023438, 0.17653465270996094, 0.1842498779296875, 0.19196510314941406, 0.19968032836914062, 0.2073955535888672, 0.21511077880859375, 0.2228260040283203, 0.23054122924804688, 0.23825645446777344, 0.2459716796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 11.0, 8.0, 11.0, 12.0, 17.0, 25.0, 20.0, 23.0, 31.0, 26.0, 32.0, 46.0, 38.0, 48.0, 51.0, 37.0, 34.0, 1070.0, 41.0, 54.0, 40.0, 37.0, 40.0, 42.0, 33.0, 31.0, 21.0, 31.0, 19.0, 13.0, 21.0, 8.0, 12.0, 7.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-14.1328125, -13.7530517578125, -13.373291015625, -12.9935302734375, -12.61376953125, -12.2340087890625, -11.854248046875, -11.4744873046875, -11.0947265625, -10.7149658203125, -10.335205078125, -9.9554443359375, -9.57568359375, -9.1959228515625, -8.816162109375, -8.4364013671875, -8.056640625, -7.6768798828125, -7.297119140625, -6.9173583984375, -6.53759765625, -6.1578369140625, -5.778076171875, -5.3983154296875, -5.0185546875, -4.6387939453125, -4.259033203125, -3.8792724609375, -3.49951171875, -3.1197509765625, -2.739990234375, -2.3602294921875, -1.98046875, -1.6007080078125, -1.220947265625, -0.8411865234375, -0.46142578125, -0.0816650390625, 0.298095703125, 0.6778564453125, 1.0576171875, 1.4373779296875, 1.817138671875, 2.1968994140625, 2.57666015625, 2.9564208984375, 3.336181640625, 3.7159423828125, 4.095703125, 4.4754638671875, 4.855224609375, 5.2349853515625, 5.61474609375, 5.9945068359375, 6.374267578125, 6.7540283203125, 7.1337890625, 7.5135498046875, 7.893310546875, 8.2730712890625, 8.65283203125, 9.0325927734375, 9.412353515625, 9.7921142578125, 10.171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 7.0, 7.0, 15.0, 15.0, 35.0, 45.0, 83.0, 130.0, 238.0, 346.0, 573.0, 1062.0, 1704.0, 2788.0, 4731.0, 7675.0, 13309.0, 22927.0, 40266.0, 73250.0, 143613.0, 1320608.0, 219563.0, 109297.0, 57836.0, 32055.0, 18261.0, 10751.0, 6283.0, 3841.0, 2210.0, 1425.0, 859.0, 492.0, 319.0, 182.0, 101.0, 75.0, 51.0, 30.0, 18.0, 16.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2265625, -0.21965599060058594, -0.21274948120117188, -0.2058429718017578, -0.19893646240234375, -0.1920299530029297, -0.18512344360351562, -0.17821693420410156, -0.1713104248046875, -0.16440391540527344, -0.15749740600585938, -0.1505908966064453, -0.14368438720703125, -0.1367778778076172, -0.12987136840820312, -0.12296485900878906, -0.116058349609375, -0.10915184020996094, -0.10224533081054688, -0.09533882141113281, -0.08843231201171875, -0.08152580261230469, -0.07461929321289062, -0.06771278381347656, -0.0608062744140625, -0.05389976501464844, -0.046993255615234375, -0.04008674621582031, -0.03318023681640625, -0.026273727416992188, -0.019367218017578125, -0.012460708618164062, -0.00555419921875, 0.0013523101806640625, 0.008258819580078125, 0.015165328979492188, 0.02207183837890625, 0.028978347778320312, 0.035884857177734375, 0.04279136657714844, 0.0496978759765625, 0.05660438537597656, 0.06351089477539062, 0.07041740417480469, 0.07732391357421875, 0.08423042297363281, 0.09113693237304688, 0.09804344177246094, 0.104949951171875, 0.11185646057128906, 0.11876296997070312, 0.1256694793701172, 0.13257598876953125, 0.1394824981689453, 0.14638900756835938, 0.15329551696777344, 0.1602020263671875, 0.16710853576660156, 0.17401504516601562, 0.1809215545654297, 0.18782806396484375, 0.1947345733642578, 0.20164108276367188, 0.20854759216308594, 0.2154541015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 14.0, 14.0, 6.0, 20.0, 11.0, 20.0, 16.0, 17.0, 25.0, 30.0, 35.0, 44.0, 26.0, 27.0, 45.0, 42.0, 58.0, 51.0, 53.0, 46.0, 39.0, 52.0, 36.0, 30.0, 24.0, 30.0, 28.0, 18.0, 22.0, 21.0, 10.0, 18.0, 16.0, 7.0, 5.0, 8.0, 4.0, 3.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003867149353027344, -0.00037195533514022827, -0.00035719573497772217, -0.00034243613481521606, -0.00032767653465270996, -0.00031291693449020386, -0.00029815733432769775, -0.00028339773416519165, -0.00026863813400268555, -0.00025387853384017944, -0.00023911893367767334, -0.00022435933351516724, -0.00020959973335266113, -0.00019484013319015503, -0.00018008053302764893, -0.00016532093286514282, -0.00015056133270263672, -0.00013580173254013062, -0.00012104213237762451, -0.00010628253221511841, -9.15229320526123e-05, -7.67633318901062e-05, -6.20037317276001e-05, -4.7244131565093994e-05, -3.248453140258789e-05, -1.7724931240081787e-05, -2.9653310775756836e-06, 1.179426908493042e-05, 2.6553869247436523e-05, 4.131346940994263e-05, 5.607306957244873e-05, 7.083266973495483e-05, 8.559226989746094e-05, 0.00010035187005996704, 0.00011511147022247314, 0.00012987107038497925, 0.00014463067054748535, 0.00015939027070999146, 0.00017414987087249756, 0.00018890947103500366, 0.00020366907119750977, 0.00021842867136001587, 0.00023318827152252197, 0.0002479478716850281, 0.0002627074718475342, 0.0002774670720100403, 0.0002922266721725464, 0.0003069862723350525, 0.0003217458724975586, 0.0003365054726600647, 0.0003512650728225708, 0.0003660246729850769, 0.000380784273147583, 0.0003955438733100891, 0.0004103034734725952, 0.0004250630736351013, 0.0004398226737976074, 0.0004545822739601135, 0.00046934187412261963, 0.00048410147428512573, 0.0004988610744476318, 0.0005136206746101379, 0.000528380274772644, 0.0005431398749351501, 0.0005578994750976562]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 0.0, 6.0, 4.0, 4.0, 6.0, 7.0, 9.0, 11.0, 15.0, 18.0, 22.0, 17.0, 26.0, 34.0, 33.0, 41.0, 68.0, 102.0, 181.0, 303.0, 863.0, 20004.0, 1019707.0, 5481.0, 678.0, 315.0, 130.0, 87.0, 69.0, 68.0, 40.0, 43.0, 28.0, 15.0, 21.0, 15.0, 14.0, 15.0, 6.0, 10.0, 16.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.0124359130859375, -0.01210319995880127, -0.011770486831665039, -0.011437773704528809, -0.011105060577392578, -0.010772347450256348, -0.010439634323120117, -0.010106921195983887, -0.009774208068847656, -0.009441494941711426, -0.009108781814575195, -0.008776068687438965, -0.008443355560302734, -0.008110642433166504, -0.0077779293060302734, -0.007445216178894043, -0.0071125030517578125, -0.006779789924621582, -0.0064470767974853516, -0.006114363670349121, -0.005781650543212891, -0.00544893741607666, -0.00511622428894043, -0.004783511161804199, -0.004450798034667969, -0.004118084907531738, -0.003785371780395508, -0.0034526586532592773, -0.003119945526123047, -0.0027872323989868164, -0.002454519271850586, -0.0021218061447143555, -0.001789093017578125, -0.0014563798904418945, -0.001123666763305664, -0.0007909536361694336, -0.0004582405090332031, -0.00012552738189697266, 0.0002071857452392578, 0.0005398988723754883, 0.0008726119995117188, 0.0012053251266479492, 0.0015380382537841797, 0.0018707513809204102, 0.0022034645080566406, 0.002536177635192871, 0.0028688907623291016, 0.003201603889465332, 0.0035343170166015625, 0.003867030143737793, 0.0041997432708740234, 0.004532456398010254, 0.004865169525146484, 0.005197882652282715, 0.005530595779418945, 0.005863308906555176, 0.006196022033691406, 0.006528735160827637, 0.006861448287963867, 0.007194161415100098, 0.007526874542236328, 0.007859587669372559, 0.008192300796508789, 0.00852501392364502, 0.00885772705078125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 371.0, 641.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011258742772042751, -0.011014152318239212, -0.010769560933113098, -0.010524969547986984, -0.010280379094183445, -0.010035788640379906, -0.009791197255253792, -0.009546605870127678, -0.009302015416324139, -0.0090574249625206, -0.008812833577394485, -0.008568242192268372, -0.008323651738464832, -0.008079061284661293, -0.00783446989953518, -0.0075898789800703526, -0.007345288060605526, -0.007100697141140699, -0.006856106221675873, -0.006611515302211046, -0.00636692438274622, -0.006122333463281393, -0.0058777425438165665, -0.00563315162435174, -0.005388560704886913, -0.005143969785422087, -0.00489937886595726, -0.0046547879464924335, -0.004410197027027607, -0.00416560610756278, -0.003921015188097954, -0.003676424268633127, -0.0034318342804908752, -0.0031872433610260487, -0.002942652441561222, -0.0026980615220963955, -0.002453470602631569, -0.0022088796831667423, -0.0019642887637019157, -0.0017196978442370892, -0.0014751069247722626, -0.001230516005307436, -0.0009859250858426094, -0.0007413341663777828, -0.0004967432469129562, -0.00025215232744812965, -7.56140798330307e-06, 0.00023702951148152351, 0.0004816204309463501, 0.0007262113504111767, 0.0009708022698760033, 0.0012153931893408298, 0.0014599841088056564, 0.001704575028270483, 0.0019491659477353096, 0.002193756867200136, 0.0024383477866649628, 0.0026829387061297894, 0.002927529625594616, 0.0031721205450594425, 0.003416711464524269, 0.0036613023839890957, 0.0039058933034539223, 0.004150484222918749, 0.0043950751423835754]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 17.0, 32.0, 35.0, 48.0, 63.0, 81.0, 103.0, 116.0, 107.0, 86.0, 84.0, 74.0, 44.0, 36.0, 28.0, 22.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000894010066986084, -0.00086224265396595, -0.000830475240945816, -0.0007987078279256821, -0.0007669404149055481, -0.0007351730018854141, -0.0007034055888652802, -0.0006716381758451462, -0.0006398707628250122, -0.0006081033498048782, -0.0005763359367847443, -0.0005445685237646103, -0.0005128011107444763, -0.00048103369772434235, -0.0004492662847042084, -0.0004174988716840744, -0.00038573145866394043, -0.00035396404564380646, -0.0003221966326236725, -0.0002904292196035385, -0.00025866180658340454, -0.00022689439356327057, -0.0001951269805431366, -0.00016335956752300262, -0.00013159215450286865, -9.982474148273468e-05, -6.805732846260071e-05, -3.6289915442466736e-05, -4.522502422332764e-06, 2.724491059780121e-05, 5.901232361793518e-05, 9.077973663806915e-05, 0.00012254714965820312, 0.0001543145626783371, 0.00018608197569847107, 0.00021784938871860504, 0.000249616801738739, 0.000281384214758873, 0.00031315162777900696, 0.00034491904079914093, 0.0003766864538192749, 0.0004084538668394089, 0.00044022127985954285, 0.0004719886928796768, 0.0005037561058998108, 0.0005355235189199448, 0.0005672909319400787, 0.0005990583449602127, 0.0006308257579803467, 0.0006625931710004807, 0.0006943605840206146, 0.0007261279970407486, 0.0007578954100608826, 0.0007896628230810165, 0.0008214302361011505, 0.0008531976491212845, 0.0008849650621414185, 0.0009167324751615524, 0.0009484998881816864, 0.0009802673012018204, 0.0010120347142219543, 0.0010438021272420883, 0.0010755695402622223, 0.0011073369532823563, 0.0011391043663024902]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 3.0, 8.0, 7.0, 9.0, 7.0, 18.0, 20.0, 12.0, 26.0, 15.0, 28.0, 23.0, 28.0, 41.0, 48.0, 36.0, 46.0, 44.0, 40.0, 51.0, 47.0, 47.0, 41.0, 38.0, 24.0, 31.0, 32.0, 37.0, 22.0, 31.0, 23.0, 28.0, 14.0, 15.0, 12.0, 7.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.142333984375, -14.66748046875, -14.192626953125, -13.7177734375, -13.242919921875, -12.76806640625, -12.293212890625, -11.818359375, -11.343505859375, -10.86865234375, -10.393798828125, -9.9189453125, -9.444091796875, -8.96923828125, -8.494384765625, -8.01953125, -7.544677734375, -7.06982421875, -6.594970703125, -6.1201171875, -5.645263671875, -5.17041015625, -4.695556640625, -4.220703125, -3.745849609375, -3.27099609375, -2.796142578125, -2.3212890625, -1.846435546875, -1.37158203125, -0.896728515625, -0.421875, 0.052978515625, 0.52783203125, 1.002685546875, 1.4775390625, 1.952392578125, 2.42724609375, 2.902099609375, 3.376953125, 3.851806640625, 4.32666015625, 4.801513671875, 5.2763671875, 5.751220703125, 6.22607421875, 6.700927734375, 7.17578125, 7.650634765625, 8.12548828125, 8.600341796875, 9.0751953125, 9.550048828125, 10.02490234375, 10.499755859375, 10.974609375, 11.449462890625, 11.92431640625, 12.399169921875, 12.8740234375, 13.348876953125, 13.82373046875, 14.298583984375, 14.7734375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 14.0, 21.0, 16.0, 32.0, 31.0, 53.0, 78.0, 100.0, 136.0, 187.0, 293.0, 444.0, 683.0, 1071.0, 1834.0, 3074.0, 5362.0, 9188.0, 17119.0, 46504.0, 736559.0, 168389.0, 27006.0, 12746.0, 7052.0, 4042.0, 2417.0, 1438.0, 879.0, 542.0, 387.0, 227.0, 150.0, 117.0, 72.0, 67.0, 52.0, 31.0, 20.0, 21.0, 19.0, 16.0, 15.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-28.234375, -27.372802734375, -26.51123046875, -25.649658203125, -24.7880859375, -23.926513671875, -23.06494140625, -22.203369140625, -21.341796875, -20.480224609375, -19.61865234375, -18.757080078125, -17.8955078125, -17.033935546875, -16.17236328125, -15.310791015625, -14.44921875, -13.587646484375, -12.72607421875, -11.864501953125, -11.0029296875, -10.141357421875, -9.27978515625, -8.418212890625, -7.556640625, -6.695068359375, -5.83349609375, -4.971923828125, -4.1103515625, -3.248779296875, -2.38720703125, -1.525634765625, -0.6640625, 0.197509765625, 1.05908203125, 1.920654296875, 2.7822265625, 3.643798828125, 4.50537109375, 5.366943359375, 6.228515625, 7.090087890625, 7.95166015625, 8.813232421875, 9.6748046875, 10.536376953125, 11.39794921875, 12.259521484375, 13.12109375, 13.982666015625, 14.84423828125, 15.705810546875, 16.5673828125, 17.428955078125, 18.29052734375, 19.152099609375, 20.013671875, 20.875244140625, 21.73681640625, 22.598388671875, 23.4599609375, 24.321533203125, 25.18310546875, 26.044677734375, 26.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 4.0, 9.0, 17.0, 19.0, 21.0, 31.0, 24.0, 29.0, 38.0, 35.0, 44.0, 36.0, 46.0, 67.0, 103.0, 1743.0, 264.0, 80.0, 59.0, 43.0, 46.0, 37.0, 35.0, 28.0, 28.0, 18.0, 23.0, 10.0, 15.0, 16.0, 9.0, 11.0, 10.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.04638671875, -34.7490234375, -33.45166015625, -32.154296875, -30.85693359375, -29.5595703125, -28.26220703125, -26.96484375, -25.66748046875, -24.3701171875, -23.07275390625, -21.775390625, -20.47802734375, -19.1806640625, -17.88330078125, -16.5859375, -15.28857421875, -13.9912109375, -12.69384765625, -11.396484375, -10.09912109375, -8.8017578125, -7.50439453125, -6.20703125, -4.90966796875, -3.6123046875, -2.31494140625, -1.017578125, 0.27978515625, 1.5771484375, 2.87451171875, 4.171875, 5.46923828125, 6.7666015625, 8.06396484375, 9.361328125, 10.65869140625, 11.9560546875, 13.25341796875, 14.55078125, 15.84814453125, 17.1455078125, 18.44287109375, 19.740234375, 21.03759765625, 22.3349609375, 23.63232421875, 24.9296875, 26.22705078125, 27.5244140625, 28.82177734375, 30.119140625, 31.41650390625, 32.7138671875, 34.01123046875, 35.30859375, 36.60595703125, 37.9033203125, 39.20068359375, 40.498046875, 41.79541015625, 43.0927734375, 44.39013671875, 45.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 9.0, 14.0, 14.0, 22.0, 16.0, 29.0, 22.0, 47.0, 83.0, 103.0, 179.0, 376.0, 1167.0, 4473.0, 25157.0, 2948441.0, 149995.0, 11471.0, 2518.0, 724.0, 316.0, 149.0, 94.0, 56.0, 41.0, 40.0, 26.0, 29.0, 19.0, 10.0, 9.0, 8.0, 8.0, 6.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0, -78.5302734375, -76.060546875, -73.5908203125, -71.12109375, -68.6513671875, -66.181640625, -63.7119140625, -61.2421875, -58.7724609375, -56.302734375, -53.8330078125, -51.36328125, -48.8935546875, -46.423828125, -43.9541015625, -41.484375, -39.0146484375, -36.544921875, -34.0751953125, -31.60546875, -29.1357421875, -26.666015625, -24.1962890625, -21.7265625, -19.2568359375, -16.787109375, -14.3173828125, -11.84765625, -9.3779296875, -6.908203125, -4.4384765625, -1.96875, 0.5009765625, 2.970703125, 5.4404296875, 7.91015625, 10.3798828125, 12.849609375, 15.3193359375, 17.7890625, 20.2587890625, 22.728515625, 25.1982421875, 27.66796875, 30.1376953125, 32.607421875, 35.0771484375, 37.546875, 40.0166015625, 42.486328125, 44.9560546875, 47.42578125, 49.8955078125, 52.365234375, 54.8349609375, 57.3046875, 59.7744140625, 62.244140625, 64.7138671875, 67.18359375, 69.6533203125, 72.123046875, 74.5927734375, 77.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 13.0, 59.0, 187.0, 363.0, 280.0, 71.0, 30.0, 6.0, 0.0, 2.0], "bins": [-248.97499084472656, -244.65927124023438, -240.34356689453125, -236.02784729003906, -231.71212768554688, -227.3964080810547, -223.0806884765625, -218.76498413085938, -214.4492645263672, -210.133544921875, -205.81784057617188, -201.5021209716797, -197.1864013671875, -192.8706817626953, -188.55496215820312, -184.2392578125, -179.9235382080078, -175.60781860351562, -171.2921142578125, -166.9763946533203, -162.66067504882812, -158.34495544433594, -154.02923583984375, -149.71353149414062, -145.39781188964844, -141.08209228515625, -136.76638793945312, -132.45066833496094, -128.13494873046875, -123.81922912597656, -119.5035171508789, -115.18780517578125, -110.87207794189453, -106.55636596679688, -102.24064636230469, -97.9249267578125, -93.60921478271484, -89.29350280761719, -84.977783203125, -80.66206359863281, -76.34635162353516, -72.0306396484375, -67.71492004394531, -63.39920425415039, -59.08348846435547, -54.76777267456055, -50.452056884765625, -46.1363410949707, -41.82062530517578, -37.50490951538086, -33.18919372558594, -28.873477935791016, -24.557762145996094, -20.242046356201172, -15.92633056640625, -11.610614776611328, -7.294897079467773, -2.9791812896728516, 1.3365345001220703, 5.652250289916992, 9.967966079711914, 14.283681869506836, 18.599397659301758, 22.91511344909668, 27.2308292388916]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 10.0, 7.0, 9.0, 19.0, 20.0, 27.0, 21.0, 34.0, 23.0, 26.0, 34.0, 30.0, 26.0, 34.0, 33.0, 34.0, 21.0, 40.0, 46.0, 32.0, 42.0, 37.0, 39.0, 37.0, 42.0, 20.0, 37.0, 20.0, 22.0, 13.0, 25.0, 22.0, 19.0, 19.0, 8.0, 8.0, 7.0, 12.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.50756072998047, -92.47132110595703, -89.43508911132812, -86.39884948730469, -83.36260986328125, -80.32637786865234, -77.2901382446289, -74.25390625, -71.21766662597656, -68.18142700195312, -65.14519500732422, -62.10895538330078, -59.07271957397461, -56.03648376464844, -53.000244140625, -49.96400833129883, -46.927772521972656, -43.891536712646484, -40.85530090332031, -37.819061279296875, -34.7828254699707, -31.74658966064453, -28.710351943969727, -25.674114227294922, -22.63787841796875, -19.601642608642578, -16.565404891967773, -13.529168128967285, -10.492931365966797, -7.456694602966309, -4.42045783996582, -1.3842201232910156, 1.6520156860351562, 4.6882524490356445, 7.724489212036133, 10.760725975036621, 13.79696273803711, 16.83319854736328, 19.869436264038086, 22.90567398071289, 25.941909790039062, 28.978145599365234, 32.014381408691406, 35.050621032714844, 38.086856842041016, 41.12309265136719, 44.159332275390625, 47.1955680847168, 50.23180389404297, 53.26803970336914, 56.30427551269531, 59.34051513671875, 62.37675094604492, 65.4129867553711, 68.44922637939453, 71.48545837402344, 74.52169799804688, 77.55793762207031, 80.59416961669922, 83.63040924072266, 86.66664123535156, 89.702880859375, 92.73912048339844, 95.77536010742188, 98.81159210205078]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 10.0, 7.0, 5.0, 15.0, 14.0, 13.0, 17.0, 20.0, 21.0, 23.0, 25.0, 33.0, 36.0, 43.0, 36.0, 44.0, 39.0, 39.0, 50.0, 43.0, 35.0, 47.0, 31.0, 46.0, 28.0, 34.0, 23.0, 26.0, 30.0, 28.0, 19.0, 16.0, 21.0, 12.0, 12.0, 17.0, 5.0, 5.0, 1.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.5625, -15.1065673828125, -14.650634765625, -14.1947021484375, -13.73876953125, -13.2828369140625, -12.826904296875, -12.3709716796875, -11.9150390625, -11.4591064453125, -11.003173828125, -10.5472412109375, -10.09130859375, -9.6353759765625, -9.179443359375, -8.7235107421875, -8.267578125, -7.8116455078125, -7.355712890625, -6.8997802734375, -6.44384765625, -5.9879150390625, -5.531982421875, -5.0760498046875, -4.6201171875, -4.1641845703125, -3.708251953125, -3.2523193359375, -2.79638671875, -2.3404541015625, -1.884521484375, -1.4285888671875, -0.97265625, -0.5167236328125, -0.060791015625, 0.3951416015625, 0.85107421875, 1.3070068359375, 1.762939453125, 2.2188720703125, 2.6748046875, 3.1307373046875, 3.586669921875, 4.0426025390625, 4.49853515625, 4.9544677734375, 5.410400390625, 5.8663330078125, 6.322265625, 6.7781982421875, 7.234130859375, 7.6900634765625, 8.14599609375, 8.6019287109375, 9.057861328125, 9.5137939453125, 9.9697265625, 10.4256591796875, 10.881591796875, 11.3375244140625, 11.79345703125, 12.2493896484375, 12.705322265625, 13.1612548828125, 13.6171875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 12.0, 11.0, 25.0, 23.0, 56.0, 88.0, 106.0, 184.0, 233.0, 360.0, 572.0, 912.0, 1450.0, 2511.0, 4019.0, 7185.0, 13519.0, 28219.0, 84484.0, 560835.0, 2619622.0, 704915.0, 100268.0, 31359.0, 14406.0, 7567.0, 4508.0, 2574.0, 1593.0, 988.0, 589.0, 365.0, 250.0, 145.0, 102.0, 59.0, 45.0, 32.0, 24.0, 10.0, 10.0, 13.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.65625, -26.83203125, -26.0078125, -25.18359375, -24.359375, -23.53515625, -22.7109375, -21.88671875, -21.0625, -20.23828125, -19.4140625, -18.58984375, -17.765625, -16.94140625, -16.1171875, -15.29296875, -14.46875, -13.64453125, -12.8203125, -11.99609375, -11.171875, -10.34765625, -9.5234375, -8.69921875, -7.875, -7.05078125, -6.2265625, -5.40234375, -4.578125, -3.75390625, -2.9296875, -2.10546875, -1.28125, -0.45703125, 0.3671875, 1.19140625, 2.015625, 2.83984375, 3.6640625, 4.48828125, 5.3125, 6.13671875, 6.9609375, 7.78515625, 8.609375, 9.43359375, 10.2578125, 11.08203125, 11.90625, 12.73046875, 13.5546875, 14.37890625, 15.203125, 16.02734375, 16.8515625, 17.67578125, 18.5, 19.32421875, 20.1484375, 20.97265625, 21.796875, 22.62109375, 23.4453125, 24.26953125, 25.09375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 11.0, 10.0, 14.0, 10.0, 16.0, 26.0, 46.0, 50.0, 76.0, 124.0, 160.0, 316.0, 633.0, 957.0, 694.0, 372.0, 176.0, 109.0, 80.0, 55.0, 40.0, 20.0, 21.0, 14.0, 19.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.98876953125, -34.9775390625, -33.96630859375, -32.955078125, -31.94384765625, -30.9326171875, -29.92138671875, -28.91015625, -27.89892578125, -26.8876953125, -25.87646484375, -24.865234375, -23.85400390625, -22.8427734375, -21.83154296875, -20.8203125, -19.80908203125, -18.7978515625, -17.78662109375, -16.775390625, -15.76416015625, -14.7529296875, -13.74169921875, -12.73046875, -11.71923828125, -10.7080078125, -9.69677734375, -8.685546875, -7.67431640625, -6.6630859375, -5.65185546875, -4.640625, -3.62939453125, -2.6181640625, -1.60693359375, -0.595703125, 0.41552734375, 1.4267578125, 2.43798828125, 3.44921875, 4.46044921875, 5.4716796875, 6.48291015625, 7.494140625, 8.50537109375, 9.5166015625, 10.52783203125, 11.5390625, 12.55029296875, 13.5615234375, 14.57275390625, 15.583984375, 16.59521484375, 17.6064453125, 18.61767578125, 19.62890625, 20.64013671875, 21.6513671875, 22.66259765625, 23.673828125, 24.68505859375, 25.6962890625, 26.70751953125, 27.71875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 13.0, 16.0, 19.0, 19.0, 35.0, 58.0, 103.0, 171.0, 317.0, 790.0, 2730.0, 13124.0, 99106.0, 3537007.0, 497216.0, 35176.0, 5812.0, 1429.0, 522.0, 244.0, 134.0, 91.0, 43.0, 26.0, 20.0, 14.0, 16.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.4375, -62.9921875, -60.546875, -58.1015625, -55.65625, -53.2109375, -50.765625, -48.3203125, -45.875, -43.4296875, -40.984375, -38.5390625, -36.09375, -33.6484375, -31.203125, -28.7578125, -26.3125, -23.8671875, -21.421875, -18.9765625, -16.53125, -14.0859375, -11.640625, -9.1953125, -6.75, -4.3046875, -1.859375, 0.5859375, 3.03125, 5.4765625, 7.921875, 10.3671875, 12.8125, 15.2578125, 17.703125, 20.1484375, 22.59375, 25.0390625, 27.484375, 29.9296875, 32.375, 34.8203125, 37.265625, 39.7109375, 42.15625, 44.6015625, 47.046875, 49.4921875, 51.9375, 54.3828125, 56.828125, 59.2734375, 61.71875, 64.1640625, 66.609375, 69.0546875, 71.5, 73.9453125, 76.390625, 78.8359375, 81.28125, 83.7265625, 86.171875, 88.6171875, 91.0625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 32.0, 64.0, 168.0, 274.0, 247.0, 149.0, 43.0, 20.0, 8.0, 1.0], "bins": [-459.6931457519531, -451.7401428222656, -443.7871398925781, -435.8341064453125, -427.881103515625, -419.9281005859375, -411.97509765625, -404.0220947265625, -396.0690612792969, -388.1160583496094, -380.1630554199219, -372.21002197265625, -364.25701904296875, -356.30401611328125, -348.35101318359375, -340.39801025390625, -332.44500732421875, -324.49200439453125, -316.53900146484375, -308.5859680175781, -300.6329650878906, -292.6799621582031, -284.7269592285156, -276.7739562988281, -268.8209228515625, -260.867919921875, -252.91490173339844, -244.96189880371094, -237.00888061523438, -229.05587768554688, -221.10287475585938, -213.1498565673828, -205.1968536376953, -197.2438507080078, -189.29083251953125, -181.33782958984375, -173.3848114013672, -165.4318084716797, -157.47879028320312, -149.52578735351562, -141.57278442382812, -133.61978149414062, -125.66676330566406, -117.71376037597656, -109.76074981689453, -101.8077392578125, -93.85472869873047, -85.90171813964844, -77.9487075805664, -69.99569702148438, -62.04269027709961, -54.08967971801758, -46.13667297363281, -38.18366241455078, -30.23065185546875, -22.277645111083984, -14.324634552001953, -6.3716254234313965, 1.5813837051391602, 9.534393310546875, 17.487401962280273, 25.440410614013672, 33.3934211730957, 41.34642791748047, 49.2994384765625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 5.0, 7.0, 6.0, 15.0, 16.0, 8.0, 14.0, 17.0, 12.0, 25.0, 19.0, 20.0, 27.0, 36.0, 27.0, 44.0, 44.0, 36.0, 29.0, 35.0, 35.0, 45.0, 42.0, 37.0, 36.0, 37.0, 39.0, 27.0, 34.0, 36.0, 19.0, 21.0, 24.0, 23.0, 17.0, 10.0, 9.0, 15.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.98035430908203, -59.78236389160156, -57.58437728881836, -55.386390686035156, -53.18840026855469, -50.99040985107422, -48.792423248291016, -46.59443664550781, -44.396446228027344, -42.198455810546875, -40.00046920776367, -37.80248260498047, -35.6044921875, -33.40650177001953, -31.208515167236328, -29.010526657104492, -26.812538146972656, -24.61454963684082, -22.416561126708984, -20.21857261657715, -18.020584106445312, -15.822595596313477, -13.62460708618164, -11.426618576049805, -9.228630065917969, -7.030641555786133, -4.832653045654297, -2.634664535522461, -0.436676025390625, 1.761312484741211, 3.959300994873047, 6.157289505004883, 8.355270385742188, 10.553258895874023, 12.75124740600586, 14.949235916137695, 17.14722442626953, 19.345212936401367, 21.543201446533203, 23.74118995666504, 25.939178466796875, 28.13716697692871, 30.335155487060547, 32.53314208984375, 34.73113250732422, 36.92912292480469, 39.12710952758789, 41.325096130371094, 43.52308654785156, 45.72107696533203, 47.919063568115234, 50.11705017089844, 52.315040588378906, 54.513031005859375, 56.71101760864258, 58.90900421142578, 61.10699462890625, 63.30498504638672, 65.50297546386719, 67.70095825195312, 69.8989486694336, 72.09693908691406, 74.294921875, 76.49291229248047, 78.69090270996094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 10.0, 9.0, 21.0, 19.0, 22.0, 25.0, 39.0, 27.0, 38.0, 41.0, 33.0, 45.0, 50.0, 38.0, 45.0, 46.0, 31.0, 49.0, 44.0, 39.0, 42.0, 44.0, 38.0, 32.0, 18.0, 27.0, 24.0, 24.0, 21.0, 13.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.357666015625, -16.82470703125, -16.291748046875, -15.7587890625, -15.225830078125, -14.69287109375, -14.159912109375, -13.626953125, -13.093994140625, -12.56103515625, -12.028076171875, -11.4951171875, -10.962158203125, -10.42919921875, -9.896240234375, -9.36328125, -8.830322265625, -8.29736328125, -7.764404296875, -7.2314453125, -6.698486328125, -6.16552734375, -5.632568359375, -5.099609375, -4.566650390625, -4.03369140625, -3.500732421875, -2.9677734375, -2.434814453125, -1.90185546875, -1.368896484375, -0.8359375, -0.302978515625, 0.22998046875, 0.762939453125, 1.2958984375, 1.828857421875, 2.36181640625, 2.894775390625, 3.427734375, 3.960693359375, 4.49365234375, 5.026611328125, 5.5595703125, 6.092529296875, 6.62548828125, 7.158447265625, 7.69140625, 8.224365234375, 8.75732421875, 9.290283203125, 9.8232421875, 10.356201171875, 10.88916015625, 11.422119140625, 11.955078125, 12.488037109375, 13.02099609375, 13.553955078125, 14.0869140625, 14.619873046875, 15.15283203125, 15.685791015625, 16.21875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 11.0, 14.0, 18.0, 30.0, 41.0, 62.0, 115.0, 124.0, 197.0, 306.0, 438.0, 763.0, 1102.0, 1712.0, 2750.0, 4217.0, 6936.0, 11561.0, 19547.0, 32750.0, 55292.0, 94128.0, 163121.0, 242546.0, 169810.0, 98035.0, 57296.0, 33903.0, 20146.0, 11893.0, 7337.0, 4472.0, 2816.0, 1733.0, 1166.0, 754.0, 473.0, 297.0, 202.0, 148.0, 104.0, 63.0, 37.0, 40.0, 17.0, 10.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.339599609375, -0.3288307189941406, -0.31806182861328125, -0.3072929382324219, -0.2965240478515625, -0.2857551574707031, -0.27498626708984375, -0.2642173767089844, -0.253448486328125, -0.24267959594726562, -0.23191070556640625, -0.22114181518554688, -0.2103729248046875, -0.19960403442382812, -0.18883514404296875, -0.17806625366210938, -0.16729736328125, -0.15652847290039062, -0.14575958251953125, -0.13499069213867188, -0.1242218017578125, -0.11345291137695312, -0.10268402099609375, -0.09191513061523438, -0.081146240234375, -0.07037734985351562, -0.05960845947265625, -0.048839569091796875, -0.0380706787109375, -0.027301788330078125, -0.01653289794921875, -0.005764007568359375, 0.0050048828125, 0.015773773193359375, 0.02654266357421875, 0.037311553955078125, 0.0480804443359375, 0.058849334716796875, 0.06961822509765625, 0.08038711547851562, 0.091156005859375, 0.10192489624023438, 0.11269378662109375, 0.12346267700195312, 0.1342315673828125, 0.14500045776367188, 0.15576934814453125, 0.16653823852539062, 0.17730712890625, 0.18807601928710938, 0.19884490966796875, 0.20961380004882812, 0.2203826904296875, 0.23115158081054688, 0.24192047119140625, 0.2526893615722656, 0.263458251953125, 0.2742271423339844, 0.28499603271484375, 0.2957649230957031, 0.3065338134765625, 0.3173027038574219, 0.32807159423828125, 0.3388404846191406, 0.349609375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 7.0, 10.0, 11.0, 7.0, 8.0, 17.0, 18.0, 19.0, 18.0, 24.0, 24.0, 30.0, 25.0, 41.0, 41.0, 33.0, 45.0, 48.0, 41.0, 38.0, 1072.0, 37.0, 33.0, 30.0, 36.0, 44.0, 35.0, 39.0, 22.0, 25.0, 13.0, 16.0, 19.0, 18.0, 15.0, 16.0, 13.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.859375, -9.533447265625, -9.20751953125, -8.881591796875, -8.5556640625, -8.229736328125, -7.90380859375, -7.577880859375, -7.251953125, -6.926025390625, -6.60009765625, -6.274169921875, -5.9482421875, -5.622314453125, -5.29638671875, -4.970458984375, -4.64453125, -4.318603515625, -3.99267578125, -3.666748046875, -3.3408203125, -3.014892578125, -2.68896484375, -2.363037109375, -2.037109375, -1.711181640625, -1.38525390625, -1.059326171875, -0.7333984375, -0.407470703125, -0.08154296875, 0.244384765625, 0.5703125, 0.896240234375, 1.22216796875, 1.548095703125, 1.8740234375, 2.199951171875, 2.52587890625, 2.851806640625, 3.177734375, 3.503662109375, 3.82958984375, 4.155517578125, 4.4814453125, 4.807373046875, 5.13330078125, 5.459228515625, 5.78515625, 6.111083984375, 6.43701171875, 6.762939453125, 7.0888671875, 7.414794921875, 7.74072265625, 8.066650390625, 8.392578125, 8.718505859375, 9.04443359375, 9.370361328125, 9.6962890625, 10.022216796875, 10.34814453125, 10.674072265625, 11.0]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 5.0, 13.0, 13.0, 21.0, 44.0, 60.0, 77.0, 101.0, 141.0, 238.0, 289.0, 391.0, 609.0, 824.0, 1074.0, 1643.0, 2182.0, 3242.0, 4465.0, 6428.0, 9313.0, 13572.0, 20327.0, 30282.0, 46080.0, 70816.0, 112494.0, 178663.0, 1238250.0, 123815.0, 77883.0, 50114.0, 33284.0, 22322.0, 14934.0, 9996.0, 6986.0, 4788.0, 3273.0, 2278.0, 1626.0, 1162.0, 900.0, 608.0, 423.0, 325.0, 219.0, 165.0, 107.0, 98.0, 52.0, 43.0, 22.0, 20.0, 14.0, 11.0, 5.0, 2.0, 5.0, 2.0, 3.0], "bins": [-0.143310546875, -0.138702392578125, -0.13409423828125, -0.129486083984375, -0.1248779296875, -0.120269775390625, -0.11566162109375, -0.111053466796875, -0.1064453125, -0.101837158203125, -0.09722900390625, -0.092620849609375, -0.0880126953125, -0.083404541015625, -0.07879638671875, -0.074188232421875, -0.069580078125, -0.064971923828125, -0.06036376953125, -0.055755615234375, -0.0511474609375, -0.046539306640625, -0.04193115234375, -0.037322998046875, -0.03271484375, -0.028106689453125, -0.02349853515625, -0.018890380859375, -0.0142822265625, -0.009674072265625, -0.00506591796875, -0.000457763671875, 0.004150390625, 0.008758544921875, 0.01336669921875, 0.017974853515625, 0.0225830078125, 0.027191162109375, 0.03179931640625, 0.036407470703125, 0.041015625, 0.045623779296875, 0.05023193359375, 0.054840087890625, 0.0594482421875, 0.064056396484375, 0.06866455078125, 0.073272705078125, 0.077880859375, 0.082489013671875, 0.08709716796875, 0.091705322265625, 0.0963134765625, 0.100921630859375, 0.10552978515625, 0.110137939453125, 0.11474609375, 0.119354248046875, 0.12396240234375, 0.128570556640625, 0.1331787109375, 0.137786865234375, 0.14239501953125, 0.147003173828125, 0.151611328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 9.0, 4.0, 5.0, 11.0, 17.0, 13.0, 14.0, 13.0, 20.0, 27.0, 34.0, 43.0, 49.0, 50.0, 55.0, 60.0, 70.0, 66.0, 52.0, 66.0, 48.0, 51.0, 35.0, 36.0, 27.0, 25.0, 21.0, 18.0, 6.0, 12.0, 7.0, 7.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005297660827636719, -0.0005147233605384827, -0.0004996806383132935, -0.00048463791608810425, -0.00046959519386291504, -0.00045455247163772583, -0.0004395097494125366, -0.0004244670271873474, -0.0004094243049621582, -0.000394381582736969, -0.0003793388605117798, -0.0003642961382865906, -0.00034925341606140137, -0.00033421069383621216, -0.00031916797161102295, -0.00030412524938583374, -0.00028908252716064453, -0.0002740398049354553, -0.0002589970827102661, -0.0002439543604850769, -0.0002289116382598877, -0.00021386891603469849, -0.00019882619380950928, -0.00018378347158432007, -0.00016874074935913086, -0.00015369802713394165, -0.00013865530490875244, -0.00012361258268356323, -0.00010856986045837402, -9.352713823318481e-05, -7.84844160079956e-05, -6.34416937828064e-05, -4.839897155761719e-05, -3.335624933242798e-05, -1.831352710723877e-05, -3.2708048820495605e-06, 1.1771917343139648e-05, 2.6814639568328857e-05, 4.1857361793518066e-05, 5.6900084018707275e-05, 7.194280624389648e-05, 8.69855284690857e-05, 0.0001020282506942749, 0.00011707097291946411, 0.00013211369514465332, 0.00014715641736984253, 0.00016219913959503174, 0.00017724186182022095, 0.00019228458404541016, 0.00020732730627059937, 0.00022237002849578857, 0.00023741275072097778, 0.000252455472946167, 0.0002674981951713562, 0.0002825409173965454, 0.0002975836396217346, 0.00031262636184692383, 0.00032766908407211304, 0.00034271180629730225, 0.00035775452852249146, 0.00037279725074768066, 0.0003878399729728699, 0.0004028826951980591, 0.0004179254174232483, 0.0004329681396484375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 3.0, 7.0, 9.0, 13.0, 9.0, 21.0, 27.0, 28.0, 34.0, 61.0, 65.0, 125.0, 209.0, 420.0, 1800.0, 981799.0, 62103.0, 870.0, 349.0, 175.0, 100.0, 77.0, 51.0, 45.0, 26.0, 19.0, 14.0, 16.0, 19.0, 10.0, 8.0, 5.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0097198486328125, -0.00938260555267334, -0.00904536247253418, -0.00870811939239502, -0.00837087631225586, -0.0080336332321167, -0.007696390151977539, -0.007359147071838379, -0.007021903991699219, -0.006684660911560059, -0.0063474178314208984, -0.006010174751281738, -0.005672931671142578, -0.005335688591003418, -0.004998445510864258, -0.004661202430725098, -0.0043239593505859375, -0.003986716270446777, -0.003649473190307617, -0.003312230110168457, -0.002974987030029297, -0.0026377439498901367, -0.0023005008697509766, -0.0019632577896118164, -0.0016260147094726562, -0.001288771629333496, -0.0009515285491943359, -0.0006142854690551758, -0.0002770423889160156, 6.020069122314453e-05, 0.0003974437713623047, 0.0007346868515014648, 0.001071929931640625, 0.0014091730117797852, 0.0017464160919189453, 0.0020836591720581055, 0.0024209022521972656, 0.0027581453323364258, 0.003095388412475586, 0.003432631492614746, 0.0037698745727539062, 0.004107117652893066, 0.0044443607330322266, 0.004781603813171387, 0.005118846893310547, 0.005456089973449707, 0.005793333053588867, 0.006130576133728027, 0.0064678192138671875, 0.006805062294006348, 0.007142305374145508, 0.007479548454284668, 0.007816791534423828, 0.008154034614562988, 0.008491277694702148, 0.008828520774841309, 0.009165763854980469, 0.009503006935119629, 0.009840250015258789, 0.01017749309539795, 0.01051473617553711, 0.01085197925567627, 0.01118922233581543, 0.01152646541595459, 0.01186370849609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 912.0, 88.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0028254054486751556, -0.0027009393088519573, -0.0025764729361981153, -0.002452006796374917, -0.0023275406565517187, -0.0022030742838978767, -0.0020786081440746784, -0.00195414200425148, -0.00182967574801296, -0.0017052094917744398, -0.0015807433519512415, -0.0014562770957127213, -0.0013318108394742012, -0.0012073446996510029, -0.0010828784434124827, -0.0009584122453816235, -0.0008339460473507643, -0.000709479849319905, -0.0005850136512890458, -0.00046054739505052567, -0.00033608119701966643, -0.0002116149989888072, -8.714874275028706e-05, 3.7317455280572176e-05, 0.0001617836533114314, 0.00028624985134229064, 0.00041071607847698033, 0.00053518230561167, 0.0006596485036425292, 0.0007841147016733885, 0.0009085809579119086, 0.0010330472141504288, 0.001157513353973627, 0.0012819796102121472, 0.0014064457500353456, 0.0015309120062738657, 0.001655378146097064, 0.0017798444023355842, 0.0019043106585741043, 0.0020287767983973026, 0.002153242938220501, 0.0022777090780436993, 0.0024021754506975412, 0.0025266415905207396, 0.002651107730343938, 0.00277557410299778, 0.002900040242820978, 0.0030245063826441765, 0.0031489727552980185, 0.0032734388951212168, 0.0033979052677750587, 0.003522371407598257, 0.0036468375474214554, 0.0037713036872446537, 0.0038957700598984957, 0.004020236432552338, 0.004144702572375536, 0.004269168712198734, 0.004393634852021933, 0.004518100991845131, 0.0046425675973296165, 0.004767033737152815, 0.004891499876976013, 0.0050159660167992115, 0.00514043215662241]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 25.0, 27.0, 47.0, 45.0, 91.0, 110.0, 95.0, 119.0, 111.0, 108.0, 58.0, 72.0, 36.0, 25.0, 16.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000614464282989502, -0.0005881385877728462, -0.0005618128925561905, -0.0005354871973395348, -0.000509161502122879, -0.0004828358069062233, -0.00045651011168956757, -0.00043018441647291183, -0.0004038587212562561, -0.00037753302603960037, -0.00035120733082294464, -0.0003248816356062889, -0.0002985559403896332, -0.00027223024517297745, -0.0002459045499563217, -0.00021957885473966599, -0.00019325315952301025, -0.00016692746430635452, -0.0001406017690896988, -0.00011427607387304306, -8.795037865638733e-05, -6.16246834397316e-05, -3.529898822307587e-05, -8.973293006420135e-06, 1.7352402210235596e-05, 4.367809742689133e-05, 7.000379264354706e-05, 9.632948786020279e-05, 0.00012265518307685852, 0.00014898087829351425, 0.00017530657351016998, 0.00020163226872682571, 0.00022795796394348145, 0.0002542836591601372, 0.0002806093543767929, 0.00030693504959344864, 0.00033326074481010437, 0.0003595864400267601, 0.00038591213524341583, 0.00041223783046007156, 0.0004385635256767273, 0.000464889220893383, 0.0004912149161100388, 0.0005175406113266945, 0.0005438663065433502, 0.000570192001760006, 0.0005965176969766617, 0.0006228433921933174, 0.0006491690874099731, 0.0006754947826266289, 0.0007018204778432846, 0.0007281461730599403, 0.0007544718682765961, 0.0007807975634932518, 0.0008071232587099075, 0.0008334489539265633, 0.000859774649143219, 0.0008861003443598747, 0.0009124260395765305, 0.0009387517347931862, 0.0009650774300098419, 0.0009914031252264977, 0.0010177288204431534, 0.0010440545156598091, 0.0010703802108764648]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 10.0, 9.0, 21.0, 19.0, 22.0, 25.0, 39.0, 27.0, 38.0, 41.0, 33.0, 45.0, 50.0, 38.0, 45.0, 46.0, 31.0, 49.0, 44.0, 39.0, 42.0, 44.0, 38.0, 32.0, 18.0, 27.0, 24.0, 24.0, 21.0, 13.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.357666015625, -16.82470703125, -16.291748046875, -15.7587890625, -15.225830078125, -14.69287109375, -14.159912109375, -13.626953125, -13.093994140625, -12.56103515625, -12.028076171875, -11.4951171875, -10.962158203125, -10.42919921875, -9.896240234375, -9.36328125, -8.830322265625, -8.29736328125, -7.764404296875, -7.2314453125, -6.698486328125, -6.16552734375, -5.632568359375, -5.099609375, -4.566650390625, -4.03369140625, -3.500732421875, -2.9677734375, -2.434814453125, -1.90185546875, -1.368896484375, -0.8359375, -0.302978515625, 0.22998046875, 0.762939453125, 1.2958984375, 1.828857421875, 2.36181640625, 2.894775390625, 3.427734375, 3.960693359375, 4.49365234375, 5.026611328125, 5.5595703125, 6.092529296875, 6.62548828125, 7.158447265625, 7.69140625, 8.224365234375, 8.75732421875, 9.290283203125, 9.8232421875, 10.356201171875, 10.88916015625, 11.422119140625, 11.955078125, 12.488037109375, 13.02099609375, 13.553955078125, 14.0869140625, 14.619873046875, 15.15283203125, 15.685791015625, 16.21875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 26.0, 26.0, 39.0, 60.0, 87.0, 112.0, 183.0, 286.0, 442.0, 713.0, 1110.0, 1725.0, 2808.0, 4499.0, 7322.0, 12758.0, 22015.0, 39626.0, 77505.0, 212852.0, 411952.0, 123761.0, 55892.0, 30201.0, 16921.0, 9912.0, 5858.0, 3646.0, 2276.0, 1395.0, 858.0, 539.0, 381.0, 256.0, 147.0, 110.0, 87.0, 44.0, 29.0, 26.0, 12.0, 16.0, 7.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.6875, -18.049072265625, -17.41064453125, -16.772216796875, -16.1337890625, -15.495361328125, -14.85693359375, -14.218505859375, -13.580078125, -12.941650390625, -12.30322265625, -11.664794921875, -11.0263671875, -10.387939453125, -9.74951171875, -9.111083984375, -8.47265625, -7.834228515625, -7.19580078125, -6.557373046875, -5.9189453125, -5.280517578125, -4.64208984375, -4.003662109375, -3.365234375, -2.726806640625, -2.08837890625, -1.449951171875, -0.8115234375, -0.173095703125, 0.46533203125, 1.103759765625, 1.7421875, 2.380615234375, 3.01904296875, 3.657470703125, 4.2958984375, 4.934326171875, 5.57275390625, 6.211181640625, 6.849609375, 7.488037109375, 8.12646484375, 8.764892578125, 9.4033203125, 10.041748046875, 10.68017578125, 11.318603515625, 11.95703125, 12.595458984375, 13.23388671875, 13.872314453125, 14.5107421875, 15.149169921875, 15.78759765625, 16.426025390625, 17.064453125, 17.702880859375, 18.34130859375, 18.979736328125, 19.6181640625, 20.256591796875, 20.89501953125, 21.533447265625, 22.171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 14.0, 4.0, 9.0, 6.0, 8.0, 11.0, 11.0, 17.0, 20.0, 23.0, 29.0, 28.0, 38.0, 25.0, 30.0, 44.0, 50.0, 90.0, 110.0, 225.0, 1526.0, 184.0, 95.0, 70.0, 41.0, 42.0, 42.0, 36.0, 33.0, 24.0, 23.0, 16.0, 23.0, 22.0, 22.0, 11.0, 8.0, 10.0, 8.0, 9.0, 0.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.53125, -37.34033203125, -36.1494140625, -34.95849609375, -33.767578125, -32.57666015625, -31.3857421875, -30.19482421875, -29.00390625, -27.81298828125, -26.6220703125, -25.43115234375, -24.240234375, -23.04931640625, -21.8583984375, -20.66748046875, -19.4765625, -18.28564453125, -17.0947265625, -15.90380859375, -14.712890625, -13.52197265625, -12.3310546875, -11.14013671875, -9.94921875, -8.75830078125, -7.5673828125, -6.37646484375, -5.185546875, -3.99462890625, -2.8037109375, -1.61279296875, -0.421875, 0.76904296875, 1.9599609375, 3.15087890625, 4.341796875, 5.53271484375, 6.7236328125, 7.91455078125, 9.10546875, 10.29638671875, 11.4873046875, 12.67822265625, 13.869140625, 15.06005859375, 16.2509765625, 17.44189453125, 18.6328125, 19.82373046875, 21.0146484375, 22.20556640625, 23.396484375, 24.58740234375, 25.7783203125, 26.96923828125, 28.16015625, 29.35107421875, 30.5419921875, 31.73291015625, 32.923828125, 34.11474609375, 35.3056640625, 36.49658203125, 37.6875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 6.0, 7.0, 7.0, 13.0, 14.0, 21.0, 35.0, 47.0, 50.0, 92.0, 114.0, 199.0, 436.0, 932.0, 2114.0, 5822.0, 17492.0, 64994.0, 479842.0, 2391760.0, 135233.0, 30905.0, 9548.0, 3353.0, 1312.0, 604.0, 268.0, 157.0, 100.0, 57.0, 40.0, 34.0, 21.0, 22.0, 7.0, 15.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-46.0625, -44.716796875, -43.37109375, -42.025390625, -40.6796875, -39.333984375, -37.98828125, -36.642578125, -35.296875, -33.951171875, -32.60546875, -31.259765625, -29.9140625, -28.568359375, -27.22265625, -25.876953125, -24.53125, -23.185546875, -21.83984375, -20.494140625, -19.1484375, -17.802734375, -16.45703125, -15.111328125, -13.765625, -12.419921875, -11.07421875, -9.728515625, -8.3828125, -7.037109375, -5.69140625, -4.345703125, -3.0, -1.654296875, -0.30859375, 1.037109375, 2.3828125, 3.728515625, 5.07421875, 6.419921875, 7.765625, 9.111328125, 10.45703125, 11.802734375, 13.1484375, 14.494140625, 15.83984375, 17.185546875, 18.53125, 19.876953125, 21.22265625, 22.568359375, 23.9140625, 25.259765625, 26.60546875, 27.951171875, 29.296875, 30.642578125, 31.98828125, 33.333984375, 34.6796875, 36.025390625, 37.37109375, 38.716796875, 40.0625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 10.0, 37.0, 117.0, 233.0, 297.0, 210.0, 69.0, 29.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.21734619140625, -40.668174743652344, -35.11900329589844, -29.569833755493164, -24.020662307739258, -18.47149085998535, -12.922321319580078, -7.373149871826172, -1.8239784240722656, 3.7251925468444824, 9.27436351776123, 14.82353401184082, 20.372705459594727, 25.921876907348633, 31.471046447753906, 37.02021789550781, 42.56938934326172, 48.118560791015625, 53.66773223876953, 59.21690368652344, 64.76607513427734, 70.31524658203125, 75.86441040039062, 81.41358947753906, 86.96275329589844, 92.51192474365234, 98.06109619140625, 103.61026763916016, 109.15943908691406, 114.70861053466797, 120.25778198242188, 125.80694580078125, 131.3561248779297, 136.90528869628906, 142.4544677734375, 148.00363159179688, 153.5528106689453, 159.1019744873047, 164.65115356445312, 170.2003173828125, 175.74949645996094, 181.2986602783203, 186.84783935546875, 192.39700317382812, 197.94618225097656, 203.49534606933594, 209.04452514648438, 214.59368896484375, 220.14285278320312, 225.6920166015625, 231.24119567871094, 236.7903594970703, 242.33953857421875, 247.88870239257812, 253.43788146972656, 258.987060546875, 264.5362243652344, 270.08538818359375, 275.6345520019531, 281.1837463378906, 286.73291015625, 292.2820739746094, 297.83123779296875, 303.38043212890625, 308.9295959472656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 9.0, 4.0, 13.0, 11.0, 13.0, 14.0, 20.0, 19.0, 21.0, 20.0, 26.0, 27.0, 36.0, 26.0, 28.0, 41.0, 42.0, 39.0, 40.0, 39.0, 40.0, 38.0, 40.0, 44.0, 39.0, 37.0, 39.0, 34.0, 27.0, 25.0, 19.0, 13.0, 23.0, 12.0, 11.0, 10.0, 9.0, 13.0, 6.0, 7.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-83.2530746459961, -80.60598754882812, -77.95890045166016, -75.31180572509766, -72.66471862792969, -70.01763153076172, -67.37054443359375, -64.72345733642578, -62.07636642456055, -59.42927932739258, -56.782188415527344, -54.135101318359375, -51.488014221191406, -48.84092330932617, -46.1938362121582, -43.54674530029297, -40.899658203125, -38.25257110595703, -35.6054801940918, -32.95839309692383, -30.311304092407227, -27.664215087890625, -25.017127990722656, -22.370038986206055, -19.722949981689453, -17.07586097717285, -14.428772926330566, -11.781684875488281, -9.13459587097168, -6.487506866455078, -3.840418815612793, -1.1933307647705078, 1.4537506103515625, 4.100839138031006, 6.747927665710449, 9.395015716552734, 12.042104721069336, 14.689193725585938, 17.336280822753906, 19.983369827270508, 22.63045883178711, 25.27754783630371, 27.924636840820312, 30.57172393798828, 33.21881103515625, 35.865901947021484, 38.51298904418945, 41.16007995605469, 43.807167053222656, 46.454254150390625, 49.10134506225586, 51.74843215942383, 54.39552307128906, 57.04261016845703, 59.689697265625, 62.33678436279297, 64.98387145996094, 67.6309585571289, 70.27804565429688, 72.92514038085938, 75.57222747802734, 78.21931457519531, 80.86640167236328, 83.51348876953125, 86.16058349609375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 3.0, 7.0, 7.0, 9.0, 17.0, 15.0, 19.0, 23.0, 26.0, 38.0, 35.0, 34.0, 42.0, 48.0, 28.0, 48.0, 31.0, 46.0, 46.0, 42.0, 38.0, 41.0, 40.0, 34.0, 41.0, 25.0, 34.0, 37.0, 21.0, 22.0, 18.0, 18.0, 18.0, 12.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.46875, -16.945068359375, -16.42138671875, -15.897705078125, -15.3740234375, -14.850341796875, -14.32666015625, -13.802978515625, -13.279296875, -12.755615234375, -12.23193359375, -11.708251953125, -11.1845703125, -10.660888671875, -10.13720703125, -9.613525390625, -9.08984375, -8.566162109375, -8.04248046875, -7.518798828125, -6.9951171875, -6.471435546875, -5.94775390625, -5.424072265625, -4.900390625, -4.376708984375, -3.85302734375, -3.329345703125, -2.8056640625, -2.281982421875, -1.75830078125, -1.234619140625, -0.7109375, -0.187255859375, 0.33642578125, 0.860107421875, 1.3837890625, 1.907470703125, 2.43115234375, 2.954833984375, 3.478515625, 4.002197265625, 4.52587890625, 5.049560546875, 5.5732421875, 6.096923828125, 6.62060546875, 7.144287109375, 7.66796875, 8.191650390625, 8.71533203125, 9.239013671875, 9.7626953125, 10.286376953125, 10.81005859375, 11.333740234375, 11.857421875, 12.381103515625, 12.90478515625, 13.428466796875, 13.9521484375, 14.475830078125, 14.99951171875, 15.523193359375, 16.046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 7.0, 3.0, 6.0, 16.0, 14.0, 15.0, 31.0, 34.0, 52.0, 85.0, 94.0, 152.0, 227.0, 280.0, 475.0, 666.0, 974.0, 1382.0, 2244.0, 3529.0, 5793.0, 9683.0, 18152.0, 41369.0, 158389.0, 1085371.0, 2332195.0, 399417.0, 73431.0, 26566.0, 12915.0, 7614.0, 4514.0, 2865.0, 1859.0, 1236.0, 837.0, 584.0, 374.0, 261.0, 204.0, 98.0, 85.0, 59.0, 33.0, 25.0, 16.0, 21.0, 6.0, 11.0, 5.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.96484375, -22.1796875, -21.39453125, -20.609375, -19.82421875, -19.0390625, -18.25390625, -17.46875, -16.68359375, -15.8984375, -15.11328125, -14.328125, -13.54296875, -12.7578125, -11.97265625, -11.1875, -10.40234375, -9.6171875, -8.83203125, -8.046875, -7.26171875, -6.4765625, -5.69140625, -4.90625, -4.12109375, -3.3359375, -2.55078125, -1.765625, -0.98046875, -0.1953125, 0.58984375, 1.375, 2.16015625, 2.9453125, 3.73046875, 4.515625, 5.30078125, 6.0859375, 6.87109375, 7.65625, 8.44140625, 9.2265625, 10.01171875, 10.796875, 11.58203125, 12.3671875, 13.15234375, 13.9375, 14.72265625, 15.5078125, 16.29296875, 17.078125, 17.86328125, 18.6484375, 19.43359375, 20.21875, 21.00390625, 21.7890625, 22.57421875, 23.359375, 24.14453125, 24.9296875, 25.71484375, 26.5]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 11.0, 12.0, 11.0, 18.0, 16.0, 19.0, 29.0, 37.0, 45.0, 52.0, 71.0, 93.0, 158.0, 238.0, 476.0, 724.0, 734.0, 485.0, 273.0, 161.0, 97.0, 58.0, 43.0, 41.0, 29.0, 31.0, 14.0, 16.0, 8.0, 13.0, 6.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.59375, -26.8056640625, -26.017578125, -25.2294921875, -24.44140625, -23.6533203125, -22.865234375, -22.0771484375, -21.2890625, -20.5009765625, -19.712890625, -18.9248046875, -18.13671875, -17.3486328125, -16.560546875, -15.7724609375, -14.984375, -14.1962890625, -13.408203125, -12.6201171875, -11.83203125, -11.0439453125, -10.255859375, -9.4677734375, -8.6796875, -7.8916015625, -7.103515625, -6.3154296875, -5.52734375, -4.7392578125, -3.951171875, -3.1630859375, -2.375, -1.5869140625, -0.798828125, -0.0107421875, 0.77734375, 1.5654296875, 2.353515625, 3.1416015625, 3.9296875, 4.7177734375, 5.505859375, 6.2939453125, 7.08203125, 7.8701171875, 8.658203125, 9.4462890625, 10.234375, 11.0224609375, 11.810546875, 12.5986328125, 13.38671875, 14.1748046875, 14.962890625, 15.7509765625, 16.5390625, 17.3271484375, 18.115234375, 18.9033203125, 19.69140625, 20.4794921875, 21.267578125, 22.0556640625, 22.84375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 8.0, 12.0, 20.0, 19.0, 35.0, 54.0, 79.0, 98.0, 193.0, 336.0, 635.0, 1264.0, 2925.0, 6538.0, 16146.0, 47167.0, 193817.0, 2996149.0, 786148.0, 95417.0, 28165.0, 10486.0, 4446.0, 1969.0, 918.0, 500.0, 275.0, 141.0, 99.0, 65.0, 35.0, 35.0, 20.0, 13.0, 14.0, 9.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-48.125, -46.7412109375, -45.357421875, -43.9736328125, -42.58984375, -41.2060546875, -39.822265625, -38.4384765625, -37.0546875, -35.6708984375, -34.287109375, -32.9033203125, -31.51953125, -30.1357421875, -28.751953125, -27.3681640625, -25.984375, -24.6005859375, -23.216796875, -21.8330078125, -20.44921875, -19.0654296875, -17.681640625, -16.2978515625, -14.9140625, -13.5302734375, -12.146484375, -10.7626953125, -9.37890625, -7.9951171875, -6.611328125, -5.2275390625, -3.84375, -2.4599609375, -1.076171875, 0.3076171875, 1.69140625, 3.0751953125, 4.458984375, 5.8427734375, 7.2265625, 8.6103515625, 9.994140625, 11.3779296875, 12.76171875, 14.1455078125, 15.529296875, 16.9130859375, 18.296875, 19.6806640625, 21.064453125, 22.4482421875, 23.83203125, 25.2158203125, 26.599609375, 27.9833984375, 29.3671875, 30.7509765625, 32.134765625, 33.5185546875, 34.90234375, 36.2861328125, 37.669921875, 39.0537109375, 40.4375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 46.0, 220.0, 510.0, 196.0, 34.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.16114807128906, -196.59690856933594, -182.0326690673828, -167.4684295654297, -152.90419006347656, -138.33995056152344, -123.77571105957031, -109.21147155761719, -94.64723205566406, -80.08299255371094, -65.51875305175781, -50.95451354980469, -36.39027404785156, -21.826034545898438, -7.2617950439453125, 7.3024444580078125, 21.866683959960938, 36.43092346191406, 50.99516296386719, 65.55940246582031, 80.12364196777344, 94.68788146972656, 109.25212097167969, 123.81636047363281, 138.38059997558594, 152.94483947753906, 167.5090789794922, 182.0733184814453, 196.63755798339844, 211.20179748535156, 225.7660369873047, 240.3302764892578, 254.89453125, 269.4587707519531, 284.02301025390625, 298.5872497558594, 313.1514892578125, 327.7157287597656, 342.27996826171875, 356.8442077636719, 371.408447265625, 385.9726867675781, 400.53692626953125, 415.1011657714844, 429.6654052734375, 444.2296447753906, 458.79388427734375, 473.3581237792969, 487.92236328125, 502.4866027832031, 517.0508422851562, 531.6151123046875, 546.1793212890625, 560.7435302734375, 575.3078002929688, 589.8720703125, 604.436279296875, 619.00048828125, 633.5647583007812, 648.1290283203125, 662.6932373046875, 677.2574462890625, 691.8217163085938, 706.385986328125, 720.9501953125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 3.0, 6.0, 10.0, 9.0, 9.0, 19.0, 25.0, 16.0, 17.0, 22.0, 32.0, 30.0, 38.0, 32.0, 38.0, 38.0, 36.0, 33.0, 51.0, 45.0, 54.0, 55.0, 34.0, 32.0, 28.0, 26.0, 30.0, 29.0, 37.0, 29.0, 25.0, 19.0, 17.0, 15.0, 4.0, 6.0, 12.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.73143005371094, -70.1810302734375, -67.6306381225586, -65.08023834228516, -62.52984619140625, -59.97944641113281, -57.42905044555664, -54.87865447998047, -52.3282585144043, -49.777862548828125, -47.22746658325195, -44.67707061767578, -42.126670837402344, -39.57627868652344, -37.02587890625, -34.47548294067383, -31.925086975097656, -29.374691009521484, -26.824295043945312, -24.273897171020508, -21.723501205444336, -19.173105239868164, -16.62270736694336, -14.072311401367188, -11.521915435791016, -8.971519470214844, -6.4211225509643555, -3.8707261085510254, -1.3203296661376953, 1.2300662994384766, 3.780463218688965, 6.330860137939453, 8.881248474121094, 11.431644439697266, 13.982041358947754, 16.532438278198242, 19.082834243774414, 21.633230209350586, 24.18362808227539, 26.734024047851562, 29.284420013427734, 31.834815979003906, 34.38521194458008, 36.93560791015625, 39.48600769042969, 42.036399841308594, 44.58679962158203, 47.1371955871582, 49.687591552734375, 52.23798751831055, 54.78838348388672, 57.33877944946289, 59.88917541503906, 62.4395751953125, 64.9899673461914, 67.54036712646484, 70.09075927734375, 72.64115905761719, 75.1915512084961, 77.74195098876953, 80.29234313964844, 82.84274291992188, 85.39313507080078, 87.94353485107422, 90.49393463134766]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 16.0, 18.0, 25.0, 32.0, 33.0, 37.0, 30.0, 37.0, 31.0, 41.0, 44.0, 45.0, 48.0, 38.0, 33.0, 48.0, 44.0, 48.0, 37.0, 34.0, 25.0, 31.0, 37.0, 21.0, 19.0, 14.0, 11.0, 10.0, 10.0, 10.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.921875, -16.368896484375, -15.81591796875, -15.262939453125, -14.7099609375, -14.156982421875, -13.60400390625, -13.051025390625, -12.498046875, -11.945068359375, -11.39208984375, -10.839111328125, -10.2861328125, -9.733154296875, -9.18017578125, -8.627197265625, -8.07421875, -7.521240234375, -6.96826171875, -6.415283203125, -5.8623046875, -5.309326171875, -4.75634765625, -4.203369140625, -3.650390625, -3.097412109375, -2.54443359375, -1.991455078125, -1.4384765625, -0.885498046875, -0.33251953125, 0.220458984375, 0.7734375, 1.326416015625, 1.87939453125, 2.432373046875, 2.9853515625, 3.538330078125, 4.09130859375, 4.644287109375, 5.197265625, 5.750244140625, 6.30322265625, 6.856201171875, 7.4091796875, 7.962158203125, 8.51513671875, 9.068115234375, 9.62109375, 10.174072265625, 10.72705078125, 11.280029296875, 11.8330078125, 12.385986328125, 12.93896484375, 13.491943359375, 14.044921875, 14.597900390625, 15.15087890625, 15.703857421875, 16.2568359375, 16.809814453125, 17.36279296875, 17.915771484375, 18.46875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 21.0, 29.0, 39.0, 74.0, 100.0, 149.0, 211.0, 340.0, 492.0, 771.0, 1154.0, 1817.0, 2835.0, 4372.0, 6932.0, 11198.0, 17951.0, 29288.0, 47068.0, 76274.0, 123972.0, 214771.0, 201477.0, 117173.0, 71960.0, 44676.0, 27318.0, 17029.0, 10563.0, 6684.0, 4183.0, 2715.0, 1728.0, 1104.0, 712.0, 503.0, 291.0, 178.0, 154.0, 78.0, 42.0, 33.0, 27.0, 17.0, 9.0, 14.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.331787109375, -0.3213996887207031, -0.31101226806640625, -0.3006248474121094, -0.2902374267578125, -0.2798500061035156, -0.26946258544921875, -0.2590751647949219, -0.248687744140625, -0.23830032348632812, -0.22791290283203125, -0.21752548217773438, -0.2071380615234375, -0.19675064086914062, -0.18636322021484375, -0.17597579956054688, -0.16558837890625, -0.15520095825195312, -0.14481353759765625, -0.13442611694335938, -0.1240386962890625, -0.11365127563476562, -0.10326385498046875, -0.09287643432617188, -0.082489013671875, -0.07210159301757812, -0.06171417236328125, -0.051326751708984375, -0.0409393310546875, -0.030551910400390625, -0.02016448974609375, -0.009777069091796875, 0.0006103515625, 0.010997772216796875, 0.02138519287109375, 0.031772613525390625, 0.0421600341796875, 0.052547454833984375, 0.06293487548828125, 0.07332229614257812, 0.083709716796875, 0.09409713745117188, 0.10448455810546875, 0.11487197875976562, 0.1252593994140625, 0.13564682006835938, 0.14603424072265625, 0.15642166137695312, 0.16680908203125, 0.17719650268554688, 0.18758392333984375, 0.19797134399414062, 0.2083587646484375, 0.21874618530273438, 0.22913360595703125, 0.23952102661132812, 0.249908447265625, 0.2602958679199219, 0.27068328857421875, 0.2810707092285156, 0.2914581298828125, 0.3018455505371094, 0.31223297119140625, 0.3226203918457031, 0.3330078125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 15.0, 10.0, 12.0, 17.0, 12.0, 19.0, 28.0, 24.0, 25.0, 33.0, 31.0, 39.0, 36.0, 40.0, 31.0, 46.0, 40.0, 1081.0, 39.0, 37.0, 45.0, 34.0, 26.0, 44.0, 35.0, 18.0, 32.0, 24.0, 28.0, 19.0, 16.0, 16.0, 10.0, 7.0, 8.0, 8.0, 7.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2523193359375, -10.879638671875, -10.5069580078125, -10.13427734375, -9.7615966796875, -9.388916015625, -9.0162353515625, -8.6435546875, -8.2708740234375, -7.898193359375, -7.5255126953125, -7.15283203125, -6.7801513671875, -6.407470703125, -6.0347900390625, -5.662109375, -5.2894287109375, -4.916748046875, -4.5440673828125, -4.17138671875, -3.7987060546875, -3.426025390625, -3.0533447265625, -2.6806640625, -2.3079833984375, -1.935302734375, -1.5626220703125, -1.18994140625, -0.8172607421875, -0.444580078125, -0.0718994140625, 0.30078125, 0.6734619140625, 1.046142578125, 1.4188232421875, 1.79150390625, 2.1641845703125, 2.536865234375, 2.9095458984375, 3.2822265625, 3.6549072265625, 4.027587890625, 4.4002685546875, 4.77294921875, 5.1456298828125, 5.518310546875, 5.8909912109375, 6.263671875, 6.6363525390625, 7.009033203125, 7.3817138671875, 7.75439453125, 8.1270751953125, 8.499755859375, 8.8724365234375, 9.2451171875, 9.6177978515625, 9.990478515625, 10.3631591796875, 10.73583984375, 11.1085205078125, 11.481201171875, 11.8538818359375, 12.2265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 10.0, 20.0, 27.0, 34.0, 35.0, 77.0, 93.0, 161.0, 244.0, 315.0, 476.0, 749.0, 1088.0, 1545.0, 2277.0, 3284.0, 4856.0, 7444.0, 11406.0, 17423.0, 27365.0, 44119.0, 71367.0, 119476.0, 257228.0, 1206894.0, 121969.0, 71938.0, 44924.0, 28021.0, 17832.0, 11426.0, 7538.0, 4988.0, 3250.0, 2252.0, 1566.0, 1068.0, 752.0, 504.0, 349.0, 246.0, 165.0, 120.0, 72.0, 47.0, 34.0, 20.0, 9.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.192138671875, -0.18631935119628906, -0.18050003051757812, -0.1746807098388672, -0.16886138916015625, -0.1630420684814453, -0.15722274780273438, -0.15140342712402344, -0.1455841064453125, -0.13976478576660156, -0.13394546508789062, -0.1281261444091797, -0.12230682373046875, -0.11648750305175781, -0.11066818237304688, -0.10484886169433594, -0.099029541015625, -0.09321022033691406, -0.08739089965820312, -0.08157157897949219, -0.07575225830078125, -0.06993293762207031, -0.06411361694335938, -0.05829429626464844, -0.0524749755859375, -0.04665565490722656, -0.040836334228515625, -0.03501701354980469, -0.02919769287109375, -0.023378372192382812, -0.017559051513671875, -0.011739730834960938, -0.00592041015625, -0.0001010894775390625, 0.005718231201171875, 0.011537551879882812, 0.01735687255859375, 0.023176193237304688, 0.028995513916015625, 0.03481483459472656, 0.0406341552734375, 0.04645347595214844, 0.052272796630859375, 0.05809211730957031, 0.06391143798828125, 0.06973075866699219, 0.07555007934570312, 0.08136940002441406, 0.087188720703125, 0.09300804138183594, 0.09882736206054688, 0.10464668273925781, 0.11046600341796875, 0.11628532409667969, 0.12210464477539062, 0.12792396545410156, 0.1337432861328125, 0.13956260681152344, 0.14538192749023438, 0.1512012481689453, 0.15702056884765625, 0.1628398895263672, 0.16865921020507812, 0.17447853088378906, 0.1802978515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 7.0, 3.0, 4.0, 11.0, 18.0, 16.0, 22.0, 23.0, 29.0, 20.0, 28.0, 40.0, 43.0, 39.0, 66.0, 102.0, 111.0, 67.0, 55.0, 35.0, 42.0, 31.0, 20.0, 29.0, 16.0, 14.0, 13.0, 11.0, 12.0, 9.0, 9.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004000663757324219, -0.0003871992230415344, -0.00037433207035064697, -0.0003614649176597595, -0.00034859776496887207, -0.0003357306122779846, -0.00032286345958709717, -0.0003099963068962097, -0.00029712915420532227, -0.0002842620015144348, -0.00027139484882354736, -0.0002585276961326599, -0.00024566054344177246, -0.000232793390750885, -0.00021992623805999756, -0.0002070590853691101, -0.00019419193267822266, -0.0001813247799873352, -0.00016845762729644775, -0.0001555904746055603, -0.00014272332191467285, -0.0001298561692237854, -0.00011698901653289795, -0.0001041218638420105, -9.125471115112305e-05, -7.83875584602356e-05, -6.552040576934814e-05, -5.265325307846069e-05, -3.978610038757324e-05, -2.691894769668579e-05, -1.405179500579834e-05, -1.1846423149108887e-06, 1.1682510375976562e-05, 2.4549663066864014e-05, 3.7416815757751465e-05, 5.0283968448638916e-05, 6.315112113952637e-05, 7.601827383041382e-05, 8.888542652130127e-05, 0.00010175257921218872, 0.00011461973190307617, 0.00012748688459396362, 0.00014035403728485107, 0.00015322118997573853, 0.00016608834266662598, 0.00017895549535751343, 0.00019182264804840088, 0.00020468980073928833, 0.00021755695343017578, 0.00023042410612106323, 0.00024329125881195068, 0.00025615841150283813, 0.0002690255641937256, 0.00028189271688461304, 0.0002947598695755005, 0.00030762702226638794, 0.0003204941749572754, 0.00033336132764816284, 0.0003462284803390503, 0.00035909563302993774, 0.0003719627857208252, 0.00038482993841171265, 0.0003976970911026001, 0.00041056424379348755, 0.000423431396484375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 12.0, 7.0, 14.0, 20.0, 14.0, 22.0, 37.0, 43.0, 59.0, 81.0, 133.0, 232.0, 540.0, 3175.0, 1023569.0, 18884.0, 799.0, 293.0, 172.0, 100.0, 69.0, 36.0, 43.0, 35.0, 25.0, 22.0, 19.0, 18.0, 2.0, 7.0, 5.0, 12.0, 6.0, 7.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00942230224609375, -0.00913381576538086, -0.008845329284667969, -0.008556842803955078, -0.008268356323242188, -0.007979869842529297, -0.007691383361816406, -0.007402896881103516, -0.007114410400390625, -0.006825923919677734, -0.006537437438964844, -0.006248950958251953, -0.0059604644775390625, -0.005671977996826172, -0.005383491516113281, -0.005095005035400391, -0.0048065185546875, -0.004518032073974609, -0.004229545593261719, -0.003941059112548828, -0.0036525726318359375, -0.003364086151123047, -0.0030755996704101562, -0.0027871131896972656, -0.002498626708984375, -0.0022101402282714844, -0.0019216537475585938, -0.0016331672668457031, -0.0013446807861328125, -0.0010561943054199219, -0.0007677078247070312, -0.0004792213439941406, -0.00019073486328125, 9.775161743164062e-05, 0.00038623809814453125, 0.0006747245788574219, 0.0009632110595703125, 0.0012516975402832031, 0.0015401840209960938, 0.0018286705017089844, 0.002117156982421875, 0.0024056434631347656, 0.0026941299438476562, 0.002982616424560547, 0.0032711029052734375, 0.003559589385986328, 0.0038480758666992188, 0.004136562347412109, 0.004425048828125, 0.004713535308837891, 0.005002021789550781, 0.005290508270263672, 0.0055789947509765625, 0.005867481231689453, 0.006155967712402344, 0.006444454193115234, 0.006732940673828125, 0.007021427154541016, 0.007309913635253906, 0.007598400115966797, 0.007886886596679688, 0.008175373077392578, 0.008463859558105469, 0.00875234603881836, 0.00904083251953125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 262.0, 748.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024615549482405186, -0.0023176034446805716, -0.0021736519411206245, -0.0020297004375606775, -0.0018857489340007305, -0.0017417974304407835, -0.0015978459268808365, -0.0014538944233208895, -0.0013099429197609425, -0.0011659914162009954, -0.0010220399126410484, -0.0008780884090811014, -0.0007341369055211544, -0.0005901854019612074, -0.0004462338984012604, -0.00030228239484131336, -0.00015833089128136635, -1.4379387721419334e-05, 0.00012957211583852768, 0.0002735236193984747, 0.0004174751229584217, 0.0005614266265183687, 0.0007053781300783157, 0.0008493296336382627, 0.0009932811371982098, 0.0011372326407581568, 0.0012811841443181038, 0.0014251356478780508, 0.0015690871514379978, 0.0017130386549979448, 0.0018569901585578918, 0.002000941662117839, 0.0021448927000164986, 0.0022888442035764456, 0.0024327957071363926, 0.0025767472106963396, 0.0027206987142562866, 0.0028646502178162336, 0.0030086017213761806, 0.0031525532249361277, 0.0032965047284960747, 0.0034404562320560217, 0.0035844077356159687, 0.0037283592391759157, 0.0038723107427358627, 0.004016262479126453, 0.004160213749855757, 0.00430416502058506, 0.004448116756975651, 0.0045920684933662415, 0.004736019764095545, 0.004879971034824848, 0.005023922771215439, 0.0051678745076060295, 0.005311825778335333, 0.005455777049064636, 0.005599728785455227, 0.0057436805218458176, 0.005887631792575121, 0.006031583063304424, 0.006175534799695015, 0.006319486536085606, 0.006463437806814909, 0.006607389077544212, 0.006751340813934803]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 10.0, 21.0, 30.0, 40.0, 63.0, 69.0, 77.0, 107.0, 106.0, 94.0, 83.0, 85.0, 64.0, 61.0, 29.0, 22.0, 16.0, 11.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043714046478271484, -0.0004170164465904236, -0.0003968924283981323, -0.00037676841020584106, -0.0003566443920135498, -0.00033652037382125854, -0.0003163963556289673, -0.000296272337436676, -0.00027614831924438477, -0.0002560243010520935, -0.00023590028285980225, -0.00021577626466751099, -0.00019565224647521973, -0.00017552822828292847, -0.0001554042100906372, -0.00013528019189834595, -0.00011515617370605469, -9.503215551376343e-05, -7.490813732147217e-05, -5.478411912918091e-05, -3.466010093688965e-05, -1.4536082744598389e-05, 5.587935447692871e-06, 2.571195363998413e-05, 4.583597183227539e-05, 6.595999002456665e-05, 8.608400821685791e-05, 0.00010620802640914917, 0.00012633204460144043, 0.0001464560627937317, 0.00016658008098602295, 0.0001867040991783142, 0.00020682811737060547, 0.00022695213556289673, 0.000247076153755188, 0.00026720017194747925, 0.0002873241901397705, 0.00030744820833206177, 0.00032757222652435303, 0.0003476962447166443, 0.00036782026290893555, 0.0003879442811012268, 0.00040806829929351807, 0.0004281923174858093, 0.0004483163356781006, 0.00046844035387039185, 0.0004885643720626831, 0.0005086883902549744, 0.0005288124084472656, 0.0005489364266395569, 0.0005690604448318481, 0.0005891844630241394, 0.0006093084812164307, 0.0006294324994087219, 0.0006495565176010132, 0.0006696805357933044, 0.0006898045539855957, 0.000709928572177887, 0.0007300525903701782, 0.0007501766085624695, 0.0007703006267547607, 0.000790424644947052, 0.0008105486631393433, 0.0008306726813316345, 0.0008507966995239258]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 12.0, 17.0, 25.0, 16.0, 18.0, 25.0, 32.0, 33.0, 37.0, 30.0, 37.0, 31.0, 41.0, 44.0, 45.0, 48.0, 38.0, 33.0, 48.0, 44.0, 48.0, 37.0, 34.0, 25.0, 31.0, 37.0, 21.0, 19.0, 14.0, 11.0, 10.0, 10.0, 10.0, 3.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.921875, -16.368896484375, -15.81591796875, -15.262939453125, -14.7099609375, -14.156982421875, -13.60400390625, -13.051025390625, -12.498046875, -11.945068359375, -11.39208984375, -10.839111328125, -10.2861328125, -9.733154296875, -9.18017578125, -8.627197265625, -8.07421875, -7.521240234375, -6.96826171875, -6.415283203125, -5.8623046875, -5.309326171875, -4.75634765625, -4.203369140625, -3.650390625, -3.097412109375, -2.54443359375, -1.991455078125, -1.4384765625, -0.885498046875, -0.33251953125, 0.220458984375, 0.7734375, 1.326416015625, 1.87939453125, 2.432373046875, 2.9853515625, 3.538330078125, 4.09130859375, 4.644287109375, 5.197265625, 5.750244140625, 6.30322265625, 6.856201171875, 7.4091796875, 7.962158203125, 8.51513671875, 9.068115234375, 9.62109375, 10.174072265625, 10.72705078125, 11.280029296875, 11.8330078125, 12.385986328125, 12.93896484375, 13.491943359375, 14.044921875, 14.597900390625, 15.15087890625, 15.703857421875, 16.2568359375, 16.809814453125, 17.36279296875, 17.915771484375, 18.46875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 13.0, 17.0, 20.0, 36.0, 53.0, 73.0, 110.0, 156.0, 238.0, 395.0, 572.0, 949.0, 1464.0, 2347.0, 3611.0, 5898.0, 9482.0, 16701.0, 31602.0, 72078.0, 239854.0, 445265.0, 118102.0, 45072.0, 22132.0, 12451.0, 7325.0, 4499.0, 2908.0, 1779.0, 1214.0, 682.0, 471.0, 324.0, 188.0, 156.0, 103.0, 64.0, 36.0, 32.0, 18.0, 16.0, 8.0, 7.0, 5.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.59375, -19.97412109375, -19.3544921875, -18.73486328125, -18.115234375, -17.49560546875, -16.8759765625, -16.25634765625, -15.63671875, -15.01708984375, -14.3974609375, -13.77783203125, -13.158203125, -12.53857421875, -11.9189453125, -11.29931640625, -10.6796875, -10.06005859375, -9.4404296875, -8.82080078125, -8.201171875, -7.58154296875, -6.9619140625, -6.34228515625, -5.72265625, -5.10302734375, -4.4833984375, -3.86376953125, -3.244140625, -2.62451171875, -2.0048828125, -1.38525390625, -0.765625, -0.14599609375, 0.4736328125, 1.09326171875, 1.712890625, 2.33251953125, 2.9521484375, 3.57177734375, 4.19140625, 4.81103515625, 5.4306640625, 6.05029296875, 6.669921875, 7.28955078125, 7.9091796875, 8.52880859375, 9.1484375, 9.76806640625, 10.3876953125, 11.00732421875, 11.626953125, 12.24658203125, 12.8662109375, 13.48583984375, 14.10546875, 14.72509765625, 15.3447265625, 15.96435546875, 16.583984375, 17.20361328125, 17.8232421875, 18.44287109375, 19.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 11.0, 5.0, 3.0, 8.0, 16.0, 26.0, 28.0, 17.0, 35.0, 27.0, 44.0, 30.0, 30.0, 55.0, 76.0, 108.0, 205.0, 1585.0, 207.0, 92.0, 68.0, 56.0, 51.0, 40.0, 33.0, 37.0, 20.0, 27.0, 24.0, 21.0, 19.0, 7.0, 9.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.59375, -47.14599609375, -45.6982421875, -44.25048828125, -42.802734375, -41.35498046875, -39.9072265625, -38.45947265625, -37.01171875, -35.56396484375, -34.1162109375, -32.66845703125, -31.220703125, -29.77294921875, -28.3251953125, -26.87744140625, -25.4296875, -23.98193359375, -22.5341796875, -21.08642578125, -19.638671875, -18.19091796875, -16.7431640625, -15.29541015625, -13.84765625, -12.39990234375, -10.9521484375, -9.50439453125, -8.056640625, -6.60888671875, -5.1611328125, -3.71337890625, -2.265625, -0.81787109375, 0.6298828125, 2.07763671875, 3.525390625, 4.97314453125, 6.4208984375, 7.86865234375, 9.31640625, 10.76416015625, 12.2119140625, 13.65966796875, 15.107421875, 16.55517578125, 18.0029296875, 19.45068359375, 20.8984375, 22.34619140625, 23.7939453125, 25.24169921875, 26.689453125, 28.13720703125, 29.5849609375, 31.03271484375, 32.48046875, 33.92822265625, 35.3759765625, 36.82373046875, 38.271484375, 39.71923828125, 41.1669921875, 42.61474609375, 44.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 7.0, 13.0, 3.0, 7.0, 16.0, 26.0, 31.0, 28.0, 40.0, 64.0, 92.0, 133.0, 219.0, 364.0, 941.0, 2336.0, 7172.0, 24958.0, 150872.0, 2749073.0, 170117.0, 26890.0, 7786.0, 2452.0, 953.0, 362.0, 246.0, 119.0, 108.0, 54.0, 36.0, 41.0, 33.0, 15.0, 16.0, 19.0, 13.0, 5.0, 7.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.34375, -50.734375, -49.125, -47.515625, -45.90625, -44.296875, -42.6875, -41.078125, -39.46875, -37.859375, -36.25, -34.640625, -33.03125, -31.421875, -29.8125, -28.203125, -26.59375, -24.984375, -23.375, -21.765625, -20.15625, -18.546875, -16.9375, -15.328125, -13.71875, -12.109375, -10.5, -8.890625, -7.28125, -5.671875, -4.0625, -2.453125, -0.84375, 0.765625, 2.375, 3.984375, 5.59375, 7.203125, 8.8125, 10.421875, 12.03125, 13.640625, 15.25, 16.859375, 18.46875, 20.078125, 21.6875, 23.296875, 24.90625, 26.515625, 28.125, 29.734375, 31.34375, 32.953125, 34.5625, 36.171875, 37.78125, 39.390625, 41.0, 42.609375, 44.21875, 45.828125, 47.4375, 49.046875, 50.65625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 47.0, 390.0, 494.0, 71.0, 10.0, 1.0, 1.0, 1.0], "bins": [-779.1015625, -765.6905517578125, -752.279541015625, -738.8685302734375, -725.4574584960938, -712.0464477539062, -698.6354370117188, -685.2244262695312, -671.8134155273438, -658.4024047851562, -644.9913940429688, -631.580322265625, -618.1693115234375, -604.75830078125, -591.3472900390625, -577.936279296875, -564.5252685546875, -551.1142578125, -537.7032470703125, -524.292236328125, -510.8811950683594, -497.47015380859375, -484.05914306640625, -470.64813232421875, -457.237060546875, -443.8260498046875, -430.4150085449219, -417.0039978027344, -403.5929870605469, -390.18194580078125, -376.77093505859375, -363.35992431640625, -349.9489440917969, -336.5379333496094, -323.12689208984375, -309.71588134765625, -296.30487060546875, -282.89385986328125, -269.4828186035156, -256.0718078613281, -242.66078186035156, -229.249755859375, -215.8387451171875, -202.42771911621094, -189.01669311523438, -175.60568237304688, -162.1946563720703, -148.78363037109375, -135.37261962890625, -121.96160125732422, -108.55058288574219, -95.13955688476562, -81.7285385131836, -68.31752014160156, -54.906494140625, -41.49547576904297, -28.084457397460938, -14.673437118530273, -1.2624168395996094, 12.148605346679688, 25.55962371826172, 38.97064208984375, 52.38166809082031, 65.79268646240234, 79.20370483398438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 5.0, 4.0, 8.0, 6.0, 8.0, 16.0, 12.0, 11.0, 19.0, 19.0, 17.0, 16.0, 24.0, 24.0, 27.0, 29.0, 34.0, 26.0, 36.0, 40.0, 25.0, 37.0, 45.0, 37.0, 34.0, 38.0, 43.0, 41.0, 41.0, 33.0, 22.0, 34.0, 21.0, 15.0, 22.0, 23.0, 18.0, 19.0, 8.0, 9.0, 11.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-85.95767211914062, -83.10855102539062, -80.25942993164062, -77.41031646728516, -74.56119537353516, -71.71207427978516, -68.86296081542969, -66.01383972167969, -63.16471862792969, -60.31559753417969, -57.46648025512695, -54.61736297607422, -51.76824188232422, -48.91912078857422, -46.070003509521484, -43.22088623046875, -40.37176513671875, -37.52264404296875, -34.673526763916016, -31.82440757751465, -28.97528839111328, -26.126169204711914, -23.277050018310547, -20.42793083190918, -17.578811645507812, -14.729692459106445, -11.880573272705078, -9.031454086303711, -6.182334899902344, -3.3332157135009766, -0.4840965270996094, 2.365022659301758, 5.214134216308594, 8.063253402709961, 10.912372589111328, 13.761491775512695, 16.610610961914062, 19.45973014831543, 22.308849334716797, 25.157968521118164, 28.00708770751953, 30.8562068939209, 33.705326080322266, 36.554443359375, 39.403564453125, 42.252685546875, 45.101802825927734, 47.95092010498047, 50.80004119873047, 53.64916229248047, 56.4982795715332, 59.34739685058594, 62.19651794433594, 65.04563903808594, 67.89476013183594, 70.7438735961914, 73.5929946899414, 76.4421157836914, 79.29122924804688, 82.14035034179688, 84.98947143554688, 87.83859252929688, 90.68771362304688, 93.53682708740234, 96.38594818115234]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 3.0, 11.0, 10.0, 18.0, 22.0, 23.0, 24.0, 28.0, 33.0, 38.0, 29.0, 40.0, 35.0, 41.0, 42.0, 42.0, 49.0, 39.0, 48.0, 39.0, 62.0, 46.0, 40.0, 33.0, 18.0, 32.0, 26.0, 24.0, 27.0, 18.0, 14.0, 11.0, 5.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.453125, -19.849853515625, -19.24658203125, -18.643310546875, -18.0400390625, -17.436767578125, -16.83349609375, -16.230224609375, -15.626953125, -15.023681640625, -14.42041015625, -13.817138671875, -13.2138671875, -12.610595703125, -12.00732421875, -11.404052734375, -10.80078125, -10.197509765625, -9.59423828125, -8.990966796875, -8.3876953125, -7.784423828125, -7.18115234375, -6.577880859375, -5.974609375, -5.371337890625, -4.76806640625, -4.164794921875, -3.5615234375, -2.958251953125, -2.35498046875, -1.751708984375, -1.1484375, -0.545166015625, 0.05810546875, 0.661376953125, 1.2646484375, 1.867919921875, 2.47119140625, 3.074462890625, 3.677734375, 4.281005859375, 4.88427734375, 5.487548828125, 6.0908203125, 6.694091796875, 7.29736328125, 7.900634765625, 8.50390625, 9.107177734375, 9.71044921875, 10.313720703125, 10.9169921875, 11.520263671875, 12.12353515625, 12.726806640625, 13.330078125, 13.933349609375, 14.53662109375, 15.139892578125, 15.7431640625, 16.346435546875, 16.94970703125, 17.552978515625, 18.15625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 14.0, 22.0, 28.0, 30.0, 35.0, 48.0, 58.0, 75.0, 85.0, 116.0, 183.0, 283.0, 652.0, 2020.0, 13444.0, 2764806.0, 1397797.0, 11174.0, 1758.0, 542.0, 298.0, 171.0, 133.0, 85.0, 64.0, 56.0, 47.0, 33.0, 24.0, 18.0, 19.0, 20.0, 16.0, 15.0, 14.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-128.875, -124.96484375, -121.0546875, -117.14453125, -113.234375, -109.32421875, -105.4140625, -101.50390625, -97.59375, -93.68359375, -89.7734375, -85.86328125, -81.953125, -78.04296875, -74.1328125, -70.22265625, -66.3125, -62.40234375, -58.4921875, -54.58203125, -50.671875, -46.76171875, -42.8515625, -38.94140625, -35.03125, -31.12109375, -27.2109375, -23.30078125, -19.390625, -15.48046875, -11.5703125, -7.66015625, -3.75, 0.16015625, 4.0703125, 7.98046875, 11.890625, 15.80078125, 19.7109375, 23.62109375, 27.53125, 31.44140625, 35.3515625, 39.26171875, 43.171875, 47.08203125, 50.9921875, 54.90234375, 58.8125, 62.72265625, 66.6328125, 70.54296875, 74.453125, 78.36328125, 82.2734375, 86.18359375, 90.09375, 94.00390625, 97.9140625, 101.82421875, 105.734375, 109.64453125, 113.5546875, 117.46484375, 121.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 8.0, 5.0, 8.0, 12.0, 16.0, 15.0, 22.0, 20.0, 20.0, 38.0, 31.0, 50.0, 93.0, 133.0, 221.0, 306.0, 554.0, 756.0, 642.0, 361.0, 231.0, 128.0, 84.0, 65.0, 54.0, 35.0, 29.0, 27.0, 20.0, 14.0, 9.0, 9.0, 7.0, 6.0, 6.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-24.640625, -23.908935546875, -23.17724609375, -22.445556640625, -21.7138671875, -20.982177734375, -20.25048828125, -19.518798828125, -18.787109375, -18.055419921875, -17.32373046875, -16.592041015625, -15.8603515625, -15.128662109375, -14.39697265625, -13.665283203125, -12.93359375, -12.201904296875, -11.47021484375, -10.738525390625, -10.0068359375, -9.275146484375, -8.54345703125, -7.811767578125, -7.080078125, -6.348388671875, -5.61669921875, -4.885009765625, -4.1533203125, -3.421630859375, -2.68994140625, -1.958251953125, -1.2265625, -0.494873046875, 0.23681640625, 0.968505859375, 1.7001953125, 2.431884765625, 3.16357421875, 3.895263671875, 4.626953125, 5.358642578125, 6.09033203125, 6.822021484375, 7.5537109375, 8.285400390625, 9.01708984375, 9.748779296875, 10.48046875, 11.212158203125, 11.94384765625, 12.675537109375, 13.4072265625, 14.138916015625, 14.87060546875, 15.602294921875, 16.333984375, 17.065673828125, 17.79736328125, 18.529052734375, 19.2607421875, 19.992431640625, 20.72412109375, 21.455810546875, 22.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 11.0, 20.0, 24.0, 27.0, 31.0, 59.0, 86.0, 129.0, 224.0, 614.0, 1987.0, 7831.0, 43538.0, 983151.0, 3077974.0, 64004.0, 10664.0, 2467.0, 710.0, 309.0, 118.0, 89.0, 52.0, 37.0, 45.0, 19.0, 15.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.1875, -70.833984375, -68.48046875, -66.126953125, -63.7734375, -61.419921875, -59.06640625, -56.712890625, -54.359375, -52.005859375, -49.65234375, -47.298828125, -44.9453125, -42.591796875, -40.23828125, -37.884765625, -35.53125, -33.177734375, -30.82421875, -28.470703125, -26.1171875, -23.763671875, -21.41015625, -19.056640625, -16.703125, -14.349609375, -11.99609375, -9.642578125, -7.2890625, -4.935546875, -2.58203125, -0.228515625, 2.125, 4.478515625, 6.83203125, 9.185546875, 11.5390625, 13.892578125, 16.24609375, 18.599609375, 20.953125, 23.306640625, 25.66015625, 28.013671875, 30.3671875, 32.720703125, 35.07421875, 37.427734375, 39.78125, 42.134765625, 44.48828125, 46.841796875, 49.1953125, 51.548828125, 53.90234375, 56.255859375, 58.609375, 60.962890625, 63.31640625, 65.669921875, 68.0234375, 70.376953125, 72.73046875, 75.083984375, 77.4375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 3.0, 30.0, 318.0, 575.0, 81.0, 12.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.22539520263672, -56.66133117675781, -39.09726333618164, -21.53319549560547, -3.9691314697265625, 13.594932556152344, 31.15900421142578, 48.72306823730469, 66.2871322631836, 83.8511962890625, 101.41526794433594, 118.97933197021484, 136.54339599609375, 154.10745239257812, 171.67153930664062, 189.235595703125, 206.79965209960938, 224.3637237548828, 241.9277801513672, 259.4918518066406, 277.055908203125, 294.6199951171875, 312.1840515136719, 329.74810791015625, 347.31219482421875, 364.8762512207031, 382.4403381347656, 400.00439453125, 417.5684509277344, 435.13250732421875, 452.69659423828125, 470.2606506347656, 487.82476806640625, 505.3888244628906, 522.952880859375, 540.5169677734375, 558.0810546875, 575.6450805664062, 593.2091674804688, 610.7732543945312, 628.3372802734375, 645.9013671875, 663.4653930664062, 681.0294799804688, 698.5935668945312, 716.1575927734375, 733.7216796875, 751.2857666015625, 768.849853515625, 786.4139404296875, 803.9779663085938, 821.5420532226562, 839.1061401367188, 856.670166015625, 874.2342529296875, 891.79833984375, 909.3623657226562, 926.9264526367188, 944.490478515625, 962.0545654296875, 979.61865234375, 997.1826782226562, 1014.7467651367188, 1032.310791015625, 1049.8748779296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 12.0, 12.0, 18.0, 23.0, 19.0, 24.0, 28.0, 19.0, 31.0, 34.0, 46.0, 27.0, 42.0, 44.0, 35.0, 45.0, 51.0, 31.0, 45.0, 46.0, 36.0, 41.0, 44.0, 34.0, 30.0, 26.0, 20.0, 25.0, 28.0, 19.0, 10.0, 11.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-89.94453430175781, -87.46626281738281, -84.98799133300781, -82.50971221923828, -80.03144073486328, -77.55316925048828, -75.07489776611328, -72.59661865234375, -70.11834716796875, -67.64007568359375, -65.16180419921875, -62.683528900146484, -60.20525360107422, -57.72698211669922, -55.24871063232422, -52.77043533325195, -50.29216384887695, -47.81389236450195, -45.33561706542969, -42.85734558105469, -40.37907028198242, -37.90079879760742, -35.422523498535156, -32.944252014160156, -30.465978622436523, -27.98770523071289, -25.509431838989258, -23.031158447265625, -20.552886962890625, -18.07461166381836, -15.59634017944336, -13.118066787719727, -10.639793395996094, -8.161520004272461, -5.683247089385986, -3.2049741744995117, -0.7267007827758789, 1.751572608947754, 4.22984504699707, 6.708118438720703, 9.186391830444336, 11.664665222167969, 14.142938613891602, 16.621212005615234, 19.099483489990234, 21.5777587890625, 24.0560302734375, 26.534303665161133, 29.012577056884766, 31.4908504486084, 33.96912384033203, 36.44739532470703, 38.9256706237793, 41.4039421081543, 43.88221740722656, 46.36048889160156, 48.83876037597656, 51.31703186035156, 53.79530715942383, 56.27357864379883, 58.751853942871094, 61.230125427246094, 63.708396911621094, 66.18667602539062, 68.66494750976562]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 15.0, 14.0, 11.0, 20.0, 16.0, 26.0, 37.0, 29.0, 25.0, 32.0, 41.0, 46.0, 48.0, 44.0, 48.0, 45.0, 46.0, 55.0, 44.0, 53.0, 37.0, 45.0, 33.0, 22.0, 32.0, 30.0, 26.0, 16.0, 13.0, 12.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.897705078125, -18.29541015625, -17.693115234375, -17.0908203125, -16.488525390625, -15.88623046875, -15.283935546875, -14.681640625, -14.079345703125, -13.47705078125, -12.874755859375, -12.2724609375, -11.670166015625, -11.06787109375, -10.465576171875, -9.86328125, -9.260986328125, -8.65869140625, -8.056396484375, -7.4541015625, -6.851806640625, -6.24951171875, -5.647216796875, -5.044921875, -4.442626953125, -3.84033203125, -3.238037109375, -2.6357421875, -2.033447265625, -1.43115234375, -0.828857421875, -0.2265625, 0.375732421875, 0.97802734375, 1.580322265625, 2.1826171875, 2.784912109375, 3.38720703125, 3.989501953125, 4.591796875, 5.194091796875, 5.79638671875, 6.398681640625, 7.0009765625, 7.603271484375, 8.20556640625, 8.807861328125, 9.41015625, 10.012451171875, 10.61474609375, 11.217041015625, 11.8193359375, 12.421630859375, 13.02392578125, 13.626220703125, 14.228515625, 14.830810546875, 15.43310546875, 16.035400390625, 16.6376953125, 17.239990234375, 17.84228515625, 18.444580078125, 19.046875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 7.0, 8.0, 23.0, 22.0, 46.0, 67.0, 81.0, 127.0, 194.0, 319.0, 484.0, 747.0, 1242.0, 2112.0, 3394.0, 5707.0, 9716.0, 17037.0, 30133.0, 53334.0, 95703.0, 174369.0, 263436.0, 172646.0, 94221.0, 52546.0, 29770.0, 17031.0, 9626.0, 5690.0, 3331.0, 2030.0, 1271.0, 722.0, 484.0, 306.0, 198.0, 138.0, 82.0, 50.0, 29.0, 28.0, 12.0, 17.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.384033203125, -0.3718376159667969, -0.35964202880859375, -0.3474464416503906, -0.3352508544921875, -0.3230552673339844, -0.31085968017578125, -0.2986640930175781, -0.286468505859375, -0.2742729187011719, -0.26207733154296875, -0.24988174438476562, -0.2376861572265625, -0.22549057006835938, -0.21329498291015625, -0.20109939575195312, -0.18890380859375, -0.17670822143554688, -0.16451263427734375, -0.15231704711914062, -0.1401214599609375, -0.12792587280273438, -0.11573028564453125, -0.10353469848632812, -0.091339111328125, -0.07914352416992188, -0.06694793701171875, -0.054752349853515625, -0.0425567626953125, -0.030361175537109375, -0.01816558837890625, -0.005970001220703125, 0.0062255859375, 0.018421173095703125, 0.03061676025390625, 0.042812347412109375, 0.0550079345703125, 0.06720352172851562, 0.07939910888671875, 0.09159469604492188, 0.103790283203125, 0.11598587036132812, 0.12818145751953125, 0.14037704467773438, 0.1525726318359375, 0.16476821899414062, 0.17696380615234375, 0.18915939331054688, 0.20135498046875, 0.21355056762695312, 0.22574615478515625, 0.23794174194335938, 0.2501373291015625, 0.2623329162597656, 0.27452850341796875, 0.2867240905761719, 0.298919677734375, 0.3111152648925781, 0.32331085205078125, 0.3355064392089844, 0.3477020263671875, 0.3598976135253906, 0.37209320068359375, 0.3842887878417969, 0.396484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 8.0, 15.0, 10.0, 16.0, 17.0, 17.0, 28.0, 28.0, 28.0, 28.0, 33.0, 28.0, 44.0, 31.0, 35.0, 41.0, 41.0, 1058.0, 36.0, 51.0, 48.0, 38.0, 29.0, 32.0, 24.0, 34.0, 29.0, 25.0, 33.0, 16.0, 16.0, 20.0, 8.0, 12.0, 12.0, 10.0, 4.0, 5.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -10.01171875, -9.6640625, -9.31640625, -8.96875, -8.62109375, -8.2734375, -7.92578125, -7.578125, -7.23046875, -6.8828125, -6.53515625, -6.1875, -5.83984375, -5.4921875, -5.14453125, -4.796875, -4.44921875, -4.1015625, -3.75390625, -3.40625, -3.05859375, -2.7109375, -2.36328125, -2.015625, -1.66796875, -1.3203125, -0.97265625, -0.625, -0.27734375, 0.0703125, 0.41796875, 0.765625, 1.11328125, 1.4609375, 1.80859375, 2.15625, 2.50390625, 2.8515625, 3.19921875, 3.546875, 3.89453125, 4.2421875, 4.58984375, 4.9375, 5.28515625, 5.6328125, 5.98046875, 6.328125, 6.67578125, 7.0234375, 7.37109375, 7.71875, 8.06640625, 8.4140625, 8.76171875, 9.109375, 9.45703125, 9.8046875, 10.15234375, 10.5, 10.84765625, 11.1953125, 11.54296875, 11.890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 14.0, 35.0, 50.0, 91.0, 138.0, 204.0, 400.0, 595.0, 882.0, 1357.0, 2019.0, 3322.0, 5350.0, 8697.0, 14370.0, 23701.0, 39814.0, 67846.0, 120329.0, 233289.0, 1275200.0, 125342.0, 70060.0, 41203.0, 24498.0, 14439.0, 8934.0, 5454.0, 3475.0, 2125.0, 1397.0, 920.0, 613.0, 372.0, 235.0, 139.0, 84.0, 45.0, 18.0, 13.0, 11.0, 12.0, 4.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19811439514160156, -0.19151687622070312, -0.1849193572998047, -0.17832183837890625, -0.1717243194580078, -0.16512680053710938, -0.15852928161621094, -0.1519317626953125, -0.14533424377441406, -0.13873672485351562, -0.1321392059326172, -0.12554168701171875, -0.11894416809082031, -0.11234664916992188, -0.10574913024902344, -0.099151611328125, -0.09255409240722656, -0.08595657348632812, -0.07935905456542969, -0.07276153564453125, -0.06616401672363281, -0.059566497802734375, -0.05296897888183594, -0.0463714599609375, -0.03977394104003906, -0.033176422119140625, -0.026578903198242188, -0.01998138427734375, -0.013383865356445312, -0.006786346435546875, -0.0001888275146484375, 0.00640869140625, 0.013006210327148438, 0.019603729248046875, 0.026201248168945312, 0.03279876708984375, 0.03939628601074219, 0.045993804931640625, 0.05259132385253906, 0.0591888427734375, 0.06578636169433594, 0.07238388061523438, 0.07898139953613281, 0.08557891845703125, 0.09217643737792969, 0.09877395629882812, 0.10537147521972656, 0.111968994140625, 0.11856651306152344, 0.12516403198242188, 0.1317615509033203, 0.13835906982421875, 0.1449565887451172, 0.15155410766601562, 0.15815162658691406, 0.1647491455078125, 0.17134666442871094, 0.17794418334960938, 0.1845417022705078, 0.19113922119140625, 0.1977367401123047, 0.20433425903320312, 0.21093177795410156, 0.217529296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 4.0, 6.0, 14.0, 16.0, 18.0, 36.0, 50.0, 54.0, 82.0, 141.0, 147.0, 107.0, 81.0, 59.0, 45.0, 28.0, 19.0, 20.0, 13.0, 7.0, 7.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003809928894042969, -0.0003670230507850647, -0.0003530532121658325, -0.00033908337354660034, -0.00032511353492736816, -0.000311143696308136, -0.0002971738576889038, -0.00028320401906967163, -0.00026923418045043945, -0.0002552643418312073, -0.0002412945032119751, -0.00022732466459274292, -0.00021335482597351074, -0.00019938498735427856, -0.0001854151487350464, -0.0001714453101158142, -0.00015747547149658203, -0.00014350563287734985, -0.00012953579425811768, -0.0001155659556388855, -0.00010159611701965332, -8.762627840042114e-05, -7.365643978118896e-05, -5.968660116195679e-05, -4.571676254272461e-05, -3.174692392349243e-05, -1.7777085304260254e-05, -3.807246685028076e-06, 1.0162591934204102e-05, 2.413243055343628e-05, 3.810226917266846e-05, 5.2072107791900635e-05, 6.604194641113281e-05, 8.001178503036499e-05, 9.398162364959717e-05, 0.00010795146226882935, 0.00012192130088806152, 0.0001358911395072937, 0.00014986097812652588, 0.00016383081674575806, 0.00017780065536499023, 0.0001917704939842224, 0.0002057403326034546, 0.00021971017122268677, 0.00023368000984191895, 0.0002476498484611511, 0.0002616196870803833, 0.0002755895256996155, 0.00028955936431884766, 0.00030352920293807983, 0.000317499041557312, 0.0003314688801765442, 0.00034543871879577637, 0.00035940855741500854, 0.0003733783960342407, 0.0003873482346534729, 0.0004013180732727051, 0.00041528791189193726, 0.00042925775051116943, 0.0004432275891304016, 0.0004571974277496338, 0.00047116726636886597, 0.00048513710498809814, 0.0004991069436073303, 0.0005130767822265625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 20.0, 33.0, 38.0, 57.0, 94.0, 166.0, 358.0, 1598.0, 1023800.0, 21245.0, 555.0, 227.0, 108.0, 71.0, 38.0, 19.0, 24.0, 12.0, 8.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0111846923828125, -0.010880231857299805, -0.01057577133178711, -0.010271310806274414, -0.009966850280761719, -0.009662389755249023, -0.009357929229736328, -0.009053468704223633, -0.008749008178710938, -0.008444547653198242, -0.008140087127685547, -0.007835626602172852, -0.007531166076660156, -0.007226705551147461, -0.006922245025634766, -0.00661778450012207, -0.006313323974609375, -0.00600886344909668, -0.005704402923583984, -0.005399942398071289, -0.005095481872558594, -0.0047910213470458984, -0.004486560821533203, -0.004182100296020508, -0.0038776397705078125, -0.003573179244995117, -0.003268718719482422, -0.0029642581939697266, -0.0026597976684570312, -0.002355337142944336, -0.0020508766174316406, -0.0017464160919189453, -0.00144195556640625, -0.0011374950408935547, -0.0008330345153808594, -0.0005285739898681641, -0.00022411346435546875, 8.034706115722656e-05, 0.0003848075866699219, 0.0006892681121826172, 0.0009937286376953125, 0.0012981891632080078, 0.0016026496887207031, 0.0019071102142333984, 0.0022115707397460938, 0.002516031265258789, 0.0028204917907714844, 0.0031249523162841797, 0.003429412841796875, 0.0037338733673095703, 0.004038333892822266, 0.004342794418334961, 0.004647254943847656, 0.0049517154693603516, 0.005256175994873047, 0.005560636520385742, 0.0058650970458984375, 0.006169557571411133, 0.006474018096923828, 0.0067784786224365234, 0.007082939147949219, 0.007387399673461914, 0.007691860198974609, 0.007996320724487305, 0.00830078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 17.0, 251.0, 689.0, 45.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012884201714769006, -0.001239330624230206, -0.0011902411933988333, -0.0011411516461521387, -0.0010920620989054441, -0.0010429726680740714, -0.0009938831208273768, -0.0009447936317883432, -0.0008957041427493095, -0.0008466146537102759, -0.0007975251646712422, -0.0007484356174245477, -0.000699346128385514, -0.0006502566393464804, -0.0006011670920997858, -0.0005520776030607522, -0.0005029881140217185, -0.00045389862498268485, -0.00040480910683982074, -0.00035571958869695663, -0.000306630099657923, -0.00025754061061888933, -0.00020845109247602522, -0.00015936157433316112, -0.00011027208529412746, -6.118258170317858e-05, -1.2093078112229705e-05, 3.6996425478719175e-05, 8.608592906966805e-05, 0.0001351754181087017, 0.00018426493625156581, 0.00023335445439442992, 0.0002824440598487854, 0.00033153354888781905, 0.00038062306703068316, 0.00042971258517354727, 0.0004788020742125809, 0.0005278915632516146, 0.0005769811104983091, 0.0006260705995373428, 0.0006751600885763764, 0.0007242495776154101, 0.0007733390666544437, 0.0008224286139011383, 0.000871518102940172, 0.0009206075919792056, 0.0009696971392259002, 0.001018786570057273, 0.0010678761173039675, 0.001116965664550662, 0.0011660550953820348, 0.0012151446426287293, 0.001264234073460102, 0.0013133236207067966, 0.0013624131679534912, 0.0014115027152001858, 0.0014605921460315585, 0.001509681693278253, 0.0015587711241096258, 0.0016078606713563204, 0.001656950218603015, 0.0017060396494343877, 0.0017551291966810822, 0.001804218627512455, 0.0018533081747591496]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 10.0, 15.0, 27.0, 39.0, 52.0, 62.0, 63.0, 61.0, 92.0, 79.0, 67.0, 89.0, 69.0, 62.0, 53.0, 46.0, 37.0, 28.0, 16.0, 12.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00040787458419799805, -0.000395849347114563, -0.00038382411003112793, -0.00037179887294769287, -0.0003597736358642578, -0.00034774839878082275, -0.0003357231616973877, -0.00032369792461395264, -0.0003116726875305176, -0.0002996474504470825, -0.00028762221336364746, -0.0002755969762802124, -0.00026357173919677734, -0.0002515465021133423, -0.00023952126502990723, -0.00022749602794647217, -0.0002154707908630371, -0.00020344555377960205, -0.000191420316696167, -0.00017939507961273193, -0.00016736984252929688, -0.00015534460544586182, -0.00014331936836242676, -0.0001312941312789917, -0.00011926889419555664, -0.00010724365711212158, -9.521842002868652e-05, -8.319318294525146e-05, -7.11679458618164e-05, -5.914270877838135e-05, -4.711747169494629e-05, -3.509223461151123e-05, -2.3066997528076172e-05, -1.1041760444641113e-05, 9.834766387939453e-07, 1.3008713722229004e-05, 2.5033950805664062e-05, 3.705918788909912e-05, 4.908442497253418e-05, 6.110966205596924e-05, 7.31348991394043e-05, 8.516013622283936e-05, 9.718537330627441e-05, 0.00010921061038970947, 0.00012123584747314453, 0.0001332610845565796, 0.00014528632164001465, 0.0001573115587234497, 0.00016933679580688477, 0.00018136203289031982, 0.00019338726997375488, 0.00020541250705718994, 0.000217437744140625, 0.00022946298122406006, 0.00024148821830749512, 0.0002535134553909302, 0.00026553869247436523, 0.0002775639295578003, 0.00028958916664123535, 0.0003016144037246704, 0.00031363964080810547, 0.00032566487789154053, 0.0003376901149749756, 0.00034971535205841064, 0.0003617405891418457]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 15.0, 14.0, 11.0, 20.0, 16.0, 26.0, 37.0, 29.0, 25.0, 32.0, 41.0, 46.0, 48.0, 44.0, 48.0, 45.0, 46.0, 55.0, 44.0, 53.0, 37.0, 45.0, 33.0, 22.0, 32.0, 30.0, 26.0, 16.0, 13.0, 12.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.897705078125, -18.29541015625, -17.693115234375, -17.0908203125, -16.488525390625, -15.88623046875, -15.283935546875, -14.681640625, -14.079345703125, -13.47705078125, -12.874755859375, -12.2724609375, -11.670166015625, -11.06787109375, -10.465576171875, -9.86328125, -9.260986328125, -8.65869140625, -8.056396484375, -7.4541015625, -6.851806640625, -6.24951171875, -5.647216796875, -5.044921875, -4.442626953125, -3.84033203125, -3.238037109375, -2.6357421875, -2.033447265625, -1.43115234375, -0.828857421875, -0.2265625, 0.375732421875, 0.97802734375, 1.580322265625, 2.1826171875, 2.784912109375, 3.38720703125, 3.989501953125, 4.591796875, 5.194091796875, 5.79638671875, 6.398681640625, 7.0009765625, 7.603271484375, 8.20556640625, 8.807861328125, 9.41015625, 10.012451171875, 10.61474609375, 11.217041015625, 11.8193359375, 12.421630859375, 13.02392578125, 13.626220703125, 14.228515625, 14.830810546875, 15.43310546875, 16.035400390625, 16.6376953125, 17.239990234375, 17.84228515625, 18.444580078125, 19.046875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 1.0, 8.0, 4.0, 8.0, 10.0, 20.0, 25.0, 40.0, 44.0, 70.0, 107.0, 157.0, 263.0, 368.0, 580.0, 847.0, 1306.0, 2170.0, 3275.0, 5781.0, 10134.0, 19279.0, 41619.0, 104142.0, 313633.0, 339631.0, 113461.0, 44762.0, 20934.0, 10408.0, 5877.0, 3441.0, 2190.0, 1381.0, 833.0, 566.0, 372.0, 253.0, 177.0, 132.0, 72.0, 50.0, 51.0, 19.0, 19.0, 10.0, 12.0, 9.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.390625, -20.654052734375, -19.91748046875, -19.180908203125, -18.4443359375, -17.707763671875, -16.97119140625, -16.234619140625, -15.498046875, -14.761474609375, -14.02490234375, -13.288330078125, -12.5517578125, -11.815185546875, -11.07861328125, -10.342041015625, -9.60546875, -8.868896484375, -8.13232421875, -7.395751953125, -6.6591796875, -5.922607421875, -5.18603515625, -4.449462890625, -3.712890625, -2.976318359375, -2.23974609375, -1.503173828125, -0.7666015625, -0.030029296875, 0.70654296875, 1.443115234375, 2.1796875, 2.916259765625, 3.65283203125, 4.389404296875, 5.1259765625, 5.862548828125, 6.59912109375, 7.335693359375, 8.072265625, 8.808837890625, 9.54541015625, 10.281982421875, 11.0185546875, 11.755126953125, 12.49169921875, 13.228271484375, 13.96484375, 14.701416015625, 15.43798828125, 16.174560546875, 16.9111328125, 17.647705078125, 18.38427734375, 19.120849609375, 19.857421875, 20.593994140625, 21.33056640625, 22.067138671875, 22.8037109375, 23.540283203125, 24.27685546875, 25.013427734375, 25.75]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 10.0, 13.0, 16.0, 25.0, 21.0, 26.0, 38.0, 37.0, 40.0, 54.0, 55.0, 89.0, 138.0, 1510.0, 390.0, 140.0, 72.0, 71.0, 47.0, 46.0, 37.0, 26.0, 29.0, 21.0, 18.0, 14.0, 14.0, 9.0, 4.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.37158203125, -45.9306640625, -44.48974609375, -43.048828125, -41.60791015625, -40.1669921875, -38.72607421875, -37.28515625, -35.84423828125, -34.4033203125, -32.96240234375, -31.521484375, -30.08056640625, -28.6396484375, -27.19873046875, -25.7578125, -24.31689453125, -22.8759765625, -21.43505859375, -19.994140625, -18.55322265625, -17.1123046875, -15.67138671875, -14.23046875, -12.78955078125, -11.3486328125, -9.90771484375, -8.466796875, -7.02587890625, -5.5849609375, -4.14404296875, -2.703125, -1.26220703125, 0.1787109375, 1.61962890625, 3.060546875, 4.50146484375, 5.9423828125, 7.38330078125, 8.82421875, 10.26513671875, 11.7060546875, 13.14697265625, 14.587890625, 16.02880859375, 17.4697265625, 18.91064453125, 20.3515625, 21.79248046875, 23.2333984375, 24.67431640625, 26.115234375, 27.55615234375, 28.9970703125, 30.43798828125, 31.87890625, 33.31982421875, 34.7607421875, 36.20166015625, 37.642578125, 39.08349609375, 40.5244140625, 41.96533203125, 43.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 15.0, 24.0, 22.0, 29.0, 68.0, 121.0, 173.0, 350.0, 952.0, 8855.0, 3044388.0, 87297.0, 2198.0, 548.0, 254.0, 107.0, 75.0, 60.0, 32.0, 28.0, 20.0, 9.0, 14.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-185.875, -181.1982421875, -176.521484375, -171.8447265625, -167.16796875, -162.4912109375, -157.814453125, -153.1376953125, -148.4609375, -143.7841796875, -139.107421875, -134.4306640625, -129.75390625, -125.0771484375, -120.400390625, -115.7236328125, -111.046875, -106.3701171875, -101.693359375, -97.0166015625, -92.33984375, -87.6630859375, -82.986328125, -78.3095703125, -73.6328125, -68.9560546875, -64.279296875, -59.6025390625, -54.92578125, -50.2490234375, -45.572265625, -40.8955078125, -36.21875, -31.5419921875, -26.865234375, -22.1884765625, -17.51171875, -12.8349609375, -8.158203125, -3.4814453125, 1.1953125, 5.8720703125, 10.548828125, 15.2255859375, 19.90234375, 24.5791015625, 29.255859375, 33.9326171875, 38.609375, 43.2861328125, 47.962890625, 52.6396484375, 57.31640625, 61.9931640625, 66.669921875, 71.3466796875, 76.0234375, 80.7001953125, 85.376953125, 90.0537109375, 94.73046875, 99.4072265625, 104.083984375, 108.7607421875, 113.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 19.0, 679.0, 311.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-445.6768493652344, -420.7241516113281, -395.771484375, -370.81878662109375, -345.8660888671875, -320.9134216308594, -295.9607238769531, -271.008056640625, -246.05535888671875, -221.10267639160156, -196.14999389648438, -171.19729614257812, -146.24461364746094, -121.29193115234375, -96.3392333984375, -71.38655090332031, -46.433868408203125, -21.481182098388672, 3.4715042114257812, 28.4241943359375, 53.37687683105469, 78.32955932617188, 103.28225708007812, 128.2349395751953, 153.1876220703125, 178.1403045654297, 203.09298706054688, 228.04568481445312, 252.9983673095703, 277.9510498046875, 302.90374755859375, 327.8564453125, 352.80908203125, 377.76177978515625, 402.7144470214844, 427.6671447753906, 452.61981201171875, 477.572509765625, 502.52520751953125, 527.4779052734375, 552.4305419921875, 577.3832397460938, 602.3359375, 627.28857421875, 652.2412719726562, 677.1939697265625, 702.1466674804688, 727.099365234375, 752.0520629882812, 777.0047607421875, 801.9574584960938, 826.91015625, 851.86279296875, 876.8154907226562, 901.7681884765625, 926.7208862304688, 951.673583984375, 976.6262817382812, 1001.5789794921875, 1026.5316162109375, 1051.484375, 1076.43701171875, 1101.3896484375, 1126.3424072265625, 1151.2950439453125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 8.0, 10.0, 10.0, 26.0, 24.0, 16.0, 27.0, 38.0, 21.0, 34.0, 44.0, 43.0, 30.0, 36.0, 43.0, 43.0, 53.0, 51.0, 27.0, 52.0, 38.0, 23.0, 46.0, 38.0, 30.0, 28.0, 31.0, 20.0, 20.0, 9.0, 13.0, 14.0, 8.0, 8.0, 3.0, 4.0, 12.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.79092407226562, -101.34465789794922, -97.89839172363281, -94.4521255493164, -91.005859375, -87.5595932006836, -84.11332702636719, -80.66705322265625, -77.22079467773438, -73.77452850341797, -70.32826232910156, -66.88199615478516, -63.43572998046875, -59.989463806152344, -56.54319381713867, -53.096927642822266, -49.650657653808594, -46.20439147949219, -42.75812530517578, -39.311859130859375, -35.86559295654297, -32.41932678222656, -28.97305679321289, -25.526790618896484, -22.080524444580078, -18.634258270263672, -15.18799114227295, -11.741724014282227, -8.29545783996582, -4.849191665649414, -1.402923583984375, 2.0433425903320312, 5.4896087646484375, 8.935874938964844, 12.382142066955566, 15.828409194946289, 19.274675369262695, 22.7209415435791, 26.16720962524414, 29.613475799560547, 33.05974197387695, 36.50600814819336, 39.952274322509766, 43.39854431152344, 46.844810485839844, 50.29107666015625, 53.737342834472656, 57.18360900878906, 60.62987518310547, 64.07614135742188, 67.52240753173828, 70.96867370605469, 74.4149398803711, 77.8612060546875, 81.30747985839844, 84.75373840332031, 88.20001220703125, 91.64627838134766, 95.09254455566406, 98.53881072998047, 101.98507690429688, 105.43134307861328, 108.87760925292969, 112.32388305664062, 115.7701416015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 16.0, 10.0, 15.0, 13.0, 27.0, 27.0, 25.0, 28.0, 48.0, 43.0, 39.0, 36.0, 43.0, 40.0, 47.0, 42.0, 62.0, 47.0, 47.0, 40.0, 49.0, 37.0, 31.0, 24.0, 19.0, 21.0, 19.0, 15.0, 27.0, 14.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.546875, -18.940185546875, -18.33349609375, -17.726806640625, -17.1201171875, -16.513427734375, -15.90673828125, -15.300048828125, -14.693359375, -14.086669921875, -13.47998046875, -12.873291015625, -12.2666015625, -11.659912109375, -11.05322265625, -10.446533203125, -9.83984375, -9.233154296875, -8.62646484375, -8.019775390625, -7.4130859375, -6.806396484375, -6.19970703125, -5.593017578125, -4.986328125, -4.379638671875, -3.77294921875, -3.166259765625, -2.5595703125, -1.952880859375, -1.34619140625, -0.739501953125, -0.1328125, 0.473876953125, 1.08056640625, 1.687255859375, 2.2939453125, 2.900634765625, 3.50732421875, 4.114013671875, 4.720703125, 5.327392578125, 5.93408203125, 6.540771484375, 7.1474609375, 7.754150390625, 8.36083984375, 8.967529296875, 9.57421875, 10.180908203125, 10.78759765625, 11.394287109375, 12.0009765625, 12.607666015625, 13.21435546875, 13.821044921875, 14.427734375, 15.034423828125, 15.64111328125, 16.247802734375, 16.8544921875, 17.461181640625, 18.06787109375, 18.674560546875, 19.28125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 10.0, 10.0, 12.0, 21.0, 19.0, 27.0, 41.0, 44.0, 64.0, 82.0, 135.0, 178.0, 229.0, 385.0, 609.0, 1057.0, 1811.0, 3547.0, 8579.0, 35584.0, 420803.0, 2603901.0, 1001839.0, 90254.0, 14431.0, 4797.0, 2366.0, 1258.0, 763.0, 445.0, 280.0, 206.0, 151.0, 94.0, 54.0, 48.0, 32.0, 22.0, 21.0, 19.0, 16.0, 14.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.25, -32.23291015625, -31.2158203125, -30.19873046875, -29.181640625, -28.16455078125, -27.1474609375, -26.13037109375, -25.11328125, -24.09619140625, -23.0791015625, -22.06201171875, -21.044921875, -20.02783203125, -19.0107421875, -17.99365234375, -16.9765625, -15.95947265625, -14.9423828125, -13.92529296875, -12.908203125, -11.89111328125, -10.8740234375, -9.85693359375, -8.83984375, -7.82275390625, -6.8056640625, -5.78857421875, -4.771484375, -3.75439453125, -2.7373046875, -1.72021484375, -0.703125, 0.31396484375, 1.3310546875, 2.34814453125, 3.365234375, 4.38232421875, 5.3994140625, 6.41650390625, 7.43359375, 8.45068359375, 9.4677734375, 10.48486328125, 11.501953125, 12.51904296875, 13.5361328125, 14.55322265625, 15.5703125, 16.58740234375, 17.6044921875, 18.62158203125, 19.638671875, 20.65576171875, 21.6728515625, 22.68994140625, 23.70703125, 24.72412109375, 25.7412109375, 26.75830078125, 27.775390625, 28.79248046875, 29.8095703125, 30.82666015625, 31.84375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 4.0, 19.0, 11.0, 18.0, 15.0, 32.0, 38.0, 56.0, 58.0, 101.0, 140.0, 252.0, 344.0, 559.0, 680.0, 556.0, 360.0, 217.0, 171.0, 107.0, 80.0, 61.0, 49.0, 28.0, 30.0, 26.0, 14.0, 8.0, 11.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.484375, -25.587890625, -24.69140625, -23.794921875, -22.8984375, -22.001953125, -21.10546875, -20.208984375, -19.3125, -18.416015625, -17.51953125, -16.623046875, -15.7265625, -14.830078125, -13.93359375, -13.037109375, -12.140625, -11.244140625, -10.34765625, -9.451171875, -8.5546875, -7.658203125, -6.76171875, -5.865234375, -4.96875, -4.072265625, -3.17578125, -2.279296875, -1.3828125, -0.486328125, 0.41015625, 1.306640625, 2.203125, 3.099609375, 3.99609375, 4.892578125, 5.7890625, 6.685546875, 7.58203125, 8.478515625, 9.375, 10.271484375, 11.16796875, 12.064453125, 12.9609375, 13.857421875, 14.75390625, 15.650390625, 16.546875, 17.443359375, 18.33984375, 19.236328125, 20.1328125, 21.029296875, 21.92578125, 22.822265625, 23.71875, 24.615234375, 25.51171875, 26.408203125, 27.3046875, 28.201171875, 29.09765625, 29.994140625, 30.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 12.0, 27.0, 28.0, 42.0, 76.0, 93.0, 147.0, 253.0, 466.0, 841.0, 1858.0, 4249.0, 11680.0, 40257.0, 203027.0, 2722548.0, 1058032.0, 110509.0, 25680.0, 8228.0, 3176.0, 1335.0, 707.0, 368.0, 238.0, 138.0, 73.0, 56.0, 46.0, 25.0, 17.0, 11.0, 5.0, 11.0, 3.0, 7.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.69482421875, -35.5771484375, -34.45947265625, -33.341796875, -32.22412109375, -31.1064453125, -29.98876953125, -28.87109375, -27.75341796875, -26.6357421875, -25.51806640625, -24.400390625, -23.28271484375, -22.1650390625, -21.04736328125, -19.9296875, -18.81201171875, -17.6943359375, -16.57666015625, -15.458984375, -14.34130859375, -13.2236328125, -12.10595703125, -10.98828125, -9.87060546875, -8.7529296875, -7.63525390625, -6.517578125, -5.39990234375, -4.2822265625, -3.16455078125, -2.046875, -0.92919921875, 0.1884765625, 1.30615234375, 2.423828125, 3.54150390625, 4.6591796875, 5.77685546875, 6.89453125, 8.01220703125, 9.1298828125, 10.24755859375, 11.365234375, 12.48291015625, 13.6005859375, 14.71826171875, 15.8359375, 16.95361328125, 18.0712890625, 19.18896484375, 20.306640625, 21.42431640625, 22.5419921875, 23.65966796875, 24.77734375, 25.89501953125, 27.0126953125, 28.13037109375, 29.248046875, 30.36572265625, 31.4833984375, 32.60107421875, 33.71875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 17.0, 76.0, 195.0, 324.0, 264.0, 88.0, 33.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.43685913085938, -109.78137969970703, -101.12590026855469, -92.47042083740234, -83.81494140625, -75.15946197509766, -66.50398254394531, -57.84850311279297, -49.193023681640625, -40.53754425048828, -31.882064819335938, -23.226585388183594, -14.57110595703125, -5.915626525878906, 2.7398529052734375, 11.395332336425781, 20.050811767578125, 28.70629119873047, 37.36177062988281, 46.017250061035156, 54.6727294921875, 63.328208923339844, 71.98368835449219, 80.63916778564453, 89.29464721679688, 97.95012664794922, 106.60560607910156, 115.2610855102539, 123.91656494140625, 132.57205200195312, 141.22752380371094, 149.88299560546875, 158.53848266601562, 167.1939697265625, 175.8494415283203, 184.50491333007812, 193.160400390625, 201.81588745117188, 210.4713592529297, 219.1268310546875, 227.78231811523438, 236.43780517578125, 245.09327697753906, 253.74874877929688, 262.40423583984375, 271.0597229003906, 279.7152099609375, 288.37066650390625, 297.0261535644531, 305.681640625, 314.33709716796875, 322.9925842285156, 331.6480712890625, 340.3035583496094, 348.95904541015625, 357.614501953125, 366.2699890136719, 374.92547607421875, 383.5809326171875, 392.2364196777344, 400.89190673828125, 409.5473937988281, 418.202880859375, 426.85833740234375, 435.5138244628906]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 6.0, 12.0, 9.0, 12.0, 9.0, 18.0, 25.0, 27.0, 24.0, 29.0, 39.0, 35.0, 30.0, 25.0, 46.0, 37.0, 52.0, 48.0, 47.0, 28.0, 43.0, 48.0, 41.0, 41.0, 34.0, 38.0, 26.0, 27.0, 27.0, 24.0, 12.0, 11.0, 11.0, 14.0, 9.0, 6.0, 5.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-101.22217559814453, -98.37931060791016, -95.53643798828125, -92.69357299804688, -89.8507080078125, -87.0078353881836, -84.16497039794922, -81.32209777832031, -78.47923278808594, -75.63636779785156, -72.79349517822266, -69.95063018798828, -67.10775756835938, -64.264892578125, -61.422027587890625, -58.579158782958984, -55.736289978027344, -52.8934211730957, -50.05055236816406, -47.20768737792969, -44.36481857299805, -41.521949768066406, -38.67908477783203, -35.83621597290039, -32.99334716796875, -30.15047836303711, -27.3076114654541, -24.464744567871094, -21.621875762939453, -18.779006958007812, -15.936140060424805, -13.093273162841797, -10.250411987304688, -7.407544136047363, -4.564676284790039, -1.7218084335327148, 1.1210594177246094, 3.9639272689819336, 6.806795120239258, 9.649662017822266, 12.492530822753906, 15.33539867401123, 18.178266525268555, 21.021133422851562, 23.864002227783203, 26.706871032714844, 29.54973793029785, 32.39260482788086, 35.2354736328125, 38.07834243774414, 40.92121124267578, 43.764076232910156, 46.6069450378418, 49.44981384277344, 52.29267883300781, 55.13554763793945, 57.978416442871094, 60.821285247802734, 63.664154052734375, 66.50701904296875, 69.34988403320312, 72.19275665283203, 75.0356216430664, 77.87849426269531, 80.72135925292969]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 9.0, 3.0, 8.0, 10.0, 14.0, 11.0, 13.0, 21.0, 23.0, 24.0, 23.0, 31.0, 29.0, 47.0, 44.0, 47.0, 26.0, 41.0, 61.0, 45.0, 42.0, 45.0, 42.0, 30.0, 40.0, 39.0, 45.0, 28.0, 30.0, 25.0, 16.0, 18.0, 11.0, 13.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4093017578125, -11.935791015625, -11.4622802734375, -10.98876953125, -10.5152587890625, -10.041748046875, -9.5682373046875, -9.0947265625, -8.6212158203125, -8.147705078125, -7.6741943359375, -7.20068359375, -6.7271728515625, -6.253662109375, -5.7801513671875, -5.306640625, -4.8331298828125, -4.359619140625, -3.8861083984375, -3.41259765625, -2.9390869140625, -2.465576171875, -1.9920654296875, -1.5185546875, -1.0450439453125, -0.571533203125, -0.0980224609375, 0.37548828125, 0.8489990234375, 1.322509765625, 1.7960205078125, 2.26953125, 2.7430419921875, 3.216552734375, 3.6900634765625, 4.16357421875, 4.6370849609375, 5.110595703125, 5.5841064453125, 6.0576171875, 6.5311279296875, 7.004638671875, 7.4781494140625, 7.95166015625, 8.4251708984375, 8.898681640625, 9.3721923828125, 9.845703125, 10.3192138671875, 10.792724609375, 11.2662353515625, 11.73974609375, 12.2132568359375, 12.686767578125, 13.1602783203125, 13.6337890625, 14.1072998046875, 14.580810546875, 15.0543212890625, 15.52783203125, 16.0013427734375, 16.474853515625, 16.9483642578125, 17.421875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 8.0, 16.0, 29.0, 30.0, 56.0, 84.0, 125.0, 224.0, 343.0, 479.0, 799.0, 1317.0, 2047.0, 3425.0, 5521.0, 9574.0, 16255.0, 28500.0, 50813.0, 93144.0, 173349.0, 270769.0, 175473.0, 94733.0, 51388.0, 28861.0, 16646.0, 9700.0, 5720.0, 3547.0, 2072.0, 1312.0, 800.0, 498.0, 303.0, 218.0, 139.0, 73.0, 53.0, 32.0, 23.0, 22.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.309814453125, -0.30028533935546875, -0.2907562255859375, -0.28122711181640625, -0.271697998046875, -0.26216888427734375, -0.2526397705078125, -0.24311065673828125, -0.23358154296875, -0.22405242919921875, -0.2145233154296875, -0.20499420166015625, -0.195465087890625, -0.18593597412109375, -0.1764068603515625, -0.16687774658203125, -0.1573486328125, -0.14781951904296875, -0.1382904052734375, -0.12876129150390625, -0.119232177734375, -0.10970306396484375, -0.1001739501953125, -0.09064483642578125, -0.08111572265625, -0.07158660888671875, -0.0620574951171875, -0.05252838134765625, -0.042999267578125, -0.03347015380859375, -0.0239410400390625, -0.01441192626953125, -0.0048828125, 0.00464630126953125, 0.0141754150390625, 0.02370452880859375, 0.033233642578125, 0.04276275634765625, 0.0522918701171875, 0.06182098388671875, 0.07135009765625, 0.08087921142578125, 0.0904083251953125, 0.09993743896484375, 0.109466552734375, 0.11899566650390625, 0.1285247802734375, 0.13805389404296875, 0.1475830078125, 0.15711212158203125, 0.1666412353515625, 0.17617034912109375, 0.185699462890625, 0.19522857666015625, 0.2047576904296875, 0.21428680419921875, 0.22381591796875, 0.23334503173828125, 0.2428741455078125, 0.25240325927734375, 0.261932373046875, 0.27146148681640625, 0.2809906005859375, 0.29051971435546875, 0.300048828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 11.0, 10.0, 14.0, 10.0, 18.0, 22.0, 19.0, 20.0, 38.0, 37.0, 34.0, 34.0, 34.0, 34.0, 35.0, 35.0, 44.0, 1070.0, 45.0, 46.0, 44.0, 55.0, 37.0, 36.0, 24.0, 22.0, 30.0, 31.0, 13.0, 21.0, 13.0, 18.0, 18.0, 15.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -7.998291015625, -7.69189453125, -7.385498046875, -7.0791015625, -6.772705078125, -6.46630859375, -6.159912109375, -5.853515625, -5.547119140625, -5.24072265625, -4.934326171875, -4.6279296875, -4.321533203125, -4.01513671875, -3.708740234375, -3.40234375, -3.095947265625, -2.78955078125, -2.483154296875, -2.1767578125, -1.870361328125, -1.56396484375, -1.257568359375, -0.951171875, -0.644775390625, -0.33837890625, -0.031982421875, 0.2744140625, 0.580810546875, 0.88720703125, 1.193603515625, 1.5, 1.806396484375, 2.11279296875, 2.419189453125, 2.7255859375, 3.031982421875, 3.33837890625, 3.644775390625, 3.951171875, 4.257568359375, 4.56396484375, 4.870361328125, 5.1767578125, 5.483154296875, 5.78955078125, 6.095947265625, 6.40234375, 6.708740234375, 7.01513671875, 7.321533203125, 7.6279296875, 7.934326171875, 8.24072265625, 8.547119140625, 8.853515625, 9.159912109375, 9.46630859375, 9.772705078125, 10.0791015625, 10.385498046875, 10.69189453125, 10.998291015625, 11.3046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 16.0, 24.0, 25.0, 50.0, 64.0, 104.0, 145.0, 231.0, 342.0, 564.0, 772.0, 1160.0, 1711.0, 2705.0, 4252.0, 6413.0, 9911.0, 15485.0, 24226.0, 38638.0, 62463.0, 104673.0, 183509.0, 1280242.0, 140935.0, 81960.0, 49974.0, 31659.0, 19523.0, 12292.0, 7853.0, 5103.0, 3490.0, 2197.0, 1482.0, 947.0, 650.0, 437.0, 316.0, 180.0, 123.0, 97.0, 58.0, 44.0, 30.0, 15.0, 15.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.149658203125, -0.14487266540527344, -0.14008712768554688, -0.1353015899658203, -0.13051605224609375, -0.1257305145263672, -0.12094497680664062, -0.11615943908691406, -0.1113739013671875, -0.10658836364746094, -0.10180282592773438, -0.09701728820800781, -0.09223175048828125, -0.08744621276855469, -0.08266067504882812, -0.07787513732910156, -0.073089599609375, -0.06830406188964844, -0.06351852416992188, -0.05873298645019531, -0.05394744873046875, -0.04916191101074219, -0.044376373291015625, -0.03959083557128906, -0.0348052978515625, -0.030019760131835938, -0.025234222412109375, -0.020448684692382812, -0.01566314697265625, -0.010877609252929688, -0.006092071533203125, -0.0013065338134765625, 0.00347900390625, 0.008264541625976562, 0.013050079345703125, 0.017835617065429688, 0.02262115478515625, 0.027406692504882812, 0.032192230224609375, 0.03697776794433594, 0.0417633056640625, 0.04654884338378906, 0.051334381103515625, 0.05611991882324219, 0.06090545654296875, 0.06569099426269531, 0.07047653198242188, 0.07526206970214844, 0.080047607421875, 0.08483314514160156, 0.08961868286132812, 0.09440422058105469, 0.09918975830078125, 0.10397529602050781, 0.10876083374023438, 0.11354637145996094, 0.1183319091796875, 0.12311744689941406, 0.12790298461914062, 0.1326885223388672, 0.13747406005859375, 0.1422595977783203, 0.14704513549804688, 0.15183067321777344, 0.1566162109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 3.0, 9.0, 4.0, 9.0, 16.0, 17.0, 22.0, 31.0, 18.0, 25.0, 29.0, 36.0, 33.0, 40.0, 51.0, 80.0, 87.0, 91.0, 63.0, 54.0, 36.0, 25.0, 37.0, 27.0, 28.0, 19.0, 21.0, 10.0, 5.0, 5.0, 5.0, 9.0, 6.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00025081634521484375, -0.00024335645139217377, -0.00023589655756950378, -0.0002284366637468338, -0.00022097676992416382, -0.00021351687610149384, -0.00020605698227882385, -0.00019859708845615387, -0.0001911371946334839, -0.0001836773008108139, -0.00017621740698814392, -0.00016875751316547394, -0.00016129761934280396, -0.00015383772552013397, -0.000146377831697464, -0.000138917937874794, -0.00013145804405212402, -0.00012399815022945404, -0.00011653825640678406, -0.00010907836258411407, -0.00010161846876144409, -9.415857493877411e-05, -8.669868111610413e-05, -7.923878729343414e-05, -7.177889347076416e-05, -6.431899964809418e-05, -5.6859105825424194e-05, -4.939921200275421e-05, -4.193931818008423e-05, -3.4479424357414246e-05, -2.7019530534744263e-05, -1.955963671207428e-05, -1.2099742889404297e-05, -4.639849066734314e-06, 2.820044755935669e-06, 1.0279938578605652e-05, 1.7739832401275635e-05, 2.5199726223945618e-05, 3.26596200466156e-05, 4.0119513869285583e-05, 4.7579407691955566e-05, 5.503930151462555e-05, 6.249919533729553e-05, 6.995908915996552e-05, 7.74189829826355e-05, 8.487887680530548e-05, 9.233877062797546e-05, 9.979866445064545e-05, 0.00010725855827331543, 0.00011471845209598541, 0.0001221783459186554, 0.00012963823974132538, 0.00013709813356399536, 0.00014455802738666534, 0.00015201792120933533, 0.0001594778150320053, 0.0001669377088546753, 0.00017439760267734528, 0.00018185749650001526, 0.00018931739032268524, 0.00019677728414535522, 0.0002042371779680252, 0.0002116970717906952, 0.00021915696561336517, 0.00022661685943603516]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 7.0, 11.0, 7.0, 12.0, 18.0, 28.0, 41.0, 38.0, 42.0, 96.0, 121.0, 180.0, 361.0, 854.0, 59077.0, 984710.0, 1652.0, 479.0, 230.0, 133.0, 99.0, 81.0, 39.0, 36.0, 34.0, 33.0, 24.0, 18.0, 9.0, 9.0, 9.0, 5.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0054473876953125, -0.00527268648147583, -0.00509798526763916, -0.00492328405380249, -0.00474858283996582, -0.00457388162612915, -0.0043991804122924805, -0.0042244791984558105, -0.004049777984619141, -0.0038750767707824707, -0.0037003755569458008, -0.003525674343109131, -0.003350973129272461, -0.003176271915435791, -0.003001570701599121, -0.002826869487762451, -0.0026521682739257812, -0.0024774670600891113, -0.0023027658462524414, -0.0021280646324157715, -0.0019533634185791016, -0.0017786622047424316, -0.0016039609909057617, -0.0014292597770690918, -0.0012545585632324219, -0.001079857349395752, -0.000905156135559082, -0.0007304549217224121, -0.0005557537078857422, -0.00038105249404907227, -0.00020635128021240234, -3.165006637573242e-05, 0.0001430511474609375, 0.0003177523612976074, 0.0004924535751342773, 0.0006671547889709473, 0.0008418560028076172, 0.0010165572166442871, 0.001191258430480957, 0.001365959644317627, 0.0015406608581542969, 0.0017153620719909668, 0.0018900632858276367, 0.0020647644996643066, 0.0022394657135009766, 0.0024141669273376465, 0.0025888681411743164, 0.0027635693550109863, 0.0029382705688476562, 0.003112971782684326, 0.003287672996520996, 0.003462374210357666, 0.003637075424194336, 0.003811776638031006, 0.003986477851867676, 0.004161179065704346, 0.004335880279541016, 0.0045105814933776855, 0.0046852827072143555, 0.004859983921051025, 0.005034685134887695, 0.005209386348724365, 0.005384087562561035, 0.005558788776397705, 0.005733489990234375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 762.0, 253.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008890714962035418, -0.0006648646667599678, -0.00044065777910873294, -0.00021645089145749807, 7.755937986075878e-06, 0.00023196276742964983, 0.0004561697132885456, 0.0006803765427321196, 0.0009045833721756935, 0.0011287902016192675, 0.0013529970310628414, 0.0015772039769217372, 0.0018014108063653111, 0.002025617752224207, 0.002249824581667781, 0.002474031411111355, 0.0026982382405549288, 0.0029224450699985027, 0.0031466518994420767, 0.0033708587288856506, 0.0035950657911598682, 0.0038192723877727985, 0.004043479450047016, 0.0042676860466599464, 0.004491893108934164, 0.004716100171208382, 0.004940306767821312, 0.0051645138300955296, 0.00538872042670846, 0.0056129274889826775, 0.005837134085595608, 0.006061341147869825, 0.006285548210144043, 0.006509755272418261, 0.006733961869031191, 0.0069581689313054085, 0.007182375527918339, 0.007406582590192556, 0.007630789652466774, 0.007854996249079704, 0.008079202845692635, 0.008303409442305565, 0.00852761697024107, 0.008751823566854, 0.00897603016346693, 0.00920023676007986, 0.009424444288015366, 0.009648650884628296, 0.009872857481241226, 0.010097064077854156, 0.010321271605789661, 0.010545478202402592, 0.010769684799015522, 0.010993891395628452, 0.011218098923563957, 0.011442305520176888, 0.011666513048112392, 0.011890719644725323, 0.012114927172660828, 0.012339133769273758, 0.012563340365886688, 0.012787546962499619, 0.013011754490435123, 0.013235961087048054, 0.013460167683660984]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 8.0, 36.0, 55.0, 79.0, 122.0, 148.0, 142.0, 129.0, 116.0, 69.0, 51.0, 32.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005792379379272461, -0.0005623642355203629, -0.0005454905331134796, -0.0005286168307065964, -0.0005117431282997131, -0.0004948694258928299, -0.00047799572348594666, -0.0004611220210790634, -0.0004442483186721802, -0.00042737461626529694, -0.0004105009138584137, -0.00039362721145153046, -0.0003767535090446472, -0.000359879806637764, -0.00034300610423088074, -0.0003261324018239975, -0.00030925869941711426, -0.000292384997010231, -0.0002755112946033478, -0.00025863759219646454, -0.0002417638897895813, -0.00022489018738269806, -0.00020801648497581482, -0.00019114278256893158, -0.00017426908016204834, -0.0001573953777551651, -0.00014052167534828186, -0.00012364797294139862, -0.00010677427053451538, -8.990056812763214e-05, -7.30268657207489e-05, -5.615316331386566e-05, -3.927946090698242e-05, -2.2405758500099182e-05, -5.532056093215942e-06, 1.1341646313667297e-05, 2.8215348720550537e-05, 4.508905112743378e-05, 6.196275353431702e-05, 7.883645594120026e-05, 9.57101583480835e-05, 0.00011258386075496674, 0.00012945756316184998, 0.00014633126556873322, 0.00016320496797561646, 0.0001800786703824997, 0.00019695237278938293, 0.00021382607519626617, 0.00023069977760314941, 0.00024757348001003265, 0.0002644471824169159, 0.00028132088482379913, 0.0002981945872306824, 0.0003150682896375656, 0.00033194199204444885, 0.0003488156944513321, 0.00036568939685821533, 0.00038256309926509857, 0.0003994368016719818, 0.00041631050407886505, 0.0004331842064857483, 0.00045005790889263153, 0.00046693161129951477, 0.000483805313706398, 0.0005006790161132812]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 9.0, 3.0, 8.0, 10.0, 14.0, 11.0, 13.0, 21.0, 23.0, 24.0, 23.0, 31.0, 29.0, 47.0, 44.0, 47.0, 26.0, 41.0, 61.0, 45.0, 42.0, 45.0, 42.0, 30.0, 40.0, 39.0, 45.0, 28.0, 30.0, 25.0, 16.0, 18.0, 11.0, 13.0, 11.0, 9.0, 6.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.4093017578125, -11.935791015625, -11.4622802734375, -10.98876953125, -10.5152587890625, -10.041748046875, -9.5682373046875, -9.0947265625, -8.6212158203125, -8.147705078125, -7.6741943359375, -7.20068359375, -6.7271728515625, -6.253662109375, -5.7801513671875, -5.306640625, -4.8331298828125, -4.359619140625, -3.8861083984375, -3.41259765625, -2.9390869140625, -2.465576171875, -1.9920654296875, -1.5185546875, -1.0450439453125, -0.571533203125, -0.0980224609375, 0.37548828125, 0.8489990234375, 1.322509765625, 1.7960205078125, 2.26953125, 2.7430419921875, 3.216552734375, 3.6900634765625, 4.16357421875, 4.6370849609375, 5.110595703125, 5.5841064453125, 6.0576171875, 6.5311279296875, 7.004638671875, 7.4781494140625, 7.95166015625, 8.4251708984375, 8.898681640625, 9.3721923828125, 9.845703125, 10.3192138671875, 10.792724609375, 11.2662353515625, 11.73974609375, 12.2132568359375, 12.686767578125, 13.1602783203125, 13.6337890625, 14.1072998046875, 14.580810546875, 15.0543212890625, 15.52783203125, 16.0013427734375, 16.474853515625, 16.9483642578125, 17.421875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 4.0, 12.0, 3.0, 27.0, 24.0, 40.0, 42.0, 73.0, 108.0, 157.0, 227.0, 346.0, 516.0, 763.0, 1288.0, 2206.0, 3845.0, 7485.0, 16790.0, 50815.0, 253627.0, 555553.0, 103706.0, 27556.0, 10792.0, 5174.0, 2746.0, 1621.0, 1021.0, 640.0, 457.0, 274.0, 187.0, 133.0, 85.0, 73.0, 45.0, 30.0, 19.0, 14.0, 6.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.09375, -25.308837890625, -24.52392578125, -23.739013671875, -22.9541015625, -22.169189453125, -21.38427734375, -20.599365234375, -19.814453125, -19.029541015625, -18.24462890625, -17.459716796875, -16.6748046875, -15.889892578125, -15.10498046875, -14.320068359375, -13.53515625, -12.750244140625, -11.96533203125, -11.180419921875, -10.3955078125, -9.610595703125, -8.82568359375, -8.040771484375, -7.255859375, -6.470947265625, -5.68603515625, -4.901123046875, -4.1162109375, -3.331298828125, -2.54638671875, -1.761474609375, -0.9765625, -0.191650390625, 0.59326171875, 1.378173828125, 2.1630859375, 2.947998046875, 3.73291015625, 4.517822265625, 5.302734375, 6.087646484375, 6.87255859375, 7.657470703125, 8.4423828125, 9.227294921875, 10.01220703125, 10.797119140625, 11.58203125, 12.366943359375, 13.15185546875, 13.936767578125, 14.7216796875, 15.506591796875, 16.29150390625, 17.076416015625, 17.861328125, 18.646240234375, 19.43115234375, 20.216064453125, 21.0009765625, 21.785888671875, 22.57080078125, 23.355712890625, 24.140625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 6.0, 6.0, 6.0, 11.0, 8.0, 13.0, 16.0, 23.0, 15.0, 23.0, 33.0, 23.0, 40.0, 42.0, 43.0, 78.0, 71.0, 204.0, 1592.0, 278.0, 96.0, 64.0, 50.0, 41.0, 33.0, 38.0, 32.0, 37.0, 22.0, 12.0, 20.0, 12.0, 11.0, 13.0, 5.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0], "bins": [-42.125, -41.035400390625, -39.94580078125, -38.856201171875, -37.7666015625, -36.677001953125, -35.58740234375, -34.497802734375, -33.408203125, -32.318603515625, -31.22900390625, -30.139404296875, -29.0498046875, -27.960205078125, -26.87060546875, -25.781005859375, -24.69140625, -23.601806640625, -22.51220703125, -21.422607421875, -20.3330078125, -19.243408203125, -18.15380859375, -17.064208984375, -15.974609375, -14.885009765625, -13.79541015625, -12.705810546875, -11.6162109375, -10.526611328125, -9.43701171875, -8.347412109375, -7.2578125, -6.168212890625, -5.07861328125, -3.989013671875, -2.8994140625, -1.809814453125, -0.72021484375, 0.369384765625, 1.458984375, 2.548583984375, 3.63818359375, 4.727783203125, 5.8173828125, 6.906982421875, 7.99658203125, 9.086181640625, 10.17578125, 11.265380859375, 12.35498046875, 13.444580078125, 14.5341796875, 15.623779296875, 16.71337890625, 17.802978515625, 18.892578125, 19.982177734375, 21.07177734375, 22.161376953125, 23.2509765625, 24.340576171875, 25.43017578125, 26.519775390625, 27.609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 12.0, 13.0, 15.0, 29.0, 36.0, 57.0, 66.0, 108.0, 147.0, 261.0, 468.0, 1336.0, 13897.0, 3086227.0, 39530.0, 2045.0, 553.0, 316.0, 168.0, 113.0, 88.0, 55.0, 38.0, 26.0, 16.0, 14.0, 16.0, 12.0, 10.0, 2.0, 6.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-100.25, -97.3544921875, -94.458984375, -91.5634765625, -88.66796875, -85.7724609375, -82.876953125, -79.9814453125, -77.0859375, -74.1904296875, -71.294921875, -68.3994140625, -65.50390625, -62.6083984375, -59.712890625, -56.8173828125, -53.921875, -51.0263671875, -48.130859375, -45.2353515625, -42.33984375, -39.4443359375, -36.548828125, -33.6533203125, -30.7578125, -27.8623046875, -24.966796875, -22.0712890625, -19.17578125, -16.2802734375, -13.384765625, -10.4892578125, -7.59375, -4.6982421875, -1.802734375, 1.0927734375, 3.98828125, 6.8837890625, 9.779296875, 12.6748046875, 15.5703125, 18.4658203125, 21.361328125, 24.2568359375, 27.15234375, 30.0478515625, 32.943359375, 35.8388671875, 38.734375, 41.6298828125, 44.525390625, 47.4208984375, 50.31640625, 53.2119140625, 56.107421875, 59.0029296875, 61.8984375, 64.7939453125, 67.689453125, 70.5849609375, 73.48046875, 76.3759765625, 79.271484375, 82.1669921875, 85.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 8.0, 33.0, 63.0, 120.0, 201.0, 241.0, 152.0, 85.0, 51.0, 19.0, 13.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.17568969726562, -95.25472259521484, -91.33375549316406, -87.41278839111328, -83.4918212890625, -79.57085418701172, -75.64988708496094, -71.72892761230469, -67.80795288085938, -63.886985778808594, -59.96601867675781, -56.04505157470703, -52.12408447265625, -48.20311737060547, -44.28215408325195, -40.36118698120117, -36.440223693847656, -32.519256591796875, -28.598289489746094, -24.677324295043945, -20.756357192993164, -16.835390090942383, -12.914424896240234, -8.993457794189453, -5.072490692138672, -1.1515240669250488, 2.769442558288574, 6.690408706665039, 10.61137580871582, 14.532342910766602, 18.45330810546875, 22.37427520751953, 26.295242309570312, 30.216209411621094, 34.137176513671875, 38.058143615722656, 41.97911071777344, 45.90007781982422, 49.821041107177734, 53.742008209228516, 57.6629753112793, 61.58394241333008, 65.5049057006836, 69.42587280273438, 73.34683990478516, 77.26780700683594, 81.18877410888672, 85.1097412109375, 89.03070831298828, 92.95167541503906, 96.87264251708984, 100.79360961914062, 104.7145767211914, 108.63554382324219, 112.55650329589844, 116.47747802734375, 120.3984375, 124.31940460205078, 128.24037170410156, 132.1613311767578, 136.08230590820312, 140.00326538085938, 143.9242401123047, 147.84519958496094, 151.76617431640625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 10.0, 9.0, 8.0, 10.0, 7.0, 13.0, 6.0, 24.0, 22.0, 20.0, 37.0, 43.0, 33.0, 38.0, 34.0, 33.0, 47.0, 56.0, 41.0, 48.0, 44.0, 44.0, 39.0, 48.0, 41.0, 28.0, 24.0, 30.0, 27.0, 18.0, 18.0, 15.0, 15.0, 11.0, 12.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-102.04652404785156, -98.91427612304688, -95.78202819824219, -92.6497802734375, -89.51753234863281, -86.38528442382812, -83.25303649902344, -80.12078094482422, -76.98853302001953, -73.85628509521484, -70.72403717041016, -67.59178924560547, -64.45954132080078, -61.32728958129883, -58.19504165649414, -55.06278991699219, -51.930545806884766, -48.79829788208008, -45.66604995727539, -42.53379821777344, -39.40155029296875, -36.26930236816406, -33.137054443359375, -30.004804611206055, -26.872556686401367, -23.74030876159668, -20.60805892944336, -17.475811004638672, -14.343562126159668, -11.211313247680664, -8.079065322875977, -4.946815490722656, -1.8145675659179688, 1.317681074142456, 4.449929714202881, 7.582178115844727, 10.71442699432373, 13.846675872802734, 16.978923797607422, 20.111173629760742, 23.24342155456543, 26.375669479370117, 29.507919311523438, 32.640167236328125, 35.77241516113281, 38.9046630859375, 42.03691101074219, 45.16916275024414, 48.30141067504883, 51.433658599853516, 54.5659065246582, 57.698158264160156, 60.830406188964844, 63.96265411376953, 67.09490203857422, 70.2271499633789, 73.3593978881836, 76.49164581298828, 79.62389373779297, 82.75614166259766, 85.88838958740234, 89.02064514160156, 92.15289306640625, 95.28514099121094, 98.41738891601562]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 7.0, 2.0, 14.0, 11.0, 11.0, 24.0, 29.0, 23.0, 23.0, 23.0, 41.0, 31.0, 38.0, 39.0, 35.0, 42.0, 61.0, 34.0, 46.0, 57.0, 51.0, 40.0, 39.0, 45.0, 34.0, 37.0, 29.0, 16.0, 27.0, 19.0, 17.0, 7.0, 9.0, 7.0, 4.0, 12.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7890625, -14.2735595703125, -13.758056640625, -13.2425537109375, -12.72705078125, -12.2115478515625, -11.696044921875, -11.1805419921875, -10.6650390625, -10.1495361328125, -9.634033203125, -9.1185302734375, -8.60302734375, -8.0875244140625, -7.572021484375, -7.0565185546875, -6.541015625, -6.0255126953125, -5.510009765625, -4.9945068359375, -4.47900390625, -3.9635009765625, -3.447998046875, -2.9324951171875, -2.4169921875, -1.9014892578125, -1.385986328125, -0.8704833984375, -0.35498046875, 0.1605224609375, 0.676025390625, 1.1915283203125, 1.70703125, 2.2225341796875, 2.738037109375, 3.2535400390625, 3.76904296875, 4.2845458984375, 4.800048828125, 5.3155517578125, 5.8310546875, 6.3465576171875, 6.862060546875, 7.3775634765625, 7.89306640625, 8.4085693359375, 8.924072265625, 9.4395751953125, 9.955078125, 10.4705810546875, 10.986083984375, 11.5015869140625, 12.01708984375, 12.5325927734375, 13.048095703125, 13.5635986328125, 14.0791015625, 14.5946044921875, 15.110107421875, 15.6256103515625, 16.14111328125, 16.6566162109375, 17.172119140625, 17.6876220703125, 18.203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 15.0, 31.0, 21.0, 46.0, 68.0, 83.0, 107.0, 141.0, 226.0, 314.0, 407.0, 634.0, 917.0, 1403.0, 2312.0, 4623.0, 14202.0, 134669.0, 1975508.0, 1892413.0, 140661.0, 14063.0, 4569.0, 2373.0, 1411.0, 961.0, 622.0, 435.0, 321.0, 217.0, 134.0, 105.0, 75.0, 39.0, 44.0, 24.0, 23.0, 16.0, 8.0, 7.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-35.53125, -34.544189453125, -33.55712890625, -32.570068359375, -31.5830078125, -30.595947265625, -29.60888671875, -28.621826171875, -27.634765625, -26.647705078125, -25.66064453125, -24.673583984375, -23.6865234375, -22.699462890625, -21.71240234375, -20.725341796875, -19.73828125, -18.751220703125, -17.76416015625, -16.777099609375, -15.7900390625, -14.802978515625, -13.81591796875, -12.828857421875, -11.841796875, -10.854736328125, -9.86767578125, -8.880615234375, -7.8935546875, -6.906494140625, -5.91943359375, -4.932373046875, -3.9453125, -2.958251953125, -1.97119140625, -0.984130859375, 0.0029296875, 0.989990234375, 1.97705078125, 2.964111328125, 3.951171875, 4.938232421875, 5.92529296875, 6.912353515625, 7.8994140625, 8.886474609375, 9.87353515625, 10.860595703125, 11.84765625, 12.834716796875, 13.82177734375, 14.808837890625, 15.7958984375, 16.782958984375, 17.77001953125, 18.757080078125, 19.744140625, 20.731201171875, 21.71826171875, 22.705322265625, 23.6923828125, 24.679443359375, 25.66650390625, 26.653564453125, 27.640625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 12.0, 14.0, 27.0, 29.0, 52.0, 92.0, 102.0, 197.0, 311.0, 586.0, 864.0, 771.0, 417.0, 226.0, 140.0, 77.0, 46.0, 35.0, 22.0, 24.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.828125, -22.825927734375, -21.82373046875, -20.821533203125, -19.8193359375, -18.817138671875, -17.81494140625, -16.812744140625, -15.810546875, -14.808349609375, -13.80615234375, -12.803955078125, -11.8017578125, -10.799560546875, -9.79736328125, -8.795166015625, -7.79296875, -6.790771484375, -5.78857421875, -4.786376953125, -3.7841796875, -2.781982421875, -1.77978515625, -0.777587890625, 0.224609375, 1.226806640625, 2.22900390625, 3.231201171875, 4.2333984375, 5.235595703125, 6.23779296875, 7.239990234375, 8.2421875, 9.244384765625, 10.24658203125, 11.248779296875, 12.2509765625, 13.253173828125, 14.25537109375, 15.257568359375, 16.259765625, 17.261962890625, 18.26416015625, 19.266357421875, 20.2685546875, 21.270751953125, 22.27294921875, 23.275146484375, 24.27734375, 25.279541015625, 26.28173828125, 27.283935546875, 28.2861328125, 29.288330078125, 30.29052734375, 31.292724609375, 32.294921875, 33.297119140625, 34.29931640625, 35.301513671875, 36.3037109375, 37.305908203125, 38.30810546875, 39.310302734375, 40.3125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 6.0, 24.0, 29.0, 42.0, 65.0, 136.0, 271.0, 754.0, 3018.0, 25459.0, 2422307.0, 1715122.0, 22746.0, 2814.0, 803.0, 314.0, 150.0, 80.0, 47.0, 32.0, 21.0, 8.0, 13.0, 10.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.3125, -76.4013671875, -74.490234375, -72.5791015625, -70.66796875, -68.7568359375, -66.845703125, -64.9345703125, -63.0234375, -61.1123046875, -59.201171875, -57.2900390625, -55.37890625, -53.4677734375, -51.556640625, -49.6455078125, -47.734375, -45.8232421875, -43.912109375, -42.0009765625, -40.08984375, -38.1787109375, -36.267578125, -34.3564453125, -32.4453125, -30.5341796875, -28.623046875, -26.7119140625, -24.80078125, -22.8896484375, -20.978515625, -19.0673828125, -17.15625, -15.2451171875, -13.333984375, -11.4228515625, -9.51171875, -7.6005859375, -5.689453125, -3.7783203125, -1.8671875, 0.0439453125, 1.955078125, 3.8662109375, 5.77734375, 7.6884765625, 9.599609375, 11.5107421875, 13.421875, 15.3330078125, 17.244140625, 19.1552734375, 21.06640625, 22.9775390625, 24.888671875, 26.7998046875, 28.7109375, 30.6220703125, 32.533203125, 34.4443359375, 36.35546875, 38.2666015625, 40.177734375, 42.0888671875, 44.0]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 109.0, 420.0, 402.0, 61.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.65985107421875, -206.4739227294922, -194.28799438476562, -182.10208129882812, -169.91615295410156, -157.730224609375, -145.5443115234375, -133.35838317871094, -121.17245483398438, -108.98652648925781, -96.80060577392578, -84.61468505859375, -72.42875671386719, -60.24283218383789, -48.056907653808594, -35.87098693847656, -23.68505859375, -11.499134063720703, 0.6867904663085938, 12.87271499633789, 25.058639526367188, 37.244564056396484, 49.43048858642578, 61.61640930175781, 73.80233764648438, 85.98826599121094, 98.17418670654297, 110.360107421875, 122.54603576660156, 134.73196411132812, 146.91787719726562, 159.1038055419922, 171.28973388671875, 183.4756622314453, 195.66159057617188, 207.84750366210938, 220.03343200683594, 232.2193603515625, 244.4052734375, 256.5911865234375, 268.7771301269531, 280.9630432128906, 293.14898681640625, 305.33489990234375, 317.52081298828125, 329.7067565917969, 341.8926696777344, 354.07861328125, 366.2645263671875, 378.450439453125, 390.6363830566406, 402.8222961425781, 415.00823974609375, 427.19415283203125, 439.38006591796875, 451.56597900390625, 463.7519226074219, 475.9378356933594, 488.123779296875, 500.3096923828125, 512.49560546875, 524.6815185546875, 536.8674926757812, 549.0534057617188, 561.2393188476562]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 7.0, 7.0, 12.0, 16.0, 8.0, 23.0, 20.0, 26.0, 15.0, 32.0, 29.0, 40.0, 35.0, 43.0, 44.0, 35.0, 38.0, 39.0, 46.0, 44.0, 42.0, 46.0, 46.0, 37.0, 32.0, 34.0, 33.0, 23.0, 23.0, 16.0, 8.0, 13.0, 15.0, 9.0, 14.0, 10.0, 7.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.37522888183594, -77.98039245605469, -75.58555603027344, -73.19071960449219, -70.79588317871094, -68.40104675292969, -66.00621032714844, -63.61137008666992, -61.21653366088867, -58.82169723510742, -56.42686080932617, -54.03202438354492, -51.637184143066406, -49.242347717285156, -46.847511291503906, -44.452674865722656, -42.057838439941406, -39.663002014160156, -37.268165588378906, -34.873329162597656, -32.478492736816406, -30.083654403686523, -27.68881607055664, -25.29397964477539, -22.89914321899414, -20.50430679321289, -18.10947036743164, -15.714632034301758, -13.319795608520508, -10.924959182739258, -8.530121803283691, -6.135284423828125, -3.740447998046875, -1.3456110954284668, 1.0492258071899414, 3.4440627098083496, 5.838899612426758, 8.233736038208008, 10.628573417663574, 13.02341079711914, 15.41824722290039, 17.81308364868164, 20.20792007446289, 22.602758407592773, 24.997594833374023, 27.392431259155273, 29.787269592285156, 32.182106018066406, 34.576942443847656, 36.971778869628906, 39.366615295410156, 41.761451721191406, 44.156288146972656, 46.551124572753906, 48.94596481323242, 51.34080123901367, 53.73563766479492, 56.13047409057617, 58.52531051635742, 60.92014694213867, 63.31498718261719, 65.70982360839844, 68.10466003417969, 70.49949645996094, 72.89433288574219]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 11.0, 12.0, 13.0, 21.0, 25.0, 13.0, 32.0, 26.0, 37.0, 49.0, 45.0, 42.0, 44.0, 36.0, 50.0, 41.0, 34.0, 53.0, 53.0, 43.0, 51.0, 25.0, 37.0, 22.0, 21.0, 25.0, 23.0, 9.0, 18.0, 13.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1400146484375, -11.717529296875, -11.2950439453125, -10.87255859375, -10.4500732421875, -10.027587890625, -9.6051025390625, -9.1826171875, -8.7601318359375, -8.337646484375, -7.9151611328125, -7.49267578125, -7.0701904296875, -6.647705078125, -6.2252197265625, -5.802734375, -5.3802490234375, -4.957763671875, -4.5352783203125, -4.11279296875, -3.6903076171875, -3.267822265625, -2.8453369140625, -2.4228515625, -2.0003662109375, -1.577880859375, -1.1553955078125, -0.73291015625, -0.3104248046875, 0.112060546875, 0.5345458984375, 0.95703125, 1.3795166015625, 1.802001953125, 2.2244873046875, 2.64697265625, 3.0694580078125, 3.491943359375, 3.9144287109375, 4.3369140625, 4.7593994140625, 5.181884765625, 5.6043701171875, 6.02685546875, 6.4493408203125, 6.871826171875, 7.2943115234375, 7.716796875, 8.1392822265625, 8.561767578125, 8.9842529296875, 9.40673828125, 9.8292236328125, 10.251708984375, 10.6741943359375, 11.0966796875, 11.5191650390625, 11.941650390625, 12.3641357421875, 12.78662109375, 13.2091064453125, 13.631591796875, 14.0540771484375, 14.4765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 11.0, 14.0, 18.0, 28.0, 33.0, 67.0, 93.0, 124.0, 225.0, 296.0, 469.0, 732.0, 1040.0, 1721.0, 2670.0, 4078.0, 6698.0, 10578.0, 17010.0, 26867.0, 44593.0, 73476.0, 124750.0, 223719.0, 211548.0, 117223.0, 69563.0, 41593.0, 25664.0, 16172.0, 10011.0, 6222.0, 3993.0, 2496.0, 1600.0, 1077.0, 708.0, 461.0, 297.0, 221.0, 130.0, 84.0, 51.0, 56.0, 22.0, 17.0, 14.0, 9.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2110595703125, -0.2042388916015625, -0.197418212890625, -0.1905975341796875, -0.18377685546875, -0.1769561767578125, -0.170135498046875, -0.1633148193359375, -0.156494140625, -0.1496734619140625, -0.142852783203125, -0.1360321044921875, -0.12921142578125, -0.1223907470703125, -0.115570068359375, -0.1087493896484375, -0.1019287109375, -0.0951080322265625, -0.088287353515625, -0.0814666748046875, -0.07464599609375, -0.0678253173828125, -0.061004638671875, -0.0541839599609375, -0.04736328125, -0.0405426025390625, -0.033721923828125, -0.0269012451171875, -0.02008056640625, -0.0132598876953125, -0.006439208984375, 0.0003814697265625, 0.0072021484375, 0.0140228271484375, 0.020843505859375, 0.0276641845703125, 0.03448486328125, 0.0413055419921875, 0.048126220703125, 0.0549468994140625, 0.061767578125, 0.0685882568359375, 0.075408935546875, 0.0822296142578125, 0.08905029296875, 0.0958709716796875, 0.102691650390625, 0.1095123291015625, 0.1163330078125, 0.1231536865234375, 0.129974365234375, 0.1367950439453125, 0.14361572265625, 0.1504364013671875, 0.157257080078125, 0.1640777587890625, 0.1708984375, 0.1777191162109375, 0.184539794921875, 0.1913604736328125, 0.19818115234375, 0.2050018310546875, 0.211822509765625, 0.2186431884765625, 0.2254638671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 17.0, 15.0, 14.0, 22.0, 27.0, 23.0, 23.0, 31.0, 34.0, 35.0, 38.0, 43.0, 52.0, 41.0, 47.0, 1072.0, 44.0, 39.0, 42.0, 36.0, 33.0, 35.0, 31.0, 28.0, 27.0, 30.0, 22.0, 10.0, 20.0, 12.0, 21.0, 10.0, 3.0, 9.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.3912353515625, -8.110595703125, -7.8299560546875, -7.54931640625, -7.2686767578125, -6.988037109375, -6.7073974609375, -6.4267578125, -6.1461181640625, -5.865478515625, -5.5848388671875, -5.30419921875, -5.0235595703125, -4.742919921875, -4.4622802734375, -4.181640625, -3.9010009765625, -3.620361328125, -3.3397216796875, -3.05908203125, -2.7784423828125, -2.497802734375, -2.2171630859375, -1.9365234375, -1.6558837890625, -1.375244140625, -1.0946044921875, -0.81396484375, -0.5333251953125, -0.252685546875, 0.0279541015625, 0.30859375, 0.5892333984375, 0.869873046875, 1.1505126953125, 1.43115234375, 1.7117919921875, 1.992431640625, 2.2730712890625, 2.5537109375, 2.8343505859375, 3.114990234375, 3.3956298828125, 3.67626953125, 3.9569091796875, 4.237548828125, 4.5181884765625, 4.798828125, 5.0794677734375, 5.360107421875, 5.6407470703125, 5.92138671875, 6.2020263671875, 6.482666015625, 6.7633056640625, 7.0439453125, 7.3245849609375, 7.605224609375, 7.8858642578125, 8.16650390625, 8.4471435546875, 8.727783203125, 9.0084228515625, 9.2890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 6.0, 7.0, 14.0, 25.0, 40.0, 46.0, 75.0, 107.0, 155.0, 228.0, 364.0, 508.0, 776.0, 1308.0, 1840.0, 2731.0, 4153.0, 6305.0, 9780.0, 15446.0, 24691.0, 40232.0, 65637.0, 112469.0, 201314.0, 1277942.0, 131531.0, 75656.0, 45967.0, 28421.0, 17429.0, 11158.0, 7146.0, 4595.0, 3034.0, 2013.0, 1256.0, 851.0, 585.0, 443.0, 310.0, 211.0, 97.0, 68.0, 48.0, 35.0, 25.0, 21.0, 14.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.13818359375, -0.1337451934814453, -0.12930679321289062, -0.12486839294433594, -0.12042999267578125, -0.11599159240722656, -0.11155319213867188, -0.10711479187011719, -0.1026763916015625, -0.09823799133300781, -0.09379959106445312, -0.08936119079589844, -0.08492279052734375, -0.08048439025878906, -0.07604598999023438, -0.07160758972167969, -0.067169189453125, -0.06273078918457031, -0.058292388916015625, -0.05385398864746094, -0.04941558837890625, -0.04497718811035156, -0.040538787841796875, -0.03610038757324219, -0.0316619873046875, -0.027223587036132812, -0.022785186767578125, -0.018346786499023438, -0.01390838623046875, -0.009469985961914062, -0.005031585693359375, -0.0005931854248046875, 0.00384521484375, 0.008283615112304688, 0.012722015380859375, 0.017160415649414062, 0.02159881591796875, 0.026037216186523438, 0.030475616455078125, 0.03491401672363281, 0.0393524169921875, 0.04379081726074219, 0.048229217529296875, 0.05266761779785156, 0.05710601806640625, 0.06154441833496094, 0.06598281860351562, 0.07042121887207031, 0.074859619140625, 0.07929801940917969, 0.08373641967773438, 0.08817481994628906, 0.09261322021484375, 0.09705162048339844, 0.10149002075195312, 0.10592842102050781, 0.1103668212890625, 0.11480522155761719, 0.11924362182617188, 0.12368202209472656, 0.12812042236328125, 0.13255882263183594, 0.13699722290039062, 0.1414356231689453, 0.1458740234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 5.0, 12.0, 5.0, 17.0, 16.0, 19.0, 24.0, 31.0, 33.0, 49.0, 42.0, 66.0, 62.0, 70.0, 86.0, 63.0, 46.0, 55.0, 39.0, 50.0, 41.0, 21.0, 22.0, 24.0, 27.0, 13.0, 4.0, 4.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001347064971923828, -0.0001301206648349762, -0.00012553483247756958, -0.00012094900012016296, -0.00011636316776275635, -0.00011177733540534973, -0.00010719150304794312, -0.0001026056706905365, -9.801983833312988e-05, -9.343400597572327e-05, -8.884817361831665e-05, -8.426234126091003e-05, -7.967650890350342e-05, -7.50906765460968e-05, -7.050484418869019e-05, -6.591901183128357e-05, -6.133317947387695e-05, -5.674734711647034e-05, -5.216151475906372e-05, -4.7575682401657104e-05, -4.298985004425049e-05, -3.840401768684387e-05, -3.3818185329437256e-05, -2.923235297203064e-05, -2.4646520614624023e-05, -2.0060688257217407e-05, -1.547485589981079e-05, -1.0889023542404175e-05, -6.303191184997559e-06, -1.7173588275909424e-06, 2.868473529815674e-06, 7.45430588722229e-06, 1.2040138244628906e-05, 1.6625970602035522e-05, 2.121180295944214e-05, 2.5797635316848755e-05, 3.038346767425537e-05, 3.496930003166199e-05, 3.9555132389068604e-05, 4.414096474647522e-05, 4.8726797103881836e-05, 5.331262946128845e-05, 5.789846181869507e-05, 6.248429417610168e-05, 6.70701265335083e-05, 7.165595889091492e-05, 7.624179124832153e-05, 8.082762360572815e-05, 8.541345596313477e-05, 8.999928832054138e-05, 9.4585120677948e-05, 9.917095303535461e-05, 0.00010375678539276123, 0.00010834261775016785, 0.00011292845010757446, 0.00011751428246498108, 0.0001221001148223877, 0.0001266859471797943, 0.00013127177953720093, 0.00013585761189460754, 0.00014044344425201416, 0.00014502927660942078, 0.0001496151089668274, 0.000154200941324234, 0.00015878677368164062]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 7.0, 11.0, 6.0, 12.0, 21.0, 39.0, 27.0, 40.0, 72.0, 104.0, 139.0, 233.0, 446.0, 1320.0, 152831.0, 889387.0, 2443.0, 537.0, 282.0, 170.0, 113.0, 76.0, 43.0, 39.0, 32.0, 24.0, 13.0, 12.0, 10.0, 10.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0034618377685546875, -0.003360360860824585, -0.0032588839530944824, -0.00315740704536438, -0.0030559301376342773, -0.002954453229904175, -0.0028529763221740723, -0.0027514994144439697, -0.002650022506713867, -0.0025485455989837646, -0.002447068691253662, -0.0023455917835235596, -0.002244114875793457, -0.0021426379680633545, -0.002041161060333252, -0.0019396841526031494, -0.0018382072448730469, -0.0017367303371429443, -0.0016352534294128418, -0.0015337765216827393, -0.0014322996139526367, -0.0013308227062225342, -0.0012293457984924316, -0.001127868890762329, -0.0010263919830322266, -0.000924915075302124, -0.0008234381675720215, -0.0007219612598419189, -0.0006204843521118164, -0.0005190074443817139, -0.00041753053665161133, -0.0003160536289215088, -0.00021457672119140625, -0.00011309981346130371, -1.1622905731201172e-05, 8.985400199890137e-05, 0.0001913309097290039, 0.00029280781745910645, 0.000394284725189209, 0.0004957616329193115, 0.0005972385406494141, 0.0006987154483795166, 0.0008001923561096191, 0.0009016692638397217, 0.0010031461715698242, 0.0011046230792999268, 0.0012060999870300293, 0.0013075768947601318, 0.0014090538024902344, 0.001510530710220337, 0.0016120076179504395, 0.001713484525680542, 0.0018149614334106445, 0.001916438341140747, 0.0020179152488708496, 0.002119392156600952, 0.0022208690643310547, 0.0023223459720611572, 0.0024238228797912598, 0.0025252997875213623, 0.002626776695251465, 0.0027282536029815674, 0.00282973051071167, 0.0029312074184417725, 0.003032684326171875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 106.0, 909.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045334320748224854, -0.0003064321062993258, -0.0001595210051164031, -1.2609903933480382e-05, 0.00013430119724944234, 0.0002812123275361955, 0.0004281233996152878, 0.00057503447169438, 0.0007219456019811332, 0.0008688566740602255, 0.0010157678043469787, 0.0011626789346337318, 0.0013095899485051632, 0.0014565011952072382, 0.0016034122090786695, 0.001750323222950101, 0.001897234469652176, 0.0020441454835236073, 0.0021910567302256823, 0.0023379677440971136, 0.0024848789907991886, 0.00263179000467062, 0.0027787010185420513, 0.0029256120324134827, 0.0030725232791155577, 0.003219434292986989, 0.003366345539689064, 0.0035132565535604954, 0.0036601675674319267, 0.0038070788141340017, 0.003953990060836077, 0.004100901074707508, 0.004247811622917652, 0.0043947226367890835, 0.004541633650660515, 0.0046885451301932335, 0.004835456144064665, 0.004982367157936096, 0.0051292781718075275, 0.005276189185678959, 0.0054231006652116776, 0.005570011679083109, 0.00571692269295454, 0.005863834172487259, 0.00601074518635869, 0.006157656200230122, 0.006304567214101553, 0.006451478227972984, 0.006598389241844416, 0.006745300255715847, 0.006892211269587278, 0.007039122749119997, 0.007186033762991428, 0.00733294477686286, 0.007479855790734291, 0.007626766804605722, 0.007773677818477154, 0.007920589298009872, 0.008067499846220016, 0.008214411325752735, 0.00836132187396288, 0.008508233353495598, 0.008655144833028316, 0.00880205538123846, 0.00894896686077118]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 17.0, 21.0, 56.0, 89.0, 147.0, 174.0, 178.0, 133.0, 100.0, 51.0, 24.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040650367736816406, -0.0003951890394091606, -0.00038387440145015717, -0.0003725597634911537, -0.00036124512553215027, -0.0003499304875731468, -0.00033861584961414337, -0.0003273012116551399, -0.0003159865736961365, -0.000304671935737133, -0.0002933572977781296, -0.00028204265981912613, -0.0002707280218601227, -0.00025941338390111923, -0.0002480987459421158, -0.00023678410798311234, -0.0002254694700241089, -0.00021415483206510544, -0.000202840194106102, -0.00019152555614709854, -0.0001802109181880951, -0.00016889628022909164, -0.0001575816422700882, -0.00014626700431108475, -0.0001349523663520813, -0.00012363772839307785, -0.0001123230904340744, -0.00010100845247507095, -8.96938145160675e-05, -7.837917655706406e-05, -6.706453859806061e-05, -5.574990063905716e-05, -4.443526268005371e-05, -3.312062472105026e-05, -2.1805986762046814e-05, -1.0491348803043365e-05, 8.23289155960083e-07, 1.2137927114963531e-05, 2.345256507396698e-05, 3.476720303297043e-05, 4.608184099197388e-05, 5.7396478950977325e-05, 6.871111690998077e-05, 8.002575486898422e-05, 9.134039282798767e-05, 0.00010265503078699112, 0.00011396966874599457, 0.00012528430670499802, 0.00013659894466400146, 0.0001479135826230049, 0.00015922822058200836, 0.0001705428585410118, 0.00018185749650001526, 0.0001931721344590187, 0.00020448677241802216, 0.0002158014103770256, 0.00022711604833602905, 0.0002384306862950325, 0.00024974532425403595, 0.0002610599622130394, 0.00027237460017204285, 0.0002836892381310463, 0.00029500387609004974, 0.0003063185140490532, 0.00031763315200805664]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 6.0, 10.0, 18.0, 11.0, 12.0, 13.0, 21.0, 25.0, 13.0, 32.0, 26.0, 37.0, 49.0, 45.0, 42.0, 44.0, 36.0, 50.0, 41.0, 34.0, 53.0, 53.0, 43.0, 51.0, 25.0, 37.0, 22.0, 21.0, 25.0, 23.0, 9.0, 18.0, 13.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5625, -12.1400146484375, -11.717529296875, -11.2950439453125, -10.87255859375, -10.4500732421875, -10.027587890625, -9.6051025390625, -9.1826171875, -8.7601318359375, -8.337646484375, -7.9151611328125, -7.49267578125, -7.0701904296875, -6.647705078125, -6.2252197265625, -5.802734375, -5.3802490234375, -4.957763671875, -4.5352783203125, -4.11279296875, -3.6903076171875, -3.267822265625, -2.8453369140625, -2.4228515625, -2.0003662109375, -1.577880859375, -1.1553955078125, -0.73291015625, -0.3104248046875, 0.112060546875, 0.5345458984375, 0.95703125, 1.3795166015625, 1.802001953125, 2.2244873046875, 2.64697265625, 3.0694580078125, 3.491943359375, 3.9144287109375, 4.3369140625, 4.7593994140625, 5.181884765625, 5.6043701171875, 6.02685546875, 6.4493408203125, 6.871826171875, 7.2943115234375, 7.716796875, 8.1392822265625, 8.561767578125, 8.9842529296875, 9.40673828125, 9.8292236328125, 10.251708984375, 10.6741943359375, 11.0966796875, 11.5191650390625, 11.941650390625, 12.3641357421875, 12.78662109375, 13.2091064453125, 13.631591796875, 14.0540771484375, 14.4765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 13.0, 12.0, 29.0, 30.0, 42.0, 55.0, 84.0, 132.0, 187.0, 338.0, 606.0, 1086.0, 2269.0, 5365.0, 16682.0, 92460.0, 696774.0, 192545.0, 26369.0, 7386.0, 2857.0, 1376.0, 731.0, 425.0, 228.0, 137.0, 97.0, 64.0, 46.0, 33.0, 18.0, 22.0, 11.0, 9.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.539306640625, -20.81298828125, -20.086669921875, -19.3603515625, -18.634033203125, -17.90771484375, -17.181396484375, -16.455078125, -15.728759765625, -15.00244140625, -14.276123046875, -13.5498046875, -12.823486328125, -12.09716796875, -11.370849609375, -10.64453125, -9.918212890625, -9.19189453125, -8.465576171875, -7.7392578125, -7.012939453125, -6.28662109375, -5.560302734375, -4.833984375, -4.107666015625, -3.38134765625, -2.655029296875, -1.9287109375, -1.202392578125, -0.47607421875, 0.250244140625, 0.9765625, 1.702880859375, 2.42919921875, 3.155517578125, 3.8818359375, 4.608154296875, 5.33447265625, 6.060791015625, 6.787109375, 7.513427734375, 8.23974609375, 8.966064453125, 9.6923828125, 10.418701171875, 11.14501953125, 11.871337890625, 12.59765625, 13.323974609375, 14.05029296875, 14.776611328125, 15.5029296875, 16.229248046875, 16.95556640625, 17.681884765625, 18.408203125, 19.134521484375, 19.86083984375, 20.587158203125, 21.3134765625, 22.039794921875, 22.76611328125, 23.492431640625, 24.21875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 1.0, 9.0, 14.0, 12.0, 15.0, 26.0, 19.0, 30.0, 18.0, 30.0, 42.0, 51.0, 75.0, 88.0, 185.0, 1560.0, 322.0, 120.0, 81.0, 53.0, 51.0, 43.0, 28.0, 29.0, 18.0, 23.0, 17.0, 17.0, 14.0, 20.0, 6.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.125, -29.146484375, -28.16796875, -27.189453125, -26.2109375, -25.232421875, -24.25390625, -23.275390625, -22.296875, -21.318359375, -20.33984375, -19.361328125, -18.3828125, -17.404296875, -16.42578125, -15.447265625, -14.46875, -13.490234375, -12.51171875, -11.533203125, -10.5546875, -9.576171875, -8.59765625, -7.619140625, -6.640625, -5.662109375, -4.68359375, -3.705078125, -2.7265625, -1.748046875, -0.76953125, 0.208984375, 1.1875, 2.166015625, 3.14453125, 4.123046875, 5.1015625, 6.080078125, 7.05859375, 8.037109375, 9.015625, 9.994140625, 10.97265625, 11.951171875, 12.9296875, 13.908203125, 14.88671875, 15.865234375, 16.84375, 17.822265625, 18.80078125, 19.779296875, 20.7578125, 21.736328125, 22.71484375, 23.693359375, 24.671875, 25.650390625, 26.62890625, 27.607421875, 28.5859375, 29.564453125, 30.54296875, 31.521484375, 32.5]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 10.0, 7.0, 21.0, 18.0, 25.0, 25.0, 27.0, 46.0, 75.0, 134.0, 245.0, 470.0, 1249.0, 62772.0, 3076171.0, 2940.0, 695.0, 309.0, 157.0, 81.0, 56.0, 39.0, 31.0, 28.0, 19.0, 12.0, 6.0, 5.0, 7.0, 5.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.9375, -83.3505859375, -80.763671875, -78.1767578125, -75.58984375, -73.0029296875, -70.416015625, -67.8291015625, -65.2421875, -62.6552734375, -60.068359375, -57.4814453125, -54.89453125, -52.3076171875, -49.720703125, -47.1337890625, -44.546875, -41.9599609375, -39.373046875, -36.7861328125, -34.19921875, -31.6123046875, -29.025390625, -26.4384765625, -23.8515625, -21.2646484375, -18.677734375, -16.0908203125, -13.50390625, -10.9169921875, -8.330078125, -5.7431640625, -3.15625, -0.5693359375, 2.017578125, 4.6044921875, 7.19140625, 9.7783203125, 12.365234375, 14.9521484375, 17.5390625, 20.1259765625, 22.712890625, 25.2998046875, 27.88671875, 30.4736328125, 33.060546875, 35.6474609375, 38.234375, 40.8212890625, 43.408203125, 45.9951171875, 48.58203125, 51.1689453125, 53.755859375, 56.3427734375, 58.9296875, 61.5166015625, 64.103515625, 66.6904296875, 69.27734375, 71.8642578125, 74.451171875, 77.0380859375, 79.625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 198.0, 711.0, 88.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34883117675781, -27.304141998291016, -19.259450912475586, -11.214759826660156, -3.1700706481933594, 4.8746185302734375, 12.9193115234375, 20.964000701904297, 29.008689880371094, 37.05337905883789, 45.09806823730469, 53.14276123046875, 61.18745040893555, 69.23213958740234, 77.2768325805664, 85.32151794433594, 93.3662109375, 101.41090393066406, 109.4555892944336, 117.50028228759766, 125.54496765136719, 133.58966064453125, 141.6343536376953, 149.67904663085938, 157.72372436523438, 165.76841735839844, 173.8131103515625, 181.8577880859375, 189.90248107910156, 197.94717407226562, 205.9918670654297, 214.03656005859375, 222.08126831054688, 230.12596130371094, 238.170654296875, 246.21533203125, 254.26002502441406, 262.3047180175781, 270.34942626953125, 278.39410400390625, 286.43878173828125, 294.48345947265625, 302.5281677246094, 310.5728454589844, 318.6175537109375, 326.6622314453125, 334.7069091796875, 342.7516174316406, 350.79632568359375, 358.84100341796875, 366.8857116699219, 374.9303894042969, 382.97509765625, 391.019775390625, 399.064453125, 407.1091613769531, 415.1538391113281, 423.1985168457031, 431.24322509765625, 439.28790283203125, 447.3326110839844, 455.3772888183594, 463.4219970703125, 471.4666748046875, 479.5113525390625]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 11.0, 14.0, 11.0, 19.0, 26.0, 19.0, 28.0, 27.0, 31.0, 30.0, 37.0, 44.0, 34.0, 44.0, 45.0, 48.0, 46.0, 42.0, 39.0, 37.0, 38.0, 46.0, 23.0, 42.0, 42.0, 25.0, 26.0, 22.0, 24.0, 12.0, 17.0, 9.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-81.09115600585938, -78.91677856445312, -76.74239349365234, -74.5680160522461, -72.39363098144531, -70.21925354003906, -68.04486846923828, -65.87049102783203, -63.69610595703125, -61.521724700927734, -59.34734344482422, -57.1729621887207, -54.99858093261719, -52.82419967651367, -50.649818420410156, -48.475440979003906, -46.30105972290039, -44.126678466796875, -41.95229721069336, -39.777915954589844, -37.60353469848633, -35.42915344238281, -33.25477600097656, -31.080392837524414, -28.9060115814209, -26.731630325317383, -24.557249069213867, -22.382869720458984, -20.20848846435547, -18.034107208251953, -15.859725952148438, -13.685344696044922, -11.510963439941406, -9.33658218383789, -7.162201404571533, -4.987820625305176, -2.81343936920166, -0.6390581130981445, 1.5353221893310547, 3.7097034454345703, 5.884084701538086, 8.058465957641602, 10.232847213745117, 12.407227516174316, 14.581608772277832, 16.75598907470703, 18.930370330810547, 21.104751586914062, 23.279132843017578, 25.453514099121094, 27.62789535522461, 29.802276611328125, 31.97665786743164, 34.151039123535156, 36.325416564941406, 38.49980163574219, 40.67417907714844, 42.84856033325195, 45.02294158935547, 47.197322845458984, 49.3717041015625, 51.546085357666016, 53.72046661376953, 55.89484405517578, 58.06922912597656]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 12.0, 14.0, 18.0, 11.0, 23.0, 19.0, 14.0, 26.0, 29.0, 40.0, 41.0, 38.0, 57.0, 36.0, 49.0, 45.0, 42.0, 40.0, 47.0, 54.0, 40.0, 43.0, 40.0, 30.0, 33.0, 24.0, 19.0, 24.0, 15.0, 12.0, 13.0, 14.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.34375, -13.8814697265625, -13.419189453125, -12.9569091796875, -12.49462890625, -12.0323486328125, -11.570068359375, -11.1077880859375, -10.6455078125, -10.1832275390625, -9.720947265625, -9.2586669921875, -8.79638671875, -8.3341064453125, -7.871826171875, -7.4095458984375, -6.947265625, -6.4849853515625, -6.022705078125, -5.5604248046875, -5.09814453125, -4.6358642578125, -4.173583984375, -3.7113037109375, -3.2490234375, -2.7867431640625, -2.324462890625, -1.8621826171875, -1.39990234375, -0.9376220703125, -0.475341796875, -0.0130615234375, 0.44921875, 0.9114990234375, 1.373779296875, 1.8360595703125, 2.29833984375, 2.7606201171875, 3.222900390625, 3.6851806640625, 4.1474609375, 4.6097412109375, 5.072021484375, 5.5343017578125, 5.99658203125, 6.4588623046875, 6.921142578125, 7.3834228515625, 7.845703125, 8.3079833984375, 8.770263671875, 9.2325439453125, 9.69482421875, 10.1571044921875, 10.619384765625, 11.0816650390625, 11.5439453125, 12.0062255859375, 12.468505859375, 12.9307861328125, 13.39306640625, 13.8553466796875, 14.317626953125, 14.7799072265625, 15.2421875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 1.0, 5.0, 5.0, 6.0, 10.0, 24.0, 24.0, 38.0, 38.0, 46.0, 83.0, 120.0, 143.0, 190.0, 312.0, 422.0, 744.0, 1362.0, 2850.0, 7877.0, 32414.0, 1099880.0, 2970339.0, 57973.0, 11410.0, 3876.0, 1641.0, 837.0, 510.0, 334.0, 226.0, 146.0, 108.0, 89.0, 61.0, 41.0, 34.0, 25.0, 17.0, 12.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.6875, -64.4755859375, -62.263671875, -60.0517578125, -57.83984375, -55.6279296875, -53.416015625, -51.2041015625, -48.9921875, -46.7802734375, -44.568359375, -42.3564453125, -40.14453125, -37.9326171875, -35.720703125, -33.5087890625, -31.296875, -29.0849609375, -26.873046875, -24.6611328125, -22.44921875, -20.2373046875, -18.025390625, -15.8134765625, -13.6015625, -11.3896484375, -9.177734375, -6.9658203125, -4.75390625, -2.5419921875, -0.330078125, 1.8818359375, 4.09375, 6.3056640625, 8.517578125, 10.7294921875, 12.94140625, 15.1533203125, 17.365234375, 19.5771484375, 21.7890625, 24.0009765625, 26.212890625, 28.4248046875, 30.63671875, 32.8486328125, 35.060546875, 37.2724609375, 39.484375, 41.6962890625, 43.908203125, 46.1201171875, 48.33203125, 50.5439453125, 52.755859375, 54.9677734375, 57.1796875, 59.3916015625, 61.603515625, 63.8154296875, 66.02734375, 68.2392578125, 70.451171875, 72.6630859375, 74.875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 12.0, 7.0, 17.0, 25.0, 28.0, 37.0, 44.0, 55.0, 86.0, 111.0, 190.0, 236.0, 433.0, 630.0, 655.0, 510.0, 327.0, 183.0, 148.0, 90.0, 63.0, 40.0, 38.0, 26.0, 23.0, 21.0, 7.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-33.53125, -32.65478515625, -31.7783203125, -30.90185546875, -30.025390625, -29.14892578125, -28.2724609375, -27.39599609375, -26.51953125, -25.64306640625, -24.7666015625, -23.89013671875, -23.013671875, -22.13720703125, -21.2607421875, -20.38427734375, -19.5078125, -18.63134765625, -17.7548828125, -16.87841796875, -16.001953125, -15.12548828125, -14.2490234375, -13.37255859375, -12.49609375, -11.61962890625, -10.7431640625, -9.86669921875, -8.990234375, -8.11376953125, -7.2373046875, -6.36083984375, -5.484375, -4.60791015625, -3.7314453125, -2.85498046875, -1.978515625, -1.10205078125, -0.2255859375, 0.65087890625, 1.52734375, 2.40380859375, 3.2802734375, 4.15673828125, 5.033203125, 5.90966796875, 6.7861328125, 7.66259765625, 8.5390625, 9.41552734375, 10.2919921875, 11.16845703125, 12.044921875, 12.92138671875, 13.7978515625, 14.67431640625, 15.55078125, 16.42724609375, 17.3037109375, 18.18017578125, 19.056640625, 19.93310546875, 20.8095703125, 21.68603515625, 22.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 9.0, 19.0, 37.0, 62.0, 152.0, 331.0, 969.0, 2963.0, 9701.0, 38964.0, 253093.0, 3273127.0, 534690.0, 60286.0, 13874.0, 3844.0, 1303.0, 455.0, 200.0, 100.0, 47.0, 25.0, 17.0, 6.0, 0.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.6875, -32.4228515625, -31.158203125, -29.8935546875, -28.62890625, -27.3642578125, -26.099609375, -24.8349609375, -23.5703125, -22.3056640625, -21.041015625, -19.7763671875, -18.51171875, -17.2470703125, -15.982421875, -14.7177734375, -13.453125, -12.1884765625, -10.923828125, -9.6591796875, -8.39453125, -7.1298828125, -5.865234375, -4.6005859375, -3.3359375, -2.0712890625, -0.806640625, 0.4580078125, 1.72265625, 2.9873046875, 4.251953125, 5.5166015625, 6.78125, 8.0458984375, 9.310546875, 10.5751953125, 11.83984375, 13.1044921875, 14.369140625, 15.6337890625, 16.8984375, 18.1630859375, 19.427734375, 20.6923828125, 21.95703125, 23.2216796875, 24.486328125, 25.7509765625, 27.015625, 28.2802734375, 29.544921875, 30.8095703125, 32.07421875, 33.3388671875, 34.603515625, 35.8681640625, 37.1328125, 38.3974609375, 39.662109375, 40.9267578125, 42.19140625, 43.4560546875, 44.720703125, 45.9853515625, 47.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 5.0, 3.0, 6.0, 1.0, 5.0, 6.0, 16.0, 7.0, 9.0, 17.0, 16.0, 35.0, 39.0, 35.0, 39.0, 55.0, 53.0, 57.0, 75.0, 70.0, 68.0, 66.0, 62.0, 47.0, 38.0, 37.0, 28.0, 24.0, 22.0, 14.0, 13.0, 13.0, 12.0, 3.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.01224517822266, -100.30632781982422, -96.60041809082031, -92.89450073242188, -89.18858337402344, -85.482666015625, -81.7767562866211, -78.07083892822266, -74.36492919921875, -70.65901184082031, -66.9531021118164, -63.24718475341797, -59.54126739501953, -55.83535385131836, -52.12944030761719, -48.42352294921875, -44.71760559082031, -41.01169204711914, -37.3057746887207, -33.59986114501953, -29.893945693969727, -26.188030242919922, -22.48211669921875, -18.776201248168945, -15.07028579711914, -11.364370346069336, -7.658455848693848, -3.9525413513183594, -0.2466259002685547, 3.45928955078125, 7.165203094482422, 10.871118545532227, 14.577041625976562, 18.282957077026367, 21.988872528076172, 25.694786071777344, 29.40070152282715, 33.10661697387695, 36.812530517578125, 40.51844787597656, 44.224361419677734, 47.930274963378906, 51.636192321777344, 55.342105865478516, 59.04801940917969, 62.753936767578125, 66.45985412597656, 70.16576385498047, 73.8716812133789, 77.57759857177734, 81.28350830078125, 84.98942565917969, 88.69534301757812, 92.40126037597656, 96.10717010498047, 99.8130874633789, 103.51899719238281, 107.22491455078125, 110.93082427978516, 114.6367416381836, 118.34265899658203, 122.04856872558594, 125.75448608398438, 129.4604034423828, 133.16632080078125]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 7.0, 5.0, 8.0, 12.0, 15.0, 17.0, 13.0, 23.0, 21.0, 22.0, 41.0, 25.0, 42.0, 32.0, 37.0, 35.0, 32.0, 27.0, 46.0, 44.0, 32.0, 28.0, 36.0, 48.0, 27.0, 37.0, 27.0, 30.0, 42.0, 26.0, 27.0, 21.0, 20.0, 17.0, 8.0, 6.0, 5.0, 9.0, 10.0, 5.0, 8.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-107.6094970703125, -104.57537841796875, -101.541259765625, -98.50714111328125, -95.47303009033203, -92.43891143798828, -89.40479278564453, -86.37067413330078, -83.33656311035156, -80.30244445800781, -77.26832580566406, -74.23420715332031, -71.2000961303711, -68.16597747802734, -65.1318588256836, -62.097740173339844, -59.063621520996094, -56.029502868652344, -52.99538803100586, -49.96126937866211, -46.927154541015625, -43.893035888671875, -40.858917236328125, -37.824798583984375, -34.79068374633789, -31.756567001342773, -28.722450256347656, -25.688331604003906, -22.65421485900879, -19.620098114013672, -16.585979461669922, -13.551862716674805, -10.517738342285156, -7.483621120452881, -4.4495038986206055, -1.4153861999511719, 1.6187305450439453, 4.6528472900390625, 7.6869659423828125, 10.72108268737793, 13.755199432373047, 16.789316177368164, 19.82343292236328, 22.85755157470703, 25.89166831970215, 28.925785064697266, 31.959903717041016, 34.9940185546875, 38.02813720703125, 41.062255859375, 44.096370697021484, 47.130489349365234, 50.16460418701172, 53.19872283935547, 56.23284149169922, 59.26696014404297, 62.30107498168945, 65.33518981933594, 68.36930847167969, 71.40342712402344, 74.43754577636719, 77.47166442871094, 80.50578308105469, 83.5398941040039, 86.57401275634766]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 4.0, 17.0, 17.0, 11.0, 10.0, 21.0, 22.0, 22.0, 30.0, 30.0, 34.0, 36.0, 40.0, 33.0, 35.0, 38.0, 43.0, 41.0, 36.0, 27.0, 40.0, 47.0, 34.0, 29.0, 37.0, 34.0, 32.0, 32.0, 27.0, 22.0, 17.0, 9.0, 11.0, 13.0, 6.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-175.5, -169.81640625, -164.1328125, -158.44921875, -152.765625, -147.08203125, -141.3984375, -135.71484375, -130.03125, -124.34765625, -118.6640625, -112.98046875, -107.296875, -101.61328125, -95.9296875, -90.24609375, -84.5625, -78.87890625, -73.1953125, -67.51171875, -61.828125, -56.14453125, -50.4609375, -44.77734375, -39.09375, -33.41015625, -27.7265625, -22.04296875, -16.359375, -10.67578125, -4.9921875, 0.69140625, 6.375, 12.05859375, 17.7421875, 23.42578125, 29.109375, 34.79296875, 40.4765625, 46.16015625, 51.84375, 57.52734375, 63.2109375, 68.89453125, 74.578125, 80.26171875, 85.9453125, 91.62890625, 97.3125, 102.99609375, 108.6796875, 114.36328125, 120.046875, 125.73046875, 131.4140625, 137.09765625, 142.78125, 148.46484375, 154.1484375, 159.83203125, 165.515625, 171.19921875, 176.8828125, 182.56640625, 188.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 10.0, 17.0, 18.0, 25.0, 31.0, 61.0, 101.0, 113.0, 156.0, 229.0, 361.0, 498.0, 717.0, 1035.0, 1420.0, 2037.0, 3037.0, 4314.0, 6322.0, 9506.0, 14239.0, 22002.0, 34786.0, 55485.0, 90977.0, 154749.0, 234883.0, 158348.0, 93587.0, 56694.0, 34991.0, 22459.0, 14764.0, 9735.0, 6562.0, 4386.0, 2934.0, 2110.0, 1494.0, 1014.0, 718.0, 523.0, 340.0, 232.0, 155.0, 120.0, 86.0, 55.0, 34.0, 30.0, 21.0, 15.0, 12.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.03125, -2.935089111328125, -2.83892822265625, -2.742767333984375, -2.6466064453125, -2.550445556640625, -2.45428466796875, -2.358123779296875, -2.261962890625, -2.165802001953125, -2.06964111328125, -1.973480224609375, -1.8773193359375, -1.781158447265625, -1.68499755859375, -1.588836669921875, -1.49267578125, -1.396514892578125, -1.30035400390625, -1.204193115234375, -1.1080322265625, -1.011871337890625, -0.91571044921875, -0.819549560546875, -0.723388671875, -0.627227783203125, -0.53106689453125, -0.434906005859375, -0.3387451171875, -0.242584228515625, -0.14642333984375, -0.050262451171875, 0.0458984375, 0.142059326171875, 0.23822021484375, 0.334381103515625, 0.4305419921875, 0.526702880859375, 0.62286376953125, 0.719024658203125, 0.815185546875, 0.911346435546875, 1.00750732421875, 1.103668212890625, 1.1998291015625, 1.295989990234375, 1.39215087890625, 1.488311767578125, 1.58447265625, 1.680633544921875, 1.77679443359375, 1.872955322265625, 1.9691162109375, 2.065277099609375, 2.16143798828125, 2.257598876953125, 2.353759765625, 2.449920654296875, 2.54608154296875, 2.642242431640625, 2.7384033203125, 2.834564208984375, 2.93072509765625, 3.026885986328125, 3.123046875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 8.0, 12.0, 11.0, 15.0, 15.0, 20.0, 19.0, 19.0, 20.0, 26.0, 33.0, 41.0, 27.0, 30.0, 34.0, 20.0, 43.0, 38.0, 40.0, 1066.0, 36.0, 37.0, 37.0, 39.0, 35.0, 31.0, 31.0, 31.0, 21.0, 27.0, 20.0, 17.0, 11.0, 17.0, 6.0, 16.0, 9.0, 6.0, 3.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.5, -101.90625, -98.3125, -94.71875, -91.125, -87.53125, -83.9375, -80.34375, -76.75, -73.15625, -69.5625, -65.96875, -62.375, -58.78125, -55.1875, -51.59375, -48.0, -44.40625, -40.8125, -37.21875, -33.625, -30.03125, -26.4375, -22.84375, -19.25, -15.65625, -12.0625, -8.46875, -4.875, -1.28125, 2.3125, 5.90625, 9.5, 13.09375, 16.6875, 20.28125, 23.875, 27.46875, 31.0625, 34.65625, 38.25, 41.84375, 45.4375, 49.03125, 52.625, 56.21875, 59.8125, 63.40625, 67.0, 70.59375, 74.1875, 77.78125, 81.375, 84.96875, 88.5625, 92.15625, 95.75, 99.34375, 102.9375, 106.53125, 110.125, 113.71875, 117.3125, 120.90625, 124.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 13.0, 18.0, 33.0, 58.0, 78.0, 105.0, 162.0, 237.0, 317.0, 447.0, 632.0, 927.0, 1233.0, 1803.0, 2566.0, 3621.0, 5185.0, 7602.0, 11328.0, 16940.0, 26139.0, 39986.0, 63882.0, 102945.0, 172299.0, 1261305.0, 139008.0, 84260.0, 53068.0, 33758.0, 21715.0, 14265.0, 9726.0, 6539.0, 4498.0, 3014.0, 2131.0, 1498.0, 1057.0, 808.0, 590.0, 443.0, 299.0, 197.0, 148.0, 80.0, 57.0, 35.0, 28.0, 21.0, 10.0, 5.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.799957275390625, -1.74053955078125, -1.681121826171875, -1.6217041015625, -1.562286376953125, -1.50286865234375, -1.443450927734375, -1.384033203125, -1.324615478515625, -1.26519775390625, -1.205780029296875, -1.1463623046875, -1.086944580078125, -1.02752685546875, -0.968109130859375, -0.90869140625, -0.849273681640625, -0.78985595703125, -0.730438232421875, -0.6710205078125, -0.611602783203125, -0.55218505859375, -0.492767333984375, -0.433349609375, -0.373931884765625, -0.31451416015625, -0.255096435546875, -0.1956787109375, -0.136260986328125, -0.07684326171875, -0.017425537109375, 0.0419921875, 0.101409912109375, 0.16082763671875, 0.220245361328125, 0.2796630859375, 0.339080810546875, 0.39849853515625, 0.457916259765625, 0.517333984375, 0.576751708984375, 0.63616943359375, 0.695587158203125, 0.7550048828125, 0.814422607421875, 0.87384033203125, 0.933258056640625, 0.99267578125, 1.052093505859375, 1.11151123046875, 1.170928955078125, 1.2303466796875, 1.289764404296875, 1.34918212890625, 1.408599853515625, 1.468017578125, 1.527435302734375, 1.58685302734375, 1.646270751953125, 1.7056884765625, 1.765106201171875, 1.82452392578125, 1.883941650390625, 1.943359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 6.0, 6.0, 17.0, 16.0, 17.0, 22.0, 28.0, 41.0, 42.0, 48.0, 101.0, 213.0, 146.0, 55.0, 54.0, 40.0, 21.0, 30.0, 25.0, 12.0, 6.0, 11.0, 7.0, 3.0, 9.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005252838134765625, -0.005087316036224365, -0.0049217939376831055, -0.004756271839141846, -0.004590749740600586, -0.004425227642059326, -0.004259705543518066, -0.004094183444976807, -0.003928661346435547, -0.003763139247894287, -0.0035976171493530273, -0.0034320950508117676, -0.003266572952270508, -0.003101050853729248, -0.0029355287551879883, -0.0027700066566467285, -0.0026044845581054688, -0.002438962459564209, -0.0022734403610229492, -0.0021079182624816895, -0.0019423961639404297, -0.00177687406539917, -0.0016113519668579102, -0.0014458298683166504, -0.0012803077697753906, -0.0011147856712341309, -0.0009492635726928711, -0.0007837414741516113, -0.0006182193756103516, -0.0004526972770690918, -0.00028717517852783203, -0.00012165307998657227, 4.38690185546875e-05, 0.00020939111709594727, 0.00037491321563720703, 0.0005404353141784668, 0.0007059574127197266, 0.0008714795112609863, 0.001037001609802246, 0.0012025237083435059, 0.0013680458068847656, 0.0015335679054260254, 0.0016990900039672852, 0.001864612102508545, 0.0020301342010498047, 0.0021956562995910645, 0.0023611783981323242, 0.002526700496673584, 0.0026922225952148438, 0.0028577446937561035, 0.0030232667922973633, 0.003188788890838623, 0.003354310989379883, 0.0035198330879211426, 0.0036853551864624023, 0.003850877285003662, 0.004016399383544922, 0.004181921482086182, 0.004347443580627441, 0.004512965679168701, 0.004678487777709961, 0.004844009876251221, 0.0050095319747924805, 0.00517505407333374, 0.005340576171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 7.0, 2.0, 7.0, 11.0, 8.0, 25.0, 33.0, 58.0, 76.0, 116.0, 221.0, 343.0, 623.0, 1192.0, 2526.0, 5754.0, 15538.0, 50181.0, 214599.0, 602950.0, 107064.0, 29495.0, 9909.0, 3881.0, 1832.0, 902.0, 490.0, 273.0, 167.0, 97.0, 68.0, 43.0, 17.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269622802734375, -0.026127099990844727, -0.025291919708251953, -0.02445673942565918, -0.023621559143066406, -0.022786378860473633, -0.02195119857788086, -0.021116018295288086, -0.020280838012695312, -0.01944565773010254, -0.018610477447509766, -0.017775297164916992, -0.01694011688232422, -0.016104936599731445, -0.015269756317138672, -0.014434576034545898, -0.013599395751953125, -0.012764215469360352, -0.011929035186767578, -0.011093854904174805, -0.010258674621582031, -0.009423494338989258, -0.008588314056396484, -0.007753133773803711, -0.0069179534912109375, -0.006082773208618164, -0.005247592926025391, -0.004412412643432617, -0.0035772323608398438, -0.0027420520782470703, -0.0019068717956542969, -0.0010716915130615234, -0.00023651123046875, 0.0005986690521240234, 0.0014338493347167969, 0.0022690296173095703, 0.0031042098999023438, 0.003939390182495117, 0.004774570465087891, 0.005609750747680664, 0.0064449310302734375, 0.007280111312866211, 0.008115291595458984, 0.008950471878051758, 0.009785652160644531, 0.010620832443237305, 0.011456012725830078, 0.012291193008422852, 0.013126373291015625, 0.013961553573608398, 0.014796733856201172, 0.015631914138793945, 0.01646709442138672, 0.017302274703979492, 0.018137454986572266, 0.01897263526916504, 0.019807815551757812, 0.020642995834350586, 0.02147817611694336, 0.022313356399536133, 0.023148536682128906, 0.02398371696472168, 0.024818897247314453, 0.025654077529907227, 0.0264892578125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 17.0, 23.0, 37.0, 78.0, 93.0, 191.0, 177.0, 118.0, 68.0, 41.0, 30.0, 28.0, 22.0, 15.0, 11.0, 8.0, 8.0, 4.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074348836205899715, -0.007020418532192707, -0.006605953443795443, -0.006191488355398178, -0.005777023732662201, -0.005362558178603649, -0.004948093555867672, -0.0045336284674704075, -0.004119163379073143, -0.0037046982906758785, -0.003290233202278614, -0.0028757683467119932, -0.0024613032583147287, -0.0020468381699174643, -0.0016323733143508434, -0.001217908225953579, -0.0008034431375563145, -0.0003889781073667109, 2.5486922822892666e-05, 0.0004399518948048353, 0.0008544169832020998, 0.0012688820715993643, 0.001683346927165985, 0.0020978120155632496, 0.002512277103960514, 0.0029267421923577785, 0.003341207280755043, 0.003755672136321664, 0.004170137457549572, 0.004584602080285549, 0.004999067168682814, 0.005413532257080078, 0.005827996879816055, 0.00624246196821332, 0.006656927056610584, 0.007071391679346561, 0.007485857233405113, 0.00790032185614109, 0.008314786478877068, 0.00872925203293562, 0.009143717586994171, 0.009558182209730148, 0.0099726477637887, 0.010387112386524677, 0.010801577940583229, 0.011216042563319206, 0.011630507186055183, 0.012044972740113735, 0.012459437362849712, 0.01287390198558569, 0.013288367539644241, 0.013702832162380219, 0.01411729771643877, 0.014531762339174747, 0.0149462278932333, 0.015360692515969276, 0.015775157138705254, 0.01618962176144123, 0.016604086384177208, 0.017018552869558334, 0.01743301749229431, 0.01784748211503029, 0.018261946737766266, 0.018676411360502243, 0.01909087784588337]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 8.0, 7.0, 6.0, 4.0, 11.0, 11.0, 8.0, 9.0, 17.0, 17.0, 16.0, 16.0, 27.0, 24.0, 22.0, 25.0, 29.0, 28.0, 30.0, 36.0, 31.0, 40.0, 34.0, 35.0, 42.0, 24.0, 33.0, 44.0, 26.0, 24.0, 37.0, 35.0, 31.0, 18.0, 24.0, 20.0, 17.0, 21.0, 19.0, 12.0, 10.0, 11.0, 15.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.004262208938598633, -0.004122590646147728, -0.003982972353696823, -0.0038433540612459183, -0.0037037357687950134, -0.0035641174763441086, -0.0034244991838932037, -0.003284880891442299, -0.003145262598991394, -0.003005644306540489, -0.0028660260140895844, -0.0027264077216386795, -0.0025867894291877747, -0.00244717113673687, -0.002307552844285965, -0.00216793455183506, -0.0020283162593841553, -0.0018886979669332504, -0.0017490796744823456, -0.0016094613820314407, -0.0014698430895805359, -0.001330224797129631, -0.0011906065046787262, -0.0010509882122278214, -0.0009113699197769165, -0.0007717516273260117, -0.0006321333348751068, -0.000492515042424202, -0.0003528967499732971, -0.00021327845752239227, -7.366016507148743e-05, 6.595812737941742e-05, 0.00020557641983032227, 0.0003451947122812271, 0.00048481300473213196, 0.0006244312971830368, 0.0007640495896339417, 0.0009036678820848465, 0.0010432861745357513, 0.0011829044669866562, 0.001322522759437561, 0.0014621410518884659, 0.0016017593443393707, 0.0017413776367902756, 0.0018809959292411804, 0.0020206142216920853, 0.00216023251414299, 0.002299850806593895, 0.0024394690990448, 0.0025790873914957047, 0.0027187056839466095, 0.0028583239763975143, 0.002997942268848419, 0.003137560561299324, 0.003277178853750229, 0.0034167971462011337, 0.0035564154386520386, 0.0036960337311029434, 0.0038356520235538483, 0.003975270316004753, 0.004114888608455658, 0.004254506900906563, 0.004394125193357468, 0.0045337434858083725, 0.004673361778259277]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 3.0, 8.0, 3.0, 18.0, 17.0, 11.0, 10.0, 20.0, 22.0, 23.0, 30.0, 30.0, 34.0, 35.0, 39.0, 34.0, 35.0, 39.0, 43.0, 40.0, 37.0, 27.0, 38.0, 49.0, 33.0, 30.0, 37.0, 32.0, 34.0, 32.0, 26.0, 23.0, 17.0, 9.0, 11.0, 13.0, 6.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-175.625, -169.939453125, -164.25390625, -158.568359375, -152.8828125, -147.197265625, -141.51171875, -135.826171875, -130.140625, -124.455078125, -118.76953125, -113.083984375, -107.3984375, -101.712890625, -96.02734375, -90.341796875, -84.65625, -78.970703125, -73.28515625, -67.599609375, -61.9140625, -56.228515625, -50.54296875, -44.857421875, -39.171875, -33.486328125, -27.80078125, -22.115234375, -16.4296875, -10.744140625, -5.05859375, 0.626953125, 6.3125, 11.998046875, 17.68359375, 23.369140625, 29.0546875, 34.740234375, 40.42578125, 46.111328125, 51.796875, 57.482421875, 63.16796875, 68.853515625, 74.5390625, 80.224609375, 85.91015625, 91.595703125, 97.28125, 102.966796875, 108.65234375, 114.337890625, 120.0234375, 125.708984375, 131.39453125, 137.080078125, 142.765625, 148.451171875, 154.13671875, 159.822265625, 165.5078125, 171.193359375, 176.87890625, 182.564453125, 188.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 8.0, 3.0, 7.0, 3.0, 14.0, 15.0, 13.0, 18.0, 22.0, 38.0, 65.0, 69.0, 116.0, 208.0, 430.0, 790.0, 1873.0, 5245.0, 16726.0, 66401.0, 332885.0, 483447.0, 103482.0, 24694.0, 7224.0, 2540.0, 1065.0, 456.0, 253.0, 125.0, 79.0, 63.0, 50.0, 28.0, 18.0, 12.0, 18.0, 4.0, 13.0, 10.0, 5.0, 7.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.90625, -28.946044921875, -27.98583984375, -27.025634765625, -26.0654296875, -25.105224609375, -24.14501953125, -23.184814453125, -22.224609375, -21.264404296875, -20.30419921875, -19.343994140625, -18.3837890625, -17.423583984375, -16.46337890625, -15.503173828125, -14.54296875, -13.582763671875, -12.62255859375, -11.662353515625, -10.7021484375, -9.741943359375, -8.78173828125, -7.821533203125, -6.861328125, -5.901123046875, -4.94091796875, -3.980712890625, -3.0205078125, -2.060302734375, -1.10009765625, -0.139892578125, 0.8203125, 1.780517578125, 2.74072265625, 3.700927734375, 4.6611328125, 5.621337890625, 6.58154296875, 7.541748046875, 8.501953125, 9.462158203125, 10.42236328125, 11.382568359375, 12.3427734375, 13.302978515625, 14.26318359375, 15.223388671875, 16.18359375, 17.143798828125, 18.10400390625, 19.064208984375, 20.0244140625, 20.984619140625, 21.94482421875, 22.905029296875, 23.865234375, 24.825439453125, 25.78564453125, 26.745849609375, 27.7060546875, 28.666259765625, 29.62646484375, 30.586669921875, 31.546875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 15.0, 24.0, 34.0, 51.0, 78.0, 94.0, 107.0, 148.0, 2085.0, 76.0, 88.0, 73.0, 55.0, 36.0, 30.0, 16.0, 11.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-510.5, -494.0703125, -477.640625, -461.2109375, -444.78125, -428.3515625, -411.921875, -395.4921875, -379.0625, -362.6328125, -346.203125, -329.7734375, -313.34375, -296.9140625, -280.484375, -264.0546875, -247.625, -231.1953125, -214.765625, -198.3359375, -181.90625, -165.4765625, -149.046875, -132.6171875, -116.1875, -99.7578125, -83.328125, -66.8984375, -50.46875, -34.0390625, -17.609375, -1.1796875, 15.25, 31.6796875, 48.109375, 64.5390625, 80.96875, 97.3984375, 113.828125, 130.2578125, 146.6875, 163.1171875, 179.546875, 195.9765625, 212.40625, 228.8359375, 245.265625, 261.6953125, 278.125, 294.5546875, 310.984375, 327.4140625, 343.84375, 360.2734375, 376.703125, 393.1328125, 409.5625, 425.9921875, 442.421875, 458.8515625, 475.28125, 491.7109375, 508.140625, 524.5703125, 541.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 9.0, 12.0, 11.0, 15.0, 18.0, 43.0, 43.0, 63.0, 170.0, 205.0, 404.0, 831.0, 2601.0, 27793.0, 2947763.0, 156884.0, 6291.0, 1237.0, 525.0, 303.0, 178.0, 108.0, 66.0, 45.0, 26.0, 18.0, 8.0, 10.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.9375, -53.8447265625, -51.751953125, -49.6591796875, -47.56640625, -45.4736328125, -43.380859375, -41.2880859375, -39.1953125, -37.1025390625, -35.009765625, -32.9169921875, -30.82421875, -28.7314453125, -26.638671875, -24.5458984375, -22.453125, -20.3603515625, -18.267578125, -16.1748046875, -14.08203125, -11.9892578125, -9.896484375, -7.8037109375, -5.7109375, -3.6181640625, -1.525390625, 0.5673828125, 2.66015625, 4.7529296875, 6.845703125, 8.9384765625, 11.03125, 13.1240234375, 15.216796875, 17.3095703125, 19.40234375, 21.4951171875, 23.587890625, 25.6806640625, 27.7734375, 29.8662109375, 31.958984375, 34.0517578125, 36.14453125, 38.2373046875, 40.330078125, 42.4228515625, 44.515625, 46.6083984375, 48.701171875, 50.7939453125, 52.88671875, 54.9794921875, 57.072265625, 59.1650390625, 61.2578125, 63.3505859375, 65.443359375, 67.5361328125, 69.62890625, 71.7216796875, 73.814453125, 75.9072265625, 78.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 11.0, 16.0, 22.0, 33.0, 77.0, 131.0, 167.0, 186.0, 146.0, 74.0, 36.0, 31.0, 21.0, 11.0, 5.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-427.74658203125, -414.37811279296875, -401.0096435546875, -387.64117431640625, -374.272705078125, -360.90423583984375, -347.5357971191406, -334.1673278808594, -320.7988586425781, -307.4303894042969, -294.0619201660156, -280.6934509277344, -267.32501220703125, -253.95652770996094, -240.58807373046875, -227.2196044921875, -213.85113525390625, -200.482666015625, -187.11419677734375, -173.74574279785156, -160.3772735595703, -147.00880432128906, -133.64035034179688, -120.27188110351562, -106.90341186523438, -93.53494262695312, -80.1664810180664, -66.79801940917969, -53.42955017089844, -40.06108093261719, -26.69261932373047, -13.32415771484375, 0.044281005859375, 13.41274642944336, 26.781211853027344, 40.14967727661133, 53.51814270019531, 66.88661193847656, 80.25507354736328, 93.62353515625, 106.99200439453125, 120.3604736328125, 133.72894287109375, 147.09739685058594, 160.4658660888672, 173.83433532714844, 187.20278930664062, 200.57125854492188, 213.93972778320312, 227.30819702148438, 240.67666625976562, 254.0451202392578, 267.41357421875, 280.78204345703125, 294.1505126953125, 307.51898193359375, 320.887451171875, 334.25592041015625, 347.6243896484375, 360.99285888671875, 374.361328125, 387.72979736328125, 401.0982360839844, 414.4667053222656, 427.8351745605469]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 12.0, 12.0, 16.0, 14.0, 17.0, 12.0, 19.0, 18.0, 23.0, 35.0, 22.0, 38.0, 46.0, 43.0, 41.0, 38.0, 42.0, 43.0, 43.0, 44.0, 43.0, 37.0, 31.0, 36.0, 28.0, 33.0, 22.0, 24.0, 26.0, 24.0, 18.0, 15.0, 16.0, 12.0, 8.0, 2.0, 8.0, 9.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.82275390625, -311.8260192871094, -300.8292541503906, -289.83251953125, -278.83575439453125, -267.8390197753906, -256.84228515625, -245.8455352783203, -234.84878540039062, -223.85203552246094, -212.85528564453125, -201.85855102539062, -190.86180114746094, -179.86505126953125, -168.86831665039062, -157.87156677246094, -146.87481689453125, -135.87806701660156, -124.8813247680664, -113.88458251953125, -102.88783264160156, -91.89108276367188, -80.89434051513672, -69.89759826660156, -58.900848388671875, -47.90410232543945, -36.90735626220703, -25.91061019897461, -14.913864135742188, -3.9171180725097656, 7.079627990722656, 18.076370239257812, 29.0731201171875, 40.06986618041992, 51.066612243652344, 62.063358306884766, 73.06010437011719, 84.05685424804688, 95.05359649658203, 106.05033874511719, 117.04708862304688, 128.04383850097656, 139.04058837890625, 150.03732299804688, 161.03407287597656, 172.03082275390625, 183.02755737304688, 194.02430725097656, 205.02105712890625, 216.01780700683594, 227.01455688476562, 238.01129150390625, 249.00804138183594, 260.0047912597656, 271.00152587890625, 281.998291015625, 292.9950256347656, 303.99176025390625, 314.988525390625, 325.9852600097656, 336.98199462890625, 347.978759765625, 358.9754943847656, 369.97222900390625, 380.968994140625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 11.0, 10.0, 14.0, 22.0, 23.0, 27.0, 33.0, 37.0, 58.0, 68.0, 77.0, 87.0, 131.0, 155.0, 203.0, 282.0, 391.0, 562.0, 895.0, 1041470.0, 1215.0, 714.0, 509.0, 391.0, 265.0, 195.0, 135.0, 109.0, 82.0, 80.0, 61.0, 46.0, 40.0, 29.0, 25.0, 23.0, 14.0, 11.0, 13.0, 7.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-129.21395874023438, -125.506103515625, -121.79825592041016, -118.09040069580078, -114.38255310058594, -110.67469787597656, -106.96684265136719, -103.25899505615234, -99.55113983154297, -95.8432846069336, -92.13543701171875, -88.42758178710938, -84.71973419189453, -81.01187896728516, -77.30403137207031, -73.59617614746094, -69.88832092285156, -66.18046569824219, -62.472618103027344, -58.76476287841797, -55.05691146850586, -51.34906005859375, -47.64120864868164, -43.93335723876953, -40.22550964355469, -36.51765823364258, -32.80980682373047, -29.101953506469727, -25.394100189208984, -21.686248779296875, -17.978397369384766, -14.270544052124023, -10.562690734863281, -6.8548383712768555, -3.146986484527588, 0.5608654022216797, 4.2687177658081055, 7.976570129394531, 11.68442153930664, 15.392274856567383, 19.100126266479492, 22.8079776763916, 26.515830993652344, 30.223682403564453, 33.93153381347656, 37.63938903808594, 41.34723663330078, 45.055091857910156, 48.762943267822266, 52.470794677734375, 56.178646087646484, 59.886497497558594, 63.59435272216797, 67.30220031738281, 71.01005554199219, 74.71791076660156, 78.4257583618164, 82.13361358642578, 85.84146118164062, 89.54931640625, 93.25716400146484, 96.96501922607422, 100.67286682128906, 104.38072204589844, 108.08857727050781]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 3.0, 8.0, 9.0, 11.0, 20.0, 22.0, 31.0, 46.0, 129.0, 796.0, 51427168.0, 34027.0, 662.0, 108.0, 41.0, 18.0, 16.0, 9.0, 5.0, 8.0, 13.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-947.4556884765625, -910.9619750976562, -874.46826171875, -837.9745483398438, -801.4808349609375, -764.9871826171875, -728.4934692382812, -691.999755859375, -655.5060424804688, -619.0123291015625, -582.5186157226562, -546.02490234375, -509.5312194824219, -473.0375061035156, -436.5438232421875, -400.05010986328125, -363.556396484375, -327.06268310546875, -290.5689697265625, -254.07528686523438, -217.58157348632812, -181.08786010742188, -144.5941619873047, -108.1004638671875, -71.60675048828125, -35.11304473876953, 1.3806610107421875, 37.874366760253906, 74.36807250976562, 110.86178588867188, 147.35548400878906, 183.84918212890625, 220.3427734375, 256.83648681640625, 293.3302001953125, 329.8238830566406, 366.3175964355469, 402.8113098144531, 439.30499267578125, 475.7987060546875, 512.2924194335938, 548.7861328125, 585.2798461914062, 621.7735595703125, 658.2672119140625, 694.760986328125, 731.254638671875, 767.7483520507812, 804.2420654296875, 840.7357788085938, 877.2294921875, 913.7232055664062, 950.2169189453125, 986.7105712890625, 1023.2042846679688, 1059.697998046875, 1096.191650390625, 1132.685302734375, 1169.1790771484375, 1205.6727294921875, 1242.16650390625, 1278.66015625, 1315.1539306640625, 1351.6475830078125, 1388.141357421875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 15.0, 22.0, 38.0, 78.0, 171.0, 239.0, 400.0, 516.0, 761.0, 1069.0, 1518.0, 2360.0, 3605.0, 5586.0, 8668.0, 14220.0, 22126.0, 36893.0, 61161.0, 104489.0, 182662.0, 339232.0, 686611.0, 3895359.0, 403631.0, 215679.0, 121105.0, 71208.0, 42044.0, 25633.0, 15983.0, 9860.0, 6256.0, 4240.0, 2722.0, 1786.0, 1171.0, 772.0, 456.0, 345.0, 214.0, 137.0, 98.0, 76.0, 74.0, 54.0, 34.0, 23.0, 8.0, 7.0, 0.0, 0.0, 2.0], "bins": [-1.248046875, -1.21148681640625, -1.1749267578125, -1.13836669921875, -1.101806640625, -1.06524658203125, -1.0286865234375, -0.99212646484375, -0.95556640625, -0.91900634765625, -0.8824462890625, -0.84588623046875, -0.809326171875, -0.77276611328125, -0.7362060546875, -0.69964599609375, -0.6630859375, -0.62652587890625, -0.5899658203125, -0.55340576171875, -0.516845703125, -0.48028564453125, -0.4437255859375, -0.40716552734375, -0.37060546875, -0.33404541015625, -0.2974853515625, -0.26092529296875, -0.224365234375, -0.18780517578125, -0.1512451171875, -0.11468505859375, -0.078125, -0.04156494140625, -0.0050048828125, 0.03155517578125, 0.068115234375, 0.10467529296875, 0.1412353515625, 0.17779541015625, 0.21435546875, 0.25091552734375, 0.2874755859375, 0.32403564453125, 0.360595703125, 0.39715576171875, 0.4337158203125, 0.47027587890625, 0.5068359375, 0.54339599609375, 0.5799560546875, 0.61651611328125, 0.653076171875, 0.68963623046875, 0.7261962890625, 0.76275634765625, 0.79931640625, 0.83587646484375, 0.8724365234375, 0.90899658203125, 0.945556640625, 0.98211669921875, 1.0186767578125, 1.05523681640625, 1.091796875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 5.0, 7.0, 11.0, 14.0, 10.0, 25.0, 16.0, 32.0, 26.0, 27.0, 42.0, 32.0, 41.0, 32.0, 37.0, 40.0, 39.0, 1087.0, 37.0, 51.0, 41.0, 35.0, 35.0, 44.0, 27.0, 33.0, 36.0, 24.0, 26.0, 27.0, 14.0, 10.0, 11.0, 7.0, 6.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0], "bins": [-114.6875, -111.4384765625, -108.189453125, -104.9404296875, -101.69140625, -98.4423828125, -95.193359375, -91.9443359375, -88.6953125, -85.4462890625, -82.197265625, -78.9482421875, -75.69921875, -72.4501953125, -69.201171875, -65.9521484375, -62.703125, -59.4541015625, -56.205078125, -52.9560546875, -49.70703125, -46.4580078125, -43.208984375, -39.9599609375, -36.7109375, -33.4619140625, -30.212890625, -26.9638671875, -23.71484375, -20.4658203125, -17.216796875, -13.9677734375, -10.71875, -7.4697265625, -4.220703125, -0.9716796875, 2.27734375, 5.5263671875, 8.775390625, 12.0244140625, 15.2734375, 18.5224609375, 21.771484375, 25.0205078125, 28.26953125, 31.5185546875, 34.767578125, 38.0166015625, 41.265625, 44.5146484375, 47.763671875, 51.0126953125, 54.26171875, 57.5107421875, 60.759765625, 64.0087890625, 67.2578125, 70.5068359375, 73.755859375, 77.0048828125, 80.25390625, 83.5029296875, 86.751953125, 90.0009765625, 93.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 5.0, 5.0, 10.0, 18.0, 13.0, 30.0, 49.0, 54.0, 58.0, 122.0, 133.0, 216.0, 329.0, 497.0, 697.0, 1037.0, 1463.0, 2079.0, 3157.0, 4877.0, 7059.0, 10526.0, 16452.0, 24488.0, 37595.0, 57265.0, 88896.0, 143730.0, 249456.0, 474989.0, 4007283.0, 492365.0, 255988.0, 148192.0, 90765.0, 58786.0, 38065.0, 25262.0, 16427.0, 11012.0, 7142.0, 4888.0, 3155.0, 2086.0, 1489.0, 1044.0, 642.0, 455.0, 331.0, 245.0, 174.0, 114.0, 56.0, 59.0, 25.0, 28.0, 19.0, 12.0, 18.0, 10.0, 5.0], "bins": [-1.482421875, -1.438201904296875, -1.39398193359375, -1.349761962890625, -1.3055419921875, -1.261322021484375, -1.21710205078125, -1.172882080078125, -1.128662109375, -1.084442138671875, -1.04022216796875, -0.996002197265625, -0.9517822265625, -0.907562255859375, -0.86334228515625, -0.819122314453125, -0.77490234375, -0.730682373046875, -0.68646240234375, -0.642242431640625, -0.5980224609375, -0.553802490234375, -0.50958251953125, -0.465362548828125, -0.421142578125, -0.376922607421875, -0.33270263671875, -0.288482666015625, -0.2442626953125, -0.200042724609375, -0.15582275390625, -0.111602783203125, -0.0673828125, -0.023162841796875, 0.02105712890625, 0.065277099609375, 0.1094970703125, 0.153717041015625, 0.19793701171875, 0.242156982421875, 0.286376953125, 0.330596923828125, 0.37481689453125, 0.419036865234375, 0.4632568359375, 0.507476806640625, 0.55169677734375, 0.595916748046875, 0.64013671875, 0.684356689453125, 0.72857666015625, 0.772796630859375, 0.8170166015625, 0.861236572265625, 0.90545654296875, 0.949676513671875, 0.993896484375, 1.038116455078125, 1.08233642578125, 1.126556396484375, 1.1707763671875, 1.214996337890625, 1.25921630859375, 1.303436279296875, 1.34765625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 3.0, 4.0, 11.0, 15.0, 13.0, 14.0, 20.0, 21.0, 24.0, 24.0, 24.0, 30.0, 35.0, 33.0, 46.0, 35.0, 43.0, 40.0, 33.0, 1062.0, 29.0, 43.0, 34.0, 39.0, 36.0, 33.0, 26.0, 25.0, 25.0, 24.0, 22.0, 27.0, 23.0, 14.0, 17.0, 18.0, 5.0, 12.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.5, -124.275390625, -120.05078125, -115.826171875, -111.6015625, -107.376953125, -103.15234375, -98.927734375, -94.703125, -90.478515625, -86.25390625, -82.029296875, -77.8046875, -73.580078125, -69.35546875, -65.130859375, -60.90625, -56.681640625, -52.45703125, -48.232421875, -44.0078125, -39.783203125, -35.55859375, -31.333984375, -27.109375, -22.884765625, -18.66015625, -14.435546875, -10.2109375, -5.986328125, -1.76171875, 2.462890625, 6.6875, 10.912109375, 15.13671875, 19.361328125, 23.5859375, 27.810546875, 32.03515625, 36.259765625, 40.484375, 44.708984375, 48.93359375, 53.158203125, 57.3828125, 61.607421875, 65.83203125, 70.056640625, 74.28125, 78.505859375, 82.73046875, 86.955078125, 91.1796875, 95.404296875, 99.62890625, 103.853515625, 108.078125, 112.302734375, 116.52734375, 120.751953125, 124.9765625, 129.201171875, 133.42578125, 137.650390625, 141.875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 21.0, 13.0, 31.0, 55.0, 63.0, 109.0, 120.0, 150.0, 253.0, 382.0, 455.0, 644.0, 854.0, 1324.0, 1746.0, 2452.0, 3451.0, 5080.0, 7461.0, 10768.0, 16349.0, 26865.0, 48420.0, 141316.0, 5745100.0, 149459.0, 49473.0, 26939.0, 16649.0, 10720.0, 7543.0, 5030.0, 3426.0, 2367.0, 1833.0, 1219.0, 862.0, 687.0, 499.0, 322.0, 244.0, 184.0, 137.0, 81.0, 70.0, 42.0, 36.0, 54.0, 23.0, 10.0, 5.0, 3.0, 5.0, 7.0, 4.0], "bins": [-3.71875, -3.6077880859375, -3.496826171875, -3.3858642578125, -3.27490234375, -3.1639404296875, -3.052978515625, -2.9420166015625, -2.8310546875, -2.7200927734375, -2.609130859375, -2.4981689453125, -2.38720703125, -2.2762451171875, -2.165283203125, -2.0543212890625, -1.943359375, -1.8323974609375, -1.721435546875, -1.6104736328125, -1.49951171875, -1.3885498046875, -1.277587890625, -1.1666259765625, -1.0556640625, -0.9447021484375, -0.833740234375, -0.7227783203125, -0.61181640625, -0.5008544921875, -0.389892578125, -0.2789306640625, -0.16796875, -0.0570068359375, 0.053955078125, 0.1649169921875, 0.27587890625, 0.3868408203125, 0.497802734375, 0.6087646484375, 0.7197265625, 0.8306884765625, 0.941650390625, 1.0526123046875, 1.16357421875, 1.2745361328125, 1.385498046875, 1.4964599609375, 1.607421875, 1.7183837890625, 1.829345703125, 1.9403076171875, 2.05126953125, 2.1622314453125, 2.273193359375, 2.3841552734375, 2.4951171875, 2.6060791015625, 2.717041015625, 2.8280029296875, 2.93896484375, 3.0499267578125, 3.160888671875, 3.2718505859375, 3.3828125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 11.0, 13.0, 12.0, 13.0, 13.0, 11.0, 25.0, 21.0, 31.0, 35.0, 33.0, 22.0, 35.0, 39.0, 48.0, 46.0, 44.0, 1069.0, 41.0, 38.0, 46.0, 34.0, 37.0, 31.0, 35.0, 33.0, 34.0, 20.0, 21.0, 17.0, 13.0, 15.0, 8.0, 15.0, 8.0, 10.0, 6.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-194.25, -188.568359375, -182.88671875, -177.205078125, -171.5234375, -165.841796875, -160.16015625, -154.478515625, -148.796875, -143.115234375, -137.43359375, -131.751953125, -126.0703125, -120.388671875, -114.70703125, -109.025390625, -103.34375, -97.662109375, -91.98046875, -86.298828125, -80.6171875, -74.935546875, -69.25390625, -63.572265625, -57.890625, -52.208984375, -46.52734375, -40.845703125, -35.1640625, -29.482421875, -23.80078125, -18.119140625, -12.4375, -6.755859375, -1.07421875, 4.607421875, 10.2890625, 15.970703125, 21.65234375, 27.333984375, 33.015625, 38.697265625, 44.37890625, 50.060546875, 55.7421875, 61.423828125, 67.10546875, 72.787109375, 78.46875, 84.150390625, 89.83203125, 95.513671875, 101.1953125, 106.876953125, 112.55859375, 118.240234375, 123.921875, 129.603515625, 135.28515625, 140.966796875, 146.6484375, 152.330078125, 158.01171875, 163.693359375, 169.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 12.0, 8.0, 17.0, 30.0, 50.0, 94.0, 503.0, 135.0, 42.0, 34.0, 19.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.89189147949219, -105.8975601196289, -99.9032211303711, -93.90888977050781, -87.91455078125, -81.92021942138672, -75.92588806152344, -69.93154907226562, -63.937217712402344, -57.9428825378418, -51.94854736328125, -45.95421600341797, -39.95988082885742, -33.965545654296875, -27.971214294433594, -21.976879119873047, -15.9825439453125, -9.98820972442627, -3.993875503540039, 2.000457763671875, 7.994792938232422, 13.989128112792969, 19.98345947265625, 25.977794647216797, 31.972129821777344, 37.96646499633789, 43.96080017089844, 49.95513153076172, 55.949466705322266, 61.94380187988281, 67.9381332397461, 73.93246459960938, 79.92678833007812, 85.9211196899414, 91.91545867919922, 97.9097900390625, 103.90412902832031, 109.8984603881836, 115.89279174804688, 121.88713073730469, 127.88146209716797, 133.87579345703125, 139.87013244628906, 145.86447143554688, 151.85879516601562, 157.85313415527344, 163.84747314453125, 169.841796875, 175.8361358642578, 181.83047485351562, 187.82479858398438, 193.8191375732422, 199.8134765625, 205.80780029296875, 211.80213928222656, 217.79647827148438, 223.79080200195312, 229.78514099121094, 235.7794647216797, 241.7738037109375, 247.7681427001953, 253.76248168945312, 259.7568054199219, 265.7511291503906, 271.7454833984375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 13.0, 50.0, 308.0, 463.0, 122.0, 18.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1459.41357421875, -1422.2220458984375, -1385.030517578125, -1347.8388671875, -1310.6473388671875, -1273.455810546875, -1236.2642822265625, -1199.07275390625, -1161.881103515625, -1124.6895751953125, -1087.498046875, -1050.306396484375, -1013.1148681640625, -975.92333984375, -938.7318115234375, -901.5402221679688, -864.3486938476562, -827.1571655273438, -789.965576171875, -752.7740478515625, -715.5824584960938, -678.3909301757812, -641.1993408203125, -604.0078125, -566.8162841796875, -529.624755859375, -492.43316650390625, -455.24163818359375, -418.050048828125, -380.8585205078125, -343.6669616699219, -306.47540283203125, -269.28375244140625, -232.09219360351562, -194.900634765625, -157.70909118652344, -120.51753234863281, -83.32597351074219, -46.134429931640625, -8.94287109375, 28.248687744140625, 65.44024658203125, 102.63179779052734, 139.82334899902344, 177.01490783691406, 214.2064666748047, 251.39801025390625, 288.5895690917969, 325.7811279296875, 362.9726867675781, 400.16424560546875, 437.35577392578125, 474.54736328125, 511.7388916015625, 548.930419921875, 586.1220092773438, 623.3135986328125, 660.505126953125, 697.6967163085938, 734.8882446289062, 772.079833984375, 809.2713623046875, 846.462890625, 883.6544799804688, 920.8460083007812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 3.0, 7.0, 7.0, 6.0, 15.0, 7.0, 6.0, 21.0, 12.0, 14.0, 9.0, 16.0, 17.0, 15.0, 18.0, 9.0, 19.0, 19.0, 23.0, 28.0, 39.0, 46.0, 47.0, 66.0, 64.0, 76.0, 84.0, 89.0, 156.0, 257.0, 379.0, 647.0, 1059.0, 1865.0, 2874.0, 8490.0, 4126628.0, 34373.0, 7266.0, 4409.0, 2054.0, 1028.0, 562.0, 374.0, 263.0, 194.0, 159.0, 137.0, 94.0, 63.0, 56.0, 40.0, 24.0, 14.0, 9.0, 10.0, 7.0], "bins": [-11.703125, -11.43695068359375, -11.1707763671875, -10.90460205078125, -10.638427734375, -10.37225341796875, -10.1060791015625, -9.83990478515625, -9.57373046875, -9.30755615234375, -9.0413818359375, -8.77520751953125, -8.509033203125, -8.24285888671875, -7.9766845703125, -7.71051025390625, -7.4443359375, -7.17816162109375, -6.9119873046875, -6.64581298828125, -6.379638671875, -6.11346435546875, -5.8472900390625, -5.58111572265625, -5.31494140625, -5.04876708984375, -4.7825927734375, -4.51641845703125, -4.250244140625, -3.98406982421875, -3.7178955078125, -3.45172119140625, -3.185546875, -2.91937255859375, -2.6531982421875, -2.38702392578125, -2.120849609375, -1.85467529296875, -1.5885009765625, -1.32232666015625, -1.05615234375, -0.78997802734375, -0.5238037109375, -0.25762939453125, 0.008544921875, 0.27471923828125, 0.5408935546875, 0.80706787109375, 1.0732421875, 1.33941650390625, 1.6055908203125, 1.87176513671875, 2.137939453125, 2.40411376953125, 2.6702880859375, 2.93646240234375, 3.20263671875, 3.46881103515625, 3.7349853515625, 4.00115966796875, 4.267333984375, 4.53350830078125, 4.7996826171875, 5.06585693359375, 5.33203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 22.0, 27.0, 463.0, 403.0, 22.0, 14.0, 16.0, 10.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7610969543457031, -0.7433853149414062, -0.7256736755371094, -0.7079620361328125, -0.6902503967285156, -0.6725387573242188, -0.6548271179199219, -0.637115478515625, -0.6194038391113281, -0.6016921997070312, -0.5839805603027344, -0.5662689208984375, -0.5485572814941406, -0.5308456420898438, -0.5131340026855469, -0.49542236328125, -0.4777107238769531, -0.45999908447265625, -0.4422874450683594, -0.4245758056640625, -0.4068641662597656, -0.38915252685546875, -0.3714408874511719, -0.353729248046875, -0.3360176086425781, -0.31830596923828125, -0.3005943298339844, -0.2828826904296875, -0.2651710510253906, -0.24745941162109375, -0.22974777221679688, -0.2120361328125, -0.19432449340820312, -0.17661285400390625, -0.15890121459960938, -0.1411895751953125, -0.12347793579101562, -0.10576629638671875, -0.08805465698242188, -0.070343017578125, -0.052631378173828125, -0.03491973876953125, -0.017208099365234375, 0.0005035400390625, 0.018215179443359375, 0.03592681884765625, 0.053638458251953125, 0.07135009765625, 0.08906173706054688, 0.10677337646484375, 0.12448501586914062, 0.1421966552734375, 0.15990829467773438, 0.17761993408203125, 0.19533157348632812, 0.213043212890625, 0.23075485229492188, 0.24846649169921875, 0.2661781311035156, 0.2838897705078125, 0.3016014099121094, 0.31931304931640625, 0.3370246887207031, 0.354736328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 12.0, 15.0, 18.0, 24.0, 34.0, 45.0, 71.0, 102.0, 130.0, 197.0, 313.0, 458.0, 717.0, 1222.0, 1972.0, 3600.0, 6696.0, 14394.0, 49162.0, 4050491.0, 36487.0, 12906.0, 6212.0, 3552.0, 2036.0, 1260.0, 766.0, 511.0, 319.0, 190.0, 119.0, 87.0, 47.0, 29.0, 26.0, 13.0, 7.0, 8.0, 3.0, 7.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.431640625, -1.386016845703125, -1.34039306640625, -1.294769287109375, -1.2491455078125, -1.203521728515625, -1.15789794921875, -1.112274169921875, -1.066650390625, -1.021026611328125, -0.97540283203125, -0.929779052734375, -0.8841552734375, -0.838531494140625, -0.79290771484375, -0.747283935546875, -0.70166015625, -0.656036376953125, -0.61041259765625, -0.564788818359375, -0.5191650390625, -0.473541259765625, -0.42791748046875, -0.382293701171875, -0.336669921875, -0.291046142578125, -0.24542236328125, -0.199798583984375, -0.1541748046875, -0.108551025390625, -0.06292724609375, -0.017303466796875, 0.0283203125, 0.073944091796875, 0.11956787109375, 0.165191650390625, 0.2108154296875, 0.256439208984375, 0.30206298828125, 0.347686767578125, 0.393310546875, 0.438934326171875, 0.48455810546875, 0.530181884765625, 0.5758056640625, 0.621429443359375, 0.66705322265625, 0.712677001953125, 0.75830078125, 0.803924560546875, 0.84954833984375, 0.895172119140625, 0.9407958984375, 0.986419677734375, 1.03204345703125, 1.077667236328125, 1.123291015625, 1.168914794921875, 1.21453857421875, 1.260162353515625, 1.3057861328125, 1.351409912109375, 1.39703369140625, 1.442657470703125, 1.48828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 8.0, 10.0, 9.0, 14.0, 15.0, 22.0, 18.0, 144.0, 3635.0, 28.0, 21.0, 17.0, 22.0, 16.0, 15.0, 10.0, 11.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6380386352539062, -0.6212921142578125, -0.6045455932617188, -0.587799072265625, -0.5710525512695312, -0.5543060302734375, -0.5375595092773438, -0.52081298828125, -0.5040664672851562, -0.4873199462890625, -0.47057342529296875, -0.453826904296875, -0.43708038330078125, -0.4203338623046875, -0.40358734130859375, -0.3868408203125, -0.37009429931640625, -0.3533477783203125, -0.33660125732421875, -0.319854736328125, -0.30310821533203125, -0.2863616943359375, -0.26961517333984375, -0.25286865234375, -0.23612213134765625, -0.2193756103515625, -0.20262908935546875, -0.185882568359375, -0.16913604736328125, -0.1523895263671875, -0.13564300537109375, -0.118896484375, -0.10214996337890625, -0.0854034423828125, -0.06865692138671875, -0.051910400390625, -0.03516387939453125, -0.0184173583984375, -0.00167083740234375, 0.01507568359375, 0.03182220458984375, 0.0485687255859375, 0.06531524658203125, 0.082061767578125, 0.09880828857421875, 0.1155548095703125, 0.13230133056640625, 0.1490478515625, 0.16579437255859375, 0.1825408935546875, 0.19928741455078125, 0.216033935546875, 0.23278045654296875, 0.2495269775390625, 0.26627349853515625, 0.28302001953125, 0.29976654052734375, 0.3165130615234375, 0.33325958251953125, 0.350006103515625, 0.36675262451171875, 0.3834991455078125, 0.40024566650390625, 0.4169921875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 14.0, 66.0, 782.0, 95.0, 19.0, 15.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5481555461883545, -2.2760331630706787, -2.003910541534424, -1.731788158416748, -1.4596656560897827, -1.1875431537628174, -0.9154207706451416, -0.6432982683181763, -0.37117576599121094, -0.099053293466568, 0.17306917905807495, 0.4451916217803955, 0.7173141241073608, 0.9894366264343262, 1.261559009552002, 1.5336815118789673, 1.8058040142059326, 2.0779263973236084, 2.3500490188598633, 2.622171401977539, 2.894293785095215, 3.1664164066314697, 3.4385387897491455, 3.7106614112854004, 3.982783794403076, 4.254906177520752, 4.527028560638428, 4.799151420593262, 5.0712738037109375, 5.343396186828613, 5.615518569946289, 5.887640953063965, 6.159763336181641, 6.431885719299316, 6.704008102416992, 6.976130485534668, 7.248253345489502, 7.520375728607178, 7.7924981117248535, 8.064620971679688, 8.336743354797363, 8.608865737915039, 8.880988121032715, 9.15311050415039, 9.425232887268066, 9.697355270385742, 9.969478607177734, 10.24160099029541, 10.513723373413086, 10.785845756530762, 11.057968139648438, 11.330090522766113, 11.602212905883789, 11.874336242675781, 12.14645767211914, 12.418581008911133, 12.690702438354492, 12.962824821472168, 13.234947204589844, 13.50706958770752, 13.779191970825195, 14.051315307617188, 14.323436737060547, 14.595560073852539, 14.867682456970215]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 22.0, 30.0, 45.0, 71.0, 97.0, 136.0, 141.0, 160.0, 116.0, 60.0, 47.0, 21.0, 13.0, 15.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.243732213973999, -3.1306803226470947, -3.0176284313201904, -2.904576539993286, -2.791524648666382, -2.6784727573394775, -2.5654208660125732, -2.452368974685669, -2.3393170833587646, -2.2262651920318604, -2.113213300704956, -2.0001614093780518, -1.8871095180511475, -1.7740576267242432, -1.6610057353973389, -1.5479538440704346, -1.4349019527435303, -1.321850061416626, -1.2087981700897217, -1.0957462787628174, -0.9826943874359131, -0.8696424961090088, -0.7565906047821045, -0.6435387134552002, -0.5304868221282959, -0.4174349308013916, -0.3043830394744873, -0.191331148147583, -0.07827925682067871, 0.034772634506225586, 0.14782452583312988, 0.2608764171600342, 0.3739280700683594, 0.48697996139526367, 0.600031852722168, 0.7130837440490723, 0.8261356353759766, 0.9391875267028809, 1.0522394180297852, 1.1652913093566895, 1.2783432006835938, 1.391395092010498, 1.5044469833374023, 1.6174988746643066, 1.730550765991211, 1.8436026573181152, 1.9566545486450195, 2.069706439971924, 2.182758331298828, 2.2958102226257324, 2.4088621139526367, 2.521914005279541, 2.6349658966064453, 2.7480177879333496, 2.861069679260254, 2.974121570587158, 3.0871734619140625, 3.200225353240967, 3.313277244567871, 3.4263291358947754, 3.5393810272216797, 3.652432918548584, 3.7654848098754883, 3.8785367012023926, 3.991588592529297]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 13.0, 6.0, 15.0, 12.0, 13.0, 24.0, 23.0, 35.0, 85.0, 99.0, 150.0, 211.0, 452.0, 896.0, 2239.0, 8225.0, 83593.0, 937778.0, 9856.0, 2598.0, 988.0, 457.0, 257.0, 165.0, 110.0, 59.0, 55.0, 30.0, 17.0, 21.0, 19.0, 10.0, 9.0, 6.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -5.203338623046875, -5.05902099609375, -4.914703369140625, -4.7703857421875, -4.626068115234375, -4.48175048828125, -4.337432861328125, -4.193115234375, -4.048797607421875, -3.90447998046875, -3.760162353515625, -3.6158447265625, -3.471527099609375, -3.32720947265625, -3.182891845703125, -3.03857421875, -2.894256591796875, -2.74993896484375, -2.605621337890625, -2.4613037109375, -2.316986083984375, -2.17266845703125, -2.028350830078125, -1.884033203125, -1.739715576171875, -1.59539794921875, -1.451080322265625, -1.3067626953125, -1.162445068359375, -1.01812744140625, -0.873809814453125, -0.7294921875, -0.585174560546875, -0.44085693359375, -0.296539306640625, -0.1522216796875, -0.007904052734375, 0.13641357421875, 0.280731201171875, 0.425048828125, 0.569366455078125, 0.71368408203125, 0.858001708984375, 1.0023193359375, 1.146636962890625, 1.29095458984375, 1.435272216796875, 1.57958984375, 1.723907470703125, 1.86822509765625, 2.012542724609375, 2.1568603515625, 2.301177978515625, 2.44549560546875, 2.589813232421875, 2.734130859375, 2.878448486328125, 3.02276611328125, 3.167083740234375, 3.3114013671875, 3.455718994140625, 3.60003662109375, 3.744354248046875, 3.888671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 1.0, 10.0, 22.0, 30.0, 819.0, 44.0, 20.0, 17.0, 13.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77197265625, -0.7543525695800781, -0.7367324829101562, -0.7191123962402344, -0.7014923095703125, -0.6838722229003906, -0.6662521362304688, -0.6486320495605469, -0.631011962890625, -0.6133918762207031, -0.5957717895507812, -0.5781517028808594, -0.5605316162109375, -0.5429115295410156, -0.5252914428710938, -0.5076713562011719, -0.49005126953125, -0.4724311828613281, -0.45481109619140625, -0.4371910095214844, -0.4195709228515625, -0.4019508361816406, -0.38433074951171875, -0.3667106628417969, -0.349090576171875, -0.3314704895019531, -0.31385040283203125, -0.2962303161621094, -0.2786102294921875, -0.2609901428222656, -0.24337005615234375, -0.22574996948242188, -0.2081298828125, -0.19050979614257812, -0.17288970947265625, -0.15526962280273438, -0.1376495361328125, -0.12002944946289062, -0.10240936279296875, -0.08478927612304688, -0.067169189453125, -0.049549102783203125, -0.03192901611328125, -0.014308929443359375, 0.0033111572265625, 0.020931243896484375, 0.03855133056640625, 0.056171417236328125, 0.07379150390625, 0.09141159057617188, 0.10903167724609375, 0.12665176391601562, 0.1442718505859375, 0.16189193725585938, 0.17951202392578125, 0.19713211059570312, 0.214752197265625, 0.23237228393554688, 0.24999237060546875, 0.2676124572753906, 0.2852325439453125, 0.3028526306152344, 0.32047271728515625, 0.3380928039550781, 0.355712890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 7.0, 2.0, 9.0, 21.0, 16.0, 27.0, 41.0, 44.0, 73.0, 102.0, 123.0, 182.0, 274.0, 417.0, 630.0, 921.0, 1374.0, 2149.0, 3589.0, 5943.0, 9665.0, 16955.0, 32085.0, 71849.0, 355580.0, 397627.0, 73494.0, 32439.0, 16800.0, 9871.0, 5989.0, 3587.0, 2274.0, 1506.0, 945.0, 635.0, 373.0, 279.0, 214.0, 133.0, 103.0, 68.0, 40.0, 17.0, 18.0, 26.0, 9.0, 8.0, 10.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.59814453125, -0.5800247192382812, -0.5619049072265625, -0.5437850952148438, -0.525665283203125, -0.5075454711914062, -0.4894256591796875, -0.47130584716796875, -0.45318603515625, -0.43506622314453125, -0.4169464111328125, -0.39882659912109375, -0.380706787109375, -0.36258697509765625, -0.3444671630859375, -0.32634735107421875, -0.3082275390625, -0.29010772705078125, -0.2719879150390625, -0.25386810302734375, -0.235748291015625, -0.21762847900390625, -0.1995086669921875, -0.18138885498046875, -0.16326904296875, -0.14514923095703125, -0.1270294189453125, -0.10890960693359375, -0.090789794921875, -0.07266998291015625, -0.0545501708984375, -0.03643035888671875, -0.018310546875, -0.00019073486328125, 0.0179290771484375, 0.03604888916015625, 0.054168701171875, 0.07228851318359375, 0.0904083251953125, 0.10852813720703125, 0.12664794921875, 0.14476776123046875, 0.1628875732421875, 0.18100738525390625, 0.199127197265625, 0.21724700927734375, 0.2353668212890625, 0.25348663330078125, 0.2716064453125, 0.28972625732421875, 0.3078460693359375, 0.32596588134765625, 0.344085693359375, 0.36220550537109375, 0.3803253173828125, 0.39844512939453125, 0.41656494140625, 0.43468475341796875, 0.4528045654296875, 0.47092437744140625, 0.489044189453125, 0.5071640014648438, 0.5252838134765625, 0.5434036254882812, 0.5615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 12.0, 12.0, 17.0, 19.0, 15.0, 18.0, 26.0, 23.0, 36.0, 37.0, 38.0, 30.0, 34.0, 38.0, 36.0, 33.0, 53.0, 43.0, 51.0, 42.0, 53.0, 32.0, 37.0, 40.0, 35.0, 19.0, 25.0, 21.0, 20.0, 20.0, 17.0, 11.0, 14.0, 7.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.63134765625, -0.6109695434570312, -0.5905914306640625, -0.5702133178710938, -0.549835205078125, -0.5294570922851562, -0.5090789794921875, -0.48870086669921875, -0.46832275390625, -0.44794464111328125, -0.4275665283203125, -0.40718841552734375, -0.386810302734375, -0.36643218994140625, -0.3460540771484375, -0.32567596435546875, -0.3052978515625, -0.28491973876953125, -0.2645416259765625, -0.24416351318359375, -0.223785400390625, -0.20340728759765625, -0.1830291748046875, -0.16265106201171875, -0.14227294921875, -0.12189483642578125, -0.1015167236328125, -0.08113861083984375, -0.060760498046875, -0.04038238525390625, -0.0200042724609375, 0.00037384033203125, 0.020751953125, 0.04113006591796875, 0.0615081787109375, 0.08188629150390625, 0.102264404296875, 0.12264251708984375, 0.1430206298828125, 0.16339874267578125, 0.18377685546875, 0.20415496826171875, 0.2245330810546875, 0.24491119384765625, 0.265289306640625, 0.28566741943359375, 0.3060455322265625, 0.32642364501953125, 0.3468017578125, 0.36717987060546875, 0.3875579833984375, 0.40793609619140625, 0.428314208984375, 0.44869232177734375, 0.4690704345703125, 0.48944854736328125, 0.50982666015625, 0.5302047729492188, 0.5505828857421875, 0.5709609985351562, 0.591339111328125, 0.6117172241210938, 0.6320953369140625, 0.6524734497070312, 0.6728515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 9.0, 20.0, 52.0, 131.0, 489.0, 4846.0, 1032920.0, 9245.0, 548.0, 151.0, 69.0, 25.0, 17.0, 7.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059326171875, -0.05799531936645508, -0.056664466857910156, -0.055333614349365234, -0.05400276184082031, -0.05267190933227539, -0.05134105682373047, -0.05001020431518555, -0.048679351806640625, -0.0473484992980957, -0.04601764678955078, -0.04468679428100586, -0.04335594177246094, -0.042025089263916016, -0.040694236755371094, -0.03936338424682617, -0.03803253173828125, -0.03670167922973633, -0.035370826721191406, -0.034039974212646484, -0.03270912170410156, -0.03137826919555664, -0.03004741668701172, -0.028716564178466797, -0.027385711669921875, -0.026054859161376953, -0.02472400665283203, -0.02339315414428711, -0.022062301635742188, -0.020731449127197266, -0.019400596618652344, -0.018069744110107422, -0.0167388916015625, -0.015408039093017578, -0.014077186584472656, -0.012746334075927734, -0.011415481567382812, -0.01008462905883789, -0.008753776550292969, -0.007422924041748047, -0.006092071533203125, -0.004761219024658203, -0.0034303665161132812, -0.0020995140075683594, -0.0007686614990234375, 0.0005621910095214844, 0.0018930435180664062, 0.003223896026611328, 0.00455474853515625, 0.005885601043701172, 0.007216453552246094, 0.008547306060791016, 0.009878158569335938, 0.01120901107788086, 0.012539863586425781, 0.013870716094970703, 0.015201568603515625, 0.016532421112060547, 0.01786327362060547, 0.01919412612915039, 0.020524978637695312, 0.021855831146240234, 0.023186683654785156, 0.024517536163330078, 0.025848388671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 15.0, 16.0, 28.0, 31.0, 65.0, 88.0, 117.0, 126.0, 103.0, 117.0, 78.0, 73.0, 40.0, 34.0, 17.0, 14.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.350688636302948e-06, -6.144866347312927e-06, -5.9390440583229065e-06, -5.733221769332886e-06, -5.527399480342865e-06, -5.321577191352844e-06, -5.1157549023628235e-06, -4.909932613372803e-06, -4.704110324382782e-06, -4.498288035392761e-06, -4.2924657464027405e-06, -4.08664345741272e-06, -3.880821168422699e-06, -3.6749988794326782e-06, -3.4691765904426575e-06, -3.2633543014526367e-06, -3.057532012462616e-06, -2.8517097234725952e-06, -2.6458874344825745e-06, -2.4400651454925537e-06, -2.234242856502533e-06, -2.028420567512512e-06, -1.8225982785224915e-06, -1.6167759895324707e-06, -1.41095370054245e-06, -1.2051314115524292e-06, -9.993091225624084e-07, -7.934868335723877e-07, -5.876645445823669e-07, -3.818422555923462e-07, -1.7601996660232544e-07, 2.9802322387695312e-08, 2.3562461137771606e-07, 4.414469003677368e-07, 6.472691893577576e-07, 8.530914783477783e-07, 1.058913767337799e-06, 1.2647360563278198e-06, 1.4705583453178406e-06, 1.6763806343078613e-06, 1.882202923297882e-06, 2.088025212287903e-06, 2.2938475012779236e-06, 2.4996697902679443e-06, 2.705492079257965e-06, 2.911314368247986e-06, 3.1171366572380066e-06, 3.3229589462280273e-06, 3.528781235218048e-06, 3.734603524208069e-06, 3.94042581319809e-06, 4.14624810218811e-06, 4.352070391178131e-06, 4.557892680168152e-06, 4.763714969158173e-06, 4.969537258148193e-06, 5.175359547138214e-06, 5.381181836128235e-06, 5.587004125118256e-06, 5.792826414108276e-06, 5.998648703098297e-06, 6.204470992088318e-06, 6.410293281078339e-06, 6.616115570068359e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 14.0, 11.0, 15.0, 18.0, 17.0, 28.0, 74.0, 117.0, 230.0, 530.0, 1195.0, 3029.0, 10624.0, 76234.0, 911645.0, 33979.0, 6932.0, 2109.0, 876.0, 378.0, 199.0, 97.0, 61.0, 24.0, 22.0, 17.0, 10.0, 12.0, 8.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006771087646484375, -0.006514012813568115, -0.0062569379806518555, -0.005999863147735596, -0.005742788314819336, -0.005485713481903076, -0.005228638648986816, -0.004971563816070557, -0.004714488983154297, -0.004457414150238037, -0.004200339317321777, -0.003943264484405518, -0.003686189651489258, -0.003429114818572998, -0.0031720399856567383, -0.0029149651527404785, -0.0026578903198242188, -0.002400815486907959, -0.0021437406539916992, -0.0018866658210754395, -0.0016295909881591797, -0.00137251615524292, -0.0011154413223266602, -0.0008583664894104004, -0.0006012916564941406, -0.00034421682357788086, -8.71419906616211e-05, 0.00016993284225463867, 0.00042700767517089844, 0.0006840825080871582, 0.000941157341003418, 0.0011982321739196777, 0.0014553070068359375, 0.0017123818397521973, 0.001969456672668457, 0.002226531505584717, 0.0024836063385009766, 0.0027406811714172363, 0.002997756004333496, 0.003254830837249756, 0.0035119056701660156, 0.0037689805030822754, 0.004026055335998535, 0.004283130168914795, 0.004540205001831055, 0.0047972798347473145, 0.005054354667663574, 0.005311429500579834, 0.005568504333496094, 0.0058255791664123535, 0.006082653999328613, 0.006339728832244873, 0.006596803665161133, 0.006853878498077393, 0.007110953330993652, 0.007368028163909912, 0.007625102996826172, 0.007882177829742432, 0.008139252662658691, 0.008396327495574951, 0.008653402328491211, 0.00891047716140747, 0.00916755199432373, 0.00942462682723999, 0.00968170166015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 7.0, 12.0, 8.0, 13.0, 25.0, 36.0, 61.0, 111.0, 208.0, 233.0, 117.0, 63.0, 32.0, 24.0, 21.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0107574462890625, -0.010528534650802612, -0.010299623012542725, -0.010070711374282837, -0.00984179973602295, -0.009612888097763062, -0.009383976459503174, -0.009155064821243286, -0.008926153182983398, -0.00869724154472351, -0.008468329906463623, -0.008239418268203735, -0.008010506629943848, -0.00778159499168396, -0.007552683353424072, -0.007323771715164185, -0.007094860076904297, -0.006865948438644409, -0.0066370368003845215, -0.006408125162124634, -0.006179213523864746, -0.005950301885604858, -0.005721390247344971, -0.005492478609085083, -0.005263566970825195, -0.005034655332565308, -0.00480574369430542, -0.004576832056045532, -0.0043479204177856445, -0.004119008779525757, -0.003890097141265869, -0.0036611855030059814, -0.0034322738647460938, -0.003203362226486206, -0.0029744505882263184, -0.0027455389499664307, -0.002516627311706543, -0.0022877156734466553, -0.0020588040351867676, -0.0018298923969268799, -0.0016009807586669922, -0.0013720691204071045, -0.0011431574821472168, -0.0009142458438873291, -0.0006853342056274414, -0.0004564225673675537, -0.00022751092910766602, 1.4007091522216797e-06, 0.00023031234741210938, 0.00045922398567199707, 0.0006881356239318848, 0.0009170472621917725, 0.0011459589004516602, 0.0013748705387115479, 0.0016037821769714355, 0.0018326938152313232, 0.002061605453491211, 0.0022905170917510986, 0.0025194287300109863, 0.002748340368270874, 0.0029772520065307617, 0.0032061636447906494, 0.003435075283050537, 0.003663986921310425, 0.0038928985595703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 14.0, 17.0, 58.0, 483.0, 295.0, 81.0, 31.0, 17.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.689971923828125, -22.160972595214844, -21.631973266601562, -21.10297203063965, -20.573972702026367, -20.044973373413086, -19.515974044799805, -18.986974716186523, -18.45797348022461, -17.928974151611328, -17.399974822998047, -16.870973587036133, -16.34197425842285, -15.81297492980957, -15.283975601196289, -14.754976272583008, -14.225976943969727, -13.696977615356445, -13.167977333068848, -12.638978004455566, -12.109977722167969, -11.580978393554688, -11.051979064941406, -10.522979736328125, -9.993979454040527, -9.464980125427246, -8.935979843139648, -8.406980514526367, -7.877980709075928, -7.348980903625488, -6.819981575012207, -6.290981769561768, -5.761983871459961, -5.2329840660095215, -4.703984260559082, -4.174984931945801, -3.6459851264953613, -3.116985321044922, -2.5879857540130615, -2.058986186981201, -1.5299863815307617, -1.0009866952896118, -0.4719870090484619, 0.05701267719268799, 0.5860123634338379, 1.1150121688842773, 1.6440117359161377, 2.173011302947998, 2.7020111083984375, 3.231010913848877, 3.7600104808807373, 4.289010047912598, 4.818009853363037, 5.347009658813477, 5.876008987426758, 6.405008792877197, 6.934008598327637, 7.463008403778076, 7.992008209228516, 8.521007537841797, 9.050006866455078, 9.579007148742676, 10.108006477355957, 10.637006759643555, 11.166006088256836]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 9.0, 16.0, 28.0, 37.0, 70.0, 99.0, 133.0, 177.0, 160.0, 107.0, 54.0, 38.0, 18.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.262331008911133, -8.761574745178223, -8.260818481445312, -7.760062217712402, -7.259305953979492, -6.758549690246582, -6.25779390335083, -5.75703763961792, -5.25628137588501, -4.7555251121521, -4.2547688484191895, -3.7540128231048584, -3.2532565593719482, -2.752500295639038, -2.251744270324707, -1.7509880065917969, -1.2502317428588867, -0.7494755387306213, -0.24871933460235596, 0.25203680992126465, 0.7527930736541748, 1.253549337387085, 1.754305362701416, 2.255061626434326, 2.7558178901672363, 3.2565741539001465, 3.7573304176330566, 4.258086204528809, 4.758842468261719, 5.259598731994629, 5.760354995727539, 6.261111259460449, 6.761867523193359, 7.2626237869262695, 7.76338005065918, 8.26413631439209, 8.764892578125, 9.26564884185791, 9.76640510559082, 10.267160415649414, 10.76791763305664, 11.26867389678955, 11.769430160522461, 12.270186424255371, 12.770942687988281, 13.271698951721191, 13.772455215454102, 14.273210525512695, 14.773966789245605, 15.274723052978516, 15.775479316711426, 16.276235580444336, 16.77699089050293, 17.277748107910156, 17.77850341796875, 18.279260635375977, 18.78001594543457, 19.280771255493164, 19.78152847290039, 20.282283782958984, 20.78304100036621, 21.283796310424805, 21.78455352783203, 22.285308837890625, 22.78606605529785]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 6.0, 11.0, 8.0, 23.0, 44.0, 54.0, 103.0, 163.0, 350.0, 999.0, 11295.0, 4176424.0, 3838.0, 674.0, 180.0, 58.0, 27.0, 10.0, 3.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.9375, -78.09130859375, -76.2451171875, -74.39892578125, -72.552734375, -70.70654296875, -68.8603515625, -67.01416015625, -65.16796875, -63.32177734375, -61.4755859375, -59.62939453125, -57.783203125, -55.93701171875, -54.0908203125, -52.24462890625, -50.3984375, -48.55224609375, -46.7060546875, -44.85986328125, -43.013671875, -41.16748046875, -39.3212890625, -37.47509765625, -35.62890625, -33.78271484375, -31.9365234375, -30.09033203125, -28.244140625, -26.39794921875, -24.5517578125, -22.70556640625, -20.859375, -19.01318359375, -17.1669921875, -15.32080078125, -13.474609375, -11.62841796875, -9.7822265625, -7.93603515625, -6.08984375, -4.24365234375, -2.3974609375, -0.55126953125, 1.294921875, 3.14111328125, 4.9873046875, 6.83349609375, 8.6796875, 10.52587890625, 12.3720703125, 14.21826171875, 16.064453125, 17.91064453125, 19.7568359375, 21.60302734375, 23.44921875, 25.29541015625, 27.1416015625, 28.98779296875, 30.833984375, 32.68017578125, 34.5263671875, 36.37255859375, 38.21875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 25.0, 49.0, 821.0, 26.0, 20.0, 16.0, 7.0, 6.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7322006225585938, -0.7148895263671875, -0.6975784301757812, -0.680267333984375, -0.6629562377929688, -0.6456451416015625, -0.6283340454101562, -0.61102294921875, -0.5937118530273438, -0.5764007568359375, -0.5590896606445312, -0.541778564453125, -0.5244674682617188, -0.5071563720703125, -0.48984527587890625, -0.4725341796875, -0.45522308349609375, -0.4379119873046875, -0.42060089111328125, -0.403289794921875, -0.38597869873046875, -0.3686676025390625, -0.35135650634765625, -0.33404541015625, -0.31673431396484375, -0.2994232177734375, -0.28211212158203125, -0.264801025390625, -0.24748992919921875, -0.2301788330078125, -0.21286773681640625, -0.195556640625, -0.17824554443359375, -0.1609344482421875, -0.14362335205078125, -0.126312255859375, -0.10900115966796875, -0.0916900634765625, -0.07437896728515625, -0.05706787109375, -0.03975677490234375, -0.0224456787109375, -0.00513458251953125, 0.012176513671875, 0.02948760986328125, 0.0467987060546875, 0.06410980224609375, 0.0814208984375, 0.09873199462890625, 0.1160430908203125, 0.13335418701171875, 0.150665283203125, 0.16797637939453125, 0.1852874755859375, 0.20259857177734375, 0.21990966796875, 0.23722076416015625, 0.2545318603515625, 0.27184295654296875, 0.289154052734375, 0.30646514892578125, 0.3237762451171875, 0.34108734130859375, 0.3583984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 6.0, 17.0, 10.0, 23.0, 36.0, 37.0, 69.0, 88.0, 150.0, 310.0, 554.0, 1021.0, 2145.0, 4729.0, 11657.0, 36460.0, 3933214.0, 159742.0, 27129.0, 9175.0, 3925.0, 1732.0, 900.0, 478.0, 252.0, 138.0, 84.0, 49.0, 39.0, 31.0, 17.0, 15.0, 15.0, 14.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.103515625, -2.01904296875, -1.9345703125, -1.85009765625, -1.765625, -1.68115234375, -1.5966796875, -1.51220703125, -1.427734375, -1.34326171875, -1.2587890625, -1.17431640625, -1.08984375, -1.00537109375, -0.9208984375, -0.83642578125, -0.751953125, -0.66748046875, -0.5830078125, -0.49853515625, -0.4140625, -0.32958984375, -0.2451171875, -0.16064453125, -0.076171875, 0.00830078125, 0.0927734375, 0.17724609375, 0.26171875, 0.34619140625, 0.4306640625, 0.51513671875, 0.599609375, 0.68408203125, 0.7685546875, 0.85302734375, 0.9375, 1.02197265625, 1.1064453125, 1.19091796875, 1.275390625, 1.35986328125, 1.4443359375, 1.52880859375, 1.61328125, 1.69775390625, 1.7822265625, 1.86669921875, 1.951171875, 2.03564453125, 2.1201171875, 2.20458984375, 2.2890625, 2.37353515625, 2.4580078125, 2.54248046875, 2.626953125, 2.71142578125, 2.7958984375, 2.88037109375, 2.96484375, 3.04931640625, 3.1337890625, 3.21826171875, 3.302734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 2.0, 5.0, 5.0, 3.0, 9.0, 14.0, 12.0, 12.0, 19.0, 21.0, 20.0, 26.0, 35.0, 27.0, 32.0, 3558.0, 68.0, 36.0, 30.0, 22.0, 17.0, 17.0, 12.0, 15.0, 9.0, 12.0, 7.0, 7.0, 8.0, 4.0, 0.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.438720703125, -0.4274101257324219, -0.41609954833984375, -0.4047889709472656, -0.3934783935546875, -0.3821678161621094, -0.37085723876953125, -0.3595466613769531, -0.348236083984375, -0.3369255065917969, -0.32561492919921875, -0.3143043518066406, -0.3029937744140625, -0.2916831970214844, -0.28037261962890625, -0.2690620422363281, -0.25775146484375, -0.24644088745117188, -0.23513031005859375, -0.22381973266601562, -0.2125091552734375, -0.20119857788085938, -0.18988800048828125, -0.17857742309570312, -0.167266845703125, -0.15595626831054688, -0.14464569091796875, -0.13333511352539062, -0.1220245361328125, -0.11071395874023438, -0.09940338134765625, -0.08809280395507812, -0.0767822265625, -0.06547164916992188, -0.05416107177734375, -0.042850494384765625, -0.0315399169921875, -0.020229339599609375, -0.00891876220703125, 0.002391815185546875, 0.013702392578125, 0.025012969970703125, 0.03632354736328125, 0.047634124755859375, 0.0589447021484375, 0.07025527954101562, 0.08156585693359375, 0.09287643432617188, 0.10418701171875, 0.11549758911132812, 0.12680816650390625, 0.13811874389648438, 0.1494293212890625, 0.16073989868164062, 0.17205047607421875, 0.18336105346679688, 0.194671630859375, 0.20598220825195312, 0.21729278564453125, 0.22860336303710938, 0.2399139404296875, 0.2512245178222656, 0.26253509521484375, 0.2738456726074219, 0.28515625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 957.0, 42.0, 8.0, 2.0, 0.0, 1.0], "bins": [-30.43301010131836, -29.91424560546875, -29.39548110961914, -28.87671661376953, -28.357952117919922, -27.839187622070312, -27.320423126220703, -26.801658630371094, -26.282894134521484, -25.764129638671875, -25.245365142822266, -24.726600646972656, -24.207836151123047, -23.689071655273438, -23.170307159423828, -22.65154266357422, -22.132776260375977, -21.614011764526367, -21.095247268676758, -20.57648277282715, -20.05771827697754, -19.53895378112793, -19.02018928527832, -18.501422882080078, -17.98265838623047, -17.46389389038086, -16.94512939453125, -16.42636489868164, -15.907600402832031, -15.388835906982422, -14.870070457458496, -14.351305961608887, -13.832544326782227, -13.313779830932617, -12.795015335083008, -12.276250839233398, -11.757486343383789, -11.23872184753418, -10.719956398010254, -10.201191902160645, -9.682427406311035, -9.163662910461426, -8.644898414611816, -8.126133918762207, -7.6073689460754395, -7.08860445022583, -6.5698394775390625, -6.051074981689453, -5.532310485839844, -5.013545989990234, -4.494781494140625, -3.9760165214538574, -3.457252025604248, -2.9384875297546387, -2.41972279548645, -1.9009580612182617, -1.3821935653686523, -0.8634289503097534, -0.3446643352508545, 0.17410027980804443, 0.6928648948669434, 1.2116293907165527, 1.7303941249847412, 2.2491588592529297, 2.767923355102539]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 14.0, 18.0, 32.0, 45.0, 67.0, 124.0, 130.0, 135.0, 126.0, 95.0, 72.0, 48.0, 33.0, 14.0, 13.0, 3.0, 5.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4376091957092285, -1.3694449663162231, -1.3012807369232178, -1.233116626739502, -1.1649523973464966, -1.0967881679534912, -1.0286240577697754, -0.96045982837677, -0.8922955989837646, -0.8241313695907593, -0.7559671998023987, -0.6878030300140381, -0.6196388006210327, -0.5514745712280273, -0.48331040143966675, -0.41514620184898376, -0.3469820022583008, -0.2788178026676178, -0.21065360307693481, -0.14248940348625183, -0.07432520389556885, -0.006161004304885864, 0.06200319528579712, 0.1301673948764801, 0.19833159446716309, 0.26649579405784607, 0.33465999364852905, 0.40282419323921204, 0.470988392829895, 0.5391526222229004, 0.607316792011261, 0.6754809617996216, 0.743645191192627, 0.8118094205856323, 0.8799735903739929, 0.9481377601623535, 1.0163019895553589, 1.0844662189483643, 1.15263032913208, 1.2207945585250854, 1.2889587879180908, 1.3571230173110962, 1.4252872467041016, 1.4934513568878174, 1.5616155862808228, 1.6297798156738281, 1.697943925857544, 1.7661081552505493, 1.8342723846435547, 1.90243661403656, 1.9706008434295654, 2.0387649536132812, 2.106929302215576, 2.175093412399292, 2.243257522583008, 2.3114218711853027, 2.3795859813690186, 2.4477500915527344, 2.5159144401550293, 2.584078550338745, 2.652242660522461, 2.720407009124756, 2.7885711193084717, 2.8567354679107666, 2.9248995780944824]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 7.0, 9.0, 11.0, 20.0, 27.0, 20.0, 23.0, 53.0, 67.0, 96.0, 164.0, 283.0, 461.0, 977.0, 2843.0, 13242.0, 995276.0, 27853.0, 4273.0, 1341.0, 582.0, 313.0, 193.0, 150.0, 62.0, 53.0, 38.0, 20.0, 24.0, 17.0, 12.0, 17.0, 5.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0625, -4.9205322265625, -4.778564453125, -4.6365966796875, -4.49462890625, -4.3526611328125, -4.210693359375, -4.0687255859375, -3.9267578125, -3.7847900390625, -3.642822265625, -3.5008544921875, -3.35888671875, -3.2169189453125, -3.074951171875, -2.9329833984375, -2.791015625, -2.6490478515625, -2.507080078125, -2.3651123046875, -2.22314453125, -2.0811767578125, -1.939208984375, -1.7972412109375, -1.6552734375, -1.5133056640625, -1.371337890625, -1.2293701171875, -1.08740234375, -0.9454345703125, -0.803466796875, -0.6614990234375, -0.51953125, -0.3775634765625, -0.235595703125, -0.0936279296875, 0.04833984375, 0.1903076171875, 0.332275390625, 0.4742431640625, 0.6162109375, 0.7581787109375, 0.900146484375, 1.0421142578125, 1.18408203125, 1.3260498046875, 1.468017578125, 1.6099853515625, 1.751953125, 1.8939208984375, 2.035888671875, 2.1778564453125, 2.31982421875, 2.4617919921875, 2.603759765625, 2.7457275390625, 2.8876953125, 3.0296630859375, 3.171630859375, 3.3135986328125, 3.45556640625, 3.5975341796875, 3.739501953125, 3.8814697265625, 4.0234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 19.0, 35.0, 491.0, 382.0, 19.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73486328125, -0.7177467346191406, -0.7006301879882812, -0.6835136413574219, -0.6663970947265625, -0.6492805480957031, -0.6321640014648438, -0.6150474548339844, -0.597930908203125, -0.5808143615722656, -0.5636978149414062, -0.5465812683105469, -0.5294647216796875, -0.5123481750488281, -0.49523162841796875, -0.4781150817871094, -0.46099853515625, -0.4438819885253906, -0.42676544189453125, -0.4096488952636719, -0.3925323486328125, -0.3754158020019531, -0.35829925537109375, -0.3411827087402344, -0.324066162109375, -0.3069496154785156, -0.28983306884765625, -0.2727165222167969, -0.2555999755859375, -0.23848342895507812, -0.22136688232421875, -0.20425033569335938, -0.1871337890625, -0.17001724243164062, -0.15290069580078125, -0.13578414916992188, -0.1186676025390625, -0.10155105590820312, -0.08443450927734375, -0.06731796264648438, -0.050201416015625, -0.033084869384765625, -0.01596832275390625, 0.001148223876953125, 0.0182647705078125, 0.035381317138671875, 0.05249786376953125, 0.06961441040039062, 0.08673095703125, 0.10384750366210938, 0.12096405029296875, 0.13808059692382812, 0.1551971435546875, 0.17231369018554688, 0.18943023681640625, 0.20654678344726562, 0.223663330078125, 0.24077987670898438, 0.25789642333984375, 0.2750129699707031, 0.2921295166015625, 0.3092460632324219, 0.32636260986328125, 0.3434791564941406, 0.360595703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 3.0, 13.0, 14.0, 15.0, 30.0, 33.0, 44.0, 78.0, 114.0, 218.0, 433.0, 1162.0, 4514.0, 28276.0, 736721.0, 254946.0, 17060.0, 3081.0, 911.0, 370.0, 177.0, 103.0, 68.0, 39.0, 30.0, 26.0, 20.0, 11.0, 9.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6123046875, -1.5523223876953125, -1.492340087890625, -1.4323577880859375, -1.37237548828125, -1.3123931884765625, -1.252410888671875, -1.1924285888671875, -1.1324462890625, -1.0724639892578125, -1.012481689453125, -0.9524993896484375, -0.89251708984375, -0.8325347900390625, -0.772552490234375, -0.7125701904296875, -0.652587890625, -0.5926055908203125, -0.532623291015625, -0.4726409912109375, -0.41265869140625, -0.3526763916015625, -0.292694091796875, -0.2327117919921875, -0.1727294921875, -0.1127471923828125, -0.052764892578125, 0.0072174072265625, 0.06719970703125, 0.1271820068359375, 0.187164306640625, 0.2471466064453125, 0.30712890625, 0.3671112060546875, 0.427093505859375, 0.4870758056640625, 0.54705810546875, 0.6070404052734375, 0.667022705078125, 0.7270050048828125, 0.7869873046875, 0.8469696044921875, 0.906951904296875, 0.9669342041015625, 1.02691650390625, 1.0868988037109375, 1.146881103515625, 1.2068634033203125, 1.266845703125, 1.3268280029296875, 1.386810302734375, 1.4467926025390625, 1.50677490234375, 1.5667572021484375, 1.626739501953125, 1.6867218017578125, 1.7467041015625, 1.8066864013671875, 1.866668701171875, 1.9266510009765625, 1.98663330078125, 2.0466156005859375, 2.106597900390625, 2.1665802001953125, 2.2265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 9.0, 10.0, 17.0, 22.0, 19.0, 27.0, 41.0, 43.0, 35.0, 51.0, 48.0, 59.0, 50.0, 50.0, 56.0, 65.0, 50.0, 48.0, 37.0, 41.0, 36.0, 37.0, 26.0, 29.0, 22.0, 15.0, 12.0, 13.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67626953125, -0.6580314636230469, -0.6397933959960938, -0.6215553283691406, -0.6033172607421875, -0.5850791931152344, -0.5668411254882812, -0.5486030578613281, -0.530364990234375, -0.5121269226074219, -0.49388885498046875, -0.4756507873535156, -0.4574127197265625, -0.4391746520996094, -0.42093658447265625, -0.4026985168457031, -0.38446044921875, -0.3662223815917969, -0.34798431396484375, -0.3297462463378906, -0.3115081787109375, -0.2932701110839844, -0.27503204345703125, -0.2567939758300781, -0.238555908203125, -0.22031784057617188, -0.20207977294921875, -0.18384170532226562, -0.1656036376953125, -0.14736557006835938, -0.12912750244140625, -0.11088943481445312, -0.0926513671875, -0.07441329956054688, -0.05617523193359375, -0.037937164306640625, -0.0196990966796875, -0.001461029052734375, 0.01677703857421875, 0.035015106201171875, 0.053253173828125, 0.07149124145507812, 0.08972930908203125, 0.10796737670898438, 0.1262054443359375, 0.14444351196289062, 0.16268157958984375, 0.18091964721679688, 0.19915771484375, 0.21739578247070312, 0.23563385009765625, 0.2538719177246094, 0.2721099853515625, 0.2903480529785156, 0.30858612060546875, 0.3268241882324219, 0.345062255859375, 0.3633003234863281, 0.38153839111328125, 0.3997764587402344, 0.4180145263671875, 0.4362525939941406, 0.45449066162109375, 0.4727287292480469, 0.490966796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 12.0, 27.0, 32.0, 41.0, 85.0, 146.0, 336.0, 1108.0, 5489.0, 65537.0, 930444.0, 39715.0, 4029.0, 946.0, 281.0, 104.0, 79.0, 53.0, 20.0, 16.0, 20.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.0924224853515625, -0.089813232421875, -0.0872039794921875, -0.0845947265625, -0.0819854736328125, -0.079376220703125, -0.0767669677734375, -0.07415771484375, -0.0715484619140625, -0.068939208984375, -0.0663299560546875, -0.063720703125, -0.0611114501953125, -0.058502197265625, -0.0558929443359375, -0.05328369140625, -0.0506744384765625, -0.048065185546875, -0.0454559326171875, -0.0428466796875, -0.0402374267578125, -0.037628173828125, -0.0350189208984375, -0.03240966796875, -0.0298004150390625, -0.027191162109375, -0.0245819091796875, -0.02197265625, -0.0193634033203125, -0.016754150390625, -0.0141448974609375, -0.01153564453125, -0.0089263916015625, -0.006317138671875, -0.0037078857421875, -0.0010986328125, 0.0015106201171875, 0.004119873046875, 0.0067291259765625, 0.00933837890625, 0.0119476318359375, 0.014556884765625, 0.0171661376953125, 0.019775390625, 0.0223846435546875, 0.024993896484375, 0.0276031494140625, 0.03021240234375, 0.0328216552734375, 0.035430908203125, 0.0380401611328125, 0.0406494140625, 0.0432586669921875, 0.045867919921875, 0.0484771728515625, 0.05108642578125, 0.0536956787109375, 0.056304931640625, 0.0589141845703125, 0.0615234375, 0.0641326904296875, 0.066741943359375, 0.0693511962890625, 0.07196044921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 0.0, 9.0, 8.0, 14.0, 23.0, 32.0, 26.0, 43.0, 76.0, 108.0, 82.0, 145.0, 113.0, 76.0, 73.0, 60.0, 37.0, 21.0, 14.0, 10.0, 10.0, 10.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.810761988162994e-06, -6.588175892829895e-06, -6.365589797496796e-06, -6.143003702163696e-06, -5.920417606830597e-06, -5.6978315114974976e-06, -5.475245416164398e-06, -5.252659320831299e-06, -5.0300732254981995e-06, -4.8074871301651e-06, -4.584901034832001e-06, -4.362314939498901e-06, -4.139728844165802e-06, -3.917142748832703e-06, -3.6945566534996033e-06, -3.471970558166504e-06, -3.2493844628334045e-06, -3.026798367500305e-06, -2.804212272167206e-06, -2.5816261768341064e-06, -2.359040081501007e-06, -2.1364539861679077e-06, -1.9138678908348083e-06, -1.691281795501709e-06, -1.4686957001686096e-06, -1.2461096048355103e-06, -1.0235235095024109e-06, -8.009374141693115e-07, -5.783513188362122e-07, -3.557652235031128e-07, -1.3317912817001343e-07, 8.940696716308594e-08, 3.119930624961853e-07, 5.345791578292847e-07, 7.57165253162384e-07, 9.797513484954834e-07, 1.2023374438285828e-06, 1.4249235391616821e-06, 1.6475096344947815e-06, 1.8700957298278809e-06, 2.0926818251609802e-06, 2.3152679204940796e-06, 2.537854015827179e-06, 2.7604401111602783e-06, 2.9830262064933777e-06, 3.205612301826477e-06, 3.4281983971595764e-06, 3.6507844924926758e-06, 3.873370587825775e-06, 4.0959566831588745e-06, 4.318542778491974e-06, 4.541128873825073e-06, 4.763714969158173e-06, 4.986301064491272e-06, 5.208887159824371e-06, 5.431473255157471e-06, 5.65405935049057e-06, 5.8766454458236694e-06, 6.099231541156769e-06, 6.321817636489868e-06, 6.5444037318229675e-06, 6.766989827156067e-06, 6.989575922489166e-06, 7.212162017822266e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 9.0, 10.0, 18.0, 15.0, 45.0, 57.0, 88.0, 228.0, 541.0, 1417.0, 5807.0, 60901.0, 945925.0, 27403.0, 4069.0, 1146.0, 413.0, 193.0, 80.0, 55.0, 44.0, 20.0, 17.0, 7.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.0857391357421875, -0.082916259765625, -0.0800933837890625, -0.0772705078125, -0.0744476318359375, -0.071624755859375, -0.0688018798828125, -0.06597900390625, -0.0631561279296875, -0.060333251953125, -0.0575103759765625, -0.0546875, -0.0518646240234375, -0.049041748046875, -0.0462188720703125, -0.04339599609375, -0.0405731201171875, -0.037750244140625, -0.0349273681640625, -0.0321044921875, -0.0292816162109375, -0.026458740234375, -0.0236358642578125, -0.02081298828125, -0.0179901123046875, -0.015167236328125, -0.0123443603515625, -0.009521484375, -0.0066986083984375, -0.003875732421875, -0.0010528564453125, 0.00177001953125, 0.0045928955078125, 0.007415771484375, 0.0102386474609375, 0.0130615234375, 0.0158843994140625, 0.018707275390625, 0.0215301513671875, 0.02435302734375, 0.0271759033203125, 0.029998779296875, 0.0328216552734375, 0.03564453125, 0.0384674072265625, 0.041290283203125, 0.0441131591796875, 0.04693603515625, 0.0497589111328125, 0.052581787109375, 0.0554046630859375, 0.0582275390625, 0.0610504150390625, 0.063873291015625, 0.0666961669921875, 0.06951904296875, 0.0723419189453125, 0.075164794921875, 0.0779876708984375, 0.080810546875, 0.0836334228515625, 0.086456298828125, 0.0892791748046875, 0.09210205078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 15.0, 10.0, 25.0, 37.0, 50.0, 75.0, 87.0, 138.0, 119.0, 124.0, 82.0, 56.0, 38.0, 28.0, 14.0, 16.0, 7.0, 11.0, 5.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0290069580078125, -0.028110027313232422, -0.027213096618652344, -0.026316165924072266, -0.025419235229492188, -0.02452230453491211, -0.02362537384033203, -0.022728443145751953, -0.021831512451171875, -0.020934581756591797, -0.02003765106201172, -0.01914072036743164, -0.018243789672851562, -0.017346858978271484, -0.016449928283691406, -0.015552997589111328, -0.01465606689453125, -0.013759136199951172, -0.012862205505371094, -0.011965274810791016, -0.011068344116210938, -0.01017141342163086, -0.009274482727050781, -0.008377552032470703, -0.007480621337890625, -0.006583690643310547, -0.005686759948730469, -0.004789829254150391, -0.0038928985595703125, -0.0029959678649902344, -0.0020990371704101562, -0.0012021064758300781, -0.00030517578125, 0.0005917549133300781, 0.0014886856079101562, 0.0023856163024902344, 0.0032825469970703125, 0.004179477691650391, 0.005076408386230469, 0.005973339080810547, 0.006870269775390625, 0.007767200469970703, 0.008664131164550781, 0.00956106185913086, 0.010457992553710938, 0.011354923248291016, 0.012251853942871094, 0.013148784637451172, 0.01404571533203125, 0.014942646026611328, 0.015839576721191406, 0.016736507415771484, 0.017633438110351562, 0.01853036880493164, 0.01942729949951172, 0.020324230194091797, 0.021221160888671875, 0.022118091583251953, 0.02301502227783203, 0.02391195297241211, 0.024808883666992188, 0.025705814361572266, 0.026602745056152344, 0.027499675750732422, 0.0283966064453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 14.0, 160.0, 792.0, 34.0, 8.0, 2.0, 6.0], "bins": [-47.23650360107422, -46.43891906738281, -45.64133071899414, -44.843746185302734, -44.04615783691406, -43.248573303222656, -42.450984954833984, -41.65340042114258, -40.855812072753906, -40.0582275390625, -39.26063919067383, -38.46305465698242, -37.66546630859375, -36.867881774902344, -36.07029342651367, -35.272708892822266, -34.47512435913086, -33.67753982543945, -32.87995147705078, -32.082366943359375, -31.284778594970703, -30.487194061279297, -29.689607620239258, -28.89202117919922, -28.09443473815918, -27.29684829711914, -26.4992618560791, -25.701675415039062, -24.904090881347656, -24.106504440307617, -23.308917999267578, -22.51133155822754, -21.7137451171875, -20.91615867614746, -20.118572235107422, -19.320985794067383, -18.523399353027344, -17.725814819335938, -16.9282283782959, -16.13064193725586, -15.33305549621582, -14.535469055175781, -13.737882614135742, -12.94029712677002, -12.14271068572998, -11.345124244689941, -10.547538757324219, -9.74995231628418, -8.95236587524414, -8.154779434204102, -7.357193470001221, -6.55960750579834, -5.762021064758301, -4.964434623718262, -4.166848659515381, -3.3692626953125, -2.571676015853882, -1.7740898132324219, -0.9765036106109619, -0.17891740798950195, 0.618668794631958, 1.416254997253418, 2.213841199874878, 3.011427164077759, 3.809013605117798]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 12.0, 16.0, 25.0, 23.0, 37.0, 50.0, 61.0, 77.0, 74.0, 94.0, 86.0, 87.0, 84.0, 54.0, 51.0, 41.0, 34.0, 20.0, 22.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.451914310455322, -5.28645133972168, -5.120988845825195, -4.955526351928711, -4.790063381195068, -4.624600410461426, -4.459137916564941, -4.293675422668457, -4.1282124519348145, -3.962749719619751, -3.7972869873046875, -3.631824254989624, -3.4663615226745605, -3.300898790359497, -3.1354360580444336, -2.96997332572937, -2.8045105934143066, -2.639047861099243, -2.4735851287841797, -2.308122396469116, -2.1426596641540527, -1.9771969318389893, -1.8117341995239258, -1.6462714672088623, -1.4808087348937988, -1.3153460025787354, -1.1498832702636719, -0.9844205379486084, -0.8189578056335449, -0.6534950733184814, -0.48803234100341797, -0.3225696086883545, -0.1571063995361328, 0.008356332778930664, 0.17381906509399414, 0.3392817974090576, 0.5047445297241211, 0.6702072620391846, 0.835669994354248, 1.0011327266693115, 1.166595458984375, 1.3320581912994385, 1.497520923614502, 1.6629836559295654, 1.828446388244629, 1.9939091205596924, 2.159371852874756, 2.3248345851898193, 2.490297317504883, 2.6557600498199463, 2.8212227821350098, 2.9866855144500732, 3.1521482467651367, 3.3176109790802, 3.4830737113952637, 3.648536443710327, 3.8139991760253906, 3.979461908340454, 4.144924640655518, 4.31038761138916, 4.4758501052856445, 4.641312599182129, 4.8067755699157715, 4.972238540649414, 5.137701034545898]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 16.0, 51.0, 57.0, 98.0, 248.0, 505.0, 3050.0, 4179897.0, 9364.0, 776.0, 172.0, 31.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.4306640625, -34.580078125, -33.7294921875, -32.87890625, -32.0283203125, -31.177734375, -30.3271484375, -29.4765625, -28.6259765625, -27.775390625, -26.9248046875, -26.07421875, -25.2236328125, -24.373046875, -23.5224609375, -22.671875, -21.8212890625, -20.970703125, -20.1201171875, -19.26953125, -18.4189453125, -17.568359375, -16.7177734375, -15.8671875, -15.0166015625, -14.166015625, -13.3154296875, -12.46484375, -11.6142578125, -10.763671875, -9.9130859375, -9.0625, -8.2119140625, -7.361328125, -6.5107421875, -5.66015625, -4.8095703125, -3.958984375, -3.1083984375, -2.2578125, -1.4072265625, -0.556640625, 0.2939453125, 1.14453125, 1.9951171875, 2.845703125, 3.6962890625, 4.546875, 5.3974609375, 6.248046875, 7.0986328125, 7.94921875, 8.7998046875, 9.650390625, 10.5009765625, 11.3515625, 12.2021484375, 13.052734375, 13.9033203125, 14.75390625, 15.6044921875, 16.455078125, 17.3056640625, 18.15625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 21.0, 52.0, 745.0, 108.0, 31.0, 13.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.7061920166015625, -0.689239501953125, -0.6722869873046875, -0.65533447265625, -0.6383819580078125, -0.621429443359375, -0.6044769287109375, -0.5875244140625, -0.5705718994140625, -0.553619384765625, -0.5366668701171875, -0.51971435546875, -0.5027618408203125, -0.485809326171875, -0.4688568115234375, -0.451904296875, -0.4349517822265625, -0.417999267578125, -0.4010467529296875, -0.38409423828125, -0.3671417236328125, -0.350189208984375, -0.3332366943359375, -0.3162841796875, -0.2993316650390625, -0.282379150390625, -0.2654266357421875, -0.24847412109375, -0.2315216064453125, -0.214569091796875, -0.1976165771484375, -0.1806640625, -0.1637115478515625, -0.146759033203125, -0.1298065185546875, -0.11285400390625, -0.0959014892578125, -0.078948974609375, -0.0619964599609375, -0.0450439453125, -0.0280914306640625, -0.011138916015625, 0.0058135986328125, 0.02276611328125, 0.0397186279296875, 0.056671142578125, 0.0736236572265625, 0.090576171875, 0.1075286865234375, 0.124481201171875, 0.1414337158203125, 0.15838623046875, 0.1753387451171875, 0.192291259765625, 0.2092437744140625, 0.2261962890625, 0.2431488037109375, 0.260101318359375, 0.2770538330078125, 0.29400634765625, 0.3109588623046875, 0.327911376953125, 0.3448638916015625, 0.36181640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 9.0, 12.0, 14.0, 15.0, 15.0, 27.0, 36.0, 52.0, 75.0, 145.0, 413.0, 1898.0, 17462.0, 4020071.0, 145773.0, 6373.0, 1075.0, 299.0, 146.0, 71.0, 58.0, 47.0, 39.0, 31.0, 27.0, 13.0, 19.0, 12.0, 10.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.11383056640625, -3.9659423828125, -3.81805419921875, -3.670166015625, -3.52227783203125, -3.3743896484375, -3.22650146484375, -3.07861328125, -2.93072509765625, -2.7828369140625, -2.63494873046875, -2.487060546875, -2.33917236328125, -2.1912841796875, -2.04339599609375, -1.8955078125, -1.74761962890625, -1.5997314453125, -1.45184326171875, -1.303955078125, -1.15606689453125, -1.0081787109375, -0.86029052734375, -0.71240234375, -0.56451416015625, -0.4166259765625, -0.26873779296875, -0.120849609375, 0.02703857421875, 0.1749267578125, 0.32281494140625, 0.470703125, 0.61859130859375, 0.7664794921875, 0.91436767578125, 1.062255859375, 1.21014404296875, 1.3580322265625, 1.50592041015625, 1.65380859375, 1.80169677734375, 1.9495849609375, 2.09747314453125, 2.245361328125, 2.39324951171875, 2.5411376953125, 2.68902587890625, 2.8369140625, 2.98480224609375, 3.1326904296875, 3.28057861328125, 3.428466796875, 3.57635498046875, 3.7242431640625, 3.87213134765625, 4.02001953125, 4.16790771484375, 4.3157958984375, 4.46368408203125, 4.611572265625, 4.75946044921875, 4.9073486328125, 5.05523681640625, 5.203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 3.0, 10.0, 9.0, 13.0, 19.0, 11.0, 23.0, 18.0, 31.0, 27.0, 29.0, 42.0, 50.0, 58.0, 91.0, 180.0, 2791.0, 247.0, 100.0, 69.0, 44.0, 42.0, 31.0, 30.0, 18.0, 11.0, 13.0, 12.0, 10.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.389892578125, -0.3789520263671875, -0.368011474609375, -0.3570709228515625, -0.34613037109375, -0.3351898193359375, -0.324249267578125, -0.3133087158203125, -0.3023681640625, -0.2914276123046875, -0.280487060546875, -0.2695465087890625, -0.25860595703125, -0.2476654052734375, -0.236724853515625, -0.2257843017578125, -0.21484375, -0.2039031982421875, -0.192962646484375, -0.1820220947265625, -0.17108154296875, -0.1601409912109375, -0.149200439453125, -0.1382598876953125, -0.1273193359375, -0.1163787841796875, -0.105438232421875, -0.0944976806640625, -0.08355712890625, -0.0726165771484375, -0.061676025390625, -0.0507354736328125, -0.039794921875, -0.0288543701171875, -0.017913818359375, -0.0069732666015625, 0.00396728515625, 0.0149078369140625, 0.025848388671875, 0.0367889404296875, 0.0477294921875, 0.0586700439453125, 0.069610595703125, 0.0805511474609375, 0.09149169921875, 0.1024322509765625, 0.113372802734375, 0.1243133544921875, 0.13525390625, 0.1461944580078125, 0.157135009765625, 0.1680755615234375, 0.17901611328125, 0.1899566650390625, 0.200897216796875, 0.2118377685546875, 0.2227783203125, 0.2337188720703125, 0.244659423828125, 0.2555999755859375, 0.26654052734375, 0.2774810791015625, 0.288421630859375, 0.2993621826171875, 0.310302734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 38.0, 685.0, 239.0, 26.0, 5.0, 3.0, 1.0, 1.0], "bins": [-11.203322410583496, -11.009543418884277, -10.815765380859375, -10.621986389160156, -10.428207397460938, -10.234429359436035, -10.040650367736816, -9.846872329711914, -9.653093338012695, -9.459314346313477, -9.265536308288574, -9.071757316589355, -8.877979278564453, -8.684200286865234, -8.490421295166016, -8.296643257141113, -8.102864265441895, -7.909085750579834, -7.715307235717773, -7.521528244018555, -7.327749729156494, -7.133971214294434, -6.940192222595215, -6.746413707733154, -6.552635192871094, -6.358856678009033, -6.165078163146973, -5.971299171447754, -5.777520656585693, -5.583742141723633, -5.389963150024414, -5.1961846351623535, -5.002406120300293, -4.808627605438232, -4.614849090576172, -4.421070098876953, -4.227291584014893, -4.033513069152832, -3.8397343158721924, -3.6459555625915527, -3.452176809310913, -3.2583980560302734, -3.064619541168213, -2.8708410263061523, -2.6770622730255127, -2.483283519744873, -2.2895050048828125, -2.095726490020752, -1.9019477367401123, -1.7081691026687622, -1.514390468597412, -1.320611834526062, -1.126833200454712, -0.9330545663833618, -0.7392759323120117, -0.5454972982406616, -0.3517186641693115, -0.15794003009796143, 0.03583860397338867, 0.22961723804473877, 0.42339587211608887, 0.617174506187439, 0.8109531402587891, 1.0047317743301392, 1.1985104084014893]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 20.0, 17.0, 39.0, 59.0, 90.0, 105.0, 115.0, 108.0, 124.0, 103.0, 70.0, 57.0, 37.0, 18.0, 13.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40962553024292, -2.3139803409576416, -2.2183351516723633, -2.122690200805664, -2.0270450115203857, -1.9313998222351074, -1.835754632949829, -1.7401094436645508, -1.6444642543792725, -1.5488190650939941, -1.4531739950180054, -1.357528805732727, -1.2618836164474487, -1.16623854637146, -1.0705933570861816, -0.9749481678009033, -0.8793030977249146, -0.783657968044281, -0.6880127787590027, -0.5923676490783691, -0.4967224895954132, -0.4010773301124573, -0.30543220043182373, -0.2097870111465454, -0.11414188146591187, -0.01849672943353653, 0.0771484225988388, 0.17279356718063354, 0.2684387266635895, 0.3640838861465454, 0.45972901582717896, 0.5553742051124573, 0.6510193347930908, 0.7466644644737244, 0.8423096537590027, 0.9379547834396362, 1.0335999727249146, 1.1292450428009033, 1.2248902320861816, 1.32053542137146, 1.4161806106567383, 1.5118257999420166, 1.6074708700180054, 1.7031160593032837, 1.798761248588562, 1.8944063186645508, 1.990051507949829, 2.0856966972351074, 2.1813416481018066, 2.276986837387085, 2.3726320266723633, 2.4682769775390625, 2.563922166824341, 2.659567356109619, 2.7552125453948975, 2.850857734680176, 2.946502923965454, 3.0421481132507324, 3.1377933025360107, 3.233438491821289, 3.3290834426879883, 3.4247286319732666, 3.520373821258545, 3.6160190105438232, 3.7116641998291016]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 4.0, 7.0, 3.0, 7.0, 12.0, 18.0, 15.0, 14.0, 30.0, 52.0, 67.0, 76.0, 123.0, 206.0, 374.0, 613.0, 1310.0, 3806.0, 27881.0, 994686.0, 13800.0, 2895.0, 1092.0, 558.0, 316.0, 159.0, 144.0, 75.0, 50.0, 40.0, 25.0, 20.0, 17.0, 13.0, 10.0, 6.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.802734375, -3.692138671875, -3.58154296875, -3.470947265625, -3.3603515625, -3.249755859375, -3.13916015625, -3.028564453125, -2.91796875, -2.807373046875, -2.69677734375, -2.586181640625, -2.4755859375, -2.364990234375, -2.25439453125, -2.143798828125, -2.033203125, -1.922607421875, -1.81201171875, -1.701416015625, -1.5908203125, -1.480224609375, -1.36962890625, -1.259033203125, -1.1484375, -1.037841796875, -0.92724609375, -0.816650390625, -0.7060546875, -0.595458984375, -0.48486328125, -0.374267578125, -0.263671875, -0.153076171875, -0.04248046875, 0.068115234375, 0.1787109375, 0.289306640625, 0.39990234375, 0.510498046875, 0.62109375, 0.731689453125, 0.84228515625, 0.952880859375, 1.0634765625, 1.174072265625, 1.28466796875, 1.395263671875, 1.505859375, 1.616455078125, 1.72705078125, 1.837646484375, 1.9482421875, 2.058837890625, 2.16943359375, 2.280029296875, 2.390625, 2.501220703125, 2.61181640625, 2.722412109375, 2.8330078125, 2.943603515625, 3.05419921875, 3.164794921875, 3.275390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 13.0, 34.0, 332.0, 501.0, 73.0, 16.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6583137512207031, -0.6423110961914062, -0.6263084411621094, -0.6103057861328125, -0.5943031311035156, -0.5783004760742188, -0.5622978210449219, -0.546295166015625, -0.5302925109863281, -0.5142898559570312, -0.4982872009277344, -0.4822845458984375, -0.4662818908691406, -0.45027923583984375, -0.4342765808105469, -0.41827392578125, -0.4022712707519531, -0.38626861572265625, -0.3702659606933594, -0.3542633056640625, -0.3382606506347656, -0.32225799560546875, -0.3062553405761719, -0.290252685546875, -0.2742500305175781, -0.25824737548828125, -0.24224472045898438, -0.2262420654296875, -0.21023941040039062, -0.19423675537109375, -0.17823410034179688, -0.1622314453125, -0.14622879028320312, -0.13022613525390625, -0.11422348022460938, -0.0982208251953125, -0.08221817016601562, -0.06621551513671875, -0.050212860107421875, -0.034210205078125, -0.018207550048828125, -0.00220489501953125, 0.013797760009765625, 0.0298004150390625, 0.045803070068359375, 0.06180572509765625, 0.07780838012695312, 0.09381103515625, 0.10981369018554688, 0.12581634521484375, 0.14181900024414062, 0.1578216552734375, 0.17382431030273438, 0.18982696533203125, 0.20582962036132812, 0.221832275390625, 0.23783493041992188, 0.25383758544921875, 0.2698402404785156, 0.2858428955078125, 0.3018455505371094, 0.31784820556640625, 0.3338508605957031, 0.349853515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 4.0, 0.0, 6.0, 4.0, 10.0, 2.0, 7.0, 8.0, 13.0, 16.0, 17.0, 26.0, 28.0, 38.0, 47.0, 58.0, 97.0, 134.0, 228.0, 383.0, 741.0, 2018.0, 8788.0, 104758.0, 869254.0, 52860.0, 5835.0, 1493.0, 644.0, 356.0, 204.0, 138.0, 84.0, 54.0, 48.0, 32.0, 23.0, 22.0, 15.0, 10.0, 13.0, 6.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.592132568359375, -1.53973388671875, -1.487335205078125, -1.4349365234375, -1.382537841796875, -1.33013916015625, -1.277740478515625, -1.225341796875, -1.172943115234375, -1.12054443359375, -1.068145751953125, -1.0157470703125, -0.963348388671875, -0.91094970703125, -0.858551025390625, -0.80615234375, -0.753753662109375, -0.70135498046875, -0.648956298828125, -0.5965576171875, -0.544158935546875, -0.49176025390625, -0.439361572265625, -0.386962890625, -0.334564208984375, -0.28216552734375, -0.229766845703125, -0.1773681640625, -0.124969482421875, -0.07257080078125, -0.020172119140625, 0.0322265625, 0.084625244140625, 0.13702392578125, 0.189422607421875, 0.2418212890625, 0.294219970703125, 0.34661865234375, 0.399017333984375, 0.451416015625, 0.503814697265625, 0.55621337890625, 0.608612060546875, 0.6610107421875, 0.713409423828125, 0.76580810546875, 0.818206787109375, 0.87060546875, 0.923004150390625, 0.97540283203125, 1.027801513671875, 1.0802001953125, 1.132598876953125, 1.18499755859375, 1.237396240234375, 1.289794921875, 1.342193603515625, 1.39459228515625, 1.446990966796875, 1.4993896484375, 1.551788330078125, 1.60418701171875, 1.656585693359375, 1.708984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 8.0, 9.0, 14.0, 10.0, 17.0, 20.0, 18.0, 27.0, 26.0, 29.0, 35.0, 32.0, 45.0, 41.0, 39.0, 41.0, 34.0, 39.0, 42.0, 48.0, 43.0, 38.0, 30.0, 34.0, 31.0, 29.0, 23.0, 25.0, 26.0, 19.0, 16.0, 14.0, 21.0, 9.0, 8.0, 5.0, 6.0, 6.0, 6.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.4827423095703125, -0.467437744140625, -0.4521331787109375, -0.43682861328125, -0.4215240478515625, -0.406219482421875, -0.3909149169921875, -0.3756103515625, -0.3603057861328125, -0.345001220703125, -0.3296966552734375, -0.31439208984375, -0.2990875244140625, -0.283782958984375, -0.2684783935546875, -0.253173828125, -0.2378692626953125, -0.222564697265625, -0.2072601318359375, -0.19195556640625, -0.1766510009765625, -0.161346435546875, -0.1460418701171875, -0.1307373046875, -0.1154327392578125, -0.100128173828125, -0.0848236083984375, -0.06951904296875, -0.0542144775390625, -0.038909912109375, -0.0236053466796875, -0.00830078125, 0.0070037841796875, 0.022308349609375, 0.0376129150390625, 0.05291748046875, 0.0682220458984375, 0.083526611328125, 0.0988311767578125, 0.1141357421875, 0.1294403076171875, 0.144744873046875, 0.1600494384765625, 0.17535400390625, 0.1906585693359375, 0.205963134765625, 0.2212677001953125, 0.236572265625, 0.2518768310546875, 0.267181396484375, 0.2824859619140625, 0.29779052734375, 0.3130950927734375, 0.328399658203125, 0.3437042236328125, 0.3590087890625, 0.3743133544921875, 0.389617919921875, 0.4049224853515625, 0.42022705078125, 0.4355316162109375, 0.450836181640625, 0.4661407470703125, 0.4814453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 12.0, 12.0, 19.0, 33.0, 27.0, 41.0, 90.0, 118.0, 184.0, 403.0, 1054.0, 3671.0, 24909.0, 779110.0, 222613.0, 12389.0, 2286.0, 707.0, 352.0, 160.0, 109.0, 78.0, 41.0, 34.0, 18.0, 15.0, 11.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2744941711425781, -0.26529693603515625, -0.2560997009277344, -0.2469024658203125, -0.23770523071289062, -0.22850799560546875, -0.21931076049804688, -0.210113525390625, -0.20091629028320312, -0.19171905517578125, -0.18252182006835938, -0.1733245849609375, -0.16412734985351562, -0.15493011474609375, -0.14573287963867188, -0.13653564453125, -0.12733840942382812, -0.11814117431640625, -0.10894393920898438, -0.0997467041015625, -0.09054946899414062, -0.08135223388671875, -0.07215499877929688, -0.062957763671875, -0.053760528564453125, -0.04456329345703125, -0.035366058349609375, -0.0261688232421875, -0.016971588134765625, -0.00777435302734375, 0.001422882080078125, 0.0106201171875, 0.019817352294921875, 0.02901458740234375, 0.038211822509765625, 0.0474090576171875, 0.056606292724609375, 0.06580352783203125, 0.07500076293945312, 0.084197998046875, 0.09339523315429688, 0.10259246826171875, 0.11178970336914062, 0.1209869384765625, 0.13018417358398438, 0.13938140869140625, 0.14857864379882812, 0.15777587890625, 0.16697311401367188, 0.17617034912109375, 0.18536758422851562, 0.1945648193359375, 0.20376205444335938, 0.21295928955078125, 0.22215652465820312, 0.231353759765625, 0.24055099487304688, 0.24974822998046875, 0.2589454650878906, 0.2681427001953125, 0.2773399353027344, 0.28653717041015625, 0.2957344055175781, 0.304931640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 10.0, 15.0, 24.0, 25.0, 29.0, 54.0, 64.0, 103.0, 117.0, 115.0, 108.0, 98.0, 61.0, 32.0, 35.0, 16.0, 17.0, 13.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4543533325195312e-05, -1.4077872037887573e-05, -1.3612210750579834e-05, -1.3146549463272095e-05, -1.2680888175964355e-05, -1.2215226888656616e-05, -1.1749565601348877e-05, -1.1283904314041138e-05, -1.0818243026733398e-05, -1.035258173942566e-05, -9.88692045211792e-06, -9.42125916481018e-06, -8.955597877502441e-06, -8.489936590194702e-06, -8.024275302886963e-06, -7.558614015579224e-06, -7.092952728271484e-06, -6.627291440963745e-06, -6.161630153656006e-06, -5.695968866348267e-06, -5.230307579040527e-06, -4.764646291732788e-06, -4.298985004425049e-06, -3.8333237171173096e-06, -3.3676624298095703e-06, -2.902001142501831e-06, -2.436339855194092e-06, -1.9706785678863525e-06, -1.5050172805786133e-06, -1.039355993270874e-06, -5.736947059631348e-07, -1.0803341865539551e-07, 3.5762786865234375e-07, 8.23289155960083e-07, 1.2889504432678223e-06, 1.7546117305755615e-06, 2.2202730178833008e-06, 2.68593430519104e-06, 3.1515955924987793e-06, 3.6172568798065186e-06, 4.082918167114258e-06, 4.548579454421997e-06, 5.014240741729736e-06, 5.479902029037476e-06, 5.945563316345215e-06, 6.411224603652954e-06, 6.876885890960693e-06, 7.342547178268433e-06, 7.808208465576172e-06, 8.273869752883911e-06, 8.73953104019165e-06, 9.20519232749939e-06, 9.670853614807129e-06, 1.0136514902114868e-05, 1.0602176189422607e-05, 1.1067837476730347e-05, 1.1533498764038086e-05, 1.1999160051345825e-05, 1.2464821338653564e-05, 1.2930482625961304e-05, 1.3396143913269043e-05, 1.3861805200576782e-05, 1.4327466487884521e-05, 1.479312777519226e-05, 1.52587890625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 16.0, 19.0, 43.0, 64.0, 79.0, 163.0, 359.0, 991.0, 5172.0, 133943.0, 894274.0, 10755.0, 1640.0, 506.0, 194.0, 106.0, 47.0, 51.0, 33.0, 15.0, 12.0, 5.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.5057601928710938, -0.4900360107421875, -0.47431182861328125, -0.458587646484375, -0.44286346435546875, -0.4271392822265625, -0.41141510009765625, -0.39569091796875, -0.37996673583984375, -0.3642425537109375, -0.34851837158203125, -0.332794189453125, -0.31707000732421875, -0.3013458251953125, -0.28562164306640625, -0.2698974609375, -0.25417327880859375, -0.2384490966796875, -0.22272491455078125, -0.207000732421875, -0.19127655029296875, -0.1755523681640625, -0.15982818603515625, -0.14410400390625, -0.12837982177734375, -0.1126556396484375, -0.09693145751953125, -0.081207275390625, -0.06548309326171875, -0.0497589111328125, -0.03403472900390625, -0.018310546875, -0.00258636474609375, 0.0131378173828125, 0.02886199951171875, 0.044586181640625, 0.06031036376953125, 0.0760345458984375, 0.09175872802734375, 0.10748291015625, 0.12320709228515625, 0.1389312744140625, 0.15465545654296875, 0.170379638671875, 0.18610382080078125, 0.2018280029296875, 0.21755218505859375, 0.2332763671875, 0.24900054931640625, 0.2647247314453125, 0.28044891357421875, 0.296173095703125, 0.31189727783203125, 0.3276214599609375, 0.34334564208984375, 0.35906982421875, 0.37479400634765625, 0.3905181884765625, 0.40624237060546875, 0.421966552734375, 0.43769073486328125, 0.4534149169921875, 0.46913909912109375, 0.48486328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 3.0, 5.0, 9.0, 13.0, 17.0, 14.0, 22.0, 27.0, 40.0, 56.0, 89.0, 107.0, 107.0, 111.0, 87.0, 70.0, 58.0, 29.0, 18.0, 19.0, 23.0, 13.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12325859069824219, -0.11895370483398438, -0.11464881896972656, -0.11034393310546875, -0.10603904724121094, -0.10173416137695312, -0.09742927551269531, -0.0931243896484375, -0.08881950378417969, -0.08451461791992188, -0.08020973205566406, -0.07590484619140625, -0.07159996032714844, -0.06729507446289062, -0.06299018859863281, -0.058685302734375, -0.05438041687011719, -0.050075531005859375, -0.04577064514160156, -0.04146575927734375, -0.03716087341308594, -0.032855987548828125, -0.028551101684570312, -0.0242462158203125, -0.019941329956054688, -0.015636444091796875, -0.011331558227539062, -0.00702667236328125, -0.0027217864990234375, 0.001583099365234375, 0.0058879852294921875, 0.01019287109375, 0.014497756958007812, 0.018802642822265625, 0.023107528686523438, 0.02741241455078125, 0.03171730041503906, 0.036022186279296875, 0.04032707214355469, 0.0446319580078125, 0.04893684387207031, 0.053241729736328125, 0.05754661560058594, 0.06185150146484375, 0.06615638732910156, 0.07046127319335938, 0.07476615905761719, 0.079071044921875, 0.08337593078613281, 0.08768081665039062, 0.09198570251464844, 0.09629058837890625, 0.10059547424316406, 0.10490036010742188, 0.10920524597167969, 0.1135101318359375, 0.11781501770019531, 0.12211990356445312, 0.12642478942871094, 0.13072967529296875, 0.13503456115722656, 0.13933944702148438, 0.1436443328857422, 0.14794921875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 767.0, 237.0, 5.0], "bins": [-83.30458068847656, -81.95889282226562, -80.61321258544922, -79.26752471923828, -77.92184448242188, -76.57615661621094, -75.23047637939453, -73.8847885131836, -72.53910827636719, -71.19342041015625, -69.84774017333984, -68.5020523071289, -67.1563720703125, -65.81068420410156, -64.46500396728516, -63.11931610107422, -61.77362823486328, -60.42794418334961, -59.08226013183594, -57.736576080322266, -56.390892028808594, -55.045204162597656, -53.69952392578125, -52.35383605957031, -51.008155822753906, -49.662471771240234, -48.31678771972656, -46.97110366821289, -45.62541961669922, -44.27973175048828, -42.934051513671875, -41.58836364746094, -40.24268341064453, -38.89699935913086, -37.55131530761719, -36.205631256103516, -34.859947204589844, -33.514259338378906, -32.1685791015625, -30.822891235351562, -29.47720718383789, -28.13152313232422, -26.785839080810547, -25.440155029296875, -24.09446907043457, -22.7487850189209, -21.403100967407227, -20.057415008544922, -18.711732864379883, -17.36604881286621, -16.02036476135254, -14.67467975616455, -13.328994750976562, -11.98331069946289, -10.637626647949219, -9.29194164276123, -7.946257591247559, -6.6005730628967285, -5.254888534545898, -3.9092044830322266, -2.5635199546813965, -1.2178354263305664, 0.12784862518310547, 1.4735336303710938, 2.8192179203033447]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 13.0, 18.0, 21.0, 45.0, 53.0, 64.0, 68.0, 86.0, 77.0, 84.0, 75.0, 80.0, 77.0, 70.0, 55.0, 30.0, 26.0, 15.0, 8.0, 11.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881531715393066, -8.656502723693848, -8.431473731994629, -8.20644474029541, -7.981415748596191, -7.756386756896973, -7.531358242034912, -7.306329250335693, -7.081300258636475, -6.856271266937256, -6.631242275238037, -6.406213283538818, -6.181184768676758, -5.956155776977539, -5.73112678527832, -5.506097793579102, -5.281068801879883, -5.056039810180664, -4.831010818481445, -4.605981826782227, -4.380952835083008, -4.155923843383789, -3.9308953285217285, -3.7058663368225098, -3.480837345123291, -3.2558083534240723, -3.0307793617248535, -2.805750608444214, -2.580721616744995, -2.3556926250457764, -2.1306638717651367, -1.905634880065918, -1.6806058883666992, -1.4555768966674805, -1.2305480241775513, -1.005519151687622, -0.7804901599884033, -0.5554611682891846, -0.33043229579925537, -0.10540342330932617, 0.11962556838989258, 0.34465450048446655, 0.5696834325790405, 0.7947123646736145, 1.0197412967681885, 1.2447702884674072, 1.4697991609573364, 1.6948280334472656, 1.9198570251464844, 2.144886016845703, 2.369915008544922, 2.5949437618255615, 2.8199727535247803, 3.045001745223999, 3.2700304985046387, 3.4950594902038574, 3.720088481903076, 3.945117473602295, 4.170146465301514, 4.395175457000732, 4.620203971862793, 4.845232963562012, 5.0702619552612305, 5.295290946960449, 5.520319938659668]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 13.0, 25.0, 35.0, 57.0, 153.0, 377.0, 3446.0, 4187331.0, 2425.0, 300.0, 72.0, 21.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.9520263671875, -17.529052734375, -17.1060791015625, -16.68310546875, -16.2601318359375, -15.837158203125, -15.4141845703125, -14.9912109375, -14.5682373046875, -14.145263671875, -13.7222900390625, -13.29931640625, -12.8763427734375, -12.453369140625, -12.0303955078125, -11.607421875, -11.1844482421875, -10.761474609375, -10.3385009765625, -9.91552734375, -9.4925537109375, -9.069580078125, -8.6466064453125, -8.2236328125, -7.8006591796875, -7.377685546875, -6.9547119140625, -6.53173828125, -6.1087646484375, -5.685791015625, -5.2628173828125, -4.83984375, -4.4168701171875, -3.993896484375, -3.5709228515625, -3.14794921875, -2.7249755859375, -2.302001953125, -1.8790283203125, -1.4560546875, -1.0330810546875, -0.610107421875, -0.1871337890625, 0.23583984375, 0.6588134765625, 1.081787109375, 1.5047607421875, 1.927734375, 2.3507080078125, 2.773681640625, 3.1966552734375, 3.61962890625, 4.0426025390625, 4.465576171875, 4.8885498046875, 5.3115234375, 5.7344970703125, 6.157470703125, 6.5804443359375, 7.00341796875, 7.4263916015625, 7.849365234375, 8.2723388671875, 8.6953125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 15.0, 33.0, 227.0, 477.0, 176.0, 35.0, 13.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72998046875, -0.713165283203125, -0.69635009765625, -0.679534912109375, -0.6627197265625, -0.645904541015625, -0.62908935546875, -0.612274169921875, -0.595458984375, -0.578643798828125, -0.56182861328125, -0.545013427734375, -0.5281982421875, -0.511383056640625, -0.49456787109375, -0.477752685546875, -0.4609375, -0.444122314453125, -0.42730712890625, -0.410491943359375, -0.3936767578125, -0.376861572265625, -0.36004638671875, -0.343231201171875, -0.326416015625, -0.309600830078125, -0.29278564453125, -0.275970458984375, -0.2591552734375, -0.242340087890625, -0.22552490234375, -0.208709716796875, -0.19189453125, -0.175079345703125, -0.15826416015625, -0.141448974609375, -0.1246337890625, -0.107818603515625, -0.09100341796875, -0.074188232421875, -0.057373046875, -0.040557861328125, -0.02374267578125, -0.006927490234375, 0.0098876953125, 0.026702880859375, 0.04351806640625, 0.060333251953125, 0.0771484375, 0.093963623046875, 0.11077880859375, 0.127593994140625, 0.1444091796875, 0.161224365234375, 0.17803955078125, 0.194854736328125, 0.211669921875, 0.228485107421875, 0.24530029296875, 0.262115478515625, 0.2789306640625, 0.295745849609375, 0.31256103515625, 0.329376220703125, 0.34619140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 6.0, 20.0, 10.0, 28.0, 45.0, 58.0, 139.0, 381.0, 1294.0, 4851.0, 30343.0, 4093876.0, 53959.0, 6754.0, 1572.0, 502.0, 174.0, 76.0, 50.0, 26.0, 19.0, 21.0, 12.0, 7.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.28515625, -2.2171630859375, -2.149169921875, -2.0811767578125, -2.01318359375, -1.9451904296875, -1.877197265625, -1.8092041015625, -1.7412109375, -1.6732177734375, -1.605224609375, -1.5372314453125, -1.46923828125, -1.4012451171875, -1.333251953125, -1.2652587890625, -1.197265625, -1.1292724609375, -1.061279296875, -0.9932861328125, -0.92529296875, -0.8572998046875, -0.789306640625, -0.7213134765625, -0.6533203125, -0.5853271484375, -0.517333984375, -0.4493408203125, -0.38134765625, -0.3133544921875, -0.245361328125, -0.1773681640625, -0.109375, -0.0413818359375, 0.026611328125, 0.0946044921875, 0.16259765625, 0.2305908203125, 0.298583984375, 0.3665771484375, 0.4345703125, 0.5025634765625, 0.570556640625, 0.6385498046875, 0.70654296875, 0.7745361328125, 0.842529296875, 0.9105224609375, 0.978515625, 1.0465087890625, 1.114501953125, 1.1824951171875, 1.25048828125, 1.3184814453125, 1.386474609375, 1.4544677734375, 1.5224609375, 1.5904541015625, 1.658447265625, 1.7264404296875, 1.79443359375, 1.8624267578125, 1.930419921875, 1.9984130859375, 2.06640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 10.0, 6.0, 9.0, 7.0, 16.0, 12.0, 16.0, 30.0, 36.0, 58.0, 132.0, 2817.0, 594.0, 100.0, 62.0, 30.0, 25.0, 16.0, 12.0, 11.0, 11.0, 3.0, 8.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.299072265625, -0.2896919250488281, -0.28031158447265625, -0.2709312438964844, -0.2615509033203125, -0.2521705627441406, -0.24279022216796875, -0.23340988159179688, -0.224029541015625, -0.21464920043945312, -0.20526885986328125, -0.19588851928710938, -0.1865081787109375, -0.17712783813476562, -0.16774749755859375, -0.15836715698242188, -0.14898681640625, -0.13960647583007812, -0.13022613525390625, -0.12084579467773438, -0.1114654541015625, -0.10208511352539062, -0.09270477294921875, -0.08332443237304688, -0.073944091796875, -0.06456375122070312, -0.05518341064453125, -0.045803070068359375, -0.0364227294921875, -0.027042388916015625, -0.01766204833984375, -0.008281707763671875, 0.0010986328125, 0.010478973388671875, 0.01985931396484375, 0.029239654541015625, 0.0386199951171875, 0.048000335693359375, 0.05738067626953125, 0.06676101684570312, 0.076141357421875, 0.08552169799804688, 0.09490203857421875, 0.10428237915039062, 0.1136627197265625, 0.12304306030273438, 0.13242340087890625, 0.14180374145507812, 0.15118408203125, 0.16056442260742188, 0.16994476318359375, 0.17932510375976562, 0.1887054443359375, 0.19808578491210938, 0.20746612548828125, 0.21684646606445312, 0.226226806640625, 0.23560714721679688, 0.24498748779296875, 0.2543678283691406, 0.2637481689453125, 0.2731285095214844, 0.28250885009765625, 0.2918891906738281, 0.30126953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 51.0, 963.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9768232107162476, -0.5497756600379944, -0.12272810935974121, 0.30431950092315674, 0.7313669919967651, 1.1584144830703735, 1.585462212562561, 2.012509822845459, 2.4395570755004883, 2.8666045665740967, 3.293652057647705, 3.7206997871398926, 4.147747039794922, 4.574794769287109, 5.001842498779297, 5.428890228271484, 5.855937480926514, 6.282985210418701, 6.7100324630737305, 7.137080192565918, 7.5641279220581055, 7.991175174713135, 8.418222427368164, 8.845270156860352, 9.272317886352539, 9.699365615844727, 10.126413345336914, 10.553461074829102, 10.980507850646973, 11.40755558013916, 11.834603309631348, 12.261651039123535, 12.688697814941406, 13.115745544433594, 13.542793273925781, 13.969841003417969, 14.39688777923584, 14.823935508728027, 15.250983238220215, 15.678030967712402, 16.105077743530273, 16.53212547302246, 16.95917320251465, 17.386220932006836, 17.813268661499023, 18.240314483642578, 18.667362213134766, 19.094409942626953, 19.52145767211914, 19.948505401611328, 20.375553131103516, 20.802600860595703, 21.22964859008789, 21.656696319580078, 22.083744049072266, 22.51078987121582, 22.93783950805664, 23.364887237548828, 23.791934967041016, 24.218982696533203, 24.64603042602539, 25.073078155517578, 25.500125885009766, 25.92717170715332, 26.354219436645508]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 11.0, 21.0, 54.0, 68.0, 107.0, 141.0, 123.0, 134.0, 118.0, 81.0, 47.0, 44.0, 32.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.183340072631836, -2.110987901687622, -2.038635730743408, -1.9662833213806152, -1.8939311504364014, -1.8215789794921875, -1.749226689338684, -1.6768743991851807, -1.6045222282409668, -1.532170057296753, -1.4598177671432495, -1.387465476989746, -1.3151133060455322, -1.2427611351013184, -1.170408844947815, -1.0980565547943115, -1.0257043838500977, -0.953352153301239, -0.8809999227523804, -0.8086476922035217, -0.7362954616546631, -0.6639432311058044, -0.5915910005569458, -0.5192387700080872, -0.4468865394592285, -0.3745343089103699, -0.30218207836151123, -0.2298298478126526, -0.15747761726379395, -0.0851253867149353, -0.01277315616607666, 0.05957907438278198, 0.13193154335021973, 0.20428377389907837, 0.276636004447937, 0.34898823499679565, 0.4213404655456543, 0.49369269609451294, 0.5660449266433716, 0.6383971571922302, 0.7107493877410889, 0.7831016182899475, 0.8554538488388062, 0.9278060793876648, 1.0001583099365234, 1.0725104808807373, 1.1448627710342407, 1.2172150611877441, 1.289567232131958, 1.3619194030761719, 1.4342716932296753, 1.5066239833831787, 1.5789761543273926, 1.6513283252716064, 1.7236806154251099, 1.7960329055786133, 1.8683850765228271, 1.940737247467041, 2.013089656829834, 2.085441827774048, 2.1577939987182617, 2.2301461696624756, 2.3024983406066895, 2.3748507499694824, 2.4472029209136963]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 9.0, 8.0, 16.0, 20.0, 30.0, 54.0, 45.0, 79.0, 117.0, 194.0, 353.0, 568.0, 1379.0, 3836.0, 29829.0, 989515.0, 16875.0, 3028.0, 1131.0, 565.0, 330.0, 172.0, 107.0, 86.0, 53.0, 31.0, 28.0, 20.0, 12.0, 8.0, 8.0, 4.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.166015625, -3.071258544921875, -2.97650146484375, -2.881744384765625, -2.7869873046875, -2.692230224609375, -2.59747314453125, -2.502716064453125, -2.407958984375, -2.313201904296875, -2.21844482421875, -2.123687744140625, -2.0289306640625, -1.934173583984375, -1.83941650390625, -1.744659423828125, -1.64990234375, -1.555145263671875, -1.46038818359375, -1.365631103515625, -1.2708740234375, -1.176116943359375, -1.08135986328125, -0.986602783203125, -0.891845703125, -0.797088623046875, -0.70233154296875, -0.607574462890625, -0.5128173828125, -0.418060302734375, -0.32330322265625, -0.228546142578125, -0.1337890625, -0.039031982421875, 0.05572509765625, 0.150482177734375, 0.2452392578125, 0.339996337890625, 0.43475341796875, 0.529510498046875, 0.624267578125, 0.719024658203125, 0.81378173828125, 0.908538818359375, 1.0032958984375, 1.098052978515625, 1.19281005859375, 1.287567138671875, 1.38232421875, 1.477081298828125, 1.57183837890625, 1.666595458984375, 1.7613525390625, 1.856109619140625, 1.95086669921875, 2.045623779296875, 2.140380859375, 2.235137939453125, 2.32989501953125, 2.424652099609375, 2.5194091796875, 2.614166259765625, 2.70892333984375, 2.803680419921875, 2.8984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 11.0, 16.0, 147.0, 447.0, 293.0, 47.0, 15.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6756973266601562, -0.6595001220703125, -0.6433029174804688, -0.627105712890625, -0.6109085083007812, -0.5947113037109375, -0.5785140991210938, -0.56231689453125, -0.5461196899414062, -0.5299224853515625, -0.5137252807617188, -0.497528076171875, -0.48133087158203125, -0.4651336669921875, -0.44893646240234375, -0.4327392578125, -0.41654205322265625, -0.4003448486328125, -0.38414764404296875, -0.367950439453125, -0.35175323486328125, -0.3355560302734375, -0.31935882568359375, -0.30316162109375, -0.28696441650390625, -0.2707672119140625, -0.25457000732421875, -0.238372802734375, -0.22217559814453125, -0.2059783935546875, -0.18978118896484375, -0.173583984375, -0.15738677978515625, -0.1411895751953125, -0.12499237060546875, -0.108795166015625, -0.09259796142578125, -0.0764007568359375, -0.06020355224609375, -0.04400634765625, -0.02780914306640625, -0.0116119384765625, 0.00458526611328125, 0.020782470703125, 0.03697967529296875, 0.0531768798828125, 0.06937408447265625, 0.0855712890625, 0.10176849365234375, 0.1179656982421875, 0.13416290283203125, 0.150360107421875, 0.16655731201171875, 0.1827545166015625, 0.19895172119140625, 0.21514892578125, 0.23134613037109375, 0.2475433349609375, 0.26374053955078125, 0.279937744140625, 0.29613494873046875, 0.3123321533203125, 0.32852935791015625, 0.3447265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 5.0, 7.0, 11.0, 18.0, 27.0, 29.0, 45.0, 39.0, 74.0, 127.0, 206.0, 463.0, 1145.0, 6883.0, 224796.0, 798741.0, 13041.0, 1616.0, 559.0, 268.0, 139.0, 77.0, 46.0, 50.0, 26.0, 22.0, 15.0, 19.0, 14.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69140625, -2.618927001953125, -2.54644775390625, -2.473968505859375, -2.4014892578125, -2.329010009765625, -2.25653076171875, -2.184051513671875, -2.111572265625, -2.039093017578125, -1.96661376953125, -1.894134521484375, -1.8216552734375, -1.749176025390625, -1.67669677734375, -1.604217529296875, -1.53173828125, -1.459259033203125, -1.38677978515625, -1.314300537109375, -1.2418212890625, -1.169342041015625, -1.09686279296875, -1.024383544921875, -0.951904296875, -0.879425048828125, -0.80694580078125, -0.734466552734375, -0.6619873046875, -0.589508056640625, -0.51702880859375, -0.444549560546875, -0.3720703125, -0.299591064453125, -0.22711181640625, -0.154632568359375, -0.0821533203125, -0.009674072265625, 0.06280517578125, 0.135284423828125, 0.207763671875, 0.280242919921875, 0.35272216796875, 0.425201416015625, 0.4976806640625, 0.570159912109375, 0.64263916015625, 0.715118408203125, 0.78759765625, 0.860076904296875, 0.93255615234375, 1.005035400390625, 1.0775146484375, 1.149993896484375, 1.22247314453125, 1.294952392578125, 1.367431640625, 1.439910888671875, 1.51239013671875, 1.584869384765625, 1.6573486328125, 1.729827880859375, 1.80230712890625, 1.874786376953125, 1.947265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 7.0, 5.0, 14.0, 9.0, 17.0, 17.0, 20.0, 24.0, 26.0, 33.0, 43.0, 49.0, 44.0, 49.0, 58.0, 46.0, 48.0, 52.0, 52.0, 66.0, 50.0, 46.0, 33.0, 30.0, 31.0, 31.0, 29.0, 17.0, 14.0, 10.0, 7.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6110763549804688, -0.5873870849609375, -0.5636978149414062, -0.540008544921875, -0.5163192749023438, -0.4926300048828125, -0.46894073486328125, -0.44525146484375, -0.42156219482421875, -0.3978729248046875, -0.37418365478515625, -0.350494384765625, -0.32680511474609375, -0.3031158447265625, -0.27942657470703125, -0.2557373046875, -0.23204803466796875, -0.2083587646484375, -0.18466949462890625, -0.160980224609375, -0.13729095458984375, -0.1136016845703125, -0.08991241455078125, -0.06622314453125, -0.04253387451171875, -0.0188446044921875, 0.00484466552734375, 0.028533935546875, 0.05222320556640625, 0.0759124755859375, 0.09960174560546875, 0.123291015625, 0.14698028564453125, 0.1706695556640625, 0.19435882568359375, 0.218048095703125, 0.24173736572265625, 0.2654266357421875, 0.28911590576171875, 0.31280517578125, 0.33649444580078125, 0.3601837158203125, 0.38387298583984375, 0.407562255859375, 0.43125152587890625, 0.4549407958984375, 0.47863006591796875, 0.5023193359375, 0.5260086059570312, 0.5496978759765625, 0.5733871459960938, 0.597076416015625, 0.6207656860351562, 0.6444549560546875, 0.6681442260742188, 0.69183349609375, 0.7155227661132812, 0.7392120361328125, 0.7629013061523438, 0.786590576171875, 0.8102798461914062, 0.8339691162109375, 0.8576583862304688, 0.88134765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 8.0, 6.0, 4.0, 8.0, 14.0, 27.0, 31.0, 60.0, 101.0, 205.0, 560.0, 2577.0, 53870.0, 974102.0, 14871.0, 1363.0, 366.0, 159.0, 95.0, 39.0, 32.0, 16.0, 11.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.67236328125, -0.6533355712890625, -0.634307861328125, -0.6152801513671875, -0.59625244140625, -0.5772247314453125, -0.558197021484375, -0.5391693115234375, -0.5201416015625, -0.5011138916015625, -0.482086181640625, -0.4630584716796875, -0.44403076171875, -0.4250030517578125, -0.405975341796875, -0.3869476318359375, -0.367919921875, -0.3488922119140625, -0.329864501953125, -0.3108367919921875, -0.29180908203125, -0.2727813720703125, -0.253753662109375, -0.2347259521484375, -0.2156982421875, -0.1966705322265625, -0.177642822265625, -0.1586151123046875, -0.13958740234375, -0.1205596923828125, -0.101531982421875, -0.0825042724609375, -0.0634765625, -0.0444488525390625, -0.025421142578125, -0.0063934326171875, 0.01263427734375, 0.0316619873046875, 0.050689697265625, 0.0697174072265625, 0.0887451171875, 0.1077728271484375, 0.126800537109375, 0.1458282470703125, 0.16485595703125, 0.1838836669921875, 0.202911376953125, 0.2219390869140625, 0.240966796875, 0.2599945068359375, 0.279022216796875, 0.2980499267578125, 0.31707763671875, 0.3361053466796875, 0.355133056640625, 0.3741607666015625, 0.3931884765625, 0.4122161865234375, 0.431243896484375, 0.4502716064453125, 0.46929931640625, 0.4883270263671875, 0.507354736328125, 0.5263824462890625, 0.54541015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 19.0, 20.0, 33.0, 59.0, 129.0, 165.0, 141.0, 155.0, 94.0, 61.0, 35.0, 26.0, 12.0, 10.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.3089349269866943e-05, -2.2396445274353027e-05, -2.170354127883911e-05, -2.1010637283325195e-05, -2.031773328781128e-05, -1.9624829292297363e-05, -1.8931925296783447e-05, -1.823902130126953e-05, -1.7546117305755615e-05, -1.68532133102417e-05, -1.6160309314727783e-05, -1.5467405319213867e-05, -1.4774501323699951e-05, -1.4081597328186035e-05, -1.3388693332672119e-05, -1.2695789337158203e-05, -1.2002885341644287e-05, -1.1309981346130371e-05, -1.0617077350616455e-05, -9.924173355102539e-06, -9.231269359588623e-06, -8.538365364074707e-06, -7.845461368560791e-06, -7.152557373046875e-06, -6.459653377532959e-06, -5.766749382019043e-06, -5.073845386505127e-06, -4.380941390991211e-06, -3.688037395477295e-06, -2.995133399963379e-06, -2.302229404449463e-06, -1.6093254089355469e-06, -9.164214134216309e-07, -2.2351741790771484e-07, 4.6938657760620117e-07, 1.1622905731201172e-06, 1.8551945686340332e-06, 2.5480985641479492e-06, 3.2410025596618652e-06, 3.933906555175781e-06, 4.626810550689697e-06, 5.319714546203613e-06, 6.012618541717529e-06, 6.705522537231445e-06, 7.398426532745361e-06, 8.091330528259277e-06, 8.784234523773193e-06, 9.47713851928711e-06, 1.0170042514801025e-05, 1.0862946510314941e-05, 1.1555850505828857e-05, 1.2248754501342773e-05, 1.294165849685669e-05, 1.3634562492370605e-05, 1.4327466487884521e-05, 1.5020370483398438e-05, 1.5713274478912354e-05, 1.640617847442627e-05, 1.7099082469940186e-05, 1.77919864654541e-05, 1.8484890460968018e-05, 1.9177794456481934e-05, 1.987069845199585e-05, 2.0563602447509766e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 10.0, 15.0, 12.0, 25.0, 42.0, 61.0, 117.0, 200.0, 441.0, 1872.0, 17194.0, 952340.0, 70721.0, 3963.0, 855.0, 295.0, 138.0, 86.0, 38.0, 31.0, 22.0, 14.0, 6.0, 6.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.6865234375, -0.6687812805175781, -0.6510391235351562, -0.6332969665527344, -0.6155548095703125, -0.5978126525878906, -0.5800704956054688, -0.5623283386230469, -0.544586181640625, -0.5268440246582031, -0.5091018676757812, -0.4913597106933594, -0.4736175537109375, -0.4558753967285156, -0.43813323974609375, -0.4203910827636719, -0.40264892578125, -0.3849067687988281, -0.36716461181640625, -0.3494224548339844, -0.3316802978515625, -0.3139381408691406, -0.29619598388671875, -0.2784538269042969, -0.260711669921875, -0.24296951293945312, -0.22522735595703125, -0.20748519897460938, -0.1897430419921875, -0.17200088500976562, -0.15425872802734375, -0.13651657104492188, -0.1187744140625, -0.10103225708007812, -0.08329010009765625, -0.06554794311523438, -0.0478057861328125, -0.030063629150390625, -0.01232147216796875, 0.005420684814453125, 0.023162841796875, 0.040904998779296875, 0.05864715576171875, 0.07638931274414062, 0.0941314697265625, 0.11187362670898438, 0.12961578369140625, 0.14735794067382812, 0.16510009765625, 0.18284225463867188, 0.20058441162109375, 0.21832656860351562, 0.2360687255859375, 0.2538108825683594, 0.27155303955078125, 0.2892951965332031, 0.307037353515625, 0.3247795104980469, 0.34252166748046875, 0.3602638244628906, 0.3780059814453125, 0.3957481384277344, 0.41349029541015625, 0.4312324523925781, 0.448974609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 7.0, 10.0, 7.0, 18.0, 29.0, 35.0, 51.0, 70.0, 82.0, 103.0, 127.0, 120.0, 79.0, 75.0, 38.0, 34.0, 26.0, 18.0, 6.0, 13.0, 10.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1480712890625, -0.14200782775878906, -0.13594436645507812, -0.1298809051513672, -0.12381744384765625, -0.11775398254394531, -0.11169052124023438, -0.10562705993652344, -0.0995635986328125, -0.09350013732910156, -0.08743667602539062, -0.08137321472167969, -0.07530975341796875, -0.06924629211425781, -0.06318283081054688, -0.05711936950683594, -0.051055908203125, -0.04499244689941406, -0.038928985595703125, -0.03286552429199219, -0.02680206298828125, -0.020738601684570312, -0.014675140380859375, -0.008611679077148438, -0.0025482177734375, 0.0035152435302734375, 0.009578704833984375, 0.015642166137695312, 0.02170562744140625, 0.027769088745117188, 0.033832550048828125, 0.03989601135253906, 0.04595947265625, 0.05202293395996094, 0.058086395263671875, 0.06414985656738281, 0.07021331787109375, 0.07627677917480469, 0.08234024047851562, 0.08840370178222656, 0.0944671630859375, 0.10053062438964844, 0.10659408569335938, 0.11265754699707031, 0.11872100830078125, 0.12478446960449219, 0.13084793090820312, 0.13691139221191406, 0.142974853515625, 0.14903831481933594, 0.15510177612304688, 0.1611652374267578, 0.16722869873046875, 0.1732921600341797, 0.17935562133789062, 0.18541908264160156, 0.1914825439453125, 0.19754600524902344, 0.20360946655273438, 0.2096729278564453, 0.21573638916015625, 0.2217998504638672, 0.22786331176757812, 0.23392677307128906, 0.239990234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 20.0, 227.0, 716.0, 43.0, 5.0, 0.0, 1.0], "bins": [-41.116172790527344, -40.42205047607422, -39.72792434692383, -39.0338020324707, -38.33967590332031, -37.64555358886719, -36.95143127441406, -36.25730514526367, -35.56318283081055, -34.86906051635742, -34.17493438720703, -33.480812072753906, -32.786685943603516, -32.09256362915039, -31.398439407348633, -30.704315185546875, -30.010189056396484, -29.316064834594727, -28.62194061279297, -27.927818298339844, -27.233694076538086, -26.539569854736328, -25.84544563293457, -25.151321411132812, -24.457199096679688, -23.76307487487793, -23.068950653076172, -22.374828338623047, -21.68070411682129, -20.98657989501953, -20.292455673217773, -19.598331451416016, -18.904207229614258, -18.2100830078125, -17.515958786010742, -16.821834564208984, -16.12771224975586, -15.433588027954102, -14.739463806152344, -14.045339584350586, -13.351215362548828, -12.65709114074707, -11.962967872619629, -11.268843650817871, -10.574719429016113, -9.880596160888672, -9.186471939086914, -8.492347717285156, -7.798224449157715, -7.104100704193115, -6.409976482391357, -5.715852737426758, -5.021728515625, -4.3276047706604, -3.633481025695801, -2.939356803894043, -2.2452330589294434, -1.5511090755462646, -0.8569852113723755, -0.16286134719848633, 0.5312626361846924, 1.225386619567871, 1.9195103645324707, 2.6136345863342285, 3.307758331298828]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 15.0, 25.0, 27.0, 24.0, 33.0, 36.0, 45.0, 49.0, 54.0, 61.0, 74.0, 69.0, 76.0, 60.0, 56.0, 52.0, 48.0, 31.0, 32.0, 29.0, 24.0, 19.0, 14.0, 6.0, 11.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.673714637756348, -4.497820854187012, -4.321927070617676, -4.14603328704834, -3.970139503479004, -3.794245719909668, -3.618351936340332, -3.442458152770996, -3.26656436920166, -3.090670585632324, -2.9147768020629883, -2.7388830184936523, -2.5629892349243164, -2.3870954513549805, -2.2112016677856445, -2.0353078842163086, -1.8594141006469727, -1.6835203170776367, -1.5076265335083008, -1.3317327499389648, -1.155838966369629, -0.979945182800293, -0.804051399230957, -0.6281576156616211, -0.45226383209228516, -0.2763700485229492, -0.10047626495361328, 0.07541751861572266, 0.2513113021850586, 0.42720508575439453, 0.6030988693237305, 0.7789926528930664, 0.9548859596252441, 1.13077974319458, 1.306673526763916, 1.482567310333252, 1.658461093902588, 1.8343548774719238, 2.0102486610412598, 2.1861424446105957, 2.3620362281799316, 2.5379300117492676, 2.7138237953186035, 2.8897175788879395, 3.0656113624572754, 3.2415051460266113, 3.4173989295959473, 3.593292713165283, 3.769186496734619, 3.945080280303955, 4.120974063873291, 4.296867847442627, 4.472761631011963, 4.648655414581299, 4.824549198150635, 5.000442981719971, 5.176336765289307, 5.352230548858643, 5.5281243324279785, 5.7040181159973145, 5.87991189956665, 6.055805683135986, 6.231699466705322, 6.407593250274658, 6.583487033843994]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 16.0, 12.0, 23.0, 37.0, 106.0, 201.0, 956.0, 393109.0, 3798517.0, 962.0, 196.0, 65.0, 37.0, 10.0, 11.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19921875, -7.031829833984375, -6.86444091796875, -6.697052001953125, -6.5296630859375, -6.362274169921875, -6.19488525390625, -6.027496337890625, -5.860107421875, -5.692718505859375, -5.52532958984375, -5.357940673828125, -5.1905517578125, -5.023162841796875, -4.85577392578125, -4.688385009765625, -4.52099609375, -4.353607177734375, -4.18621826171875, -4.018829345703125, -3.8514404296875, -3.684051513671875, -3.51666259765625, -3.349273681640625, -3.181884765625, -3.014495849609375, -2.84710693359375, -2.679718017578125, -2.5123291015625, -2.344940185546875, -2.17755126953125, -2.010162353515625, -1.8427734375, -1.675384521484375, -1.50799560546875, -1.340606689453125, -1.1732177734375, -1.005828857421875, -0.83843994140625, -0.671051025390625, -0.503662109375, -0.336273193359375, -0.16888427734375, -0.001495361328125, 0.1658935546875, 0.333282470703125, 0.50067138671875, 0.668060302734375, 0.83544921875, 1.002838134765625, 1.17022705078125, 1.337615966796875, 1.5050048828125, 1.672393798828125, 1.83978271484375, 2.007171630859375, 2.174560546875, 2.341949462890625, 2.50933837890625, 2.676727294921875, 2.8441162109375, 3.011505126953125, 3.17889404296875, 3.346282958984375, 3.513671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 17.0, 102.0, 263.0, 375.0, 163.0, 45.0, 12.0, 7.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7054595947265625, -0.688751220703125, -0.6720428466796875, -0.65533447265625, -0.6386260986328125, -0.621917724609375, -0.6052093505859375, -0.5885009765625, -0.5717926025390625, -0.555084228515625, -0.5383758544921875, -0.52166748046875, -0.5049591064453125, -0.488250732421875, -0.4715423583984375, -0.454833984375, -0.4381256103515625, -0.421417236328125, -0.4047088623046875, -0.38800048828125, -0.3712921142578125, -0.354583740234375, -0.3378753662109375, -0.3211669921875, -0.3044586181640625, -0.287750244140625, -0.2710418701171875, -0.25433349609375, -0.2376251220703125, -0.220916748046875, -0.2042083740234375, -0.1875, -0.1707916259765625, -0.154083251953125, -0.1373748779296875, -0.12066650390625, -0.1039581298828125, -0.087249755859375, -0.0705413818359375, -0.0538330078125, -0.0371246337890625, -0.020416259765625, -0.0037078857421875, 0.01300048828125, 0.0297088623046875, 0.046417236328125, 0.0631256103515625, 0.079833984375, 0.0965423583984375, 0.113250732421875, 0.1299591064453125, 0.14666748046875, 0.1633758544921875, 0.180084228515625, 0.1967926025390625, 0.2135009765625, 0.2302093505859375, 0.246917724609375, 0.2636260986328125, 0.28033447265625, 0.2970428466796875, 0.313751220703125, 0.3304595947265625, 0.34716796875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 12.0, 11.0, 24.0, 51.0, 91.0, 204.0, 675.0, 2005.0, 8554.0, 195867.0, 3971307.0, 12140.0, 2263.0, 631.0, 206.0, 110.0, 45.0, 18.0, 15.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.3935394287109375, -1.345672607421875, -1.2978057861328125, -1.24993896484375, -1.2020721435546875, -1.154205322265625, -1.1063385009765625, -1.0584716796875, -1.0106048583984375, -0.962738037109375, -0.9148712158203125, -0.86700439453125, -0.8191375732421875, -0.771270751953125, -0.7234039306640625, -0.675537109375, -0.6276702880859375, -0.579803466796875, -0.5319366455078125, -0.48406982421875, -0.4362030029296875, -0.388336181640625, -0.3404693603515625, -0.2926025390625, -0.2447357177734375, -0.196868896484375, -0.1490020751953125, -0.10113525390625, -0.0532684326171875, -0.005401611328125, 0.0424652099609375, 0.09033203125, 0.1381988525390625, 0.186065673828125, 0.2339324951171875, 0.28179931640625, 0.3296661376953125, 0.377532958984375, 0.4253997802734375, 0.4732666015625, 0.5211334228515625, 0.569000244140625, 0.6168670654296875, 0.66473388671875, 0.7126007080078125, 0.760467529296875, 0.8083343505859375, 0.856201171875, 0.9040679931640625, 0.951934814453125, 0.9998016357421875, 1.04766845703125, 1.0955352783203125, 1.143402099609375, 1.1912689208984375, 1.2391357421875, 1.2870025634765625, 1.334869384765625, 1.3827362060546875, 1.43060302734375, 1.4784698486328125, 1.526336669921875, 1.5742034912109375, 1.6220703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 6.0, 15.0, 18.0, 38.0, 50.0, 113.0, 1190.0, 2374.0, 114.0, 42.0, 23.0, 19.0, 10.0, 9.0, 2.0, 5.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.3296661376953125, -0.319976806640625, -0.3102874755859375, -0.30059814453125, -0.2909088134765625, -0.281219482421875, -0.2715301513671875, -0.2618408203125, -0.2521514892578125, -0.242462158203125, -0.2327728271484375, -0.22308349609375, -0.2133941650390625, -0.203704833984375, -0.1940155029296875, -0.184326171875, -0.1746368408203125, -0.164947509765625, -0.1552581787109375, -0.14556884765625, -0.1358795166015625, -0.126190185546875, -0.1165008544921875, -0.1068115234375, -0.0971221923828125, -0.087432861328125, -0.0777435302734375, -0.06805419921875, -0.0583648681640625, -0.048675537109375, -0.0389862060546875, -0.029296875, -0.0196075439453125, -0.009918212890625, -0.0002288818359375, 0.00946044921875, 0.0191497802734375, 0.028839111328125, 0.0385284423828125, 0.0482177734375, 0.0579071044921875, 0.067596435546875, 0.0772857666015625, 0.08697509765625, 0.0966644287109375, 0.106353759765625, 0.1160430908203125, 0.125732421875, 0.1354217529296875, 0.145111083984375, 0.1548004150390625, 0.16448974609375, 0.1741790771484375, 0.183868408203125, 0.1935577392578125, 0.2032470703125, 0.2129364013671875, 0.222625732421875, 0.2323150634765625, 0.24200439453125, 0.2516937255859375, 0.261383056640625, 0.2710723876953125, 0.28076171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 15.0, 60.0, 323.0, 477.0, 88.0, 27.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5450942516326904, -1.488369107246399, -1.4316439628601074, -1.374918818473816, -1.3181936740875244, -1.2614684104919434, -1.2047433853149414, -1.1480181217193604, -1.0912929773330688, -1.0345678329467773, -0.9778426885604858, -0.9211175441741943, -0.8643923401832581, -0.8076671957969666, -0.750942051410675, -0.6942168474197388, -0.637491762638092, -0.5807666182518005, -0.524041473865509, -0.46731629967689514, -0.41059112548828125, -0.35386598110198975, -0.29714083671569824, -0.24041566252708435, -0.18369051814079285, -0.12696535885334015, -0.07024020701646805, -0.013515055179595947, 0.04321010410785675, 0.09993526339530945, 0.15666040778160095, 0.21338558197021484, 0.27011072635650635, 0.32683587074279785, 0.38356104493141174, 0.44028618931770325, 0.49701136350631714, 0.5537365078926086, 0.6104616522789001, 0.6671868562698364, 0.7239120006561279, 0.7806371450424194, 0.8373622894287109, 0.8940874338150024, 0.9508126378059387, 1.007537841796875, 1.064262866973877, 1.120988130569458, 1.17771315574646, 1.2344383001327515, 1.291163444519043, 1.3478885889053345, 1.404613733291626, 1.461338996887207, 1.518064022064209, 1.57478928565979, 1.6315144300460815, 1.688239574432373, 1.7449647188186646, 1.801689863204956, 1.8584150075912476, 1.915140151977539, 1.9718654155731201, 2.028590440750122, 2.085315704345703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 14.0, 16.0, 12.0, 23.0, 20.0, 45.0, 56.0, 57.0, 75.0, 74.0, 83.0, 92.0, 78.0, 69.0, 56.0, 55.0, 42.0, 43.0, 32.0, 13.0, 17.0, 8.0, 10.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8000990748405457, -0.7672092318534851, -0.7343193888664246, -0.701429545879364, -0.6685397028923035, -0.6356498599052429, -0.6027599573135376, -0.569870114326477, -0.5369802713394165, -0.504090428352356, -0.4712005853652954, -0.43831074237823486, -0.4054208993911743, -0.37253105640411377, -0.33964118361473083, -0.3067513406276703, -0.27386152744293213, -0.24097168445587158, -0.20808184146881104, -0.1751919835805893, -0.14230214059352875, -0.1094122976064682, -0.07652243971824646, -0.04363259673118591, -0.010742753744125366, 0.02214709296822548, 0.055036939680576324, 0.08792679011821747, 0.12081663310527802, 0.15370647609233856, 0.1865963339805603, 0.21948617696762085, 0.2523759603500366, 0.28526580333709717, 0.3181556463241577, 0.35104548931121826, 0.3839353322982788, 0.41682517528533936, 0.4497150480747223, 0.48260489106178284, 0.515494704246521, 0.5483845472335815, 0.5812743902206421, 0.6141642332077026, 0.6470540761947632, 0.6799439191818237, 0.7128337621688843, 0.7457236051559448, 0.7786135077476501, 0.8115033507347107, 0.8443931937217712, 0.8772830367088318, 0.9101728796958923, 0.9430627226829529, 0.9759526252746582, 1.0088424682617188, 1.0417323112487793, 1.0746221542358398, 1.1075119972229004, 1.140401840209961, 1.1732916831970215, 1.206181526184082, 1.2390713691711426, 1.2719612121582031, 1.3048510551452637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 8.0, 18.0, 26.0, 26.0, 36.0, 59.0, 89.0, 124.0, 243.0, 419.0, 832.0, 1837.0, 6113.0, 201654.0, 822506.0, 10041.0, 2291.0, 966.0, 486.0, 268.0, 138.0, 84.0, 84.0, 44.0, 28.0, 34.0, 19.0, 8.0, 13.0, 10.0, 7.0, 5.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6361541748046875, -1.577972412109375, -1.5197906494140625, -1.46160888671875, -1.4034271240234375, -1.345245361328125, -1.2870635986328125, -1.2288818359375, -1.1707000732421875, -1.112518310546875, -1.0543365478515625, -0.99615478515625, -0.9379730224609375, -0.879791259765625, -0.8216094970703125, -0.763427734375, -0.7052459716796875, -0.647064208984375, -0.5888824462890625, -0.53070068359375, -0.4725189208984375, -0.414337158203125, -0.3561553955078125, -0.2979736328125, -0.2397918701171875, -0.181610107421875, -0.1234283447265625, -0.06524658203125, -0.0070648193359375, 0.051116943359375, 0.1092987060546875, 0.16748046875, 0.2256622314453125, 0.283843994140625, 0.3420257568359375, 0.40020751953125, 0.4583892822265625, 0.516571044921875, 0.5747528076171875, 0.6329345703125, 0.6911163330078125, 0.749298095703125, 0.8074798583984375, 0.86566162109375, 0.9238433837890625, 0.982025146484375, 1.0402069091796875, 1.098388671875, 1.1565704345703125, 1.214752197265625, 1.2729339599609375, 1.33111572265625, 1.3892974853515625, 1.447479248046875, 1.5056610107421875, 1.5638427734375, 1.6220245361328125, 1.680206298828125, 1.7383880615234375, 1.79656982421875, 1.8547515869140625, 1.912933349609375, 1.9711151123046875, 2.029296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 34.0, 162.0, 343.0, 302.0, 98.0, 25.0, 15.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.684326171875, -0.66796875, -0.651611328125, -0.63525390625, -0.618896484375, -0.6025390625, -0.586181640625, -0.56982421875, -0.553466796875, -0.537109375, -0.520751953125, -0.50439453125, -0.488037109375, -0.4716796875, -0.455322265625, -0.43896484375, -0.422607421875, -0.40625, -0.389892578125, -0.37353515625, -0.357177734375, -0.3408203125, -0.324462890625, -0.30810546875, -0.291748046875, -0.275390625, -0.259033203125, -0.24267578125, -0.226318359375, -0.2099609375, -0.193603515625, -0.17724609375, -0.160888671875, -0.14453125, -0.128173828125, -0.11181640625, -0.095458984375, -0.0791015625, -0.062744140625, -0.04638671875, -0.030029296875, -0.013671875, 0.002685546875, 0.01904296875, 0.035400390625, 0.0517578125, 0.068115234375, 0.08447265625, 0.100830078125, 0.1171875, 0.133544921875, 0.14990234375, 0.166259765625, 0.1826171875, 0.198974609375, 0.21533203125, 0.231689453125, 0.248046875, 0.264404296875, 0.28076171875, 0.297119140625, 0.3134765625, 0.329833984375, 0.34619140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 15.0, 15.0, 18.0, 18.0, 13.0, 45.0, 35.0, 42.0, 81.0, 126.0, 248.0, 499.0, 1552.0, 9899.0, 218602.0, 788827.0, 24418.0, 2538.0, 745.0, 321.0, 151.0, 97.0, 62.0, 36.0, 27.0, 15.0, 14.0, 17.0, 14.0, 9.0, 10.0, 9.0, 5.0, 8.0, 1.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5290985107421875, -1.483001708984375, -1.4369049072265625, -1.39080810546875, -1.3447113037109375, -1.298614501953125, -1.2525177001953125, -1.2064208984375, -1.1603240966796875, -1.114227294921875, -1.0681304931640625, -1.02203369140625, -0.9759368896484375, -0.929840087890625, -0.8837432861328125, -0.837646484375, -0.7915496826171875, -0.745452880859375, -0.6993560791015625, -0.65325927734375, -0.6071624755859375, -0.561065673828125, -0.5149688720703125, -0.4688720703125, -0.4227752685546875, -0.376678466796875, -0.3305816650390625, -0.28448486328125, -0.2383880615234375, -0.192291259765625, -0.1461944580078125, -0.10009765625, -0.0540008544921875, -0.007904052734375, 0.0381927490234375, 0.08428955078125, 0.1303863525390625, 0.176483154296875, 0.2225799560546875, 0.2686767578125, 0.3147735595703125, 0.360870361328125, 0.4069671630859375, 0.45306396484375, 0.4991607666015625, 0.545257568359375, 0.5913543701171875, 0.637451171875, 0.6835479736328125, 0.729644775390625, 0.7757415771484375, 0.82183837890625, 0.8679351806640625, 0.914031982421875, 0.9601287841796875, 1.0062255859375, 1.0523223876953125, 1.098419189453125, 1.1445159912109375, 1.19061279296875, 1.2367095947265625, 1.282806396484375, 1.3289031982421875, 1.375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 3.0, 11.0, 9.0, 6.0, 15.0, 16.0, 11.0, 15.0, 20.0, 27.0, 32.0, 39.0, 44.0, 34.0, 35.0, 53.0, 48.0, 49.0, 58.0, 61.0, 48.0, 45.0, 42.0, 43.0, 39.0, 26.0, 22.0, 31.0, 17.0, 20.0, 16.0, 17.0, 13.0, 12.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.601898193359375, -0.58123779296875, -0.560577392578125, -0.5399169921875, -0.519256591796875, -0.49859619140625, -0.477935791015625, -0.457275390625, -0.436614990234375, -0.41595458984375, -0.395294189453125, -0.3746337890625, -0.353973388671875, -0.33331298828125, -0.312652587890625, -0.2919921875, -0.271331787109375, -0.25067138671875, -0.230010986328125, -0.2093505859375, -0.188690185546875, -0.16802978515625, -0.147369384765625, -0.126708984375, -0.106048583984375, -0.08538818359375, -0.064727783203125, -0.0440673828125, -0.023406982421875, -0.00274658203125, 0.017913818359375, 0.03857421875, 0.059234619140625, 0.07989501953125, 0.100555419921875, 0.1212158203125, 0.141876220703125, 0.16253662109375, 0.183197021484375, 0.203857421875, 0.224517822265625, 0.24517822265625, 0.265838623046875, 0.2864990234375, 0.307159423828125, 0.32781982421875, 0.348480224609375, 0.369140625, 0.389801025390625, 0.41046142578125, 0.431121826171875, 0.4517822265625, 0.472442626953125, 0.49310302734375, 0.513763427734375, 0.534423828125, 0.555084228515625, 0.57574462890625, 0.596405029296875, 0.6170654296875, 0.637725830078125, 0.65838623046875, 0.679046630859375, 0.69970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 9.0, 9.0, 11.0, 10.0, 27.0, 45.0, 78.0, 124.0, 240.0, 399.0, 1020.0, 2681.0, 9628.0, 70576.0, 821431.0, 123401.0, 13391.0, 3264.0, 1138.0, 472.0, 247.0, 123.0, 72.0, 50.0, 30.0, 25.0, 15.0, 15.0, 2.0, 6.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15262222290039062, -0.14728546142578125, -0.14194869995117188, -0.1366119384765625, -0.13127517700195312, -0.12593841552734375, -0.12060165405273438, -0.115264892578125, -0.10992813110351562, -0.10459136962890625, -0.09925460815429688, -0.0939178466796875, -0.08858108520507812, -0.08324432373046875, -0.07790756225585938, -0.07257080078125, -0.06723403930664062, -0.06189727783203125, -0.056560516357421875, -0.0512237548828125, -0.045886993408203125, -0.04055023193359375, -0.035213470458984375, -0.029876708984375, -0.024539947509765625, -0.01920318603515625, -0.013866424560546875, -0.0085296630859375, -0.003192901611328125, 0.00214385986328125, 0.007480621337890625, 0.0128173828125, 0.018154144287109375, 0.02349090576171875, 0.028827667236328125, 0.0341644287109375, 0.039501190185546875, 0.04483795166015625, 0.050174713134765625, 0.055511474609375, 0.060848236083984375, 0.06618499755859375, 0.07152175903320312, 0.0768585205078125, 0.08219528198242188, 0.08753204345703125, 0.09286880493164062, 0.09820556640625, 0.10354232788085938, 0.10887908935546875, 0.11421585083007812, 0.1195526123046875, 0.12488937377929688, 0.13022613525390625, 0.13556289672851562, 0.140899658203125, 0.14623641967773438, 0.15157318115234375, 0.15690994262695312, 0.1622467041015625, 0.16758346557617188, 0.17292022705078125, 0.17825698852539062, 0.18359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 11.0, 20.0, 17.0, 33.0, 47.0, 78.0, 108.0, 133.0, 158.0, 139.0, 82.0, 64.0, 47.0, 32.0, 13.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7463229596614838e-05, -1.6866251826286316e-05, -1.6269274055957794e-05, -1.5672296285629272e-05, -1.507531851530075e-05, -1.4478340744972229e-05, -1.3881362974643707e-05, -1.3284385204315186e-05, -1.2687407433986664e-05, -1.2090429663658142e-05, -1.149345189332962e-05, -1.0896474123001099e-05, -1.0299496352672577e-05, -9.702518582344055e-06, -9.105540812015533e-06, -8.508563041687012e-06, -7.91158527135849e-06, -7.314607501029968e-06, -6.7176297307014465e-06, -6.120651960372925e-06, -5.523674190044403e-06, -4.926696419715881e-06, -4.32971864938736e-06, -3.732740879058838e-06, -3.135763108730316e-06, -2.5387853384017944e-06, -1.9418075680732727e-06, -1.344829797744751e-06, -7.478520274162292e-07, -1.5087425708770752e-07, 4.461035132408142e-07, 1.043081283569336e-06, 1.6400590538978577e-06, 2.2370368242263794e-06, 2.834014594554901e-06, 3.430992364883423e-06, 4.027970135211945e-06, 4.624947905540466e-06, 5.221925675868988e-06, 5.81890344619751e-06, 6.4158812165260315e-06, 7.012858986854553e-06, 7.609836757183075e-06, 8.206814527511597e-06, 8.803792297840118e-06, 9.40077006816864e-06, 9.997747838497162e-06, 1.0594725608825684e-05, 1.1191703379154205e-05, 1.1788681149482727e-05, 1.2385658919811249e-05, 1.298263669013977e-05, 1.3579614460468292e-05, 1.4176592230796814e-05, 1.4773570001125336e-05, 1.5370547771453857e-05, 1.596752554178238e-05, 1.65645033121109e-05, 1.7161481082439423e-05, 1.7758458852767944e-05, 1.8355436623096466e-05, 1.8952414393424988e-05, 1.954939216375351e-05, 2.014636993408203e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 12.0, 13.0, 15.0, 19.0, 28.0, 58.0, 90.0, 215.0, 562.0, 2878.0, 49304.0, 972425.0, 20064.0, 2009.0, 465.0, 176.0, 80.0, 48.0, 34.0, 16.0, 9.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.4215507507324219, -0.40853118896484375, -0.3955116271972656, -0.3824920654296875, -0.3694725036621094, -0.35645294189453125, -0.3434333801269531, -0.330413818359375, -0.3173942565917969, -0.30437469482421875, -0.2913551330566406, -0.2783355712890625, -0.2653160095214844, -0.25229644775390625, -0.23927688598632812, -0.22625732421875, -0.21323776245117188, -0.20021820068359375, -0.18719863891601562, -0.1741790771484375, -0.16115951538085938, -0.14813995361328125, -0.13512039184570312, -0.122100830078125, -0.10908126831054688, -0.09606170654296875, -0.08304214477539062, -0.0700225830078125, -0.057003021240234375, -0.04398345947265625, -0.030963897705078125, -0.0179443359375, -0.004924774169921875, 0.00809478759765625, 0.021114349365234375, 0.0341339111328125, 0.047153472900390625, 0.06017303466796875, 0.07319259643554688, 0.086212158203125, 0.09923171997070312, 0.11225128173828125, 0.12527084350585938, 0.1382904052734375, 0.15130996704101562, 0.16432952880859375, 0.17734909057617188, 0.19036865234375, 0.20338821411132812, 0.21640777587890625, 0.22942733764648438, 0.2424468994140625, 0.2554664611816406, 0.26848602294921875, 0.2815055847167969, 0.294525146484375, 0.3075447082519531, 0.32056427001953125, 0.3335838317871094, 0.3466033935546875, 0.3596229553222656, 0.37264251708984375, 0.3856620788574219, 0.398681640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 6.0, 8.0, 24.0, 29.0, 31.0, 60.0, 57.0, 87.0, 97.0, 110.0, 104.0, 90.0, 78.0, 53.0, 40.0, 24.0, 25.0, 12.0, 11.0, 8.0, 8.0, 10.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1566162109375, -0.1513347625732422, -0.14605331420898438, -0.14077186584472656, -0.13549041748046875, -0.13020896911621094, -0.12492752075195312, -0.11964607238769531, -0.1143646240234375, -0.10908317565917969, -0.10380172729492188, -0.09852027893066406, -0.09323883056640625, -0.08795738220214844, -0.08267593383789062, -0.07739448547363281, -0.072113037109375, -0.06683158874511719, -0.061550140380859375, -0.05626869201660156, -0.05098724365234375, -0.04570579528808594, -0.040424346923828125, -0.03514289855957031, -0.0298614501953125, -0.024580001831054688, -0.019298553466796875, -0.014017105102539062, -0.00873565673828125, -0.0034542083740234375, 0.001827239990234375, 0.0071086883544921875, 0.01239013671875, 0.017671585083007812, 0.022953033447265625, 0.028234481811523438, 0.03351593017578125, 0.03879737854003906, 0.044078826904296875, 0.04936027526855469, 0.0546417236328125, 0.05992317199707031, 0.06520462036132812, 0.07048606872558594, 0.07576751708984375, 0.08104896545410156, 0.08633041381835938, 0.09161186218261719, 0.096893310546875, 0.10217475891113281, 0.10745620727539062, 0.11273765563964844, 0.11801910400390625, 0.12330055236816406, 0.12858200073242188, 0.1338634490966797, 0.1391448974609375, 0.1444263458251953, 0.14970779418945312, 0.15498924255371094, 0.16027069091796875, 0.16555213928222656, 0.17083358764648438, 0.1761150360107422, 0.181396484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 20.0, 30.0, 73.0, 171.0, 334.0, 195.0, 78.0, 36.0, 26.0, 12.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.589051246643066, -5.455007553100586, -5.320964336395264, -5.186920642852783, -5.052877426147461, -4.9188337326049805, -4.784790515899658, -4.650746822357178, -4.5167036056518555, -4.382659912109375, -4.248616695404053, -4.114573001861572, -3.98052978515625, -3.8464863300323486, -3.7124428749084473, -3.578399181365967, -3.4443557262420654, -3.310312271118164, -3.1762688159942627, -3.0422253608703613, -2.90818190574646, -2.7741384506225586, -2.640094757080078, -2.506051540374756, -2.3720078468322754, -2.237964391708374, -2.1039209365844727, -1.9698774814605713, -1.83583402633667, -1.7017905712127686, -1.5677469968795776, -1.4337035417556763, -1.2996599674224854, -1.165616512298584, -1.0315730571746826, -0.8975295424461365, -0.7634860873222351, -0.6294426321983337, -0.4953991174697876, -0.36135566234588623, -0.22731220722198486, -0.0932687371969223, 0.04077473282814026, 0.174818217754364, 0.3088616728782654, 0.44290512800216675, 0.5769486427307129, 0.7109920978546143, 0.8450355529785156, 0.979079008102417, 1.1131224632263184, 1.2471659183502197, 1.381209373474121, 1.5152528285980225, 1.6492964029312134, 1.7833398580551147, 1.9173833131790161, 2.051426887512207, 2.1854703426361084, 2.3195137977600098, 2.453557252883911, 2.5876007080078125, 2.721644163131714, 2.8556876182556152, 2.9897310733795166]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 4.0, 10.0, 8.0, 9.0, 18.0, 16.0, 18.0, 24.0, 24.0, 31.0, 31.0, 33.0, 43.0, 45.0, 48.0, 51.0, 44.0, 54.0, 60.0, 47.0, 49.0, 37.0, 35.0, 35.0, 31.0, 28.0, 28.0, 20.0, 24.0, 21.0, 14.0, 14.0, 9.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11759090423584, -3.0048656463623047, -2.8921406269073486, -2.7794156074523926, -2.6666903495788574, -2.5539650917053223, -2.441240072250366, -2.32851505279541, -2.215789794921875, -2.10306453704834, -1.9903395175933838, -1.8776143789291382, -1.7648892402648926, -1.652164101600647, -1.5394389629364014, -1.4267138242721558, -1.3139886856079102, -1.2012635469436646, -1.088538408279419, -0.9758132696151733, -0.8630881309509277, -0.7503629922866821, -0.6376378536224365, -0.5249127149581909, -0.4121875762939453, -0.2994624376296997, -0.1867372989654541, -0.0740121603012085, 0.03871297836303711, 0.15143811702728271, 0.2641632556915283, 0.3768883943557739, 0.48961353302001953, 0.6023386716842651, 0.7150638103485107, 0.8277889490127563, 0.940514087677002, 1.0532392263412476, 1.1659643650054932, 1.2786895036697388, 1.3914146423339844, 1.50413978099823, 1.6168649196624756, 1.7295900583267212, 1.8423151969909668, 1.9550403356552124, 2.067765474319458, 2.180490493774414, 2.293215751647949, 2.4059410095214844, 2.5186660289764404, 2.6313910484313965, 2.7441163063049316, 2.856841564178467, 2.969566583633423, 3.082291603088379, 3.195016860961914, 3.307742118835449, 3.4204671382904053, 3.5331921577453613, 3.6459174156188965, 3.7586426734924316, 3.8713676929473877, 3.9840927124023438, 4.096817970275879]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 11.0, 21.0, 53.0, 233.0, 2143.0, 4190961.0, 684.0, 105.0, 34.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.29296875, -7.1246337890625, -6.956298828125, -6.7879638671875, -6.61962890625, -6.4512939453125, -6.282958984375, -6.1146240234375, -5.9462890625, -5.7779541015625, -5.609619140625, -5.4412841796875, -5.27294921875, -5.1046142578125, -4.936279296875, -4.7679443359375, -4.599609375, -4.4312744140625, -4.262939453125, -4.0946044921875, -3.92626953125, -3.7579345703125, -3.589599609375, -3.4212646484375, -3.2529296875, -3.0845947265625, -2.916259765625, -2.7479248046875, -2.57958984375, -2.4112548828125, -2.242919921875, -2.0745849609375, -1.90625, -1.7379150390625, -1.569580078125, -1.4012451171875, -1.23291015625, -1.0645751953125, -0.896240234375, -0.7279052734375, -0.5595703125, -0.3912353515625, -0.222900390625, -0.0545654296875, 0.11376953125, 0.2821044921875, 0.450439453125, 0.6187744140625, 0.787109375, 0.9554443359375, 1.123779296875, 1.2921142578125, 1.46044921875, 1.6287841796875, 1.797119140625, 1.9654541015625, 2.1337890625, 2.3021240234375, 2.470458984375, 2.6387939453125, 2.80712890625, 2.9754638671875, 3.143798828125, 3.3121337890625, 3.48046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 17.0, 74.0, 179.0, 351.0, 248.0, 79.0, 26.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.7013053894042969, -0.6848373413085938, -0.6683692932128906, -0.6519012451171875, -0.6354331970214844, -0.6189651489257812, -0.6024971008300781, -0.586029052734375, -0.5695610046386719, -0.5530929565429688, -0.5366249084472656, -0.5201568603515625, -0.5036888122558594, -0.48722076416015625, -0.4707527160644531, -0.45428466796875, -0.4378166198730469, -0.42134857177734375, -0.4048805236816406, -0.3884124755859375, -0.3719444274902344, -0.35547637939453125, -0.3390083312988281, -0.322540283203125, -0.3060722351074219, -0.28960418701171875, -0.2731361389160156, -0.2566680908203125, -0.24020004272460938, -0.22373199462890625, -0.20726394653320312, -0.1907958984375, -0.17432785034179688, -0.15785980224609375, -0.14139175415039062, -0.1249237060546875, -0.10845565795898438, -0.09198760986328125, -0.07551956176757812, -0.059051513671875, -0.042583465576171875, -0.02611541748046875, -0.009647369384765625, 0.0068206787109375, 0.023288726806640625, 0.03975677490234375, 0.056224822998046875, 0.07269287109375, 0.08916091918945312, 0.10562896728515625, 0.12209701538085938, 0.1385650634765625, 0.15503311157226562, 0.17150115966796875, 0.18796920776367188, 0.204437255859375, 0.22090530395507812, 0.23737335205078125, 0.2538414001464844, 0.2703094482421875, 0.2867774963378906, 0.30324554443359375, 0.3197135925292969, 0.336181640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 0.0, 8.0, 10.0, 27.0, 50.0, 81.0, 177.0, 428.0, 1198.0, 4495.0, 49177.0, 4115217.0, 19232.0, 2854.0, 772.0, 264.0, 131.0, 61.0, 34.0, 27.0, 13.0, 14.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.965850830078125, -0.93853759765625, -0.911224365234375, -0.8839111328125, -0.856597900390625, -0.82928466796875, -0.801971435546875, -0.774658203125, -0.747344970703125, -0.72003173828125, -0.692718505859375, -0.6654052734375, -0.638092041015625, -0.61077880859375, -0.583465576171875, -0.55615234375, -0.528839111328125, -0.50152587890625, -0.474212646484375, -0.4468994140625, -0.419586181640625, -0.39227294921875, -0.364959716796875, -0.337646484375, -0.310333251953125, -0.28302001953125, -0.255706787109375, -0.2283935546875, -0.201080322265625, -0.17376708984375, -0.146453857421875, -0.119140625, -0.091827392578125, -0.06451416015625, -0.037200927734375, -0.0098876953125, 0.017425537109375, 0.04473876953125, 0.072052001953125, 0.099365234375, 0.126678466796875, 0.15399169921875, 0.181304931640625, 0.2086181640625, 0.235931396484375, 0.26324462890625, 0.290557861328125, 0.31787109375, 0.345184326171875, 0.37249755859375, 0.399810791015625, 0.4271240234375, 0.454437255859375, 0.48175048828125, 0.509063720703125, 0.536376953125, 0.563690185546875, 0.59100341796875, 0.618316650390625, 0.6456298828125, 0.672943115234375, 0.70025634765625, 0.727569580078125, 0.7548828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 11.0, 7.0, 10.0, 18.0, 45.0, 106.0, 1009.0, 2657.0, 115.0, 35.0, 23.0, 16.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.18136024475097656, -0.17412185668945312, -0.1668834686279297, -0.15964508056640625, -0.1524066925048828, -0.14516830444335938, -0.13792991638183594, -0.1306915283203125, -0.12345314025878906, -0.11621475219726562, -0.10897636413574219, -0.10173797607421875, -0.09449958801269531, -0.08726119995117188, -0.08002281188964844, -0.072784423828125, -0.06554603576660156, -0.058307647705078125, -0.05106925964355469, -0.04383087158203125, -0.03659248352050781, -0.029354095458984375, -0.022115707397460938, -0.0148773193359375, -0.0076389312744140625, -0.000400543212890625, 0.0068378448486328125, 0.01407623291015625, 0.021314620971679688, 0.028553009033203125, 0.03579139709472656, 0.04302978515625, 0.05026817321777344, 0.057506561279296875, 0.06474494934082031, 0.07198333740234375, 0.07922172546386719, 0.08646011352539062, 0.09369850158691406, 0.1009368896484375, 0.10817527770996094, 0.11541366577148438, 0.12265205383300781, 0.12989044189453125, 0.1371288299560547, 0.14436721801757812, 0.15160560607910156, 0.158843994140625, 0.16608238220214844, 0.17332077026367188, 0.1805591583251953, 0.18779754638671875, 0.1950359344482422, 0.20227432250976562, 0.20951271057128906, 0.2167510986328125, 0.22398948669433594, 0.23122787475585938, 0.2384662628173828, 0.24570465087890625, 0.2529430389404297, 0.2601814270019531, 0.26741981506347656, 0.274658203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 165.0, 847.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3448017835617065, -1.1571334600448608, -0.9694650173187256, -0.7817966938018799, -0.5941283106803894, -0.4064599275588989, -0.21879160404205322, -0.03112316131591797, 0.15654516220092773, 0.3442135453224182, 0.5318819284439087, 0.7195502519607544, 0.9072186350822449, 1.0948870182037354, 1.282555341720581, 1.4702237844467163, 1.657892107963562, 1.8455604314804077, 2.033228874206543, 2.2208971977233887, 2.4085655212402344, 2.59623384475708, 2.783902168273926, 2.9715707302093506, 3.1592390537261963, 3.346907377243042, 3.5345757007598877, 3.7222442626953125, 3.909912586212158, 4.097580909729004, 4.28524923324585, 4.472917556762695, 4.660585880279541, 4.848254203796387, 5.035922527313232, 5.223590850830078, 5.411259174346924, 5.5989274978637695, 5.786596298217773, 5.974264621734619, 6.161932945251465, 6.3496012687683105, 6.537269592285156, 6.724937915802002, 6.912606239318848, 7.100275039672852, 7.287942886352539, 7.475611686706543, 7.6632795333862305, 7.850947856903076, 8.038616180419922, 8.226284980773926, 8.413952827453613, 8.601621627807617, 8.789289474487305, 8.976958274841309, 9.164627075195312, 9.352295875549316, 9.539963722229004, 9.727632522583008, 9.915300369262695, 10.1029691696167, 10.290637016296387, 10.47830581665039, 10.665973663330078]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 7.0, 10.0, 16.0, 18.0, 23.0, 30.0, 37.0, 35.0, 50.0, 61.0, 43.0, 51.0, 74.0, 68.0, 65.0, 71.0, 54.0, 43.0, 50.0, 38.0, 31.0, 19.0, 15.0, 20.0, 21.0, 13.0, 6.0, 7.0, 7.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47241783142089844, -0.4569101929664612, -0.4414025545120239, -0.42589494585990906, -0.4103873074054718, -0.39487966895103455, -0.3793720602989197, -0.3638644218444824, -0.34835678339004517, -0.3328491449356079, -0.31734150648117065, -0.3018338978290558, -0.28632625937461853, -0.2708186209201813, -0.2553110122680664, -0.23980337381362915, -0.2242957353591919, -0.20878809690475464, -0.19328047335147858, -0.17777284979820251, -0.16226521134376526, -0.146757572889328, -0.13124994933605194, -0.11574231833219528, -0.10023468732833862, -0.08472705632448196, -0.0692194253206253, -0.053711794316768646, -0.03820416331291199, -0.02269653230905533, -0.007188901305198669, 0.00831872969865799, 0.02382636070251465, 0.03933399170637131, 0.054841622710227966, 0.07034925371408463, 0.08585688471794128, 0.10136451572179794, 0.1168721467256546, 0.13237977027893066, 0.14788740873336792, 0.16339504718780518, 0.17890267074108124, 0.1944102942943573, 0.20991793274879456, 0.2254255712032318, 0.24093319475650787, 0.25644081830978394, 0.2719484567642212, 0.28745609521865845, 0.3029637336730957, 0.31847134232521057, 0.3339789807796478, 0.3494866192340851, 0.36499422788619995, 0.3805018663406372, 0.39600950479507446, 0.4115171432495117, 0.427024781703949, 0.44253239035606384, 0.4580400288105011, 0.47354766726493835, 0.4890552759170532, 0.5045629143714905, 0.5200705528259277]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 8.0, 3.0, 3.0, 11.0, 9.0, 7.0, 10.0, 22.0, 27.0, 29.0, 32.0, 56.0, 88.0, 136.0, 183.0, 380.0, 615.0, 1332.0, 3474.0, 24567.0, 927429.0, 80722.0, 5634.0, 1781.0, 823.0, 406.0, 264.0, 165.0, 96.0, 56.0, 48.0, 34.0, 24.0, 14.0, 11.0, 13.0, 8.0, 6.0, 9.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.3041534423828125, -1.261627197265625, -1.2191009521484375, -1.17657470703125, -1.1340484619140625, -1.091522216796875, -1.0489959716796875, -1.0064697265625, -0.9639434814453125, -0.921417236328125, -0.8788909912109375, -0.83636474609375, -0.7938385009765625, -0.751312255859375, -0.7087860107421875, -0.666259765625, -0.6237335205078125, -0.581207275390625, -0.5386810302734375, -0.49615478515625, -0.4536285400390625, -0.411102294921875, -0.3685760498046875, -0.3260498046875, -0.2835235595703125, -0.240997314453125, -0.1984710693359375, -0.15594482421875, -0.1134185791015625, -0.070892333984375, -0.0283660888671875, 0.01416015625, 0.0566864013671875, 0.099212646484375, 0.1417388916015625, 0.18426513671875, 0.2267913818359375, 0.269317626953125, 0.3118438720703125, 0.3543701171875, 0.3968963623046875, 0.439422607421875, 0.4819488525390625, 0.52447509765625, 0.5670013427734375, 0.609527587890625, 0.6520538330078125, 0.694580078125, 0.7371063232421875, 0.779632568359375, 0.8221588134765625, 0.86468505859375, 0.9072113037109375, 0.949737548828125, 0.9922637939453125, 1.0347900390625, 1.0773162841796875, 1.119842529296875, 1.1623687744140625, 1.20489501953125, 1.2474212646484375, 1.289947509765625, 1.3324737548828125, 1.375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 22.0, 79.0, 217.0, 346.0, 221.0, 69.0, 22.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.693145751953125, -0.67681884765625, -0.660491943359375, -0.6441650390625, -0.627838134765625, -0.61151123046875, -0.595184326171875, -0.578857421875, -0.562530517578125, -0.54620361328125, -0.529876708984375, -0.5135498046875, -0.497222900390625, -0.48089599609375, -0.464569091796875, -0.4482421875, -0.431915283203125, -0.41558837890625, -0.399261474609375, -0.3829345703125, -0.366607666015625, -0.35028076171875, -0.333953857421875, -0.317626953125, -0.301300048828125, -0.28497314453125, -0.268646240234375, -0.2523193359375, -0.235992431640625, -0.21966552734375, -0.203338623046875, -0.18701171875, -0.170684814453125, -0.15435791015625, -0.138031005859375, -0.1217041015625, -0.105377197265625, -0.08905029296875, -0.072723388671875, -0.056396484375, -0.040069580078125, -0.02374267578125, -0.007415771484375, 0.0089111328125, 0.025238037109375, 0.04156494140625, 0.057891845703125, 0.07421875, 0.090545654296875, 0.10687255859375, 0.123199462890625, 0.1395263671875, 0.155853271484375, 0.17218017578125, 0.188507080078125, 0.204833984375, 0.221160888671875, 0.23748779296875, 0.253814697265625, 0.2701416015625, 0.286468505859375, 0.30279541015625, 0.319122314453125, 0.33544921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 9.0, 8.0, 8.0, 13.0, 20.0, 22.0, 20.0, 27.0, 46.0, 67.0, 117.0, 179.0, 347.0, 915.0, 3391.0, 19494.0, 259359.0, 716084.0, 40300.0, 5624.0, 1375.0, 443.0, 230.0, 132.0, 85.0, 53.0, 34.0, 24.0, 19.0, 12.0, 13.0, 11.0, 6.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.00390625, -0.9706268310546875, -0.937347412109375, -0.9040679931640625, -0.87078857421875, -0.8375091552734375, -0.804229736328125, -0.7709503173828125, -0.7376708984375, -0.7043914794921875, -0.671112060546875, -0.6378326416015625, -0.60455322265625, -0.5712738037109375, -0.537994384765625, -0.5047149658203125, -0.471435546875, -0.4381561279296875, -0.404876708984375, -0.3715972900390625, -0.33831787109375, -0.3050384521484375, -0.271759033203125, -0.2384796142578125, -0.2052001953125, -0.1719207763671875, -0.138641357421875, -0.1053619384765625, -0.07208251953125, -0.0388031005859375, -0.005523681640625, 0.0277557373046875, 0.06103515625, 0.0943145751953125, 0.127593994140625, 0.1608734130859375, 0.19415283203125, 0.2274322509765625, 0.260711669921875, 0.2939910888671875, 0.3272705078125, 0.3605499267578125, 0.393829345703125, 0.4271087646484375, 0.46038818359375, 0.4936676025390625, 0.526947021484375, 0.5602264404296875, 0.593505859375, 0.6267852783203125, 0.660064697265625, 0.6933441162109375, 0.72662353515625, 0.7599029541015625, 0.793182373046875, 0.8264617919921875, 0.8597412109375, 0.8930206298828125, 0.926300048828125, 0.9595794677734375, 0.99285888671875, 1.0261383056640625, 1.059417724609375, 1.0926971435546875, 1.1259765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 6.0, 7.0, 9.0, 7.0, 10.0, 14.0, 12.0, 16.0, 19.0, 24.0, 33.0, 27.0, 37.0, 48.0, 51.0, 45.0, 49.0, 36.0, 42.0, 41.0, 49.0, 53.0, 47.0, 40.0, 44.0, 35.0, 23.0, 29.0, 19.0, 17.0, 17.0, 22.0, 6.0, 8.0, 9.0, 13.0, 5.0, 2.0, 11.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6125640869140625, -0.593780517578125, -0.5749969482421875, -0.55621337890625, -0.5374298095703125, -0.518646240234375, -0.4998626708984375, -0.4810791015625, -0.4622955322265625, -0.443511962890625, -0.4247283935546875, -0.40594482421875, -0.3871612548828125, -0.368377685546875, -0.3495941162109375, -0.330810546875, -0.3120269775390625, -0.293243408203125, -0.2744598388671875, -0.25567626953125, -0.2368927001953125, -0.218109130859375, -0.1993255615234375, -0.1805419921875, -0.1617584228515625, -0.142974853515625, -0.1241912841796875, -0.10540771484375, -0.0866241455078125, -0.067840576171875, -0.0490570068359375, -0.0302734375, -0.0114898681640625, 0.007293701171875, 0.0260772705078125, 0.04486083984375, 0.0636444091796875, 0.082427978515625, 0.1012115478515625, 0.1199951171875, 0.1387786865234375, 0.157562255859375, 0.1763458251953125, 0.19512939453125, 0.2139129638671875, 0.232696533203125, 0.2514801025390625, 0.270263671875, 0.2890472412109375, 0.307830810546875, 0.3266143798828125, 0.34539794921875, 0.3641815185546875, 0.382965087890625, 0.4017486572265625, 0.4205322265625, 0.4393157958984375, 0.458099365234375, 0.4768829345703125, 0.49566650390625, 0.5144500732421875, 0.533233642578125, 0.5520172119140625, 0.57080078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 20.0, 41.0, 63.0, 111.0, 208.0, 443.0, 1179.0, 4575.0, 32712.0, 738718.0, 251722.0, 14512.0, 2664.0, 848.0, 335.0, 162.0, 74.0, 39.0, 31.0, 22.0, 16.0, 12.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1451416015625, -0.1399250030517578, -0.13470840454101562, -0.12949180603027344, -0.12427520751953125, -0.11905860900878906, -0.11384201049804688, -0.10862541198730469, -0.1034088134765625, -0.09819221496582031, -0.09297561645507812, -0.08775901794433594, -0.08254241943359375, -0.07732582092285156, -0.07210922241210938, -0.06689262390136719, -0.061676025390625, -0.05645942687988281, -0.051242828369140625, -0.04602622985839844, -0.04080963134765625, -0.03559303283691406, -0.030376434326171875, -0.025159835815429688, -0.0199432373046875, -0.014726638793945312, -0.009510040283203125, -0.0042934417724609375, 0.00092315673828125, 0.0061397552490234375, 0.011356353759765625, 0.016572952270507812, 0.02178955078125, 0.027006149291992188, 0.032222747802734375, 0.03743934631347656, 0.04265594482421875, 0.04787254333496094, 0.053089141845703125, 0.05830574035644531, 0.0635223388671875, 0.06873893737792969, 0.07395553588867188, 0.07917213439941406, 0.08438873291015625, 0.08960533142089844, 0.09482192993164062, 0.10003852844238281, 0.105255126953125, 0.11047172546386719, 0.11568832397460938, 0.12090492248535156, 0.12612152099609375, 0.13133811950683594, 0.13655471801757812, 0.1417713165283203, 0.1469879150390625, 0.1522045135498047, 0.15742111206054688, 0.16263771057128906, 0.16785430908203125, 0.17307090759277344, 0.17828750610351562, 0.1835041046142578, 0.188720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 10.0, 11.0, 13.0, 12.0, 24.0, 28.0, 31.0, 40.0, 47.0, 38.0, 76.0, 92.0, 79.0, 59.0, 76.0, 69.0, 64.0, 44.0, 42.0, 22.0, 13.0, 21.0, 19.0, 16.0, 8.0, 6.0, 6.0, 1.0, 7.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.417533874511719e-06, -9.120441973209381e-06, -8.823350071907043e-06, -8.526258170604706e-06, -8.229166269302368e-06, -7.93207436800003e-06, -7.634982466697693e-06, -7.337890565395355e-06, -7.040798664093018e-06, -6.74370676279068e-06, -6.446614861488342e-06, -6.149522960186005e-06, -5.852431058883667e-06, -5.555339157581329e-06, -5.258247256278992e-06, -4.961155354976654e-06, -4.664063453674316e-06, -4.366971552371979e-06, -4.069879651069641e-06, -3.7727877497673035e-06, -3.475695848464966e-06, -3.178603947162628e-06, -2.8815120458602905e-06, -2.584420144557953e-06, -2.2873282432556152e-06, -1.9902363419532776e-06, -1.69314444065094e-06, -1.3960525393486023e-06, -1.0989606380462646e-06, -8.01868736743927e-07, -5.047768354415894e-07, -2.076849341392517e-07, 8.940696716308594e-08, 3.864988684654236e-07, 6.835907697677612e-07, 9.806826710700989e-07, 1.2777745723724365e-06, 1.5748664736747742e-06, 1.8719583749771118e-06, 2.1690502762794495e-06, 2.466142177581787e-06, 2.7632340788841248e-06, 3.0603259801864624e-06, 3.3574178814888e-06, 3.6545097827911377e-06, 3.951601684093475e-06, 4.248693585395813e-06, 4.545785486698151e-06, 4.842877388000488e-06, 5.139969289302826e-06, 5.4370611906051636e-06, 5.734153091907501e-06, 6.031244993209839e-06, 6.3283368945121765e-06, 6.625428795814514e-06, 6.922520697116852e-06, 7.2196125984191895e-06, 7.516704499721527e-06, 7.813796401023865e-06, 8.110888302326202e-06, 8.40798020362854e-06, 8.705072104930878e-06, 9.002164006233215e-06, 9.299255907535553e-06, 9.59634780883789e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 9.0, 13.0, 19.0, 24.0, 45.0, 52.0, 105.0, 212.0, 568.0, 1994.0, 12251.0, 391001.0, 623049.0, 15754.0, 2279.0, 629.0, 231.0, 98.0, 62.0, 42.0, 22.0, 24.0, 14.0, 17.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2203369140625, -0.21300506591796875, -0.2056732177734375, -0.19834136962890625, -0.191009521484375, -0.18367767333984375, -0.1763458251953125, -0.16901397705078125, -0.16168212890625, -0.15435028076171875, -0.1470184326171875, -0.13968658447265625, -0.132354736328125, -0.12502288818359375, -0.1176910400390625, -0.11035919189453125, -0.10302734375, -0.09569549560546875, -0.0883636474609375, -0.08103179931640625, -0.073699951171875, -0.06636810302734375, -0.0590362548828125, -0.05170440673828125, -0.04437255859375, -0.03704071044921875, -0.0297088623046875, -0.02237701416015625, -0.015045166015625, -0.00771331787109375, -0.0003814697265625, 0.00695037841796875, 0.0142822265625, 0.02161407470703125, 0.0289459228515625, 0.03627777099609375, 0.043609619140625, 0.05094146728515625, 0.0582733154296875, 0.06560516357421875, 0.07293701171875, 0.08026885986328125, 0.0876007080078125, 0.09493255615234375, 0.102264404296875, 0.10959625244140625, 0.1169281005859375, 0.12425994873046875, 0.131591796875, 0.13892364501953125, 0.1462554931640625, 0.15358734130859375, 0.160919189453125, 0.16825103759765625, 0.1755828857421875, 0.18291473388671875, 0.19024658203125, 0.19757843017578125, 0.2049102783203125, 0.21224212646484375, 0.219573974609375, 0.22690582275390625, 0.2342376708984375, 0.24156951904296875, 0.2489013671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 5.0, 14.0, 16.0, 12.0, 24.0, 24.0, 31.0, 41.0, 56.0, 65.0, 85.0, 89.0, 109.0, 94.0, 67.0, 59.0, 41.0, 38.0, 29.0, 18.0, 19.0, 16.0, 9.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.1301097869873047, -0.12618637084960938, -0.12226295471191406, -0.11833953857421875, -0.11441612243652344, -0.11049270629882812, -0.10656929016113281, -0.1026458740234375, -0.09872245788574219, -0.09479904174804688, -0.09087562561035156, -0.08695220947265625, -0.08302879333496094, -0.07910537719726562, -0.07518196105957031, -0.071258544921875, -0.06733512878417969, -0.06341171264648438, -0.05948829650878906, -0.05556488037109375, -0.05164146423339844, -0.047718048095703125, -0.04379463195800781, -0.0398712158203125, -0.03594779968261719, -0.032024383544921875, -0.028100967407226562, -0.02417755126953125, -0.020254135131835938, -0.016330718994140625, -0.012407302856445312, -0.00848388671875, -0.0045604705810546875, -0.000637054443359375, 0.0032863616943359375, 0.00720977783203125, 0.011133193969726562, 0.015056610107421875, 0.018980026245117188, 0.0229034423828125, 0.026826858520507812, 0.030750274658203125, 0.03467369079589844, 0.03859710693359375, 0.04252052307128906, 0.046443939208984375, 0.05036735534667969, 0.054290771484375, 0.05821418762207031, 0.062137603759765625, 0.06606101989746094, 0.06998443603515625, 0.07390785217285156, 0.07783126831054688, 0.08175468444824219, 0.0856781005859375, 0.08960151672363281, 0.09352493286132812, 0.09744834899902344, 0.10137176513671875, 0.10529518127441406, 0.10921859741210938, 0.11314201354980469, 0.1170654296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 14.0, 13.0, 24.0, 38.0, 79.0, 178.0, 280.0, 182.0, 75.0, 38.0, 34.0, 19.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.151472091674805, -5.03578519821167, -4.920098304748535, -4.8044114112854, -4.688724517822266, -4.573037624359131, -4.457350730895996, -4.341663837432861, -4.225976943969727, -4.110290050506592, -3.994603157043457, -3.8789162635803223, -3.7632293701171875, -3.6475424766540527, -3.531855583190918, -3.416168689727783, -3.3004820346832275, -3.1847951412200928, -3.069108247756958, -2.9534213542938232, -2.8377344608306885, -2.7220475673675537, -2.606360912322998, -2.4906740188598633, -2.3749871253967285, -2.2593002319335938, -2.143613338470459, -2.027926445007324, -1.9122395515441895, -1.7965526580810547, -1.6808658838272095, -1.5651789903640747, -1.4494922161102295, -1.3338053226470947, -1.21811842918396, -1.1024315357208252, -0.9867447018623352, -0.8710578083992004, -0.7553709745407104, -0.6396840810775757, -0.5239971876144409, -0.40831029415130615, -0.2926234304904938, -0.1769365668296814, -0.06124967336654663, 0.054437220096588135, 0.17012405395507812, 0.2858109474182129, 0.40149784088134766, 0.5171847343444824, 0.6328716278076172, 0.7485584616661072, 0.8642453551292419, 0.9799322485923767, 1.0956190824508667, 1.2113059759140015, 1.3269928693771362, 1.442679762840271, 1.5583666563034058, 1.674053430557251, 1.7897403240203857, 1.9054272174835205, 2.0211141109466553, 2.13680100440979, 2.252487897872925]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 5.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 13.0, 24.0, 40.0, 37.0, 30.0, 44.0, 48.0, 56.0, 49.0, 55.0, 47.0, 43.0, 50.0, 57.0, 60.0, 50.0, 32.0, 25.0, 32.0, 33.0, 19.0, 17.0, 14.0, 15.0, 3.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.053379058837891, -3.934798002243042, -3.8162171840667725, -3.697636127471924, -3.5790553092956543, -3.4604742527008057, -3.341893196105957, -3.2233123779296875, -3.104731321334839, -2.9861502647399902, -2.8675694465637207, -2.748988389968872, -2.6304073333740234, -2.511826515197754, -2.3932454586029053, -2.2746644020080566, -2.156083583831787, -2.0375025272369385, -1.918921709060669, -1.8003406524658203, -1.6817597150802612, -1.5631787776947021, -1.4445977210998535, -1.3260167837142944, -1.2074358463287354, -1.0888549089431763, -0.9702739119529724, -0.8516929149627686, -0.7331119775772095, -0.6145310401916504, -0.49595004320144653, -0.3773690462112427, -0.2587881088256836, -0.14020714163780212, -0.021626174449920654, 0.09695479273796082, 0.21553575992584229, 0.33411669731140137, 0.4526976943016052, 0.5712786912918091, 0.6898596286773682, 0.8084405660629272, 0.9270215630531311, 1.045602560043335, 1.164183497428894, 1.2827644348144531, 1.4013454914093018, 1.5199264287948608, 1.63850736618042, 1.757088303565979, 1.875669240951538, 1.9942502975463867, 2.1128311157226562, 2.231412172317505, 2.3499932289123535, 2.468574047088623, 2.5871551036834717, 2.7057361602783203, 2.82431697845459, 2.9428980350494385, 3.061479091644287, 3.1800599098205566, 3.2986409664154053, 3.417222023010254, 3.5358028411865234]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 12.0, 17.0, 18.0, 20.0, 42.0, 84.0, 145.0, 288.0, 1039.0, 8329.0, 4170192.0, 12353.0, 1152.0, 320.0, 112.0, 55.0, 40.0, 18.0, 13.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01171875, -2.94256591796875, -2.8734130859375, -2.80426025390625, -2.735107421875, -2.66595458984375, -2.5968017578125, -2.52764892578125, -2.45849609375, -2.38934326171875, -2.3201904296875, -2.25103759765625, -2.181884765625, -2.11273193359375, -2.0435791015625, -1.97442626953125, -1.9052734375, -1.83612060546875, -1.7669677734375, -1.69781494140625, -1.628662109375, -1.55950927734375, -1.4903564453125, -1.42120361328125, -1.35205078125, -1.28289794921875, -1.2137451171875, -1.14459228515625, -1.075439453125, -1.00628662109375, -0.9371337890625, -0.86798095703125, -0.798828125, -0.72967529296875, -0.6605224609375, -0.59136962890625, -0.522216796875, -0.45306396484375, -0.3839111328125, -0.31475830078125, -0.24560546875, -0.17645263671875, -0.1072998046875, -0.03814697265625, 0.031005859375, 0.10015869140625, 0.1693115234375, 0.23846435546875, 0.3076171875, 0.37677001953125, 0.4459228515625, 0.51507568359375, 0.584228515625, 0.65338134765625, 0.7225341796875, 0.79168701171875, 0.86083984375, 0.92999267578125, 0.9991455078125, 1.06829833984375, 1.137451171875, 1.20660400390625, 1.2757568359375, 1.34490966796875, 1.4140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 21.0, 75.0, 193.0, 306.0, 261.0, 79.0, 35.0, 8.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7127761840820312, -0.6960601806640625, -0.6793441772460938, -0.662628173828125, -0.6459121704101562, -0.6291961669921875, -0.6124801635742188, -0.59576416015625, -0.5790481567382812, -0.5623321533203125, -0.5456161499023438, -0.528900146484375, -0.5121841430664062, -0.4954681396484375, -0.47875213623046875, -0.4620361328125, -0.44532012939453125, -0.4286041259765625, -0.41188812255859375, -0.395172119140625, -0.37845611572265625, -0.3617401123046875, -0.34502410888671875, -0.32830810546875, -0.31159210205078125, -0.2948760986328125, -0.27816009521484375, -0.261444091796875, -0.24472808837890625, -0.2280120849609375, -0.21129608154296875, -0.194580078125, -0.17786407470703125, -0.1611480712890625, -0.14443206787109375, -0.127716064453125, -0.11100006103515625, -0.0942840576171875, -0.07756805419921875, -0.06085205078125, -0.04413604736328125, -0.0274200439453125, -0.01070404052734375, 0.006011962890625, 0.02272796630859375, 0.0394439697265625, 0.05615997314453125, 0.0728759765625, 0.08959197998046875, 0.1063079833984375, 0.12302398681640625, 0.139739990234375, 0.15645599365234375, 0.1731719970703125, 0.18988800048828125, 0.20660400390625, 0.22332000732421875, 0.2400360107421875, 0.25675201416015625, 0.273468017578125, 0.29018402099609375, 0.3069000244140625, 0.32361602783203125, 0.34033203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 2.0, 5.0, 7.0, 23.0, 45.0, 89.0, 302.0, 1170.0, 6840.0, 4122682.0, 59438.0, 2796.0, 513.0, 167.0, 93.0, 43.0, 22.0, 22.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.570159912109375, -2.50555419921875, -2.440948486328125, -2.3763427734375, -2.311737060546875, -2.24713134765625, -2.182525634765625, -2.117919921875, -2.053314208984375, -1.98870849609375, -1.924102783203125, -1.8594970703125, -1.794891357421875, -1.73028564453125, -1.665679931640625, -1.60107421875, -1.536468505859375, -1.47186279296875, -1.407257080078125, -1.3426513671875, -1.278045654296875, -1.21343994140625, -1.148834228515625, -1.084228515625, -1.019622802734375, -0.95501708984375, -0.890411376953125, -0.8258056640625, -0.761199951171875, -0.69659423828125, -0.631988525390625, -0.5673828125, -0.502777099609375, -0.43817138671875, -0.373565673828125, -0.3089599609375, -0.244354248046875, -0.17974853515625, -0.115142822265625, -0.050537109375, 0.014068603515625, 0.07867431640625, 0.143280029296875, 0.2078857421875, 0.272491455078125, 0.33709716796875, 0.401702880859375, 0.46630859375, 0.530914306640625, 0.59552001953125, 0.660125732421875, 0.7247314453125, 0.789337158203125, 0.85394287109375, 0.918548583984375, 0.983154296875, 1.047760009765625, 1.11236572265625, 1.176971435546875, 1.2415771484375, 1.306182861328125, 1.37078857421875, 1.435394287109375, 1.5]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 17.0, 29.0, 91.0, 271.0, 3305.0, 228.0, 53.0, 29.0, 11.0, 9.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4466972351074219, -0.42684173583984375, -0.4069862365722656, -0.3871307373046875, -0.3672752380371094, -0.34741973876953125, -0.3275642395019531, -0.307708740234375, -0.2878532409667969, -0.26799774169921875, -0.24814224243164062, -0.2282867431640625, -0.20843124389648438, -0.18857574462890625, -0.16872024536132812, -0.14886474609375, -0.12900924682617188, -0.10915374755859375, -0.08929824829101562, -0.0694427490234375, -0.049587249755859375, -0.02973175048828125, -0.009876251220703125, 0.009979248046875, 0.029834747314453125, 0.04969024658203125, 0.06954574584960938, 0.0894012451171875, 0.10925674438476562, 0.12911224365234375, 0.14896774291992188, 0.1688232421875, 0.18867874145507812, 0.20853424072265625, 0.22838973999023438, 0.2482452392578125, 0.2681007385253906, 0.28795623779296875, 0.3078117370605469, 0.327667236328125, 0.3475227355957031, 0.36737823486328125, 0.3872337341308594, 0.4070892333984375, 0.4269447326660156, 0.44680023193359375, 0.4666557312011719, 0.48651123046875, 0.5063667297363281, 0.5262222290039062, 0.5460777282714844, 0.5659332275390625, 0.5857887268066406, 0.6056442260742188, 0.6254997253417969, 0.645355224609375, 0.6652107238769531, 0.6850662231445312, 0.7049217224121094, 0.7247772216796875, 0.7446327209472656, 0.7644882202148438, 0.7843437194824219, 0.80419921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 6.0, 10.0, 50.0, 431.0, 431.0, 50.0, 18.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.220455169677734, -4.1127448081970215, -4.005034446716309, -3.8973240852355957, -3.789613723754883, -3.68190336227417, -3.574192762374878, -3.466482400894165, -3.358772039413452, -3.2510616779327393, -3.1433513164520264, -3.0356409549713135, -2.9279303550720215, -2.8202199935913086, -2.7125096321105957, -2.604799270629883, -2.49708890914917, -2.389378547668457, -2.281668186187744, -2.1739578247070312, -2.0662474632263184, -1.958536982536316, -1.8508265018463135, -1.7431161403656006, -1.6354057788848877, -1.5276954174041748, -1.419985055923462, -1.3122745752334595, -1.2045642137527466, -1.0968538522720337, -0.989143431186676, -0.8814330101013184, -0.7737228870391846, -0.6660125255584717, -0.558302104473114, -0.45059171319007874, -0.34288132190704346, -0.23517096042633057, -0.1274605393409729, -0.019750118255615234, 0.08796024322509766, 0.19567063450813293, 0.3033810257911682, 0.4110914170742035, 0.5188018083572388, 0.6265121698379517, 0.7342225909233093, 0.841933012008667, 0.9496433734893799, 1.0573537349700928, 1.1650640964508057, 1.272774577140808, 1.380484938621521, 1.4881953001022339, 1.5959057807922363, 1.7036161422729492, 1.811326503753662, 1.919036865234375, 2.026747226715088, 2.134457588195801, 2.2421679496765137, 2.3498783111572266, 2.4575889110565186, 2.5652992725372314, 2.6730096340179443]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 26.0, 33.0, 64.0, 95.0, 107.0, 133.0, 119.0, 110.0, 116.0, 75.0, 57.0, 27.0, 19.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8339438438415527, -2.7609875202178955, -2.6880311965942383, -2.615074634552002, -2.5421183109283447, -2.4691619873046875, -2.3962056636810303, -2.323249340057373, -2.2502927780151367, -2.1773364543914795, -2.1043801307678223, -2.031423568725586, -1.9584672451019287, -1.8855109214782715, -1.8125545978546143, -1.7395981550216675, -1.6666418313980103, -1.593685507774353, -1.5207290649414062, -1.447772741317749, -1.3748162984848022, -1.301859974861145, -1.2289035320281982, -1.155947208404541, -1.0829908847808838, -1.0100345611572266, -0.9370781183242798, -0.8641217947006226, -0.7911653518676758, -0.7182090282440186, -0.6452526450157166, -0.5722962617874146, -0.4993398189544678, -0.42638343572616577, -0.35342705249786377, -0.28047069907188416, -0.20751431584358215, -0.13455793261528015, -0.06160157918930054, 0.011354804039001465, 0.08431118726730347, 0.15726757049560547, 0.23022393882274628, 0.3031803071498871, 0.3761366903781891, 0.4490930736064911, 0.5220494270324707, 0.5950058102607727, 0.6679621934890747, 0.7409185767173767, 0.8138749599456787, 0.8868312835693359, 0.9597877264022827, 1.03274405002594, 1.1057004928588867, 1.178656816482544, 1.2516131401062012, 1.3245694637298584, 1.3975259065628052, 1.4704822301864624, 1.5434386730194092, 1.6163949966430664, 1.6893513202667236, 1.7623077630996704, 1.8352642059326172]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 7.0, 18.0, 10.0, 14.0, 29.0, 24.0, 46.0, 53.0, 107.0, 169.0, 284.0, 542.0, 1012.0, 2544.0, 12164.0, 764936.0, 254048.0, 8391.0, 2125.0, 874.0, 437.0, 264.0, 142.0, 93.0, 52.0, 41.0, 27.0, 24.0, 13.0, 11.0, 7.0, 9.0, 5.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.107421875, -2.0452728271484375, -1.983123779296875, -1.9209747314453125, -1.85882568359375, -1.7966766357421875, -1.734527587890625, -1.6723785400390625, -1.6102294921875, -1.5480804443359375, -1.485931396484375, -1.4237823486328125, -1.36163330078125, -1.2994842529296875, -1.237335205078125, -1.1751861572265625, -1.113037109375, -1.0508880615234375, -0.988739013671875, -0.9265899658203125, -0.86444091796875, -0.8022918701171875, -0.740142822265625, -0.6779937744140625, -0.6158447265625, -0.5536956787109375, -0.491546630859375, -0.4293975830078125, -0.36724853515625, -0.3050994873046875, -0.242950439453125, -0.1808013916015625, -0.11865234375, -0.0565032958984375, 0.005645751953125, 0.0677947998046875, 0.12994384765625, 0.1920928955078125, 0.254241943359375, 0.3163909912109375, 0.3785400390625, 0.4406890869140625, 0.502838134765625, 0.5649871826171875, 0.62713623046875, 0.6892852783203125, 0.751434326171875, 0.8135833740234375, 0.875732421875, 0.9378814697265625, 1.000030517578125, 1.0621795654296875, 1.12432861328125, 1.1864776611328125, 1.248626708984375, 1.3107757568359375, 1.3729248046875, 1.4350738525390625, 1.497222900390625, 1.5593719482421875, 1.62152099609375, 1.6836700439453125, 1.745819091796875, 1.8079681396484375, 1.8701171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 45.0, 115.0, 242.0, 314.0, 175.0, 56.0, 21.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6863784790039062, -0.6701202392578125, -0.6538619995117188, -0.637603759765625, -0.6213455200195312, -0.6050872802734375, -0.5888290405273438, -0.57257080078125, -0.5563125610351562, -0.5400543212890625, -0.5237960815429688, -0.507537841796875, -0.49127960205078125, -0.4750213623046875, -0.45876312255859375, -0.4425048828125, -0.42624664306640625, -0.4099884033203125, -0.39373016357421875, -0.377471923828125, -0.36121368408203125, -0.3449554443359375, -0.32869720458984375, -0.31243896484375, -0.29618072509765625, -0.2799224853515625, -0.26366424560546875, -0.247406005859375, -0.23114776611328125, -0.2148895263671875, -0.19863128662109375, -0.182373046875, -0.16611480712890625, -0.1498565673828125, -0.13359832763671875, -0.117340087890625, -0.10108184814453125, -0.0848236083984375, -0.06856536865234375, -0.05230712890625, -0.03604888916015625, -0.0197906494140625, -0.00353240966796875, 0.012725830078125, 0.02898406982421875, 0.0452423095703125, 0.06150054931640625, 0.0777587890625, 0.09401702880859375, 0.1102752685546875, 0.12653350830078125, 0.142791748046875, 0.15904998779296875, 0.1753082275390625, 0.19156646728515625, 0.20782470703125, 0.22408294677734375, 0.2403411865234375, 0.25659942626953125, 0.272857666015625, 0.28911590576171875, 0.3053741455078125, 0.32163238525390625, 0.337890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 12.0, 5.0, 11.0, 5.0, 16.0, 14.0, 15.0, 19.0, 23.0, 23.0, 43.0, 73.0, 120.0, 277.0, 863.0, 3136.0, 18032.0, 167766.0, 775208.0, 70466.0, 9394.0, 1907.0, 539.0, 201.0, 103.0, 56.0, 39.0, 19.0, 30.0, 21.0, 19.0, 17.0, 23.0, 9.0, 12.0, 7.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.1904296875, -1.1567306518554688, -1.1230316162109375, -1.0893325805664062, -1.055633544921875, -1.0219345092773438, -0.9882354736328125, -0.9545364379882812, -0.92083740234375, -0.8871383666992188, -0.8534393310546875, -0.8197402954101562, -0.786041259765625, -0.7523422241210938, -0.7186431884765625, -0.6849441528320312, -0.6512451171875, -0.6175460815429688, -0.5838470458984375, -0.5501480102539062, -0.516448974609375, -0.48274993896484375, -0.4490509033203125, -0.41535186767578125, -0.38165283203125, -0.34795379638671875, -0.3142547607421875, -0.28055572509765625, -0.246856689453125, -0.21315765380859375, -0.1794586181640625, -0.14575958251953125, -0.112060546875, -0.07836151123046875, -0.0446624755859375, -0.01096343994140625, 0.022735595703125, 0.05643463134765625, 0.0901336669921875, 0.12383270263671875, 0.15753173828125, 0.19123077392578125, 0.2249298095703125, 0.25862884521484375, 0.292327880859375, 0.32602691650390625, 0.3597259521484375, 0.39342498779296875, 0.4271240234375, 0.46082305908203125, 0.4945220947265625, 0.5282211303710938, 0.561920166015625, 0.5956192016601562, 0.6293182373046875, 0.6630172729492188, 0.69671630859375, 0.7304153442382812, 0.7641143798828125, 0.7978134155273438, 0.831512451171875, 0.8652114868164062, 0.8989105224609375, 0.9326095581054688, 0.96630859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 10.0, 13.0, 20.0, 15.0, 21.0, 28.0, 26.0, 15.0, 31.0, 37.0, 41.0, 35.0, 44.0, 37.0, 38.0, 45.0, 40.0, 56.0, 53.0, 44.0, 47.0, 37.0, 36.0, 37.0, 26.0, 22.0, 15.0, 22.0, 11.0, 17.0, 13.0, 7.0, 10.0, 7.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54296875, -0.5238113403320312, -0.5046539306640625, -0.48549652099609375, -0.466339111328125, -0.44718170166015625, -0.4280242919921875, -0.40886688232421875, -0.38970947265625, -0.37055206298828125, -0.3513946533203125, -0.33223724365234375, -0.313079833984375, -0.29392242431640625, -0.2747650146484375, -0.25560760498046875, -0.2364501953125, -0.21729278564453125, -0.1981353759765625, -0.17897796630859375, -0.159820556640625, -0.14066314697265625, -0.1215057373046875, -0.10234832763671875, -0.08319091796875, -0.06403350830078125, -0.0448760986328125, -0.02571868896484375, -0.006561279296875, 0.01259613037109375, 0.0317535400390625, 0.05091094970703125, 0.070068359375, 0.08922576904296875, 0.1083831787109375, 0.12754058837890625, 0.146697998046875, 0.16585540771484375, 0.1850128173828125, 0.20417022705078125, 0.22332763671875, 0.24248504638671875, 0.2616424560546875, 0.28079986572265625, 0.299957275390625, 0.31911468505859375, 0.3382720947265625, 0.35742950439453125, 0.3765869140625, 0.39574432373046875, 0.4149017333984375, 0.43405914306640625, 0.453216552734375, 0.47237396240234375, 0.4915313720703125, 0.5106887817382812, 0.52984619140625, 0.5490036010742188, 0.5681610107421875, 0.5873184204101562, 0.606475830078125, 0.6256332397460938, 0.6447906494140625, 0.6639480590820312, 0.68310546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 15.0, 19.0, 23.0, 53.0, 70.0, 122.0, 285.0, 551.0, 1077.0, 2355.0, 6812.0, 30985.0, 669660.0, 307677.0, 19897.0, 5109.0, 1984.0, 870.0, 386.0, 225.0, 104.0, 76.0, 50.0, 36.0, 23.0, 26.0, 8.0, 7.0, 5.0, 6.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24158096313476562, -0.23291778564453125, -0.22425460815429688, -0.2155914306640625, -0.20692825317382812, -0.19826507568359375, -0.18960189819335938, -0.180938720703125, -0.17227554321289062, -0.16361236572265625, -0.15494918823242188, -0.1462860107421875, -0.13762283325195312, -0.12895965576171875, -0.12029647827148438, -0.11163330078125, -0.10297012329101562, -0.09430694580078125, -0.08564376831054688, -0.0769805908203125, -0.06831741333007812, -0.05965423583984375, -0.050991058349609375, -0.042327880859375, -0.033664703369140625, -0.02500152587890625, -0.016338348388671875, -0.0076751708984375, 0.000988006591796875, 0.00965118408203125, 0.018314361572265625, 0.0269775390625, 0.035640716552734375, 0.04430389404296875, 0.052967071533203125, 0.0616302490234375, 0.07029342651367188, 0.07895660400390625, 0.08761978149414062, 0.096282958984375, 0.10494613647460938, 0.11360931396484375, 0.12227249145507812, 0.1309356689453125, 0.13959884643554688, 0.14826202392578125, 0.15692520141601562, 0.16558837890625, 0.17425155639648438, 0.18291473388671875, 0.19157791137695312, 0.2002410888671875, 0.20890426635742188, 0.21756744384765625, 0.22623062133789062, 0.234893798828125, 0.24355697631835938, 0.25222015380859375, 0.2608833312988281, 0.2695465087890625, 0.2782096862792969, 0.28687286376953125, 0.2955360412597656, 0.30419921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 11.0, 13.0, 48.0, 72.0, 134.0, 258.0, 220.0, 132.0, 49.0, 30.0, 11.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910064697265625e-05, -3.7913210690021515e-05, -3.672577440738678e-05, -3.5538338124752045e-05, -3.435090184211731e-05, -3.3163465559482574e-05, -3.197602927684784e-05, -3.0788592994213104e-05, -2.960115671157837e-05, -2.8413720428943634e-05, -2.72262841463089e-05, -2.6038847863674164e-05, -2.485141158103943e-05, -2.3663975298404694e-05, -2.247653901576996e-05, -2.1289102733135223e-05, -2.0101666450500488e-05, -1.8914230167865753e-05, -1.7726793885231018e-05, -1.6539357602596283e-05, -1.5351921319961548e-05, -1.4164485037326813e-05, -1.2977048754692078e-05, -1.1789612472057343e-05, -1.0602176189422607e-05, -9.414739906787872e-06, -8.227303624153137e-06, -7.039867341518402e-06, -5.852431058883667e-06, -4.664994776248932e-06, -3.4775584936141968e-06, -2.2901222109794617e-06, -1.1026859283447266e-06, 8.475035429000854e-08, 1.2721866369247437e-06, 2.4596229195594788e-06, 3.647059202194214e-06, 4.834495484828949e-06, 6.021931767463684e-06, 7.209368050098419e-06, 8.396804332733154e-06, 9.58424061536789e-06, 1.0771676898002625e-05, 1.195911318063736e-05, 1.3146549463272095e-05, 1.433398574590683e-05, 1.5521422028541565e-05, 1.67088583111763e-05, 1.7896294593811035e-05, 1.908373087644577e-05, 2.0271167159080505e-05, 2.145860344171524e-05, 2.2646039724349976e-05, 2.383347600698471e-05, 2.5020912289619446e-05, 2.620834857225418e-05, 2.7395784854888916e-05, 2.858322113752365e-05, 2.9770657420158386e-05, 3.095809370279312e-05, 3.2145529985427856e-05, 3.333296626806259e-05, 3.452040255069733e-05, 3.570783883333206e-05, 3.68952751159668e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 7.0, 16.0, 28.0, 53.0, 130.0, 386.0, 1778.0, 26249.0, 999757.0, 18079.0, 1482.0, 367.0, 110.0, 48.0, 21.0, 9.0, 9.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.680511474609375, -0.65887451171875, -0.637237548828125, -0.6156005859375, -0.593963623046875, -0.57232666015625, -0.550689697265625, -0.529052734375, -0.507415771484375, -0.48577880859375, -0.464141845703125, -0.4425048828125, -0.420867919921875, -0.39923095703125, -0.377593994140625, -0.35595703125, -0.334320068359375, -0.31268310546875, -0.291046142578125, -0.2694091796875, -0.247772216796875, -0.22613525390625, -0.204498291015625, -0.182861328125, -0.161224365234375, -0.13958740234375, -0.117950439453125, -0.0963134765625, -0.074676513671875, -0.05303955078125, -0.031402587890625, -0.009765625, 0.011871337890625, 0.03350830078125, 0.055145263671875, 0.0767822265625, 0.098419189453125, 0.12005615234375, 0.141693115234375, 0.163330078125, 0.184967041015625, 0.20660400390625, 0.228240966796875, 0.2498779296875, 0.271514892578125, 0.29315185546875, 0.314788818359375, 0.33642578125, 0.358062744140625, 0.37969970703125, 0.401336669921875, 0.4229736328125, 0.444610595703125, 0.46624755859375, 0.487884521484375, 0.509521484375, 0.531158447265625, 0.55279541015625, 0.574432373046875, 0.5960693359375, 0.617706298828125, 0.63934326171875, 0.660980224609375, 0.6826171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 3.0, 10.0, 9.0, 18.0, 50.0, 88.0, 167.0, 236.0, 163.0, 99.0, 54.0, 41.0, 18.0, 11.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3567466735839844, -0.34508514404296875, -0.3334236145019531, -0.3217620849609375, -0.3101005554199219, -0.29843902587890625, -0.2867774963378906, -0.275115966796875, -0.2634544372558594, -0.25179290771484375, -0.24013137817382812, -0.2284698486328125, -0.21680831909179688, -0.20514678955078125, -0.19348526000976562, -0.18182373046875, -0.17016220092773438, -0.15850067138671875, -0.14683914184570312, -0.1351776123046875, -0.12351608276367188, -0.11185455322265625, -0.10019302368164062, -0.088531494140625, -0.07686996459960938, -0.06520843505859375, -0.053546905517578125, -0.0418853759765625, -0.030223846435546875, -0.01856231689453125, -0.006900787353515625, 0.0047607421875, 0.016422271728515625, 0.02808380126953125, 0.039745330810546875, 0.0514068603515625, 0.06306838989257812, 0.07472991943359375, 0.08639144897460938, 0.098052978515625, 0.10971450805664062, 0.12137603759765625, 0.13303756713867188, 0.1446990966796875, 0.15636062622070312, 0.16802215576171875, 0.17968368530273438, 0.19134521484375, 0.20300674438476562, 0.21466827392578125, 0.22632980346679688, 0.2379913330078125, 0.24965286254882812, 0.26131439208984375, 0.2729759216308594, 0.284637451171875, 0.2962989807128906, 0.30796051025390625, 0.3196220397949219, 0.3312835693359375, 0.3429450988769531, 0.35460662841796875, 0.3662681579589844, 0.3779296875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 20.0, 52.0, 160.0, 442.0, 200.0, 79.0, 23.0, 17.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.938676834106445, -5.698006629943848, -5.45733642578125, -5.216666221618652, -4.975996017456055, -4.735325813293457, -4.494655609130859, -4.253985404968262, -4.013315200805664, -3.7726449966430664, -3.5319747924804688, -3.291304588317871, -3.0506343841552734, -2.809964179992676, -2.5692942142486572, -2.3286240100860596, -2.087954044342041, -1.8472838401794434, -1.6066136360168457, -1.3659435510635376, -1.12527334690094, -0.8846031427383423, -0.6439330577850342, -0.4032628536224365, -0.16259264945983887, 0.0780775249004364, 0.31874769926071167, 0.5594178438186646, 0.8000880479812622, 1.0407582521438599, 1.281428337097168, 1.5220985412597656, 1.7627687454223633, 2.003438949584961, 2.2441091537475586, 2.4847793579101562, 2.725449562072754, 2.9661197662353516, 3.20678973197937, 3.4474599361419678, 3.6881301403045654, 3.928800344467163, 4.169470310211182, 4.410140514373779, 4.650810718536377, 4.891480922698975, 5.132151126861572, 5.37282133102417, 5.613491535186768, 5.854161739349365, 6.094831943511963, 6.3355021476745605, 6.576172351837158, 6.816842555999756, 7.057512283325195, 7.298182487487793, 7.538852691650391, 7.779522895812988, 8.020193099975586, 8.260863304138184, 8.501533508300781, 8.742203712463379, 8.982873916625977, 9.223544120788574, 9.464214324951172]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 9.0, 14.0, 15.0, 15.0, 21.0, 22.0, 31.0, 37.0, 34.0, 57.0, 60.0, 62.0, 65.0, 84.0, 69.0, 51.0, 66.0, 61.0, 47.0, 44.0, 25.0, 33.0, 20.0, 15.0, 15.0, 8.0, 6.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.111644744873047, -3.957146167755127, -3.802647590637207, -3.648149013519287, -3.493650197982788, -3.339151620864868, -3.1846530437469482, -3.030154228210449, -2.8756556510925293, -2.7211570739746094, -2.5666584968566895, -2.4121599197387695, -2.2576611042022705, -2.1031625270843506, -1.9486639499664307, -1.7941652536392212, -1.6396667957305908, -1.485168218612671, -1.3306695222854614, -1.1761709451675415, -1.021672248840332, -0.8671736717224121, -0.7126750946044922, -0.5581763982772827, -0.4036778211593628, -0.2491791993379593, -0.09468057751655579, 0.05981802940368652, 0.21431666612625122, 0.3688153028488159, 0.5233138799667358, 0.6778125762939453, 0.8323111534118652, 0.9868097901344299, 1.1413084268569946, 1.2958070039749146, 1.450305700302124, 1.604804277420044, 1.7593028545379639, 1.9138015508651733, 2.068300247192383, 2.2227988243103027, 2.3772974014282227, 2.5317959785461426, 2.6862947940826416, 2.8407933712005615, 2.9952919483184814, 3.1497907638549805, 3.3042891025543213, 3.458787679672241, 3.613286256790161, 3.76778507232666, 3.92228364944458, 4.0767822265625, 4.23128080368042, 4.38577938079834, 4.54027795791626, 4.69477653503418, 4.8492751121521, 5.0037736892700195, 5.1582722663879395, 5.312770843505859, 5.4672698974609375, 5.621768474578857, 5.776267051696777]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 22.0, 42.0, 150.0, 643.0, 302639.0, 3889996.0, 546.0, 130.0, 45.0, 15.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -6.032196044921875, -5.88861083984375, -5.745025634765625, -5.6014404296875, -5.457855224609375, -5.31427001953125, -5.170684814453125, -5.027099609375, -4.883514404296875, -4.73992919921875, -4.596343994140625, -4.4527587890625, -4.309173583984375, -4.16558837890625, -4.022003173828125, -3.87841796875, -3.734832763671875, -3.59124755859375, -3.447662353515625, -3.3040771484375, -3.160491943359375, -3.01690673828125, -2.873321533203125, -2.729736328125, -2.586151123046875, -2.44256591796875, -2.298980712890625, -2.1553955078125, -2.011810302734375, -1.86822509765625, -1.724639892578125, -1.5810546875, -1.437469482421875, -1.29388427734375, -1.150299072265625, -1.0067138671875, -0.863128662109375, -0.71954345703125, -0.575958251953125, -0.432373046875, -0.288787841796875, -0.14520263671875, -0.001617431640625, 0.1419677734375, 0.285552978515625, 0.42913818359375, 0.572723388671875, 0.71630859375, 0.859893798828125, 1.00347900390625, 1.147064208984375, 1.2906494140625, 1.434234619140625, 1.57781982421875, 1.721405029296875, 1.864990234375, 2.008575439453125, 2.15216064453125, 2.295745849609375, 2.4393310546875, 2.582916259765625, 2.72650146484375, 2.870086669921875, 3.013671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 15.0, 36.0, 115.0, 197.0, 290.0, 207.0, 79.0, 33.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71630859375, -0.6998023986816406, -0.6832962036132812, -0.6667900085449219, -0.6502838134765625, -0.6337776184082031, -0.6172714233398438, -0.6007652282714844, -0.584259033203125, -0.5677528381347656, -0.5512466430664062, -0.5347404479980469, -0.5182342529296875, -0.5017280578613281, -0.48522186279296875, -0.4687156677246094, -0.45220947265625, -0.4357032775878906, -0.41919708251953125, -0.4026908874511719, -0.3861846923828125, -0.3696784973144531, -0.35317230224609375, -0.3366661071777344, -0.320159912109375, -0.3036537170410156, -0.28714752197265625, -0.2706413269042969, -0.2541351318359375, -0.23762893676757812, -0.22112274169921875, -0.20461654663085938, -0.1881103515625, -0.17160415649414062, -0.15509796142578125, -0.13859176635742188, -0.1220855712890625, -0.10557937622070312, -0.08907318115234375, -0.07256698608398438, -0.056060791015625, -0.039554595947265625, -0.02304840087890625, -0.006542205810546875, 0.0099639892578125, 0.026470184326171875, 0.04297637939453125, 0.059482574462890625, 0.07598876953125, 0.09249496459960938, 0.10900115966796875, 0.12550735473632812, 0.1420135498046875, 0.15851974487304688, 0.17502593994140625, 0.19153213500976562, 0.208038330078125, 0.22454452514648438, 0.24105072021484375, 0.2575569152832031, 0.2740631103515625, 0.2905693054199219, 0.30707550048828125, 0.3235816955566406, 0.340087890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 9.0, 17.0, 37.0, 48.0, 114.0, 188.0, 458.0, 1188.0, 4644.0, 32358.0, 4081709.0, 64205.0, 6761.0, 1619.0, 504.0, 202.0, 112.0, 45.0, 21.0, 9.0, 11.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5614242553710938, -0.5354461669921875, -0.5094680786132812, -0.483489990234375, -0.45751190185546875, -0.4315338134765625, -0.40555572509765625, -0.37957763671875, -0.35359954833984375, -0.3276214599609375, -0.30164337158203125, -0.275665283203125, -0.24968719482421875, -0.2237091064453125, -0.19773101806640625, -0.1717529296875, -0.14577484130859375, -0.1197967529296875, -0.09381866455078125, -0.067840576171875, -0.04186248779296875, -0.0158843994140625, 0.01009368896484375, 0.03607177734375, 0.06204986572265625, 0.0880279541015625, 0.11400604248046875, 0.139984130859375, 0.16596221923828125, 0.1919403076171875, 0.21791839599609375, 0.243896484375, 0.26987457275390625, 0.2958526611328125, 0.32183074951171875, 0.347808837890625, 0.37378692626953125, 0.3997650146484375, 0.42574310302734375, 0.45172119140625, 0.47769927978515625, 0.5036773681640625, 0.5296554565429688, 0.555633544921875, 0.5816116333007812, 0.6075897216796875, 0.6335678100585938, 0.6595458984375, 0.6855239868164062, 0.7115020751953125, 0.7374801635742188, 0.763458251953125, 0.7894363403320312, 0.8154144287109375, 0.8413925170898438, 0.86737060546875, 0.8933486938476562, 0.9193267822265625, 0.9453048706054688, 0.971282958984375, 0.9972610473632812, 1.0232391357421875, 1.0492172241210938, 1.0751953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 8.0, 14.0, 22.0, 48.0, 122.0, 497.0, 3038.0, 175.0, 44.0, 23.0, 23.0, 19.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318115234375, -0.3095703125, -0.301025390625, -0.29248046875, -0.283935546875, -0.275390625, -0.266845703125, -0.25830078125, -0.249755859375, -0.2412109375, -0.232666015625, -0.22412109375, -0.215576171875, -0.20703125, -0.198486328125, -0.18994140625, -0.181396484375, -0.1728515625, -0.164306640625, -0.15576171875, -0.147216796875, -0.138671875, -0.130126953125, -0.12158203125, -0.113037109375, -0.1044921875, -0.095947265625, -0.08740234375, -0.078857421875, -0.0703125, -0.061767578125, -0.05322265625, -0.044677734375, -0.0361328125, -0.027587890625, -0.01904296875, -0.010498046875, -0.001953125, 0.006591796875, 0.01513671875, 0.023681640625, 0.0322265625, 0.040771484375, 0.04931640625, 0.057861328125, 0.06640625, 0.074951171875, 0.08349609375, 0.092041015625, 0.1005859375, 0.109130859375, 0.11767578125, 0.126220703125, 0.134765625, 0.143310546875, 0.15185546875, 0.160400390625, 0.1689453125, 0.177490234375, 0.18603515625, 0.194580078125, 0.203125, 0.211669921875, 0.22021484375, 0.228759765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 33.0, 147.0, 533.0, 241.0, 41.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.640495777130127, -3.567335605621338, -3.494175434112549, -3.4210152626037598, -3.3478550910949707, -3.2746951580047607, -3.2015349864959717, -3.1283748149871826, -3.0552146434783936, -2.9820544719696045, -2.9088943004608154, -2.8357341289520264, -2.7625741958618164, -2.6894140243530273, -2.6162538528442383, -2.543093681335449, -2.46993350982666, -2.396773338317871, -2.323613166809082, -2.250452995300293, -2.177292823791504, -2.104132890701294, -2.030972719192505, -1.9578125476837158, -1.8846523761749268, -1.8114922046661377, -1.7383320331573486, -1.6651719808578491, -1.59201180934906, -1.518851637840271, -1.4456915855407715, -1.3725314140319824, -1.2993710041046143, -1.2262108325958252, -1.1530506610870361, -1.0798906087875366, -1.0067304372787476, -0.9335702657699585, -0.8604101538658142, -0.7872500419616699, -0.7140898704528809, -0.6409296989440918, -0.5677695870399475, -0.49460944533348083, -0.42144930362701416, -0.3482891619205475, -0.2751290202140808, -0.20196890830993652, -0.12880873680114746, -0.055648595094680786, 0.01751154661178589, 0.09067168831825256, 0.16383183002471924, 0.2369919717311859, 0.3101521134376526, 0.3833122253417969, 0.45647239685058594, 0.529632568359375, 0.6027926802635193, 0.6759527921676636, 0.7491129636764526, 0.8222731351852417, 0.895433247089386, 0.9685933589935303, 1.0417535305023193]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 5.0, 7.0, 11.0, 18.0, 15.0, 29.0, 32.0, 26.0, 44.0, 64.0, 55.0, 60.0, 50.0, 48.0, 51.0, 69.0, 51.0, 56.0, 64.0, 48.0, 40.0, 40.0, 30.0, 32.0, 18.0, 10.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8985940217971802, -0.8755716681480408, -0.8525493144989014, -0.8295270204544067, -0.8065046668052673, -0.7834823131561279, -0.7604599595069885, -0.7374376058578491, -0.7144153118133545, -0.6913929581642151, -0.6683706045150757, -0.645348310470581, -0.6223259568214417, -0.5993036031723022, -0.5762812495231628, -0.5532588958740234, -0.530236542224884, -0.5072141885757446, -0.4841918647289276, -0.4611695110797882, -0.4381471872329712, -0.4151248335838318, -0.3921024799346924, -0.369080126285553, -0.34605780243873596, -0.32303544878959656, -0.30001312494277954, -0.27699077129364014, -0.25396841764450073, -0.23094609379768372, -0.2079237401485443, -0.1849014014005661, -0.16187900304794312, -0.1388566642999649, -0.1158343181014061, -0.09281197190284729, -0.06978963315486908, -0.04676729440689087, -0.023744940757751465, -0.0007226020097732544, 0.022299736738204956, 0.045322079211473465, 0.06834442168474197, 0.09136676788330078, 0.11438910663127899, 0.1374114453792572, 0.1604337990283966, 0.18345613777637482, 0.20647847652435303, 0.22950081527233124, 0.25252315402030945, 0.27554550766944885, 0.29856783151626587, 0.3215901851654053, 0.3446125388145447, 0.3676348924636841, 0.3906572163105011, 0.4136795699596405, 0.4367018938064575, 0.4597242474555969, 0.48274660110473633, 0.505768895149231, 0.5287913084030151, 0.5518136024475098, 0.5748359560966492]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 12.0, 19.0, 30.0, 46.0, 64.0, 72.0, 123.0, 246.0, 477.0, 1053.0, 2690.0, 14797.0, 835382.0, 182714.0, 7199.0, 1906.0, 772.0, 389.0, 192.0, 109.0, 55.0, 33.0, 46.0, 23.0, 21.0, 13.0, 14.0, 6.0, 7.0, 8.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.189453125, -2.122772216796875, -2.05609130859375, -1.989410400390625, -1.9227294921875, -1.856048583984375, -1.78936767578125, -1.722686767578125, -1.656005859375, -1.589324951171875, -1.52264404296875, -1.455963134765625, -1.3892822265625, -1.322601318359375, -1.25592041015625, -1.189239501953125, -1.12255859375, -1.055877685546875, -0.98919677734375, -0.922515869140625, -0.8558349609375, -0.789154052734375, -0.72247314453125, -0.655792236328125, -0.589111328125, -0.522430419921875, -0.45574951171875, -0.389068603515625, -0.3223876953125, -0.255706787109375, -0.18902587890625, -0.122344970703125, -0.0556640625, 0.011016845703125, 0.07769775390625, 0.144378662109375, 0.2110595703125, 0.277740478515625, 0.34442138671875, 0.411102294921875, 0.477783203125, 0.544464111328125, 0.61114501953125, 0.677825927734375, 0.7445068359375, 0.811187744140625, 0.87786865234375, 0.944549560546875, 1.01123046875, 1.077911376953125, 1.14459228515625, 1.211273193359375, 1.2779541015625, 1.344635009765625, 1.41131591796875, 1.477996826171875, 1.544677734375, 1.611358642578125, 1.67803955078125, 1.744720458984375, 1.8114013671875, 1.878082275390625, 1.94476318359375, 2.011444091796875, 2.078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 16.0, 44.0, 125.0, 229.0, 258.0, 196.0, 71.0, 35.0, 8.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6945114135742188, -0.6780853271484375, -0.6616592407226562, -0.645233154296875, -0.6288070678710938, -0.6123809814453125, -0.5959548950195312, -0.57952880859375, -0.5631027221679688, -0.5466766357421875, -0.5302505493164062, -0.513824462890625, -0.49739837646484375, -0.4809722900390625, -0.46454620361328125, -0.4481201171875, -0.43169403076171875, -0.4152679443359375, -0.39884185791015625, -0.382415771484375, -0.36598968505859375, -0.3495635986328125, -0.33313751220703125, -0.31671142578125, -0.30028533935546875, -0.2838592529296875, -0.26743316650390625, -0.251007080078125, -0.23458099365234375, -0.2181549072265625, -0.20172882080078125, -0.185302734375, -0.16887664794921875, -0.1524505615234375, -0.13602447509765625, -0.119598388671875, -0.10317230224609375, -0.0867462158203125, -0.07032012939453125, -0.05389404296875, -0.03746795654296875, -0.0210418701171875, -0.00461578369140625, 0.011810302734375, 0.02823638916015625, 0.0446624755859375, 0.06108856201171875, 0.0775146484375, 0.09394073486328125, 0.1103668212890625, 0.12679290771484375, 0.143218994140625, 0.15964508056640625, 0.1760711669921875, 0.19249725341796875, 0.20892333984375, 0.22534942626953125, 0.2417755126953125, 0.25820159912109375, 0.274627685546875, 0.29105377197265625, 0.3074798583984375, 0.32390594482421875, 0.34033203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 12.0, 12.0, 15.0, 22.0, 25.0, 27.0, 25.0, 50.0, 52.0, 115.0, 255.0, 737.0, 2519.0, 13124.0, 110679.0, 804216.0, 100729.0, 12228.0, 2378.0, 682.0, 252.0, 121.0, 56.0, 48.0, 29.0, 23.0, 23.0, 17.0, 12.0, 15.0, 9.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2626953125, -1.22607421875, -1.189453125, -1.15283203125, -1.1162109375, -1.07958984375, -1.04296875, -1.00634765625, -0.9697265625, -0.93310546875, -0.896484375, -0.85986328125, -0.8232421875, -0.78662109375, -0.75, -0.71337890625, -0.6767578125, -0.64013671875, -0.603515625, -0.56689453125, -0.5302734375, -0.49365234375, -0.45703125, -0.42041015625, -0.3837890625, -0.34716796875, -0.310546875, -0.27392578125, -0.2373046875, -0.20068359375, -0.1640625, -0.12744140625, -0.0908203125, -0.05419921875, -0.017578125, 0.01904296875, 0.0556640625, 0.09228515625, 0.12890625, 0.16552734375, 0.2021484375, 0.23876953125, 0.275390625, 0.31201171875, 0.3486328125, 0.38525390625, 0.421875, 0.45849609375, 0.4951171875, 0.53173828125, 0.568359375, 0.60498046875, 0.6416015625, 0.67822265625, 0.71484375, 0.75146484375, 0.7880859375, 0.82470703125, 0.861328125, 0.89794921875, 0.9345703125, 0.97119140625, 1.0078125, 1.04443359375, 1.0810546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 16.0, 11.0, 19.0, 21.0, 22.0, 27.0, 35.0, 34.0, 37.0, 36.0, 41.0, 44.0, 54.0, 44.0, 56.0, 56.0, 48.0, 52.0, 31.0, 44.0, 33.0, 32.0, 31.0, 17.0, 35.0, 17.0, 17.0, 16.0, 13.0, 8.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6008453369140625, -0.579620361328125, -0.5583953857421875, -0.53717041015625, -0.5159454345703125, -0.494720458984375, -0.4734954833984375, -0.4522705078125, -0.4310455322265625, -0.409820556640625, -0.3885955810546875, -0.36737060546875, -0.3461456298828125, -0.324920654296875, -0.3036956787109375, -0.282470703125, -0.2612457275390625, -0.240020751953125, -0.2187957763671875, -0.19757080078125, -0.1763458251953125, -0.155120849609375, -0.1338958740234375, -0.1126708984375, -0.0914459228515625, -0.070220947265625, -0.0489959716796875, -0.02777099609375, -0.0065460205078125, 0.014678955078125, 0.0359039306640625, 0.05712890625, 0.0783538818359375, 0.099578857421875, 0.1208038330078125, 0.14202880859375, 0.1632537841796875, 0.184478759765625, 0.2057037353515625, 0.2269287109375, 0.2481536865234375, 0.269378662109375, 0.2906036376953125, 0.31182861328125, 0.3330535888671875, 0.354278564453125, 0.3755035400390625, 0.396728515625, 0.4179534912109375, 0.439178466796875, 0.4604034423828125, 0.48162841796875, 0.5028533935546875, 0.524078369140625, 0.5453033447265625, 0.5665283203125, 0.5877532958984375, 0.608978271484375, 0.6302032470703125, 0.65142822265625, 0.6726531982421875, 0.693878173828125, 0.7151031494140625, 0.736328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 12.0, 8.0, 18.0, 22.0, 37.0, 52.0, 78.0, 158.0, 244.0, 533.0, 1176.0, 3359.0, 13484.0, 92631.0, 770763.0, 141505.0, 17625.0, 4168.0, 1396.0, 577.0, 291.0, 139.0, 102.0, 64.0, 32.0, 31.0, 13.0, 7.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2410888671875, -0.23320579528808594, -0.22532272338867188, -0.2174396514892578, -0.20955657958984375, -0.2016735076904297, -0.19379043579101562, -0.18590736389160156, -0.1780242919921875, -0.17014122009277344, -0.16225814819335938, -0.1543750762939453, -0.14649200439453125, -0.1386089324951172, -0.13072586059570312, -0.12284278869628906, -0.114959716796875, -0.10707664489746094, -0.09919357299804688, -0.09131050109863281, -0.08342742919921875, -0.07554435729980469, -0.06766128540039062, -0.05977821350097656, -0.0518951416015625, -0.04401206970214844, -0.036128997802734375, -0.028245925903320312, -0.02036285400390625, -0.012479782104492188, -0.004596710205078125, 0.0032863616943359375, 0.01116943359375, 0.019052505493164062, 0.026935577392578125, 0.03481864929199219, 0.04270172119140625, 0.05058479309082031, 0.058467864990234375, 0.06635093688964844, 0.0742340087890625, 0.08211708068847656, 0.09000015258789062, 0.09788322448730469, 0.10576629638671875, 0.11364936828613281, 0.12153244018554688, 0.12941551208496094, 0.137298583984375, 0.14518165588378906, 0.15306472778320312, 0.1609477996826172, 0.16883087158203125, 0.1767139434814453, 0.18459701538085938, 0.19248008728027344, 0.2003631591796875, 0.20824623107910156, 0.21612930297851562, 0.2240123748779297, 0.23189544677734375, 0.2397785186767578, 0.24766159057617188, 0.25554466247558594, 0.263427734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 12.0, 7.0, 15.0, 33.0, 35.0, 53.0, 88.0, 112.0, 161.0, 118.0, 124.0, 89.0, 57.0, 30.0, 22.0, 11.0, 9.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.297494888305664e-05, -4.209205508232117e-05, -4.120916128158569e-05, -4.032626748085022e-05, -3.9443373680114746e-05, -3.856047987937927e-05, -3.76775860786438e-05, -3.6794692277908325e-05, -3.591179847717285e-05, -3.502890467643738e-05, -3.4146010875701904e-05, -3.326311707496643e-05, -3.238022327423096e-05, -3.1497329473495483e-05, -3.061443567276001e-05, -2.9731541872024536e-05, -2.8848648071289062e-05, -2.796575427055359e-05, -2.7082860469818115e-05, -2.619996666908264e-05, -2.5317072868347168e-05, -2.4434179067611694e-05, -2.355128526687622e-05, -2.2668391466140747e-05, -2.1785497665405273e-05, -2.09026038646698e-05, -2.0019710063934326e-05, -1.9136816263198853e-05, -1.825392246246338e-05, -1.7371028661727905e-05, -1.648813486099243e-05, -1.5605241060256958e-05, -1.4722347259521484e-05, -1.383945345878601e-05, -1.2956559658050537e-05, -1.2073665857315063e-05, -1.119077205657959e-05, -1.0307878255844116e-05, -9.424984455108643e-06, -8.542090654373169e-06, -7.659196853637695e-06, -6.776303052902222e-06, -5.893409252166748e-06, -5.010515451431274e-06, -4.127621650695801e-06, -3.244727849960327e-06, -2.3618340492248535e-06, -1.4789402484893799e-06, -5.960464477539062e-07, 2.868473529815674e-07, 1.169741153717041e-06, 2.0526349544525146e-06, 2.9355287551879883e-06, 3.818422555923462e-06, 4.7013163566589355e-06, 5.584210157394409e-06, 6.467103958129883e-06, 7.3499977588653564e-06, 8.23289155960083e-06, 9.115785360336304e-06, 9.998679161071777e-06, 1.0881572961807251e-05, 1.1764466762542725e-05, 1.2647360563278198e-05, 1.3530254364013672e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 11.0, 2.0, 11.0, 6.0, 12.0, 15.0, 12.0, 23.0, 42.0, 71.0, 111.0, 282.0, 625.0, 2113.0, 10111.0, 83117.0, 840726.0, 96757.0, 10901.0, 2323.0, 673.0, 251.0, 123.0, 69.0, 36.0, 20.0, 23.0, 19.0, 12.0, 12.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.25615692138671875, -0.2471771240234375, -0.23819732666015625, -0.229217529296875, -0.22023773193359375, -0.2112579345703125, -0.20227813720703125, -0.19329833984375, -0.18431854248046875, -0.1753387451171875, -0.16635894775390625, -0.157379150390625, -0.14839935302734375, -0.1394195556640625, -0.13043975830078125, -0.1214599609375, -0.11248016357421875, -0.1035003662109375, -0.09452056884765625, -0.085540771484375, -0.07656097412109375, -0.0675811767578125, -0.05860137939453125, -0.04962158203125, -0.04064178466796875, -0.0316619873046875, -0.02268218994140625, -0.013702392578125, -0.00472259521484375, 0.0042572021484375, 0.01323699951171875, 0.022216796875, 0.03119659423828125, 0.0401763916015625, 0.04915618896484375, 0.058135986328125, 0.06711578369140625, 0.0760955810546875, 0.08507537841796875, 0.09405517578125, 0.10303497314453125, 0.1120147705078125, 0.12099456787109375, 0.129974365234375, 0.13895416259765625, 0.1479339599609375, 0.15691375732421875, 0.1658935546875, 0.17487335205078125, 0.1838531494140625, 0.19283294677734375, 0.201812744140625, 0.21079254150390625, 0.2197723388671875, 0.22875213623046875, 0.23773193359375, 0.24671173095703125, 0.2556915283203125, 0.26467132568359375, 0.273651123046875, 0.28263092041015625, 0.2916107177734375, 0.30059051513671875, 0.3095703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 5.0, 5.0, 8.0, 13.0, 15.0, 12.0, 15.0, 26.0, 23.0, 39.0, 32.0, 65.0, 81.0, 76.0, 81.0, 72.0, 68.0, 55.0, 54.0, 47.0, 42.0, 30.0, 25.0, 15.0, 11.0, 12.0, 8.0, 11.0, 9.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1651611328125, -0.16042709350585938, -0.15569305419921875, -0.15095901489257812, -0.1462249755859375, -0.14149093627929688, -0.13675689697265625, -0.13202285766601562, -0.127288818359375, -0.12255477905273438, -0.11782073974609375, -0.11308670043945312, -0.1083526611328125, -0.10361862182617188, -0.09888458251953125, -0.09415054321289062, -0.08941650390625, -0.08468246459960938, -0.07994842529296875, -0.07521438598632812, -0.0704803466796875, -0.06574630737304688, -0.06101226806640625, -0.056278228759765625, -0.051544189453125, -0.046810150146484375, -0.04207611083984375, -0.037342071533203125, -0.0326080322265625, -0.027873992919921875, -0.02313995361328125, -0.018405914306640625, -0.013671875, -0.008937835693359375, -0.00420379638671875, 0.000530242919921875, 0.0052642822265625, 0.009998321533203125, 0.01473236083984375, 0.019466400146484375, 0.024200439453125, 0.028934478759765625, 0.03366851806640625, 0.038402557373046875, 0.0431365966796875, 0.047870635986328125, 0.05260467529296875, 0.057338714599609375, 0.06207275390625, 0.06680679321289062, 0.07154083251953125, 0.07627487182617188, 0.0810089111328125, 0.08574295043945312, 0.09047698974609375, 0.09521102905273438, 0.099945068359375, 0.10467910766601562, 0.10941314697265625, 0.11414718627929688, 0.1188812255859375, 0.12361526489257812, 0.12834930419921875, 0.13308334350585938, 0.1378173828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 18.0, 50.0, 187.0, 503.0, 171.0, 49.0, 16.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.74199104309082, -16.41053009033203, -16.079071044921875, -15.747610092163086, -15.416150093078613, -15.08469009399414, -14.753229141235352, -14.421769142150879, -14.090309143066406, -13.758849143981934, -13.427389144897461, -13.095928192138672, -12.7644681930542, -12.433008193969727, -12.101547241210938, -11.770087242126465, -11.438627243041992, -11.10716724395752, -10.775707244873047, -10.444246292114258, -10.112786293029785, -9.781326293945312, -9.449865341186523, -9.11840534210205, -8.786945343017578, -8.455485343933105, -8.124025344848633, -7.792564392089844, -7.461104393005371, -7.129644393920898, -6.798183917999268, -6.466723442077637, -6.135263442993164, -5.803803443908691, -5.4723429679870605, -5.14088249206543, -4.809422492980957, -4.477962493896484, -4.1465020179748535, -3.8150417804718018, -3.48358154296875, -3.1521213054656982, -2.8206610679626465, -2.4892008304595947, -2.157740592956543, -1.8262803554534912, -1.4948201179504395, -1.1633598804473877, -0.8318996429443359, -0.5004394054412842, -0.16897916793823242, 0.16248106956481934, 0.4939413070678711, 0.8254015445709229, 1.1568617820739746, 1.4883220195770264, 1.8197822570800781, 2.15124249458313, 2.4827027320861816, 2.8141629695892334, 3.145623207092285, 3.477083444595337, 3.8085436820983887, 4.1400041580200195, 4.471464157104492]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 4.0, 5.0, 8.0, 8.0, 12.0, 15.0, 15.0, 22.0, 24.0, 32.0, 39.0, 37.0, 34.0, 28.0, 46.0, 45.0, 35.0, 44.0, 51.0, 52.0, 42.0, 44.0, 46.0, 35.0, 31.0, 36.0, 35.0, 34.0, 23.0, 23.0, 19.0, 15.0, 10.0, 9.0, 4.0, 5.0, 7.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.852600574493408, -3.736675262451172, -3.6207501888275146, -3.5048248767852783, -3.388899803161621, -3.2729744911193848, -3.1570494174957275, -3.041124105453491, -2.925199031829834, -2.8092737197875977, -2.6933486461639404, -2.577423334121704, -2.461498260498047, -2.3455729484558105, -2.2296478748321533, -2.113722562789917, -1.9977973699569702, -1.8818721771240234, -1.7659469842910767, -1.6500217914581299, -1.534096598625183, -1.4181714057922363, -1.30224609375, -1.1863210201263428, -1.0703957080841064, -0.9544705152511597, -0.8385453224182129, -0.7226201295852661, -0.6066949367523193, -0.4907696843147278, -0.374844491481781, -0.25891929864883423, -0.14299416542053223, -0.027068965137004852, 0.08885623514652252, 0.2047814428806305, 0.32070663571357727, 0.43663185834884644, 0.5525570511817932, 0.66848224401474, 0.7844074368476868, 0.9003326296806335, 1.016257882118225, 1.1321830749511719, 1.2481082677841187, 1.3640334606170654, 1.4799586534500122, 1.595883846282959, 1.7118090391159058, 1.8277342319488525, 1.9436594247817993, 2.059584617614746, 2.1755099296569824, 2.2914350032806396, 2.407360315322876, 2.523285388946533, 2.6392107009887695, 2.755136013031006, 2.871061086654663, 2.9869863986968994, 3.1029114723205566, 3.218836784362793, 3.33476185798645, 3.4506871700286865, 3.5666122436523438]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 15.0, 12.0, 13.0, 25.0, 43.0, 79.0, 242.0, 928.0, 7104.0, 4179547.0, 5250.0, 702.0, 165.0, 54.0, 35.0, 23.0, 15.0, 7.0, 4.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.5863037109375, -5.457763671875, -5.3292236328125, -5.20068359375, -5.0721435546875, -4.943603515625, -4.8150634765625, -4.6865234375, -4.5579833984375, -4.429443359375, -4.3009033203125, -4.17236328125, -4.0438232421875, -3.915283203125, -3.7867431640625, -3.658203125, -3.5296630859375, -3.401123046875, -3.2725830078125, -3.14404296875, -3.0155029296875, -2.886962890625, -2.7584228515625, -2.6298828125, -2.5013427734375, -2.372802734375, -2.2442626953125, -2.11572265625, -1.9871826171875, -1.858642578125, -1.7301025390625, -1.6015625, -1.4730224609375, -1.344482421875, -1.2159423828125, -1.08740234375, -0.9588623046875, -0.830322265625, -0.7017822265625, -0.5732421875, -0.4447021484375, -0.316162109375, -0.1876220703125, -0.05908203125, 0.0694580078125, 0.197998046875, 0.3265380859375, 0.455078125, 0.5836181640625, 0.712158203125, 0.8406982421875, 0.96923828125, 1.0977783203125, 1.226318359375, 1.3548583984375, 1.4833984375, 1.6119384765625, 1.740478515625, 1.8690185546875, 1.99755859375, 2.1260986328125, 2.254638671875, 2.3831787109375, 2.51171875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 21.0, 72.0, 107.0, 191.0, 241.0, 168.0, 114.0, 39.0, 20.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7240219116210938, -0.7073211669921875, -0.6906204223632812, -0.673919677734375, -0.6572189331054688, -0.6405181884765625, -0.6238174438476562, -0.60711669921875, -0.5904159545898438, -0.5737152099609375, -0.5570144653320312, -0.540313720703125, -0.5236129760742188, -0.5069122314453125, -0.49021148681640625, -0.4735107421875, -0.45680999755859375, -0.4401092529296875, -0.42340850830078125, -0.406707763671875, -0.39000701904296875, -0.3733062744140625, -0.35660552978515625, -0.33990478515625, -0.32320404052734375, -0.3065032958984375, -0.28980255126953125, -0.273101806640625, -0.25640106201171875, -0.2397003173828125, -0.22299957275390625, -0.206298828125, -0.18959808349609375, -0.1728973388671875, -0.15619659423828125, -0.139495849609375, -0.12279510498046875, -0.1060943603515625, -0.08939361572265625, -0.07269287109375, -0.05599212646484375, -0.0392913818359375, -0.02259063720703125, -0.005889892578125, 0.01081085205078125, 0.0275115966796875, 0.04421234130859375, 0.0609130859375, 0.07761383056640625, 0.0943145751953125, 0.11101531982421875, 0.127716064453125, 0.14441680908203125, 0.1611175537109375, 0.17781829833984375, 0.19451904296875, 0.21121978759765625, 0.2279205322265625, 0.24462127685546875, 0.261322021484375, 0.27802276611328125, 0.2947235107421875, 0.31142425537109375, 0.328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 14.0, 14.0, 25.0, 56.0, 113.0, 243.0, 527.0, 1504.0, 5411.0, 39492.0, 4048861.0, 86290.0, 8116.0, 2161.0, 785.0, 316.0, 160.0, 77.0, 36.0, 36.0, 16.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.548828125, -1.5107040405273438, -1.4725799560546875, -1.4344558715820312, -1.396331787109375, -1.3582077026367188, -1.3200836181640625, -1.2819595336914062, -1.24383544921875, -1.2057113647460938, -1.1675872802734375, -1.1294631958007812, -1.091339111328125, -1.0532150268554688, -1.0150909423828125, -0.9769668579101562, -0.9388427734375, -0.9007186889648438, -0.8625946044921875, -0.8244705200195312, -0.786346435546875, -0.7482223510742188, -0.7100982666015625, -0.6719741821289062, -0.63385009765625, -0.5957260131835938, -0.5576019287109375, -0.5194778442382812, -0.481353759765625, -0.44322967529296875, -0.4051055908203125, -0.36698150634765625, -0.328857421875, -0.29073333740234375, -0.2526092529296875, -0.21448516845703125, -0.176361083984375, -0.13823699951171875, -0.1001129150390625, -0.06198883056640625, -0.02386474609375, 0.01425933837890625, 0.0523834228515625, 0.09050750732421875, 0.128631591796875, 0.16675567626953125, 0.2048797607421875, 0.24300384521484375, 0.2811279296875, 0.31925201416015625, 0.3573760986328125, 0.39550018310546875, 0.433624267578125, 0.47174835205078125, 0.5098724365234375, 0.5479965209960938, 0.58612060546875, 0.6242446899414062, 0.6623687744140625, 0.7004928588867188, 0.738616943359375, 0.7767410278320312, 0.8148651123046875, 0.8529891967773438, 0.89111328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 4.0, 15.0, 27.0, 39.0, 72.0, 169.0, 767.0, 2625.0, 158.0, 58.0, 44.0, 28.0, 12.0, 10.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2922325134277344, -0.27904510498046875, -0.2658576965332031, -0.2526702880859375, -0.23948287963867188, -0.22629547119140625, -0.21310806274414062, -0.199920654296875, -0.18673324584960938, -0.17354583740234375, -0.16035842895507812, -0.1471710205078125, -0.13398361206054688, -0.12079620361328125, -0.10760879516601562, -0.09442138671875, -0.08123397827148438, -0.06804656982421875, -0.054859161376953125, -0.0416717529296875, -0.028484344482421875, -0.01529693603515625, -0.002109527587890625, 0.011077880859375, 0.024265289306640625, 0.03745269775390625, 0.050640106201171875, 0.0638275146484375, 0.07701492309570312, 0.09020233154296875, 0.10338973999023438, 0.1165771484375, 0.12976455688476562, 0.14295196533203125, 0.15613937377929688, 0.1693267822265625, 0.18251419067382812, 0.19570159912109375, 0.20888900756835938, 0.222076416015625, 0.23526382446289062, 0.24845123291015625, 0.2616386413574219, 0.2748260498046875, 0.2880134582519531, 0.30120086669921875, 0.3143882751464844, 0.32757568359375, 0.3407630920410156, 0.35395050048828125, 0.3671379089355469, 0.3803253173828125, 0.3935127258300781, 0.40670013427734375, 0.4198875427246094, 0.433074951171875, 0.4462623596191406, 0.45944976806640625, 0.4726371765136719, 0.4858245849609375, 0.4990119934082031, 0.5121994018554688, 0.5253868103027344, 0.53857421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 7.0, 6.0, 26.0, 78.0, 232.0, 384.0, 176.0, 57.0, 23.0, 12.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.161806344985962, -3.0679574012756348, -2.9741084575653076, -2.8802595138549805, -2.786410331726074, -2.692561388015747, -2.59871244430542, -2.5048635005950928, -2.4110145568847656, -2.3171656131744385, -2.2233166694641113, -2.129467725753784, -2.035618782043457, -1.9417697191238403, -1.8479206562042236, -1.7540717124938965, -1.6602227687835693, -1.5663738250732422, -1.472524881362915, -1.3786758184432983, -1.2848268747329712, -1.190977931022644, -1.0971288681030273, -1.0032799243927002, -0.909430980682373, -0.8155820369720459, -0.721733033657074, -0.627884030342102, -0.5340350866317749, -0.44018611311912537, -0.34633713960647583, -0.2524881362915039, -0.15863895416259766, -0.06478998064994812, 0.029058992862701416, 0.12290796637535095, 0.2167569398880005, 0.31060591340065, 0.40445488691329956, 0.4983038902282715, 0.5921528339385986, 0.6860017776489258, 0.7798507809638977, 0.8736997842788696, 0.9675487279891968, 1.061397671699524, 1.1552467346191406, 1.2490956783294678, 1.342944622039795, 1.436793565750122, 1.5306425094604492, 1.624491572380066, 1.718340516090393, 1.8121894598007202, 1.906038522720337, 1.999887466430664, 2.093736410140991, 2.1875853538513184, 2.2814342975616455, 2.3752832412719727, 2.469132423400879, 2.562981367111206, 2.656830310821533, 2.7506792545318604, 2.8445281982421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 6.0, 4.0, 10.0, 12.0, 16.0, 20.0, 37.0, 44.0, 61.0, 74.0, 59.0, 74.0, 70.0, 77.0, 96.0, 74.0, 62.0, 51.0, 28.0, 34.0, 38.0, 20.0, 11.0, 11.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4109008312225342, -1.3583920001983643, -1.3058831691741943, -1.2533743381500244, -1.2008655071258545, -1.1483566761016846, -1.0958478450775146, -1.0433388948440552, -0.9908300638198853, -0.9383212327957153, -0.8858124017715454, -0.8333035707473755, -0.7807946801185608, -0.7282858490943909, -0.675777018070221, -0.6232681274414062, -0.5707593560218811, -0.5182505249977112, -0.46574166417121887, -0.41323283314704895, -0.36072397232055664, -0.3082151412963867, -0.2557063102722168, -0.2031974494457245, -0.15068861842155457, -0.09817977249622345, -0.04567093402147293, 0.006837904453277588, 0.059346750378608704, 0.11185559630393982, 0.16436442732810974, 0.21687328815460205, 0.269382119178772, 0.3218909502029419, 0.3743998110294342, 0.4269086420536041, 0.47941750288009644, 0.5319263339042664, 0.5844351649284363, 0.636944055557251, 0.6894528865814209, 0.7419617176055908, 0.7944705486297607, 0.8469793796539307, 0.8994882702827454, 0.9519971013069153, 1.0045058727264404, 1.0570148229599, 1.1095235347747803, 1.1620323657989502, 1.2145411968231201, 1.26705002784729, 1.31955885887146, 1.3720676898956299, 1.4245765209197998, 1.4770854711532593, 1.5295943021774292, 1.5821031332015991, 1.634611964225769, 1.687120795249939, 1.7396296262741089, 1.7921385765075684, 1.8446474075317383, 1.8971562385559082, 1.9496650695800781]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 13.0, 13.0, 17.0, 24.0, 33.0, 61.0, 87.0, 174.0, 393.0, 874.0, 2919.0, 21923.0, 929899.0, 84672.0, 4977.0, 1420.0, 466.0, 227.0, 129.0, 72.0, 44.0, 36.0, 25.0, 14.0, 6.0, 5.0, 8.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.412109375, -2.342559814453125, -2.27301025390625, -2.203460693359375, -2.1339111328125, -2.064361572265625, -1.99481201171875, -1.925262451171875, -1.855712890625, -1.786163330078125, -1.71661376953125, -1.647064208984375, -1.5775146484375, -1.507965087890625, -1.43841552734375, -1.368865966796875, -1.29931640625, -1.229766845703125, -1.16021728515625, -1.090667724609375, -1.0211181640625, -0.951568603515625, -0.88201904296875, -0.812469482421875, -0.742919921875, -0.673370361328125, -0.60382080078125, -0.534271240234375, -0.4647216796875, -0.395172119140625, -0.32562255859375, -0.256072998046875, -0.1865234375, -0.116973876953125, -0.04742431640625, 0.022125244140625, 0.0916748046875, 0.161224365234375, 0.23077392578125, 0.300323486328125, 0.369873046875, 0.439422607421875, 0.50897216796875, 0.578521728515625, 0.6480712890625, 0.717620849609375, 0.78717041015625, 0.856719970703125, 0.92626953125, 0.995819091796875, 1.06536865234375, 1.134918212890625, 1.2044677734375, 1.274017333984375, 1.34356689453125, 1.413116455078125, 1.482666015625, 1.552215576171875, 1.62176513671875, 1.691314697265625, 1.7608642578125, 1.830413818359375, 1.89996337890625, 1.969512939453125, 2.0390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 15.0, 43.0, 98.0, 139.0, 213.0, 218.0, 147.0, 65.0, 33.0, 13.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.6937675476074219, -0.6775741577148438, -0.6613807678222656, -0.6451873779296875, -0.6289939880371094, -0.6128005981445312, -0.5966072082519531, -0.580413818359375, -0.5642204284667969, -0.5480270385742188, -0.5318336486816406, -0.5156402587890625, -0.4994468688964844, -0.48325347900390625, -0.4670600891113281, -0.45086669921875, -0.4346733093261719, -0.41847991943359375, -0.4022865295410156, -0.3860931396484375, -0.3698997497558594, -0.35370635986328125, -0.3375129699707031, -0.321319580078125, -0.3051261901855469, -0.28893280029296875, -0.2727394104003906, -0.2565460205078125, -0.24035263061523438, -0.22415924072265625, -0.20796585083007812, -0.1917724609375, -0.17557907104492188, -0.15938568115234375, -0.14319229125976562, -0.1269989013671875, -0.11080551147460938, -0.09461212158203125, -0.07841873168945312, -0.062225341796875, -0.046031951904296875, -0.02983856201171875, -0.013645172119140625, 0.0025482177734375, 0.018741607666015625, 0.03493499755859375, 0.051128387451171875, 0.06732177734375, 0.08351516723632812, 0.09970855712890625, 0.11590194702148438, 0.1320953369140625, 0.14828872680664062, 0.16448211669921875, 0.18067550659179688, 0.196868896484375, 0.21306228637695312, 0.22925567626953125, 0.24544906616210938, 0.2616424560546875, 0.2778358459472656, 0.29402923583984375, 0.3102226257324219, 0.326416015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 6.0, 5.0, 13.0, 7.0, 20.0, 24.0, 36.0, 53.0, 88.0, 130.0, 276.0, 756.0, 2182.0, 8570.0, 55370.0, 736635.0, 216026.0, 21710.0, 4267.0, 1322.0, 505.0, 217.0, 120.0, 62.0, 34.0, 26.0, 36.0, 18.0, 11.0, 10.0, 10.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4228515625, -1.3841552734375, -1.345458984375, -1.3067626953125, -1.26806640625, -1.2293701171875, -1.190673828125, -1.1519775390625, -1.11328125, -1.0745849609375, -1.035888671875, -0.9971923828125, -0.95849609375, -0.9197998046875, -0.881103515625, -0.8424072265625, -0.8037109375, -0.7650146484375, -0.726318359375, -0.6876220703125, -0.64892578125, -0.6102294921875, -0.571533203125, -0.5328369140625, -0.494140625, -0.4554443359375, -0.416748046875, -0.3780517578125, -0.33935546875, -0.3006591796875, -0.261962890625, -0.2232666015625, -0.1845703125, -0.1458740234375, -0.107177734375, -0.0684814453125, -0.02978515625, 0.0089111328125, 0.047607421875, 0.0863037109375, 0.125, 0.1636962890625, 0.202392578125, 0.2410888671875, 0.27978515625, 0.3184814453125, 0.357177734375, 0.3958740234375, 0.4345703125, 0.4732666015625, 0.511962890625, 0.5506591796875, 0.58935546875, 0.6280517578125, 0.666748046875, 0.7054443359375, 0.744140625, 0.7828369140625, 0.821533203125, 0.8602294921875, 0.89892578125, 0.9376220703125, 0.976318359375, 1.0150146484375, 1.0537109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 10.0, 8.0, 13.0, 23.0, 16.0, 23.0, 23.0, 21.0, 46.0, 49.0, 46.0, 51.0, 59.0, 84.0, 86.0, 54.0, 63.0, 65.0, 42.0, 37.0, 34.0, 27.0, 29.0, 21.0, 19.0, 13.0, 9.0, 8.0, 7.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77490234375, -0.7454910278320312, -0.7160797119140625, -0.6866683959960938, -0.657257080078125, -0.6278457641601562, -0.5984344482421875, -0.5690231323242188, -0.53961181640625, -0.5102005004882812, -0.4807891845703125, -0.45137786865234375, -0.421966552734375, -0.39255523681640625, -0.3631439208984375, -0.33373260498046875, -0.3043212890625, -0.27490997314453125, -0.2454986572265625, -0.21608734130859375, -0.186676025390625, -0.15726470947265625, -0.1278533935546875, -0.09844207763671875, -0.06903076171875, -0.03961944580078125, -0.0102081298828125, 0.01920318603515625, 0.048614501953125, 0.07802581787109375, 0.1074371337890625, 0.13684844970703125, 0.166259765625, 0.19567108154296875, 0.2250823974609375, 0.25449371337890625, 0.283905029296875, 0.31331634521484375, 0.3427276611328125, 0.37213897705078125, 0.40155029296875, 0.43096160888671875, 0.4603729248046875, 0.48978424072265625, 0.519195556640625, 0.5486068725585938, 0.5780181884765625, 0.6074295043945312, 0.6368408203125, 0.6662521362304688, 0.6956634521484375, 0.7250747680664062, 0.754486083984375, 0.7838973999023438, 0.8133087158203125, 0.8427200317382812, 0.87213134765625, 0.9015426635742188, 0.9309539794921875, 0.9603652954101562, 0.989776611328125, 1.0191879272460938, 1.0485992431640625, 1.0780105590820312, 1.107421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 10.0, 3.0, 6.0, 16.0, 19.0, 35.0, 67.0, 136.0, 278.0, 759.0, 2383.0, 11664.0, 123056.0, 851382.0, 49440.0, 6720.0, 1596.0, 521.0, 193.0, 86.0, 58.0, 29.0, 30.0, 14.0, 9.0, 6.0, 12.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.3255500793457031, -0.31516265869140625, -0.3047752380371094, -0.2943878173828125, -0.2840003967285156, -0.27361297607421875, -0.2632255554199219, -0.252838134765625, -0.24245071411132812, -0.23206329345703125, -0.22167587280273438, -0.2112884521484375, -0.20090103149414062, -0.19051361083984375, -0.18012619018554688, -0.16973876953125, -0.15935134887695312, -0.14896392822265625, -0.13857650756835938, -0.1281890869140625, -0.11780166625976562, -0.10741424560546875, -0.09702682495117188, -0.086639404296875, -0.07625198364257812, -0.06586456298828125, -0.055477142333984375, -0.0450897216796875, -0.034702301025390625, -0.02431488037109375, -0.013927459716796875, -0.0035400390625, 0.006847381591796875, 0.01723480224609375, 0.027622222900390625, 0.0380096435546875, 0.048397064208984375, 0.05878448486328125, 0.06917190551757812, 0.079559326171875, 0.08994674682617188, 0.10033416748046875, 0.11072158813476562, 0.1211090087890625, 0.13149642944335938, 0.14188385009765625, 0.15227127075195312, 0.16265869140625, 0.17304611206054688, 0.18343353271484375, 0.19382095336914062, 0.2042083740234375, 0.21459579467773438, 0.22498321533203125, 0.23537063598632812, 0.245758056640625, 0.2561454772949219, 0.26653289794921875, 0.2769203186035156, 0.2873077392578125, 0.2976951599121094, 0.30808258056640625, 0.3184700012207031, 0.328857421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 9.0, 9.0, 8.0, 13.0, 20.0, 17.0, 28.0, 40.0, 47.0, 72.0, 112.0, 107.0, 144.0, 104.0, 87.0, 47.0, 32.0, 22.0, 26.0, 8.0, 7.0, 8.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6927719116210938e-05, -1.6219913959503174e-05, -1.551210880279541e-05, -1.4804303646087646e-05, -1.4096498489379883e-05, -1.3388693332672119e-05, -1.2680888175964355e-05, -1.1973083019256592e-05, -1.1265277862548828e-05, -1.0557472705841064e-05, -9.8496675491333e-06, -9.141862392425537e-06, -8.434057235717773e-06, -7.72625207901001e-06, -7.018446922302246e-06, -6.310641765594482e-06, -5.602836608886719e-06, -4.895031452178955e-06, -4.187226295471191e-06, -3.4794211387634277e-06, -2.771615982055664e-06, -2.0638108253479004e-06, -1.3560056686401367e-06, -6.48200511932373e-07, 5.960464477539063e-08, 7.674098014831543e-07, 1.475214958190918e-06, 2.1830201148986816e-06, 2.8908252716064453e-06, 3.598630428314209e-06, 4.306435585021973e-06, 5.014240741729736e-06, 5.7220458984375e-06, 6.429851055145264e-06, 7.137656211853027e-06, 7.845461368560791e-06, 8.553266525268555e-06, 9.261071681976318e-06, 9.968876838684082e-06, 1.0676681995391846e-05, 1.138448715209961e-05, 1.2092292308807373e-05, 1.2800097465515137e-05, 1.35079026222229e-05, 1.4215707778930664e-05, 1.4923512935638428e-05, 1.563131809234619e-05, 1.6339123249053955e-05, 1.704692840576172e-05, 1.7754733562469482e-05, 1.8462538719177246e-05, 1.917034387588501e-05, 1.9878149032592773e-05, 2.0585954189300537e-05, 2.12937593460083e-05, 2.2001564502716064e-05, 2.2709369659423828e-05, 2.3417174816131592e-05, 2.4124979972839355e-05, 2.483278512954712e-05, 2.5540590286254883e-05, 2.6248395442962646e-05, 2.695620059967041e-05, 2.7664005756378174e-05, 2.8371810913085938e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 7.0, 7.0, 12.0, 16.0, 26.0, 34.0, 86.0, 161.0, 396.0, 1402.0, 7958.0, 145647.0, 870567.0, 18483.0, 2622.0, 627.0, 240.0, 110.0, 53.0, 22.0, 14.0, 20.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.3597412109375, -0.345458984375, -0.3311767578125, -0.31689453125, -0.3026123046875, -0.288330078125, -0.2740478515625, -0.259765625, -0.2454833984375, -0.231201171875, -0.2169189453125, -0.20263671875, -0.1883544921875, -0.174072265625, -0.1597900390625, -0.1455078125, -0.1312255859375, -0.116943359375, -0.1026611328125, -0.08837890625, -0.0740966796875, -0.059814453125, -0.0455322265625, -0.03125, -0.0169677734375, -0.002685546875, 0.0115966796875, 0.02587890625, 0.0401611328125, 0.054443359375, 0.0687255859375, 0.0830078125, 0.0972900390625, 0.111572265625, 0.1258544921875, 0.14013671875, 0.1544189453125, 0.168701171875, 0.1829833984375, 0.197265625, 0.2115478515625, 0.225830078125, 0.2401123046875, 0.25439453125, 0.2686767578125, 0.282958984375, 0.2972412109375, 0.3115234375, 0.3258056640625, 0.340087890625, 0.3543701171875, 0.36865234375, 0.3829345703125, 0.397216796875, 0.4114990234375, 0.42578125, 0.4400634765625, 0.454345703125, 0.4686279296875, 0.48291015625, 0.4971923828125, 0.511474609375, 0.5257568359375, 0.5400390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 7.0, 15.0, 16.0, 35.0, 45.0, 66.0, 110.0, 138.0, 149.0, 123.0, 66.0, 60.0, 34.0, 23.0, 15.0, 13.0, 10.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.15757369995117188, -0.15157318115234375, -0.14557266235351562, -0.1395721435546875, -0.13357162475585938, -0.12757110595703125, -0.12157058715820312, -0.115570068359375, -0.10956954956054688, -0.10356903076171875, -0.09756851196289062, -0.0915679931640625, -0.08556747436523438, -0.07956695556640625, -0.07356643676757812, -0.06756591796875, -0.061565399169921875, -0.05556488037109375, -0.049564361572265625, -0.0435638427734375, -0.037563323974609375, -0.03156280517578125, -0.025562286376953125, -0.019561767578125, -0.013561248779296875, -0.00756072998046875, -0.001560211181640625, 0.0044403076171875, 0.010440826416015625, 0.01644134521484375, 0.022441864013671875, 0.0284423828125, 0.034442901611328125, 0.04044342041015625, 0.046443939208984375, 0.0524444580078125, 0.058444976806640625, 0.06444549560546875, 0.07044601440429688, 0.076446533203125, 0.08244705200195312, 0.08844757080078125, 0.09444808959960938, 0.1004486083984375, 0.10644912719726562, 0.11244964599609375, 0.11845016479492188, 0.12445068359375, 0.13045120239257812, 0.13645172119140625, 0.14245223999023438, 0.1484527587890625, 0.15445327758789062, 0.16045379638671875, 0.16645431518554688, 0.172454833984375, 0.17845535278320312, 0.18445587158203125, 0.19045639038085938, 0.1964569091796875, 0.20245742797851562, 0.20845794677734375, 0.21445846557617188, 0.220458984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 13.0, 65.0, 278.0, 451.0, 142.0, 39.0, 14.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.783329010009766, -21.350446701049805, -20.917564392089844, -20.484683990478516, -20.051801681518555, -19.618919372558594, -19.186037063598633, -18.753154754638672, -18.320274353027344, -17.887392044067383, -17.454509735107422, -17.021629333496094, -16.588747024536133, -16.155864715576172, -15.722982406616211, -15.290101051330566, -14.857217788696289, -14.424335479736328, -13.991454124450684, -13.558571815490723, -13.125690460205078, -12.692808151245117, -12.259925842285156, -11.827044486999512, -11.394163131713867, -10.961280822753906, -10.528399467468262, -10.0955171585083, -9.662635803222656, -9.229753494262695, -8.796871185302734, -8.36398983001709, -7.931107997894287, -7.498226165771484, -7.065344333648682, -6.632462501525879, -6.199580192565918, -5.766698360443115, -5.3338165283203125, -4.900934219360352, -4.468052864074707, -4.035171031951904, -3.6022889614105225, -3.1694071292877197, -2.736525058746338, -2.303643226623535, -1.8707613945007324, -1.4378793239593506, -1.0049972534179688, -0.5721153020858765, -0.13923341035842896, 0.29364848136901855, 0.7265304327011108, 1.1594123840332031, 1.5922942161560059, 2.0251762866973877, 2.4580581188201904, 2.890939950942993, 3.323822021484375, 3.7567038536071777, 4.1895856857299805, 4.622467994689941, 5.055349349975586, 5.488231658935547, 5.92111349105835]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 3.0, 7.0, 9.0, 18.0, 9.0, 14.0, 24.0, 23.0, 34.0, 34.0, 30.0, 34.0, 31.0, 40.0, 36.0, 45.0, 34.0, 52.0, 42.0, 47.0, 34.0, 54.0, 32.0, 37.0, 43.0, 34.0, 34.0, 25.0, 28.0, 22.0, 13.0, 16.0, 13.0, 9.0, 17.0, 3.0, 1.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.39192008972168, -4.265620231628418, -4.139319896697998, -4.013020038604736, -3.8867197036743164, -3.7604198455810547, -3.634119749069214, -3.507819652557373, -3.3815195560455322, -3.2552194595336914, -3.1289193630218506, -3.0026192665100098, -2.876319408416748, -2.750019073486328, -2.6237192153930664, -2.4974191188812256, -2.3711190223693848, -2.244818925857544, -2.118518829345703, -1.9922188520431519, -1.865918755531311, -1.7396186590194702, -1.613318681716919, -1.4870185852050781, -1.3607184886932373, -1.2344183921813965, -1.1081182956695557, -0.9818183183670044, -0.8555182218551636, -0.7292181253433228, -0.6029180884361267, -0.47661805152893066, -0.35031771659851074, -0.2240176498889923, -0.09771758317947388, 0.028582483530044556, 0.154882550239563, 0.2811826467514038, 0.40748268365859985, 0.5337827205657959, 0.6600828170776367, 0.7863829135894775, 0.9126829504966736, 1.0389829874038696, 1.1652830839157104, 1.2915831804275513, 1.4178831577301025, 1.5441832542419434, 1.6704833507537842, 1.796783447265625, 1.9230835437774658, 2.0493836402893066, 2.1756834983825684, 2.3019838333129883, 2.42828369140625, 2.554583787918091, 2.6808838844299316, 2.8071839809417725, 2.9334840774536133, 3.059784173965454, 3.186084270477295, 3.3123841285705566, 3.4386842250823975, 3.5649843215942383, 3.691284418106079]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 15.0, 10.0, 26.0, 25.0, 31.0, 48.0, 67.0, 83.0, 141.0, 232.0, 415.0, 907.0, 2314.0, 8263.0, 67130.0, 4062687.0, 42200.0, 6460.0, 1863.0, 702.0, 288.0, 146.0, 80.0, 37.0, 32.0, 17.0, 9.0, 10.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4609375, -1.42803955078125, -1.3951416015625, -1.36224365234375, -1.329345703125, -1.29644775390625, -1.2635498046875, -1.23065185546875, -1.19775390625, -1.16485595703125, -1.1319580078125, -1.09906005859375, -1.066162109375, -1.03326416015625, -1.0003662109375, -0.96746826171875, -0.9345703125, -0.90167236328125, -0.8687744140625, -0.83587646484375, -0.802978515625, -0.77008056640625, -0.7371826171875, -0.70428466796875, -0.67138671875, -0.63848876953125, -0.6055908203125, -0.57269287109375, -0.539794921875, -0.50689697265625, -0.4739990234375, -0.44110107421875, -0.408203125, -0.37530517578125, -0.3424072265625, -0.30950927734375, -0.276611328125, -0.24371337890625, -0.2108154296875, -0.17791748046875, -0.14501953125, -0.11212158203125, -0.0792236328125, -0.04632568359375, -0.013427734375, 0.01947021484375, 0.0523681640625, 0.08526611328125, 0.1181640625, 0.15106201171875, 0.1839599609375, 0.21685791015625, 0.249755859375, 0.28265380859375, 0.3155517578125, 0.34844970703125, 0.38134765625, 0.41424560546875, 0.4471435546875, 0.48004150390625, 0.512939453125, 0.54583740234375, 0.5787353515625, 0.61163330078125, 0.64453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 18.0, 41.0, 75.0, 127.0, 169.0, 184.0, 146.0, 116.0, 67.0, 24.0, 15.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7386932373046875, -0.722015380859375, -0.7053375244140625, -0.68865966796875, -0.6719818115234375, -0.655303955078125, -0.6386260986328125, -0.6219482421875, -0.6052703857421875, -0.588592529296875, -0.5719146728515625, -0.55523681640625, -0.5385589599609375, -0.521881103515625, -0.5052032470703125, -0.488525390625, -0.4718475341796875, -0.455169677734375, -0.4384918212890625, -0.42181396484375, -0.4051361083984375, -0.388458251953125, -0.3717803955078125, -0.3551025390625, -0.3384246826171875, -0.321746826171875, -0.3050689697265625, -0.28839111328125, -0.2717132568359375, -0.255035400390625, -0.2383575439453125, -0.2216796875, -0.2050018310546875, -0.188323974609375, -0.1716461181640625, -0.15496826171875, -0.1382904052734375, -0.121612548828125, -0.1049346923828125, -0.0882568359375, -0.0715789794921875, -0.054901123046875, -0.0382232666015625, -0.02154541015625, -0.0048675537109375, 0.011810302734375, 0.0284881591796875, 0.045166015625, 0.0618438720703125, 0.078521728515625, 0.0951995849609375, 0.11187744140625, 0.1285552978515625, 0.145233154296875, 0.1619110107421875, 0.1785888671875, 0.1952667236328125, 0.211944580078125, 0.2286224365234375, 0.24530029296875, 0.2619781494140625, 0.278656005859375, 0.2953338623046875, 0.31201171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 7.0, 14.0, 23.0, 54.0, 120.0, 260.0, 666.0, 1587.0, 3657.0, 11130.0, 57778.0, 3978020.0, 115552.0, 16466.0, 5120.0, 2133.0, 926.0, 421.0, 176.0, 73.0, 29.0, 20.0, 7.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96533203125, -0.9374618530273438, -0.9095916748046875, -0.8817214965820312, -0.853851318359375, -0.8259811401367188, -0.7981109619140625, -0.7702407836914062, -0.74237060546875, -0.7145004272460938, -0.6866302490234375, -0.6587600708007812, -0.630889892578125, -0.6030197143554688, -0.5751495361328125, -0.5472793579101562, -0.5194091796875, -0.49153900146484375, -0.4636688232421875, -0.43579864501953125, -0.407928466796875, -0.38005828857421875, -0.3521881103515625, -0.32431793212890625, -0.29644775390625, -0.26857757568359375, -0.2407073974609375, -0.21283721923828125, -0.184967041015625, -0.15709686279296875, -0.1292266845703125, -0.10135650634765625, -0.073486328125, -0.04561614990234375, -0.0177459716796875, 0.01012420654296875, 0.037994384765625, 0.06586456298828125, 0.0937347412109375, 0.12160491943359375, 0.14947509765625, 0.17734527587890625, 0.2052154541015625, 0.23308563232421875, 0.260955810546875, 0.28882598876953125, 0.3166961669921875, 0.34456634521484375, 0.3724365234375, 0.40030670166015625, 0.4281768798828125, 0.45604705810546875, 0.483917236328125, 0.5117874145507812, 0.5396575927734375, 0.5675277709960938, 0.59539794921875, 0.6232681274414062, 0.6511383056640625, 0.6790084838867188, 0.706878662109375, 0.7347488403320312, 0.7626190185546875, 0.7904891967773438, 0.818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 14.0, 28.0, 16.0, 27.0, 64.0, 108.0, 302.0, 2960.0, 264.0, 93.0, 37.0, 29.0, 21.0, 15.0, 17.0, 11.0, 8.0, 2.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24819183349609375, -0.2397918701171875, -0.23139190673828125, -0.222991943359375, -0.21459197998046875, -0.2061920166015625, -0.19779205322265625, -0.18939208984375, -0.18099212646484375, -0.1725921630859375, -0.16419219970703125, -0.155792236328125, -0.14739227294921875, -0.1389923095703125, -0.13059234619140625, -0.1221923828125, -0.11379241943359375, -0.1053924560546875, -0.09699249267578125, -0.088592529296875, -0.08019256591796875, -0.0717926025390625, -0.06339263916015625, -0.05499267578125, -0.04659271240234375, -0.0381927490234375, -0.02979278564453125, -0.021392822265625, -0.01299285888671875, -0.0045928955078125, 0.00380706787109375, 0.01220703125, 0.02060699462890625, 0.0290069580078125, 0.03740692138671875, 0.045806884765625, 0.05420684814453125, 0.0626068115234375, 0.07100677490234375, 0.07940673828125, 0.08780670166015625, 0.0962066650390625, 0.10460662841796875, 0.113006591796875, 0.12140655517578125, 0.1298065185546875, 0.13820648193359375, 0.1466064453125, 0.15500640869140625, 0.1634063720703125, 0.17180633544921875, 0.180206298828125, 0.18860626220703125, 0.1970062255859375, 0.20540618896484375, 0.21380615234375, 0.22220611572265625, 0.2306060791015625, 0.23900604248046875, 0.247406005859375, 0.25580596923828125, 0.2642059326171875, 0.27260589599609375, 0.281005859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 10.0, 18.0, 25.0, 78.0, 225.0, 342.0, 199.0, 72.0, 18.0, 8.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5095571279525757, -1.4336057901382446, -1.3576544523239136, -1.2817031145095825, -1.205751657485962, -1.1298003196716309, -1.0538489818572998, -0.9778976440429688, -0.9019463062286377, -0.8259949684143066, -0.7500436305999756, -0.6740922331809998, -0.5981408953666687, -0.5221895575523376, -0.4462381899356842, -0.37028682231903076, -0.2943354845046997, -0.21838413178920746, -0.1424327790737152, -0.06648142635822296, 0.009469926357269287, 0.08542126417160034, 0.16137263178825378, 0.23732399940490723, 0.3132753372192383, 0.38922667503356934, 0.4651780426502228, 0.5411294102668762, 0.6170807480812073, 0.6930320858955383, 0.7689834833145142, 0.8449348211288452, 0.9208860397338867, 0.9968373775482178, 1.0727887153625488, 1.1487400531768799, 1.224691390991211, 1.300642728805542, 1.3765941858291626, 1.4525455236434937, 1.5284968614578247, 1.6044481992721558, 1.6803995370864868, 1.7563508749008179, 1.8323023319244385, 1.9082536697387695, 1.9842050075531006, 2.0601563453674316, 2.1361076831817627, 2.2120590209960938, 2.288010358810425, 2.363961696624756, 2.439913034439087, 2.515864372253418, 2.591815710067749, 2.66776704788208, 2.7437186241149902, 2.8196699619293213, 2.8956212997436523, 2.9715726375579834, 3.0475239753723145, 3.1234753131866455, 3.1994266510009766, 3.2753782272338867, 3.3513293266296387]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 6.0, 8.0, 19.0, 19.0, 47.0, 40.0, 49.0, 59.0, 57.0, 65.0, 65.0, 90.0, 79.0, 64.0, 74.0, 59.0, 37.0, 45.0, 27.0, 18.0, 15.0, 14.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.409222960472107, -1.3669484853744507, -1.3246738910675049, -1.2823994159698486, -1.2401249408721924, -1.1978504657745361, -1.1555758714675903, -1.113301396369934, -1.0710268020629883, -1.028752326965332, -0.986477792263031, -0.94420325756073, -0.9019287824630737, -0.8596542477607727, -0.8173797130584717, -0.7751052379608154, -0.7328307628631592, -0.6905562281608582, -0.6482817530632019, -0.6060072183609009, -0.5637327432632446, -0.5214582085609436, -0.4791836738586426, -0.43690916895866394, -0.3946346640586853, -0.35236015915870667, -0.310085654258728, -0.267811119556427, -0.22553661465644836, -0.18326210975646973, -0.1409875750541687, -0.09871307015419006, -0.05643868446350098, -0.014164172112941742, 0.028110340237617493, 0.07038486003875732, 0.11265936493873596, 0.1549338698387146, 0.19720840454101562, 0.23948290944099426, 0.2817574143409729, 0.32403191924095154, 0.3663064241409302, 0.4085809588432312, 0.45085546374320984, 0.4931299686431885, 0.5354045033454895, 0.5776790380477905, 0.6199535131454468, 0.6622280478477478, 0.704502522945404, 0.7467770576477051, 0.7890515327453613, 0.8313260674476624, 0.8736006021499634, 0.9158750772476196, 0.9581496119499207, 1.0004241466522217, 1.042698621749878, 1.0849730968475342, 1.12724769115448, 1.1695221662521362, 1.211796760559082, 1.2540712356567383, 1.2963457107543945]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 3.0, 7.0, 4.0, 9.0, 15.0, 19.0, 21.0, 23.0, 38.0, 55.0, 129.0, 259.0, 525.0, 1215.0, 4196.0, 42626.0, 887011.0, 102476.0, 6845.0, 1667.0, 660.0, 346.0, 156.0, 85.0, 48.0, 29.0, 28.0, 12.0, 13.0, 7.0, 9.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.21417236328125, -2.1568603515625, -2.09954833984375, -2.042236328125, -1.98492431640625, -1.9276123046875, -1.87030029296875, -1.81298828125, -1.75567626953125, -1.6983642578125, -1.64105224609375, -1.583740234375, -1.52642822265625, -1.4691162109375, -1.41180419921875, -1.3544921875, -1.29718017578125, -1.2398681640625, -1.18255615234375, -1.125244140625, -1.06793212890625, -1.0106201171875, -0.95330810546875, -0.89599609375, -0.83868408203125, -0.7813720703125, -0.72406005859375, -0.666748046875, -0.60943603515625, -0.5521240234375, -0.49481201171875, -0.4375, -0.38018798828125, -0.3228759765625, -0.26556396484375, -0.208251953125, -0.15093994140625, -0.0936279296875, -0.03631591796875, 0.02099609375, 0.07830810546875, 0.1356201171875, 0.19293212890625, 0.250244140625, 0.30755615234375, 0.3648681640625, 0.42218017578125, 0.4794921875, 0.53680419921875, 0.5941162109375, 0.65142822265625, 0.708740234375, 0.76605224609375, 0.8233642578125, 0.88067626953125, 0.93798828125, 0.99530029296875, 1.0526123046875, 1.10992431640625, 1.167236328125, 1.22454833984375, 1.2818603515625, 1.33917236328125, 1.396484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 34.0, 58.0, 85.0, 165.0, 167.0, 160.0, 131.0, 91.0, 52.0, 21.0, 10.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73486328125, -0.7188224792480469, -0.7027816772460938, -0.6867408752441406, -0.6707000732421875, -0.6546592712402344, -0.6386184692382812, -0.6225776672363281, -0.606536865234375, -0.5904960632324219, -0.5744552612304688, -0.5584144592285156, -0.5423736572265625, -0.5263328552246094, -0.5102920532226562, -0.4942512512207031, -0.47821044921875, -0.4621696472167969, -0.44612884521484375, -0.4300880432128906, -0.4140472412109375, -0.3980064392089844, -0.38196563720703125, -0.3659248352050781, -0.349884033203125, -0.3338432312011719, -0.31780242919921875, -0.3017616271972656, -0.2857208251953125, -0.2696800231933594, -0.25363922119140625, -0.23759841918945312, -0.2215576171875, -0.20551681518554688, -0.18947601318359375, -0.17343521118164062, -0.1573944091796875, -0.14135360717773438, -0.12531280517578125, -0.10927200317382812, -0.093231201171875, -0.07719039916992188, -0.06114959716796875, -0.045108795166015625, -0.0290679931640625, -0.013027191162109375, 0.00301361083984375, 0.019054412841796875, 0.03509521484375, 0.051136016845703125, 0.06717681884765625, 0.08321762084960938, 0.0992584228515625, 0.11529922485351562, 0.13134002685546875, 0.14738082885742188, 0.163421630859375, 0.17946243286132812, 0.19550323486328125, 0.21154403686523438, 0.2275848388671875, 0.24362564086914062, 0.25966644287109375, 0.2757072448730469, 0.291748046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 9.0, 19.0, 14.0, 12.0, 23.0, 29.0, 48.0, 64.0, 94.0, 194.0, 413.0, 1113.0, 3450.0, 13706.0, 87596.0, 759456.0, 154933.0, 20334.0, 4593.0, 1352.0, 516.0, 213.0, 108.0, 67.0, 45.0, 36.0, 22.0, 31.0, 11.0, 10.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0498046875, -1.01312255859375, -0.9764404296875, -0.93975830078125, -0.903076171875, -0.86639404296875, -0.8297119140625, -0.79302978515625, -0.75634765625, -0.71966552734375, -0.6829833984375, -0.64630126953125, -0.609619140625, -0.57293701171875, -0.5362548828125, -0.49957275390625, -0.462890625, -0.42620849609375, -0.3895263671875, -0.35284423828125, -0.316162109375, -0.27947998046875, -0.2427978515625, -0.20611572265625, -0.16943359375, -0.13275146484375, -0.0960693359375, -0.05938720703125, -0.022705078125, 0.01397705078125, 0.0506591796875, 0.08734130859375, 0.1240234375, 0.16070556640625, 0.1973876953125, 0.23406982421875, 0.270751953125, 0.30743408203125, 0.3441162109375, 0.38079833984375, 0.41748046875, 0.45416259765625, 0.4908447265625, 0.52752685546875, 0.564208984375, 0.60089111328125, 0.6375732421875, 0.67425537109375, 0.7109375, 0.74761962890625, 0.7843017578125, 0.82098388671875, 0.857666015625, 0.89434814453125, 0.9310302734375, 0.96771240234375, 1.00439453125, 1.04107666015625, 1.0777587890625, 1.11444091796875, 1.151123046875, 1.18780517578125, 1.2244873046875, 1.26116943359375, 1.2978515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 2.0, 9.0, 15.0, 24.0, 16.0, 28.0, 22.0, 27.0, 33.0, 45.0, 37.0, 55.0, 54.0, 51.0, 45.0, 56.0, 67.0, 61.0, 57.0, 52.0, 37.0, 31.0, 34.0, 27.0, 21.0, 13.0, 13.0, 9.0, 14.0, 11.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.94091796875, -0.9139404296875, -0.886962890625, -0.8599853515625, -0.8330078125, -0.8060302734375, -0.779052734375, -0.7520751953125, -0.72509765625, -0.6981201171875, -0.671142578125, -0.6441650390625, -0.6171875, -0.5902099609375, -0.563232421875, -0.5362548828125, -0.50927734375, -0.4822998046875, -0.455322265625, -0.4283447265625, -0.4013671875, -0.3743896484375, -0.347412109375, -0.3204345703125, -0.29345703125, -0.2664794921875, -0.239501953125, -0.2125244140625, -0.185546875, -0.1585693359375, -0.131591796875, -0.1046142578125, -0.07763671875, -0.0506591796875, -0.023681640625, 0.0032958984375, 0.0302734375, 0.0572509765625, 0.084228515625, 0.1112060546875, 0.13818359375, 0.1651611328125, 0.192138671875, 0.2191162109375, 0.24609375, 0.2730712890625, 0.300048828125, 0.3270263671875, 0.35400390625, 0.3809814453125, 0.407958984375, 0.4349365234375, 0.4619140625, 0.4888916015625, 0.515869140625, 0.5428466796875, 0.56982421875, 0.5968017578125, 0.623779296875, 0.6507568359375, 0.677734375, 0.7047119140625, 0.731689453125, 0.7586669921875, 0.78564453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 12.0, 19.0, 23.0, 39.0, 55.0, 99.0, 188.0, 492.0, 2039.0, 13718.0, 441339.0, 571901.0, 15451.0, 2163.0, 553.0, 207.0, 99.0, 52.0, 40.0, 13.0, 7.0, 9.0, 6.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.4485359191894531, -0.42905426025390625, -0.4095726013183594, -0.3900909423828125, -0.3706092834472656, -0.35112762451171875, -0.3316459655761719, -0.312164306640625, -0.2926826477050781, -0.27320098876953125, -0.2537193298339844, -0.2342376708984375, -0.21475601196289062, -0.19527435302734375, -0.17579269409179688, -0.15631103515625, -0.13682937622070312, -0.11734771728515625, -0.09786605834960938, -0.0783843994140625, -0.058902740478515625, -0.03942108154296875, -0.019939422607421875, -0.000457763671875, 0.019023895263671875, 0.03850555419921875, 0.057987213134765625, 0.0774688720703125, 0.09695053100585938, 0.11643218994140625, 0.13591384887695312, 0.1553955078125, 0.17487716674804688, 0.19435882568359375, 0.21384048461914062, 0.2333221435546875, 0.2528038024902344, 0.27228546142578125, 0.2917671203613281, 0.311248779296875, 0.3307304382324219, 0.35021209716796875, 0.3696937561035156, 0.3891754150390625, 0.4086570739746094, 0.42813873291015625, 0.4476203918457031, 0.46710205078125, 0.4865837097167969, 0.5060653686523438, 0.5255470275878906, 0.5450286865234375, 0.5645103454589844, 0.5839920043945312, 0.6034736633300781, 0.622955322265625, 0.6424369812011719, 0.6619186401367188, 0.6814002990722656, 0.7008819580078125, 0.7203636169433594, 0.7398452758789062, 0.7593269348144531, 0.77880859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 5.0, 13.0, 18.0, 24.0, 44.0, 131.0, 377.0, 217.0, 77.0, 38.0, 18.0, 17.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -2.9535964131355286e-05, -2.7004629373550415e-05, -2.4473294615745544e-05, -2.1941959857940674e-05, -1.9410625100135803e-05, -1.6879290342330933e-05, -1.4347955584526062e-05, -1.1816620826721191e-05, -9.28528606891632e-06, -6.75395131111145e-06, -4.22261655330658e-06, -1.691281795501709e-06, 8.400529623031616e-07, 3.3713877201080322e-06, 5.902722477912903e-06, 8.434057235717773e-06, 1.0965391993522644e-05, 1.3496726751327515e-05, 1.6028061509132385e-05, 1.8559396266937256e-05, 2.1090731024742126e-05, 2.3622065782546997e-05, 2.6153400540351868e-05, 2.8684735298156738e-05, 3.121607005596161e-05, 3.374740481376648e-05, 3.627873957157135e-05, 3.881007432937622e-05, 4.134140908718109e-05, 4.387274384498596e-05, 4.640407860279083e-05, 4.89354133605957e-05, 5.1466748118400574e-05, 5.3998082876205444e-05, 5.6529417634010315e-05, 5.9060752391815186e-05, 6.159208714962006e-05, 6.412342190742493e-05, 6.66547566652298e-05, 6.918609142303467e-05, 7.171742618083954e-05, 7.424876093864441e-05, 7.678009569644928e-05, 7.931143045425415e-05, 8.184276521205902e-05, 8.437409996986389e-05, 8.690543472766876e-05, 8.943676948547363e-05, 9.19681042432785e-05, 9.449943900108337e-05, 9.703077375888824e-05, 9.956210851669312e-05, 0.00010209344327449799, 0.00010462477803230286, 0.00010715611279010773, 0.0001096874475479126, 0.00011221878230571747, 0.00011475011706352234, 0.00011728145182132721, 0.00011981278657913208, 0.00012234412133693695, 0.00012487545609474182, 0.0001274067908525467, 0.00012993812561035156]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 12.0, 28.0, 58.0, 93.0, 198.0, 616.0, 5950.0, 958701.0, 80393.0, 1902.0, 348.0, 125.0, 48.0, 43.0, 21.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.719329833984375, -0.68475341796875, -0.650177001953125, -0.6156005859375, -0.581024169921875, -0.54644775390625, -0.511871337890625, -0.477294921875, -0.442718505859375, -0.40814208984375, -0.373565673828125, -0.3389892578125, -0.304412841796875, -0.26983642578125, -0.235260009765625, -0.20068359375, -0.166107177734375, -0.13153076171875, -0.096954345703125, -0.0623779296875, -0.027801513671875, 0.00677490234375, 0.041351318359375, 0.075927734375, 0.110504150390625, 0.14508056640625, 0.179656982421875, 0.2142333984375, 0.248809814453125, 0.28338623046875, 0.317962646484375, 0.3525390625, 0.387115478515625, 0.42169189453125, 0.456268310546875, 0.4908447265625, 0.525421142578125, 0.55999755859375, 0.594573974609375, 0.629150390625, 0.663726806640625, 0.69830322265625, 0.732879638671875, 0.7674560546875, 0.802032470703125, 0.83660888671875, 0.871185302734375, 0.90576171875, 0.940338134765625, 0.97491455078125, 1.009490966796875, 1.0440673828125, 1.078643798828125, 1.11322021484375, 1.147796630859375, 1.182373046875, 1.216949462890625, 1.25152587890625, 1.286102294921875, 1.3206787109375, 1.355255126953125, 1.38983154296875, 1.424407958984375, 1.458984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 3.0, 14.0, 30.0, 54.0, 108.0, 241.0, 288.0, 148.0, 49.0, 20.0, 15.0, 13.0, 9.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95166015625, -0.9326629638671875, -0.913665771484375, -0.8946685791015625, -0.87567138671875, -0.8566741943359375, -0.837677001953125, -0.8186798095703125, -0.7996826171875, -0.7806854248046875, -0.761688232421875, -0.7426910400390625, -0.72369384765625, -0.7046966552734375, -0.685699462890625, -0.6667022705078125, -0.647705078125, -0.6287078857421875, -0.609710693359375, -0.5907135009765625, -0.57171630859375, -0.5527191162109375, -0.533721923828125, -0.5147247314453125, -0.4957275390625, -0.4767303466796875, -0.457733154296875, -0.4387359619140625, -0.41973876953125, -0.4007415771484375, -0.381744384765625, -0.3627471923828125, -0.34375, -0.3247528076171875, -0.305755615234375, -0.2867584228515625, -0.26776123046875, -0.2487640380859375, -0.229766845703125, -0.2107696533203125, -0.1917724609375, -0.1727752685546875, -0.153778076171875, -0.1347808837890625, -0.11578369140625, -0.0967864990234375, -0.077789306640625, -0.0587921142578125, -0.039794921875, -0.0207977294921875, -0.001800537109375, 0.0171966552734375, 0.03619384765625, 0.0551910400390625, 0.074188232421875, 0.0931854248046875, 0.1121826171875, 0.1311798095703125, 0.150177001953125, 0.1691741943359375, 0.18817138671875, 0.2071685791015625, 0.226165771484375, 0.2451629638671875, 0.26416015625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 20.0, 49.0, 98.0, 268.0, 320.0, 139.0, 58.0, 28.0, 13.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.300485610961914, -12.002562522888184, -11.704639434814453, -11.406717300415039, -11.108794212341309, -10.810871124267578, -10.512948989868164, -10.215025901794434, -9.917102813720703, -9.619179725646973, -9.321256637573242, -9.023334503173828, -8.725411415100098, -8.427488327026367, -8.129566192626953, -7.831643104553223, -7.533720016479492, -7.235796928405762, -6.9378743171691895, -6.639951705932617, -6.342028617858887, -6.044105529785156, -5.746182918548584, -5.448260307312012, -5.150337219238281, -4.852414131164551, -4.5544915199279785, -4.256568908691406, -3.958645820617676, -3.6607229709625244, -3.362800121307373, -3.0648772716522217, -2.766953945159912, -2.4690310955047607, -2.1711082458496094, -1.873185396194458, -1.5752625465393066, -1.2773396968841553, -0.9794168472290039, -0.6814939975738525, -0.38357114791870117, -0.0856482982635498, 0.21227455139160156, 0.5101974010467529, 0.8081202507019043, 1.1060431003570557, 1.403965950012207, 1.7018887996673584, 1.9998116493225098, 2.297734498977661, 2.5956573486328125, 2.893580198287964, 3.1915030479431152, 3.4894258975982666, 3.787348747253418, 4.085271835327148, 4.383194446563721, 4.681117057800293, 4.979040145874023, 5.276963233947754, 5.574885845184326, 5.872808456420898, 6.170731544494629, 6.468654632568359, 6.766577243804932]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 1.0, 6.0, 9.0, 15.0, 14.0, 4.0, 13.0, 12.0, 18.0, 23.0, 23.0, 21.0, 33.0, 23.0, 32.0, 44.0, 43.0, 37.0, 41.0, 34.0, 36.0, 37.0, 37.0, 39.0, 41.0, 38.0, 34.0, 33.0, 32.0, 29.0, 26.0, 38.0, 24.0, 12.0, 14.0, 18.0, 5.0, 11.0, 11.0, 12.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060755968093872, -2.9560089111328125, -2.851261615753174, -2.7465145587921143, -2.6417675018310547, -2.537020206451416, -2.4322731494903564, -2.327526092529297, -2.222778797149658, -2.1180317401885986, -2.01328444480896, -1.9085373878479004, -1.8037902116775513, -1.6990430355072021, -1.5942959785461426, -1.4895488023757935, -1.3848016262054443, -1.2800544500350952, -1.175307273864746, -1.0705602169036865, -0.9658130407333374, -0.8610658645629883, -0.7563187479972839, -0.6515716314315796, -0.5468244552612305, -0.44207730889320374, -0.337330162525177, -0.23258301615715027, -0.12783586978912354, -0.023088693618774414, 0.08165842294692993, 0.18640553951263428, 0.2911524772644043, 0.39589962363243103, 0.5006467700004578, 0.6053938865661621, 0.7101410627365112, 0.8148882389068604, 0.9196353554725647, 1.024382472038269, 1.1291296482086182, 1.2338768243789673, 1.3386240005493164, 1.443371057510376, 1.548118233680725, 1.6528654098510742, 1.7576124668121338, 1.862359642982483, 1.967106819152832, 2.0718538761138916, 2.1766011714935303, 2.28134822845459, 2.3860955238342285, 2.490842580795288, 2.5955896377563477, 2.7003369331359863, 2.805083990097046, 2.9098310470581055, 3.014578342437744, 3.1193253993988037, 3.2240724563598633, 3.328819751739502, 3.4335668087005615, 3.538313865661621, 3.6430611610412598]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 5.0, 7.0, 7.0, 11.0, 15.0, 10.0, 34.0, 48.0, 102.0, 205.0, 426.0, 1105.0, 4347.0, 75013.0, 4100315.0, 9852.0, 1778.0, 546.0, 229.0, 104.0, 44.0, 32.0, 13.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.0859375, -4.9781951904296875, -4.870452880859375, -4.7627105712890625, -4.65496826171875, -4.5472259521484375, -4.439483642578125, -4.3317413330078125, -4.2239990234375, -4.1162567138671875, -4.008514404296875, -3.9007720947265625, -3.79302978515625, -3.6852874755859375, -3.577545166015625, -3.4698028564453125, -3.362060546875, -3.2543182373046875, -3.146575927734375, -3.0388336181640625, -2.93109130859375, -2.8233489990234375, -2.715606689453125, -2.6078643798828125, -2.5001220703125, -2.3923797607421875, -2.284637451171875, -2.1768951416015625, -2.06915283203125, -1.9614105224609375, -1.853668212890625, -1.7459259033203125, -1.63818359375, -1.5304412841796875, -1.422698974609375, -1.3149566650390625, -1.20721435546875, -1.0994720458984375, -0.991729736328125, -0.8839874267578125, -0.7762451171875, -0.6685028076171875, -0.560760498046875, -0.4530181884765625, -0.34527587890625, -0.2375335693359375, -0.129791259765625, -0.0220489501953125, 0.085693359375, 0.1934356689453125, 0.301177978515625, 0.4089202880859375, 0.51666259765625, 0.6244049072265625, 0.732147216796875, 0.8398895263671875, 0.9476318359375, 1.0553741455078125, 1.163116455078125, 1.2708587646484375, 1.37860107421875, 1.4863433837890625, 1.594085693359375, 1.7018280029296875, 1.8095703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 16.0, 26.0, 43.0, 79.0, 107.0, 144.0, 154.0, 133.0, 118.0, 85.0, 42.0, 24.0, 13.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.759765625, -0.7434196472167969, -0.7270736694335938, -0.7107276916503906, -0.6943817138671875, -0.6780357360839844, -0.6616897583007812, -0.6453437805175781, -0.628997802734375, -0.6126518249511719, -0.5963058471679688, -0.5799598693847656, -0.5636138916015625, -0.5472679138183594, -0.5309219360351562, -0.5145759582519531, -0.49822998046875, -0.4818840026855469, -0.46553802490234375, -0.4491920471191406, -0.4328460693359375, -0.4165000915527344, -0.40015411376953125, -0.3838081359863281, -0.367462158203125, -0.3511161804199219, -0.33477020263671875, -0.3184242248535156, -0.3020782470703125, -0.2857322692871094, -0.26938629150390625, -0.2530403137207031, -0.2366943359375, -0.22034835815429688, -0.20400238037109375, -0.18765640258789062, -0.1713104248046875, -0.15496444702148438, -0.13861846923828125, -0.12227249145507812, -0.105926513671875, -0.08958053588867188, -0.07323455810546875, -0.056888580322265625, -0.0405426025390625, -0.024196624755859375, -0.00785064697265625, 0.008495330810546875, 0.02484130859375, 0.041187286376953125, 0.05753326416015625, 0.07387924194335938, 0.0902252197265625, 0.10657119750976562, 0.12291717529296875, 0.13926315307617188, 0.155609130859375, 0.17195510864257812, 0.18830108642578125, 0.20464706420898438, 0.2209930419921875, 0.23733901977539062, 0.25368499755859375, 0.2700309753417969, 0.286376953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 4.0, 5.0, 9.0, 18.0, 23.0, 35.0, 49.0, 98.0, 133.0, 209.0, 397.0, 695.0, 1558.0, 3836.0, 11837.0, 54698.0, 3874788.0, 208041.0, 25037.0, 7281.0, 2753.0, 1226.0, 582.0, 361.0, 217.0, 150.0, 96.0, 42.0, 42.0, 18.0, 14.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.33203125, -1.2947845458984375, -1.257537841796875, -1.2202911376953125, -1.18304443359375, -1.1457977294921875, -1.108551025390625, -1.0713043212890625, -1.0340576171875, -0.9968109130859375, -0.959564208984375, -0.9223175048828125, -0.88507080078125, -0.8478240966796875, -0.810577392578125, -0.7733306884765625, -0.736083984375, -0.6988372802734375, -0.661590576171875, -0.6243438720703125, -0.58709716796875, -0.5498504638671875, -0.512603759765625, -0.4753570556640625, -0.4381103515625, -0.4008636474609375, -0.363616943359375, -0.3263702392578125, -0.28912353515625, -0.2518768310546875, -0.214630126953125, -0.1773834228515625, -0.14013671875, -0.1028900146484375, -0.065643310546875, -0.0283966064453125, 0.00885009765625, 0.0460968017578125, 0.083343505859375, 0.1205902099609375, 0.1578369140625, 0.1950836181640625, 0.232330322265625, 0.2695770263671875, 0.30682373046875, 0.3440704345703125, 0.381317138671875, 0.4185638427734375, 0.455810546875, 0.4930572509765625, 0.530303955078125, 0.5675506591796875, 0.60479736328125, 0.6420440673828125, 0.679290771484375, 0.7165374755859375, 0.7537841796875, 0.7910308837890625, 0.828277587890625, 0.8655242919921875, 0.90277099609375, 0.9400177001953125, 0.977264404296875, 1.0145111083984375, 1.0517578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 19.0, 23.0, 33.0, 63.0, 123.0, 769.0, 2628.0, 153.0, 66.0, 48.0, 33.0, 18.0, 12.0, 14.0, 11.0, 8.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35498046875, -0.34137725830078125, -0.3277740478515625, -0.31417083740234375, -0.300567626953125, -0.28696441650390625, -0.2733612060546875, -0.25975799560546875, -0.24615478515625, -0.23255157470703125, -0.2189483642578125, -0.20534515380859375, -0.191741943359375, -0.17813873291015625, -0.1645355224609375, -0.15093231201171875, -0.1373291015625, -0.12372589111328125, -0.1101226806640625, -0.09651947021484375, -0.082916259765625, -0.06931304931640625, -0.0557098388671875, -0.04210662841796875, -0.02850341796875, -0.01490020751953125, -0.0012969970703125, 0.01230621337890625, 0.025909423828125, 0.03951263427734375, 0.0531158447265625, 0.06671905517578125, 0.080322265625, 0.09392547607421875, 0.1075286865234375, 0.12113189697265625, 0.134735107421875, 0.14833831787109375, 0.1619415283203125, 0.17554473876953125, 0.18914794921875, 0.20275115966796875, 0.2163543701171875, 0.22995758056640625, 0.243560791015625, 0.25716400146484375, 0.2707672119140625, 0.28437042236328125, 0.2979736328125, 0.31157684326171875, 0.3251800537109375, 0.33878326416015625, 0.352386474609375, 0.36598968505859375, 0.3795928955078125, 0.39319610595703125, 0.40679931640625, 0.42040252685546875, 0.4340057373046875, 0.44760894775390625, 0.461212158203125, 0.47481536865234375, 0.4884185791015625, 0.5020217895507812, 0.515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 53.0, 248.0, 441.0, 164.0, 52.0, 24.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.920597076416016, -4.764099597930908, -4.607602596282959, -4.451105117797852, -4.294608116149902, -4.138110637664795, -3.9816133975982666, -3.8251161575317383, -3.66861891746521, -3.5121216773986816, -3.3556244373321533, -3.199127197265625, -3.0426297187805176, -2.8861327171325684, -2.729635238647461, -2.5731379985809326, -2.4166407585144043, -2.260143518447876, -2.1036462783813477, -1.9471489191055298, -1.7906516790390015, -1.6341544389724731, -1.4776570796966553, -1.321159839630127, -1.1646625995635986, -1.0081653594970703, -0.8516680598258972, -0.6951707601547241, -0.5386735200881958, -0.3821762800216675, -0.22567898035049438, -0.06918168067932129, 0.08731555938720703, 0.24381282925605774, 0.40031009912490845, 0.5568073987960815, 0.7133046388626099, 0.8698018789291382, 1.026299238204956, 1.1827964782714844, 1.3392937183380127, 1.495790958404541, 1.6522881984710693, 1.8087855577468872, 1.9652827978134155, 2.1217799186706543, 2.2782773971557617, 2.43477463722229, 2.5912718772888184, 2.7477691173553467, 2.904266357421875, 3.0607635974884033, 3.2172608375549316, 3.373758316040039, 3.5302555561065674, 3.6867527961730957, 3.843250036239624, 3.9997472763061523, 4.15624475479126, 4.312741756439209, 4.469239234924316, 4.625736236572266, 4.782233715057373, 4.9387311935424805, 5.09522819519043]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 15.0, 16.0, 22.0, 27.0, 49.0, 62.0, 70.0, 82.0, 85.0, 96.0, 81.0, 84.0, 78.0, 62.0, 47.0, 36.0, 40.0, 16.0, 14.0, 4.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9566502571105957, -1.8838406801223755, -1.8110312223434448, -1.7382216453552246, -1.665412187576294, -1.5926026105880737, -1.5197930335998535, -1.4469835758209229, -1.3741739988327026, -1.3013644218444824, -1.2285549640655518, -1.1557453870773315, -1.0829358100891113, -1.0101263523101807, -0.9373167753219604, -0.864507257938385, -0.7916977405548096, -0.7188882231712341, -0.6460787057876587, -0.5732691287994385, -0.500459611415863, -0.4276500940322876, -0.35484054684638977, -0.28203099966049194, -0.2092214822769165, -0.13641194999217987, -0.06360241770744324, 0.009207114577293396, 0.08201664686203003, 0.15482616424560547, 0.2276357114315033, 0.3004452586174011, 0.37325501441955566, 0.4460645318031311, 0.5188740491867065, 0.5916836261749268, 0.6644931435585022, 0.7373026609420776, 0.8101122379302979, 0.8829217553138733, 0.9557312726974487, 1.028540849685669, 1.1013503074645996, 1.1741598844528198, 1.24696946144104, 1.3197789192199707, 1.392588496208191, 1.4653980731964111, 1.5382075309753418, 1.611017107963562, 1.6838265657424927, 1.756636142730713, 1.8294456005096436, 1.9022551774978638, 1.975064754486084, 2.0478742122650146, 2.1206836700439453, 2.193493127822876, 2.2663028240203857, 2.3391122817993164, 2.411921739578247, 2.4847311973571777, 2.5575408935546875, 2.630350351333618, 2.703160047531128]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 5.0, 6.0, 5.0, 8.0, 9.0, 14.0, 20.0, 12.0, 22.0, 48.0, 50.0, 69.0, 102.0, 143.0, 369.0, 612.0, 1397.0, 3723.0, 14554.0, 80670.0, 683550.0, 222724.0, 29541.0, 6764.0, 2189.0, 865.0, 441.0, 237.0, 96.0, 94.0, 43.0, 51.0, 29.0, 25.0, 15.0, 10.0, 7.0, 8.0, 7.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.6064453125, -1.5573577880859375, -1.508270263671875, -1.4591827392578125, -1.41009521484375, -1.3610076904296875, -1.311920166015625, -1.2628326416015625, -1.2137451171875, -1.1646575927734375, -1.115570068359375, -1.0664825439453125, -1.01739501953125, -0.9683074951171875, -0.919219970703125, -0.8701324462890625, -0.821044921875, -0.7719573974609375, -0.722869873046875, -0.6737823486328125, -0.62469482421875, -0.5756072998046875, -0.526519775390625, -0.4774322509765625, -0.4283447265625, -0.3792572021484375, -0.330169677734375, -0.2810821533203125, -0.23199462890625, -0.1829071044921875, -0.133819580078125, -0.0847320556640625, -0.03564453125, 0.0134429931640625, 0.062530517578125, 0.1116180419921875, 0.16070556640625, 0.2097930908203125, 0.258880615234375, 0.3079681396484375, 0.3570556640625, 0.4061431884765625, 0.455230712890625, 0.5043182373046875, 0.55340576171875, 0.6024932861328125, 0.651580810546875, 0.7006683349609375, 0.749755859375, 0.7988433837890625, 0.847930908203125, 0.8970184326171875, 0.94610595703125, 0.9951934814453125, 1.044281005859375, 1.0933685302734375, 1.1424560546875, 1.1915435791015625, 1.240631103515625, 1.2897186279296875, 1.33880615234375, 1.3878936767578125, 1.436981201171875, 1.4860687255859375, 1.53515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 20.0, 20.0, 46.0, 80.0, 87.0, 129.0, 129.0, 133.0, 115.0, 95.0, 63.0, 31.0, 19.0, 13.0, 14.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.72998046875, -0.7140464782714844, -0.6981124877929688, -0.6821784973144531, -0.6662445068359375, -0.6503105163574219, -0.6343765258789062, -0.6184425354003906, -0.602508544921875, -0.5865745544433594, -0.5706405639648438, -0.5547065734863281, -0.5387725830078125, -0.5228385925292969, -0.5069046020507812, -0.4909706115722656, -0.47503662109375, -0.4591026306152344, -0.44316864013671875, -0.4272346496582031, -0.4113006591796875, -0.3953666687011719, -0.37943267822265625, -0.3634986877441406, -0.347564697265625, -0.3316307067871094, -0.31569671630859375, -0.2997627258300781, -0.2838287353515625, -0.2678947448730469, -0.25196075439453125, -0.23602676391601562, -0.2200927734375, -0.20415878295898438, -0.18822479248046875, -0.17229080200195312, -0.1563568115234375, -0.14042282104492188, -0.12448883056640625, -0.10855484008789062, -0.092620849609375, -0.07668685913085938, -0.06075286865234375, -0.044818878173828125, -0.0288848876953125, -0.012950897216796875, 0.00298309326171875, 0.018917083740234375, 0.03485107421875, 0.050785064697265625, 0.06671905517578125, 0.08265304565429688, 0.0985870361328125, 0.11452102661132812, 0.13045501708984375, 0.14638900756835938, 0.162322998046875, 0.17825698852539062, 0.19419097900390625, 0.21012496948242188, 0.2260589599609375, 0.24199295043945312, 0.25792694091796875, 0.2738609313964844, 0.289794921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 14.0, 13.0, 21.0, 25.0, 39.0, 55.0, 81.0, 140.0, 228.0, 427.0, 776.0, 1597.0, 3513.0, 9316.0, 30409.0, 141664.0, 665351.0, 146531.0, 31341.0, 9604.0, 3676.0, 1705.0, 826.0, 463.0, 278.0, 166.0, 89.0, 58.0, 53.0, 23.0, 18.0, 11.0, 11.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1819610595703125, -1.143218994140625, -1.1044769287109375, -1.06573486328125, -1.0269927978515625, -0.988250732421875, -0.9495086669921875, -0.9107666015625, -0.8720245361328125, -0.833282470703125, -0.7945404052734375, -0.75579833984375, -0.7170562744140625, -0.678314208984375, -0.6395721435546875, -0.600830078125, -0.5620880126953125, -0.523345947265625, -0.4846038818359375, -0.44586181640625, -0.4071197509765625, -0.368377685546875, -0.3296356201171875, -0.2908935546875, -0.2521514892578125, -0.213409423828125, -0.1746673583984375, -0.13592529296875, -0.0971832275390625, -0.058441162109375, -0.0196990966796875, 0.01904296875, 0.0577850341796875, 0.096527099609375, 0.1352691650390625, 0.17401123046875, 0.2127532958984375, 0.251495361328125, 0.2902374267578125, 0.3289794921875, 0.3677215576171875, 0.406463623046875, 0.4452056884765625, 0.48394775390625, 0.5226898193359375, 0.561431884765625, 0.6001739501953125, 0.638916015625, 0.6776580810546875, 0.716400146484375, 0.7551422119140625, 0.79388427734375, 0.8326263427734375, 0.871368408203125, 0.9101104736328125, 0.9488525390625, 0.9875946044921875, 1.026336669921875, 1.0650787353515625, 1.10382080078125, 1.1425628662109375, 1.181304931640625, 1.2200469970703125, 1.2587890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 7.0, 12.0, 16.0, 21.0, 30.0, 40.0, 39.0, 44.0, 59.0, 60.0, 57.0, 70.0, 71.0, 85.0, 71.0, 63.0, 47.0, 46.0, 29.0, 27.0, 25.0, 16.0, 7.0, 11.0, 9.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4111785888671875, -1.362396240234375, -1.3136138916015625, -1.26483154296875, -1.2160491943359375, -1.167266845703125, -1.1184844970703125, -1.0697021484375, -1.0209197998046875, -0.972137451171875, -0.9233551025390625, -0.87457275390625, -0.8257904052734375, -0.777008056640625, -0.7282257080078125, -0.679443359375, -0.6306610107421875, -0.581878662109375, -0.5330963134765625, -0.48431396484375, -0.4355316162109375, -0.386749267578125, -0.3379669189453125, -0.2891845703125, -0.2404022216796875, -0.191619873046875, -0.1428375244140625, -0.09405517578125, -0.0452728271484375, 0.003509521484375, 0.0522918701171875, 0.10107421875, 0.1498565673828125, 0.198638916015625, 0.2474212646484375, 0.29620361328125, 0.3449859619140625, 0.393768310546875, 0.4425506591796875, 0.4913330078125, 0.5401153564453125, 0.588897705078125, 0.6376800537109375, 0.68646240234375, 0.7352447509765625, 0.784027099609375, 0.8328094482421875, 0.881591796875, 0.9303741455078125, 0.979156494140625, 1.0279388427734375, 1.07672119140625, 1.1255035400390625, 1.174285888671875, 1.2230682373046875, 1.2718505859375, 1.3206329345703125, 1.369415283203125, 1.4181976318359375, 1.46697998046875, 1.5157623291015625, 1.564544677734375, 1.6133270263671875, 1.662109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 11.0, 10.0, 17.0, 39.0, 62.0, 110.0, 177.0, 329.0, 598.0, 1177.0, 2503.0, 6954.0, 28276.0, 647902.0, 328059.0, 21957.0, 5847.0, 2275.0, 1039.0, 524.0, 285.0, 154.0, 100.0, 53.0, 24.0, 15.0, 18.0, 5.0, 2.0, 9.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9443359375, -0.9147567749023438, -0.8851776123046875, -0.8555984497070312, -0.826019287109375, -0.7964401245117188, -0.7668609619140625, -0.7372817993164062, -0.70770263671875, -0.6781234741210938, -0.6485443115234375, -0.6189651489257812, -0.589385986328125, -0.5598068237304688, -0.5302276611328125, -0.5006484985351562, -0.4710693359375, -0.44149017333984375, -0.4119110107421875, -0.38233184814453125, -0.352752685546875, -0.32317352294921875, -0.2935943603515625, -0.26401519775390625, -0.23443603515625, -0.20485687255859375, -0.1752777099609375, -0.14569854736328125, -0.116119384765625, -0.08654022216796875, -0.0569610595703125, -0.02738189697265625, 0.002197265625, 0.03177642822265625, 0.0613555908203125, 0.09093475341796875, 0.120513916015625, 0.15009307861328125, 0.1796722412109375, 0.20925140380859375, 0.23883056640625, 0.26840972900390625, 0.2979888916015625, 0.32756805419921875, 0.357147216796875, 0.38672637939453125, 0.4163055419921875, 0.44588470458984375, 0.4754638671875, 0.5050430297851562, 0.5346221923828125, 0.5642013549804688, 0.593780517578125, 0.6233596801757812, 0.6529388427734375, 0.6825180053710938, 0.71209716796875, 0.7416763305664062, 0.7712554931640625, 0.8008346557617188, 0.830413818359375, 0.8599929809570312, 0.8895721435546875, 0.9191513061523438, 0.94873046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 11.0, 21.0, 28.0, 30.0, 65.0, 98.0, 138.0, 190.0, 136.0, 99.0, 41.0, 28.0, 22.0, 13.0, 14.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.052587509155273e-05, -7.837172597646713e-05, -7.621757686138153e-05, -7.406342774629593e-05, -7.190927863121033e-05, -6.975512951612473e-05, -6.760098040103912e-05, -6.544683128595352e-05, -6.329268217086792e-05, -6.113853305578232e-05, -5.8984383940696716e-05, -5.6830234825611115e-05, -5.467608571052551e-05, -5.252193659543991e-05, -5.036778748035431e-05, -4.821363836526871e-05, -4.6059489250183105e-05, -4.3905340135097504e-05, -4.17511910200119e-05, -3.95970419049263e-05, -3.74428927898407e-05, -3.5288743674755096e-05, -3.3134594559669495e-05, -3.098044544458389e-05, -2.882629632949829e-05, -2.667214721441269e-05, -2.4517998099327087e-05, -2.2363848984241486e-05, -2.0209699869155884e-05, -1.8055550754070282e-05, -1.590140163898468e-05, -1.3747252523899078e-05, -1.1593103408813477e-05, -9.438954293727875e-06, -7.284805178642273e-06, -5.130656063556671e-06, -2.9765069484710693e-06, -8.223578333854675e-07, 1.3317912817001343e-06, 3.485940396785736e-06, 5.640089511871338e-06, 7.79423862695694e-06, 9.948387742042542e-06, 1.2102536857128143e-05, 1.4256685972213745e-05, 1.6410835087299347e-05, 1.856498420238495e-05, 2.071913331747055e-05, 2.2873282432556152e-05, 2.5027431547641754e-05, 2.7181580662727356e-05, 2.9335729777812958e-05, 3.148987889289856e-05, 3.364402800798416e-05, 3.579817712306976e-05, 3.7952326238155365e-05, 4.010647535324097e-05, 4.226062446832657e-05, 4.441477358341217e-05, 4.656892269849777e-05, 4.8723071813583374e-05, 5.0877220928668976e-05, 5.303137004375458e-05, 5.518551915884018e-05, 5.733966827392578e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 13.0, 24.0, 43.0, 77.0, 193.0, 522.0, 1807.0, 9182.0, 739834.0, 287583.0, 7055.0, 1444.0, 440.0, 149.0, 73.0, 33.0, 22.0, 17.0, 9.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7578125, -1.707489013671875, -1.65716552734375, -1.606842041015625, -1.5565185546875, -1.506195068359375, -1.45587158203125, -1.405548095703125, -1.355224609375, -1.304901123046875, -1.25457763671875, -1.204254150390625, -1.1539306640625, -1.103607177734375, -1.05328369140625, -1.002960205078125, -0.95263671875, -0.902313232421875, -0.85198974609375, -0.801666259765625, -0.7513427734375, -0.701019287109375, -0.65069580078125, -0.600372314453125, -0.550048828125, -0.499725341796875, -0.44940185546875, -0.399078369140625, -0.3487548828125, -0.298431396484375, -0.24810791015625, -0.197784423828125, -0.1474609375, -0.097137451171875, -0.04681396484375, 0.003509521484375, 0.0538330078125, 0.104156494140625, 0.15447998046875, 0.204803466796875, 0.255126953125, 0.305450439453125, 0.35577392578125, 0.406097412109375, 0.4564208984375, 0.506744384765625, 0.55706787109375, 0.607391357421875, 0.65771484375, 0.708038330078125, 0.75836181640625, 0.808685302734375, 0.8590087890625, 0.909332275390625, 0.95965576171875, 1.009979248046875, 1.060302734375, 1.110626220703125, 1.16094970703125, 1.211273193359375, 1.2615966796875, 1.311920166015625, 1.36224365234375, 1.412567138671875, 1.462890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 7.0, 4.0, 12.0, 19.0, 28.0, 39.0, 64.0, 112.0, 155.0, 180.0, 134.0, 88.0, 45.0, 22.0, 21.0, 21.0, 9.0, 7.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85693359375, -0.8319168090820312, -0.8069000244140625, -0.7818832397460938, -0.756866455078125, -0.7318496704101562, -0.7068328857421875, -0.6818161010742188, -0.65679931640625, -0.6317825317382812, -0.6067657470703125, -0.5817489624023438, -0.556732177734375, -0.5317153930664062, -0.5066986083984375, -0.48168182373046875, -0.4566650390625, -0.43164825439453125, -0.4066314697265625, -0.38161468505859375, -0.356597900390625, -0.33158111572265625, -0.3065643310546875, -0.28154754638671875, -0.25653076171875, -0.23151397705078125, -0.2064971923828125, -0.18148040771484375, -0.156463623046875, -0.13144683837890625, -0.1064300537109375, -0.08141326904296875, -0.056396484375, -0.03137969970703125, -0.0063629150390625, 0.01865386962890625, 0.043670654296875, 0.06868743896484375, 0.0937042236328125, 0.11872100830078125, 0.14373779296875, 0.16875457763671875, 0.1937713623046875, 0.21878814697265625, 0.243804931640625, 0.26882171630859375, 0.2938385009765625, 0.31885528564453125, 0.3438720703125, 0.36888885498046875, 0.3939056396484375, 0.41892242431640625, 0.443939208984375, 0.46895599365234375, 0.4939727783203125, 0.5189895629882812, 0.54400634765625, 0.5690231323242188, 0.5940399169921875, 0.6190567016601562, 0.644073486328125, 0.6690902709960938, 0.6941070556640625, 0.7191238403320312, 0.744140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 41.0, 99.0, 383.0, 328.0, 86.0, 35.0, 17.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.99549865722656, -43.13209915161133, -42.268699645996094, -41.405303955078125, -40.54190444946289, -39.678504943847656, -38.81510543823242, -37.95170593261719, -37.08831024169922, -36.224910736083984, -35.36151123046875, -34.49811553955078, -33.63471603393555, -32.77131652832031, -31.907917022705078, -31.044519424438477, -30.181119918823242, -29.317720413208008, -28.454322814941406, -27.590923309326172, -26.72752571105957, -25.864126205444336, -25.000728607177734, -24.1373291015625, -23.273929595947266, -22.41053009033203, -21.54713249206543, -20.683732986450195, -19.820335388183594, -18.95693588256836, -18.093536376953125, -17.230138778686523, -16.366741180419922, -15.503342628479004, -14.639944076538086, -13.776544570922852, -12.91314697265625, -12.049747467041016, -11.186348915100098, -10.32295036315918, -9.459550857543945, -8.596152305603027, -7.732753753662109, -6.869354724884033, -6.005956172943115, -5.142557621002197, -4.279158592224121, -3.415760040283203, -2.552361488342285, -1.6889628171920776, -0.8255641460418701, 0.03783464431762695, 0.9012331962585449, 1.764631748199463, 2.628030776977539, 3.491429328918457, 4.354827880859375, 5.218226432800293, 6.081624984741211, 6.945024013519287, 7.808422565460205, 8.671821594238281, 9.5352201461792, 10.398618698120117, 11.262017250061035]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 8.0, 11.0, 18.0, 26.0, 13.0, 14.0, 30.0, 21.0, 30.0, 38.0, 34.0, 40.0, 34.0, 42.0, 45.0, 36.0, 48.0, 34.0, 31.0, 41.0, 37.0, 42.0, 39.0, 32.0, 31.0, 25.0, 26.0, 31.0, 23.0, 17.0, 17.0, 14.0, 10.0, 10.0, 10.0, 1.0, 7.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.0648722648620605, -6.840939998626709, -6.617007255554199, -6.393074989318848, -6.169142723083496, -5.9452104568481445, -5.721277713775635, -5.497345447540283, -5.273412704467773, -5.049480438232422, -4.825547695159912, -4.6016154289245605, -4.377683162689209, -4.153750419616699, -3.9298181533813477, -3.705885887145996, -3.4819536209106445, -3.258021116256714, -3.0340888500213623, -2.8101563453674316, -2.58622407913208, -2.3622915744781494, -2.1383590698242188, -1.9144266843795776, -1.6904942989349365, -1.4665619134902954, -1.2426295280456543, -1.0186970233917236, -0.7947646379470825, -0.5708322525024414, -0.34689974784851074, -0.12296736240386963, 0.10096454620361328, 0.3248969614505768, 0.5488293766975403, 0.7727618217468262, 0.9966942071914673, 1.2206265926361084, 1.444559097290039, 1.6684914827346802, 1.8924238681793213, 2.116356372833252, 2.3402886390686035, 2.564221143722534, 2.788153648376465, 3.0120859146118164, 3.236018419265747, 3.4599509239196777, 3.6838831901550293, 3.90781569480896, 4.131748199462891, 4.355680465698242, 4.579612731933594, 4.803544998168945, 5.027477741241455, 5.251410007476807, 5.475342750549316, 5.699275016784668, 5.923207759857178, 6.147140026092529, 6.371072292327881, 6.595005035400391, 6.818937301635742, 7.042869567871094, 7.266801834106445]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 13.0, 11.0, 20.0, 18.0, 24.0, 35.0, 51.0, 67.0, 139.0, 242.0, 502.0, 1150.0, 2639.0, 7669.0, 39533.0, 3961892.0, 156422.0, 16643.0, 4222.0, 1574.0, 714.0, 317.0, 178.0, 83.0, 48.0, 28.0, 12.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-3.640625, -3.561065673828125, -3.48150634765625, -3.401947021484375, -3.3223876953125, -3.242828369140625, -3.16326904296875, -3.083709716796875, -3.004150390625, -2.924591064453125, -2.84503173828125, -2.765472412109375, -2.6859130859375, -2.606353759765625, -2.52679443359375, -2.447235107421875, -2.36767578125, -2.288116455078125, -2.20855712890625, -2.128997802734375, -2.0494384765625, -1.969879150390625, -1.89031982421875, -1.810760498046875, -1.731201171875, -1.651641845703125, -1.57208251953125, -1.492523193359375, -1.4129638671875, -1.333404541015625, -1.25384521484375, -1.174285888671875, -1.0947265625, -1.015167236328125, -0.93560791015625, -0.856048583984375, -0.7764892578125, -0.696929931640625, -0.61737060546875, -0.537811279296875, -0.458251953125, -0.378692626953125, -0.29913330078125, -0.219573974609375, -0.1400146484375, -0.060455322265625, 0.01910400390625, 0.098663330078125, 0.17822265625, 0.257781982421875, 0.33734130859375, 0.416900634765625, 0.4964599609375, 0.576019287109375, 0.65557861328125, 0.735137939453125, 0.814697265625, 0.894256591796875, 0.97381591796875, 1.053375244140625, 1.1329345703125, 1.212493896484375, 1.29205322265625, 1.371612548828125, 1.451171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 14.0, 23.0, 51.0, 64.0, 67.0, 70.0, 98.0, 88.0, 102.0, 108.0, 94.0, 61.0, 60.0, 27.0, 29.0, 17.0, 11.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7958984375, -0.7785758972167969, -0.7612533569335938, -0.7439308166503906, -0.7266082763671875, -0.7092857360839844, -0.6919631958007812, -0.6746406555175781, -0.657318115234375, -0.6399955749511719, -0.6226730346679688, -0.6053504943847656, -0.5880279541015625, -0.5707054138183594, -0.5533828735351562, -0.5360603332519531, -0.51873779296875, -0.5014152526855469, -0.48409271240234375, -0.4667701721191406, -0.4494476318359375, -0.4321250915527344, -0.41480255126953125, -0.3974800109863281, -0.380157470703125, -0.3628349304199219, -0.34551239013671875, -0.3281898498535156, -0.3108673095703125, -0.2935447692871094, -0.27622222900390625, -0.2588996887207031, -0.2415771484375, -0.22425460815429688, -0.20693206787109375, -0.18960952758789062, -0.1722869873046875, -0.15496444702148438, -0.13764190673828125, -0.12031936645507812, -0.102996826171875, -0.08567428588867188, -0.06835174560546875, -0.051029205322265625, -0.0337066650390625, -0.016384124755859375, 0.00093841552734375, 0.018260955810546875, 0.03558349609375, 0.052906036376953125, 0.07022857666015625, 0.08755111694335938, 0.1048736572265625, 0.12219619750976562, 0.13951873779296875, 0.15684127807617188, 0.174163818359375, 0.19148635864257812, 0.20880889892578125, 0.22613143920898438, 0.2434539794921875, 0.2607765197753906, 0.27809906005859375, 0.2954216003417969, 0.312744140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 15.0, 19.0, 19.0, 31.0, 51.0, 80.0, 133.0, 167.0, 271.0, 407.0, 686.0, 1134.0, 2009.0, 3732.0, 7749.0, 18883.0, 67658.0, 2933291.0, 1060787.0, 62977.0, 18255.0, 7378.0, 3512.0, 1960.0, 1102.0, 700.0, 424.0, 275.0, 181.0, 125.0, 84.0, 50.0, 38.0, 26.0, 16.0, 10.0, 10.0, 8.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0], "bins": [-1.4951171875, -1.454681396484375, -1.41424560546875, -1.373809814453125, -1.3333740234375, -1.292938232421875, -1.25250244140625, -1.212066650390625, -1.171630859375, -1.131195068359375, -1.09075927734375, -1.050323486328125, -1.0098876953125, -0.969451904296875, -0.92901611328125, -0.888580322265625, -0.84814453125, -0.807708740234375, -0.76727294921875, -0.726837158203125, -0.6864013671875, -0.645965576171875, -0.60552978515625, -0.565093994140625, -0.524658203125, -0.484222412109375, -0.44378662109375, -0.403350830078125, -0.3629150390625, -0.322479248046875, -0.28204345703125, -0.241607666015625, -0.201171875, -0.160736083984375, -0.12030029296875, -0.079864501953125, -0.0394287109375, 0.001007080078125, 0.04144287109375, 0.081878662109375, 0.122314453125, 0.162750244140625, 0.20318603515625, 0.243621826171875, 0.2840576171875, 0.324493408203125, 0.36492919921875, 0.405364990234375, 0.44580078125, 0.486236572265625, 0.52667236328125, 0.567108154296875, 0.6075439453125, 0.647979736328125, 0.68841552734375, 0.728851318359375, 0.769287109375, 0.809722900390625, 0.85015869140625, 0.890594482421875, 0.9310302734375, 0.971466064453125, 1.01190185546875, 1.052337646484375, 1.0927734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 7.0, 2.0, 2.0, 7.0, 9.0, 5.0, 15.0, 15.0, 31.0, 62.0, 83.0, 162.0, 2696.0, 532.0, 169.0, 87.0, 60.0, 27.0, 18.0, 24.0, 13.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6350479125976562, -0.6104278564453125, -0.5858078002929688, -0.561187744140625, -0.5365676879882812, -0.5119476318359375, -0.48732757568359375, -0.46270751953125, -0.43808746337890625, -0.4134674072265625, -0.38884735107421875, -0.364227294921875, -0.33960723876953125, -0.3149871826171875, -0.29036712646484375, -0.2657470703125, -0.24112701416015625, -0.2165069580078125, -0.19188690185546875, -0.167266845703125, -0.14264678955078125, -0.1180267333984375, -0.09340667724609375, -0.06878662109375, -0.04416656494140625, -0.0195465087890625, 0.00507354736328125, 0.029693603515625, 0.05431365966796875, 0.0789337158203125, 0.10355377197265625, 0.128173828125, 0.15279388427734375, 0.1774139404296875, 0.20203399658203125, 0.226654052734375, 0.25127410888671875, 0.2758941650390625, 0.30051422119140625, 0.32513427734375, 0.34975433349609375, 0.3743743896484375, 0.39899444580078125, 0.423614501953125, 0.44823455810546875, 0.4728546142578125, 0.49747467041015625, 0.5220947265625, 0.5467147827148438, 0.5713348388671875, 0.5959548950195312, 0.620574951171875, 0.6451950073242188, 0.6698150634765625, 0.6944351196289062, 0.71905517578125, 0.7436752319335938, 0.7682952880859375, 0.7929153442382812, 0.817535400390625, 0.8421554565429688, 0.8667755126953125, 0.8913955688476562, 0.916015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 9.0, 23.0, 38.0, 107.0, 216.0, 254.0, 151.0, 98.0, 44.0, 19.0, 19.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4229354858398438, -3.2424254417419434, -3.061915636062622, -2.8814055919647217, -2.7008957862854004, -2.5203857421875, -2.3398756980895996, -2.1593658924102783, -1.9788559675216675, -1.7983460426330566, -1.6178361177444458, -1.437326192855835, -1.2568161487579346, -1.0763063430786133, -0.8957962989807129, -0.715286374092102, -0.5347764492034912, -0.35426652431488037, -0.17375656962394714, 0.006753385066986084, 0.18726330995559692, 0.36777323484420776, 0.5482832193374634, 0.7287931442260742, 0.9093030691146851, 1.089812994003296, 1.2703229188919067, 1.4508328437805176, 1.631342887878418, 1.8118526935577393, 1.9923627376556396, 2.172872543334961, 2.3533825874328613, 2.5338926315307617, 2.714402437210083, 2.8949124813079834, 3.0754222869873047, 3.255932331085205, 3.4364423751831055, 3.6169521808624268, 3.797461986541748, 3.9779720306396484, 4.158482074737549, 4.338991641998291, 4.519501686096191, 4.700011730194092, 4.880521774291992, 5.061031341552734, 5.241541862487793, 5.422051906585693, 5.602561950683594, 5.783071517944336, 5.963581562042236, 6.144091606140137, 6.324601650238037, 6.5051116943359375, 6.68562126159668, 6.86613130569458, 7.0466413497924805, 7.227150917053223, 7.407660961151123, 7.588171005249023, 7.768681049346924, 7.949191093444824, 8.129700660705566]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 13.0, 21.0, 32.0, 25.0, 34.0, 35.0, 33.0, 51.0, 50.0, 62.0, 61.0, 70.0, 47.0, 56.0, 50.0, 60.0, 36.0, 48.0, 37.0, 33.0, 29.0, 30.0, 19.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.947227954864502, -2.8547418117523193, -2.7622554302215576, -2.669769287109375, -2.5772831439971924, -2.4847970008850098, -2.392310619354248, -2.2998244762420654, -2.207338333129883, -2.1148521900177, -2.0223658084869385, -1.9298796653747559, -1.8373935222625732, -1.744907259941101, -1.652420997619629, -1.5599348545074463, -1.4674485921859741, -1.374962329864502, -1.2824761867523193, -1.1899899244308472, -1.0975037813186646, -1.0050175189971924, -0.912531316280365, -0.8200451135635376, -0.7275589108467102, -0.6350727081298828, -0.5425865054130554, -0.45010027289390564, -0.35761407017707825, -0.26512786746025085, -0.17264163494110107, -0.08015543222427368, 0.012330770492553711, 0.1048169806599617, 0.1973031908273697, 0.2897894084453583, 0.38227561116218567, 0.47476181387901306, 0.5672480463981628, 0.6597342491149902, 0.7522204518318176, 0.844706654548645, 0.9371928572654724, 1.0296790599822998, 1.122165322303772, 1.2146514654159546, 1.3071377277374268, 1.3996238708496094, 1.4921101331710815, 1.5845963954925537, 1.6770825386047363, 1.7695688009262085, 1.8620549440383911, 1.9545412063598633, 2.047027349472046, 2.1395134925842285, 2.2319998741149902, 2.324486017227173, 2.4169723987579346, 2.509458541870117, 2.6019446849823, 2.6944308280944824, 2.786917209625244, 2.8794033527374268, 2.9718894958496094]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 4.0, 9.0, 9.0, 16.0, 11.0, 26.0, 42.0, 44.0, 62.0, 94.0, 171.0, 429.0, 902.0, 2186.0, 6167.0, 23313.0, 103050.0, 620274.0, 232183.0, 42574.0, 11164.0, 3366.0, 1298.0, 566.0, 239.0, 117.0, 74.0, 49.0, 39.0, 23.0, 15.0, 12.0, 8.0, 6.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.208984375, -2.145355224609375, -2.08172607421875, -2.018096923828125, -1.9544677734375, -1.890838623046875, -1.82720947265625, -1.763580322265625, -1.699951171875, -1.636322021484375, -1.57269287109375, -1.509063720703125, -1.4454345703125, -1.381805419921875, -1.31817626953125, -1.254547119140625, -1.19091796875, -1.127288818359375, -1.06365966796875, -1.000030517578125, -0.9364013671875, -0.872772216796875, -0.80914306640625, -0.745513916015625, -0.681884765625, -0.618255615234375, -0.55462646484375, -0.490997314453125, -0.4273681640625, -0.363739013671875, -0.30010986328125, -0.236480712890625, -0.1728515625, -0.109222412109375, -0.04559326171875, 0.018035888671875, 0.0816650390625, 0.145294189453125, 0.20892333984375, 0.272552490234375, 0.336181640625, 0.399810791015625, 0.46343994140625, 0.527069091796875, 0.5906982421875, 0.654327392578125, 0.71795654296875, 0.781585693359375, 0.84521484375, 0.908843994140625, 0.97247314453125, 1.036102294921875, 1.0997314453125, 1.163360595703125, 1.22698974609375, 1.290618896484375, 1.354248046875, 1.417877197265625, 1.48150634765625, 1.545135498046875, 1.6087646484375, 1.672393798828125, 1.73602294921875, 1.799652099609375, 1.86328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 10.0, 12.0, 31.0, 46.0, 57.0, 65.0, 73.0, 66.0, 95.0, 100.0, 98.0, 90.0, 69.0, 57.0, 32.0, 29.0, 28.0, 14.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.748046875, -0.73114013671875, -0.7142333984375, -0.69732666015625, -0.680419921875, -0.66351318359375, -0.6466064453125, -0.62969970703125, -0.61279296875, -0.59588623046875, -0.5789794921875, -0.56207275390625, -0.545166015625, -0.52825927734375, -0.5113525390625, -0.49444580078125, -0.4775390625, -0.46063232421875, -0.4437255859375, -0.42681884765625, -0.409912109375, -0.39300537109375, -0.3760986328125, -0.35919189453125, -0.34228515625, -0.32537841796875, -0.3084716796875, -0.29156494140625, -0.274658203125, -0.25775146484375, -0.2408447265625, -0.22393798828125, -0.20703125, -0.19012451171875, -0.1732177734375, -0.15631103515625, -0.139404296875, -0.12249755859375, -0.1055908203125, -0.08868408203125, -0.07177734375, -0.05487060546875, -0.0379638671875, -0.02105712890625, -0.004150390625, 0.01275634765625, 0.0296630859375, 0.04656982421875, 0.0634765625, 0.08038330078125, 0.0972900390625, 0.11419677734375, 0.131103515625, 0.14801025390625, 0.1649169921875, 0.18182373046875, 0.19873046875, 0.21563720703125, 0.2325439453125, 0.24945068359375, 0.266357421875, 0.28326416015625, 0.3001708984375, 0.31707763671875, 0.333984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 1.0, 6.0, 4.0, 14.0, 8.0, 21.0, 27.0, 38.0, 60.0, 79.0, 99.0, 195.0, 286.0, 451.0, 783.0, 1396.0, 2670.0, 5758.0, 13439.0, 36128.0, 117413.0, 521079.0, 248490.0, 61800.0, 21377.0, 8691.0, 3762.0, 1878.0, 996.0, 559.0, 367.0, 222.0, 165.0, 93.0, 72.0, 42.0, 29.0, 16.0, 11.0, 10.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5145111083984375, -1.463592529296875, -1.4126739501953125, -1.36175537109375, -1.3108367919921875, -1.259918212890625, -1.2089996337890625, -1.1580810546875, -1.1071624755859375, -1.056243896484375, -1.0053253173828125, -0.95440673828125, -0.9034881591796875, -0.852569580078125, -0.8016510009765625, -0.750732421875, -0.6998138427734375, -0.648895263671875, -0.5979766845703125, -0.54705810546875, -0.4961395263671875, -0.445220947265625, -0.3943023681640625, -0.3433837890625, -0.2924652099609375, -0.241546630859375, -0.1906280517578125, -0.13970947265625, -0.0887908935546875, -0.037872314453125, 0.0130462646484375, 0.06396484375, 0.1148834228515625, 0.165802001953125, 0.2167205810546875, 0.26763916015625, 0.3185577392578125, 0.369476318359375, 0.4203948974609375, 0.4713134765625, 0.5222320556640625, 0.573150634765625, 0.6240692138671875, 0.67498779296875, 0.7259063720703125, 0.776824951171875, 0.8277435302734375, 0.878662109375, 0.9295806884765625, 0.980499267578125, 1.0314178466796875, 1.08233642578125, 1.1332550048828125, 1.184173583984375, 1.2350921630859375, 1.2860107421875, 1.3369293212890625, 1.387847900390625, 1.4387664794921875, 1.48968505859375, 1.5406036376953125, 1.591522216796875, 1.6424407958984375, 1.693359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 9.0, 18.0, 16.0, 17.0, 26.0, 27.0, 35.0, 39.0, 38.0, 41.0, 49.0, 54.0, 54.0, 54.0, 48.0, 52.0, 59.0, 46.0, 41.0, 46.0, 45.0, 36.0, 28.0, 26.0, 17.0, 13.0, 12.0, 10.0, 10.0, 1.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.288116455078125, -2.21881103515625, -2.149505615234375, -2.0802001953125, -2.010894775390625, -1.94158935546875, -1.872283935546875, -1.802978515625, -1.733673095703125, -1.66436767578125, -1.595062255859375, -1.5257568359375, -1.456451416015625, -1.38714599609375, -1.317840576171875, -1.24853515625, -1.179229736328125, -1.10992431640625, -1.040618896484375, -0.9713134765625, -0.902008056640625, -0.83270263671875, -0.763397216796875, -0.694091796875, -0.624786376953125, -0.55548095703125, -0.486175537109375, -0.4168701171875, -0.347564697265625, -0.27825927734375, -0.208953857421875, -0.1396484375, -0.070343017578125, -0.00103759765625, 0.068267822265625, 0.1375732421875, 0.206878662109375, 0.27618408203125, 0.345489501953125, 0.414794921875, 0.484100341796875, 0.55340576171875, 0.622711181640625, 0.6920166015625, 0.761322021484375, 0.83062744140625, 0.899932861328125, 0.96923828125, 1.038543701171875, 1.10784912109375, 1.177154541015625, 1.2464599609375, 1.315765380859375, 1.38507080078125, 1.454376220703125, 1.523681640625, 1.592987060546875, 1.66229248046875, 1.731597900390625, 1.8009033203125, 1.870208740234375, 1.93951416015625, 2.008819580078125, 2.078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 8.0, 12.0, 18.0, 20.0, 43.0, 65.0, 96.0, 134.0, 256.0, 429.0, 812.0, 1680.0, 4412.0, 18028.0, 412152.0, 580704.0, 21186.0, 4701.0, 1813.0, 795.0, 457.0, 294.0, 161.0, 92.0, 58.0, 41.0, 27.0, 17.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4096832275390625, -1.359405517578125, -1.3091278076171875, -1.25885009765625, -1.2085723876953125, -1.158294677734375, -1.1080169677734375, -1.0577392578125, -1.0074615478515625, -0.957183837890625, -0.9069061279296875, -0.85662841796875, -0.8063507080078125, -0.756072998046875, -0.7057952880859375, -0.655517578125, -0.6052398681640625, -0.554962158203125, -0.5046844482421875, -0.45440673828125, -0.4041290283203125, -0.353851318359375, -0.3035736083984375, -0.2532958984375, -0.2030181884765625, -0.152740478515625, -0.1024627685546875, -0.05218505859375, -0.0019073486328125, 0.048370361328125, 0.0986480712890625, 0.14892578125, 0.1992034912109375, 0.249481201171875, 0.2997589111328125, 0.35003662109375, 0.4003143310546875, 0.450592041015625, 0.5008697509765625, 0.5511474609375, 0.6014251708984375, 0.651702880859375, 0.7019805908203125, 0.75225830078125, 0.8025360107421875, 0.852813720703125, 0.9030914306640625, 0.953369140625, 1.0036468505859375, 1.053924560546875, 1.1042022705078125, 1.15447998046875, 1.2047576904296875, 1.255035400390625, 1.3053131103515625, 1.3555908203125, 1.4058685302734375, 1.456146240234375, 1.5064239501953125, 1.55670166015625, 1.6069793701171875, 1.657257080078125, 1.7075347900390625, 1.7578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 17.0, 21.0, 50.0, 102.0, 162.0, 204.0, 171.0, 116.0, 54.0, 33.0, 14.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015807151794433594, -0.00015350431203842163, -0.00014893710613250732, -0.00014436990022659302, -0.0001398026943206787, -0.0001352354884147644, -0.0001306682825088501, -0.0001261010766029358, -0.00012153387069702148, -0.00011696666479110718, -0.00011239945888519287, -0.00010783225297927856, -0.00010326504707336426, -9.869784116744995e-05, -9.413063526153564e-05, -8.956342935562134e-05, -8.499622344970703e-05, -8.042901754379272e-05, -7.586181163787842e-05, -7.129460573196411e-05, -6.67273998260498e-05, -6.21601939201355e-05, -5.759298801422119e-05, -5.3025782108306885e-05, -4.845857620239258e-05, -4.389137029647827e-05, -3.9324164390563965e-05, -3.475695848464966e-05, -3.018975257873535e-05, -2.5622546672821045e-05, -2.1055340766906738e-05, -1.648813486099243e-05, -1.1920928955078125e-05, -7.353723049163818e-06, -2.7865171432495117e-06, 1.780688762664795e-06, 6.3478946685791016e-06, 1.0915100574493408e-05, 1.5482306480407715e-05, 2.004951238632202e-05, 2.4616718292236328e-05, 2.9183924198150635e-05, 3.375113010406494e-05, 3.831833600997925e-05, 4.2885541915893555e-05, 4.745274782180786e-05, 5.201995372772217e-05, 5.6587159633636475e-05, 6.115436553955078e-05, 6.572157144546509e-05, 7.02887773513794e-05, 7.48559832572937e-05, 7.942318916320801e-05, 8.399039506912231e-05, 8.855760097503662e-05, 9.312480688095093e-05, 9.769201278686523e-05, 0.00010225921869277954, 0.00010682642459869385, 0.00011139363050460815, 0.00011596083641052246, 0.00012052804231643677, 0.00012509524822235107, 0.00012966245412826538, 0.0001342296600341797]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 6.0, 10.0, 14.0, 23.0, 34.0, 61.0, 85.0, 130.0, 218.0, 368.0, 700.0, 1477.0, 3616.0, 11393.0, 83809.0, 848821.0, 80007.0, 11170.0, 3465.0, 1467.0, 692.0, 371.0, 213.0, 136.0, 89.0, 58.0, 25.0, 32.0, 14.0, 13.0, 12.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3203125, -1.283111572265625, -1.24591064453125, -1.208709716796875, -1.1715087890625, -1.134307861328125, -1.09710693359375, -1.059906005859375, -1.022705078125, -0.985504150390625, -0.94830322265625, -0.911102294921875, -0.8739013671875, -0.836700439453125, -0.79949951171875, -0.762298583984375, -0.72509765625, -0.687896728515625, -0.65069580078125, -0.613494873046875, -0.5762939453125, -0.539093017578125, -0.50189208984375, -0.464691162109375, -0.427490234375, -0.390289306640625, -0.35308837890625, -0.315887451171875, -0.2786865234375, -0.241485595703125, -0.20428466796875, -0.167083740234375, -0.1298828125, -0.092681884765625, -0.05548095703125, -0.018280029296875, 0.0189208984375, 0.056121826171875, 0.09332275390625, 0.130523681640625, 0.167724609375, 0.204925537109375, 0.24212646484375, 0.279327392578125, 0.3165283203125, 0.353729248046875, 0.39093017578125, 0.428131103515625, 0.46533203125, 0.502532958984375, 0.53973388671875, 0.576934814453125, 0.6141357421875, 0.651336669921875, 0.68853759765625, 0.725738525390625, 0.762939453125, 0.800140380859375, 0.83734130859375, 0.874542236328125, 0.9117431640625, 0.948944091796875, 0.98614501953125, 1.023345947265625, 1.060546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 10.0, 17.0, 26.0, 43.0, 66.0, 107.0, 219.0, 205.0, 119.0, 72.0, 35.0, 24.0, 12.0, 9.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.25042724609375, -1.2039794921875, -1.15753173828125, -1.111083984375, -1.06463623046875, -1.0181884765625, -0.97174072265625, -0.92529296875, -0.87884521484375, -0.8323974609375, -0.78594970703125, -0.739501953125, -0.69305419921875, -0.6466064453125, -0.60015869140625, -0.5537109375, -0.50726318359375, -0.4608154296875, -0.41436767578125, -0.367919921875, -0.32147216796875, -0.2750244140625, -0.22857666015625, -0.18212890625, -0.13568115234375, -0.0892333984375, -0.04278564453125, 0.003662109375, 0.05010986328125, 0.0965576171875, 0.14300537109375, 0.189453125, 0.23590087890625, 0.2823486328125, 0.32879638671875, 0.375244140625, 0.42169189453125, 0.4681396484375, 0.51458740234375, 0.56103515625, 0.60748291015625, 0.6539306640625, 0.70037841796875, 0.746826171875, 0.79327392578125, 0.8397216796875, 0.88616943359375, 0.9326171875, 0.97906494140625, 1.0255126953125, 1.07196044921875, 1.118408203125, 1.16485595703125, 1.2113037109375, 1.25775146484375, 1.30419921875, 1.35064697265625, 1.3970947265625, 1.44354248046875, 1.489990234375, 1.53643798828125, 1.5828857421875, 1.62933349609375, 1.67578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 11.0, 16.0, 26.0, 52.0, 124.0, 225.0, 295.0, 138.0, 51.0, 33.0, 21.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.71803283691406, -41.811527252197266, -40.90502166748047, -39.99851608276367, -39.092010498046875, -38.18550491333008, -37.27899932861328, -36.372493743896484, -35.46598815917969, -34.55948257446289, -33.652976989746094, -32.7464714050293, -31.8399658203125, -30.933460235595703, -30.026954650878906, -29.12044906616211, -28.213943481445312, -27.307437896728516, -26.40093231201172, -25.494426727294922, -24.587921142578125, -23.681415557861328, -22.77490997314453, -21.868404388427734, -20.96190071105957, -20.055395126342773, -19.148889541625977, -18.24238395690918, -17.335878372192383, -16.429372787475586, -15.522867202758789, -14.616361618041992, -13.709855079650879, -12.803349494934082, -11.896843910217285, -10.990338325500488, -10.083832740783691, -9.177328109741211, -8.270822525024414, -7.364316463470459, -6.457810878753662, -5.551305294036865, -4.644799709320068, -3.7382943630218506, -2.8317887783050537, -1.925283432006836, -1.018777847290039, -0.11227226257324219, 0.7942333221435547, 1.7007389068603516, 2.6072444915771484, 3.513749837875366, 4.420255661010742, 5.326760768890381, 6.233266353607178, 7.139771938323975, 8.04627799987793, 8.952783584594727, 9.859289169311523, 10.76579475402832, 11.672300338745117, 12.578805923461914, 13.485311508178711, 14.391817092895508, 15.298321723937988]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 3.0, 12.0, 12.0, 7.0, 10.0, 12.0, 21.0, 13.0, 26.0, 21.0, 29.0, 28.0, 26.0, 30.0, 59.0, 48.0, 47.0, 48.0, 51.0, 59.0, 52.0, 55.0, 45.0, 37.0, 31.0, 38.0, 38.0, 20.0, 26.0, 15.0, 17.0, 17.0, 6.0, 12.0, 4.0, 3.0, 8.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.458839416503906, -14.010566711425781, -13.562294006347656, -13.114022254943848, -12.665749549865723, -12.217476844787598, -11.769204139709473, -11.320932388305664, -10.872659683227539, -10.424386978149414, -9.976114273071289, -9.52784252166748, -9.079569816589355, -8.63129711151123, -8.183024406433105, -7.734752178192139, -7.286479473114014, -6.838206768035889, -6.389934539794922, -5.941661834716797, -5.49338960647583, -5.045116901397705, -4.596844673156738, -4.148571968078613, -3.7002995014190674, -3.2520270347595215, -2.8037545680999756, -2.3554821014404297, -1.9072095155715942, -1.4589369297027588, -1.010664463043213, -0.562391996383667, -0.1141195297241211, 0.3341529667377472, 0.7824254631996155, 1.2306979894638062, 1.678970456123352, 2.1272430419921875, 2.5755155086517334, 3.0237879753112793, 3.472060441970825, 3.920332908630371, 4.368605613708496, 4.816877841949463, 5.265150547027588, 5.713422775268555, 6.16169548034668, 6.609968185424805, 7.0582404136657715, 7.5065131187438965, 7.954785346984863, 8.403058052062988, 8.851330757141113, 9.299602508544922, 9.747875213623047, 10.196147918701172, 10.644420623779297, 11.092693328857422, 11.540966033935547, 11.989237785339355, 12.43751049041748, 12.885783195495605, 13.33405590057373, 13.782327651977539, 14.230600357055664]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 14.0, 14.0, 21.0, 26.0, 28.0, 69.0, 93.0, 148.0, 251.0, 389.0, 635.0, 1131.0, 2186.0, 4513.0, 20267.0, 4144184.0, 12124.0, 3813.0, 1863.0, 1048.0, 554.0, 328.0, 213.0, 131.0, 73.0, 63.0, 33.0, 20.0, 16.0, 6.0, 12.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.703125, -4.5894775390625, -4.475830078125, -4.3621826171875, -4.24853515625, -4.1348876953125, -4.021240234375, -3.9075927734375, -3.7939453125, -3.6802978515625, -3.566650390625, -3.4530029296875, -3.33935546875, -3.2257080078125, -3.112060546875, -2.9984130859375, -2.884765625, -2.7711181640625, -2.657470703125, -2.5438232421875, -2.43017578125, -2.3165283203125, -2.202880859375, -2.0892333984375, -1.9755859375, -1.8619384765625, -1.748291015625, -1.6346435546875, -1.52099609375, -1.4073486328125, -1.293701171875, -1.1800537109375, -1.06640625, -0.9527587890625, -0.839111328125, -0.7254638671875, -0.61181640625, -0.4981689453125, -0.384521484375, -0.2708740234375, -0.1572265625, -0.0435791015625, 0.070068359375, 0.1837158203125, 0.29736328125, 0.4110107421875, 0.524658203125, 0.6383056640625, 0.751953125, 0.8656005859375, 0.979248046875, 1.0928955078125, 1.20654296875, 1.3201904296875, 1.433837890625, 1.5474853515625, 1.6611328125, 1.7747802734375, 1.888427734375, 2.0020751953125, 2.11572265625, 2.2293701171875, 2.343017578125, 2.4566650390625, 2.5703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 8.0, 14.0, 15.0, 16.0, 22.0, 30.0, 45.0, 42.0, 62.0, 68.0, 60.0, 58.0, 72.0, 79.0, 81.0, 74.0, 57.0, 46.0, 37.0, 25.0, 24.0, 14.0, 4.0, 15.0, 10.0, 11.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8076171875, -0.7876091003417969, -0.7676010131835938, -0.7475929260253906, -0.7275848388671875, -0.7075767517089844, -0.6875686645507812, -0.6675605773925781, -0.647552490234375, -0.6275444030761719, -0.6075363159179688, -0.5875282287597656, -0.5675201416015625, -0.5475120544433594, -0.5275039672851562, -0.5074958801269531, -0.48748779296875, -0.4674797058105469, -0.44747161865234375, -0.4274635314941406, -0.4074554443359375, -0.3874473571777344, -0.36743927001953125, -0.3474311828613281, -0.327423095703125, -0.3074150085449219, -0.28740692138671875, -0.2673988342285156, -0.2473907470703125, -0.22738265991210938, -0.20737457275390625, -0.18736648559570312, -0.1673583984375, -0.14735031127929688, -0.12734222412109375, -0.10733413696289062, -0.0873260498046875, -0.06731796264648438, -0.04730987548828125, -0.027301788330078125, -0.007293701171875, 0.012714385986328125, 0.03272247314453125, 0.052730560302734375, 0.0727386474609375, 0.09274673461914062, 0.11275482177734375, 0.13276290893554688, 0.15277099609375, 0.17277908325195312, 0.19278717041015625, 0.21279525756835938, 0.2328033447265625, 0.2528114318847656, 0.27281951904296875, 0.2928276062011719, 0.312835693359375, 0.3328437805175781, 0.35285186767578125, 0.3728599548339844, 0.3928680419921875, 0.4128761291503906, 0.43288421630859375, 0.4528923034667969, 0.472900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 11.0, 9.0, 18.0, 13.0, 27.0, 24.0, 41.0, 62.0, 84.0, 91.0, 145.0, 201.0, 282.0, 391.0, 609.0, 897.0, 1374.0, 2649.0, 5987.0, 19134.0, 4101665.0, 43373.0, 8800.0, 3402.0, 1735.0, 1022.0, 661.0, 446.0, 327.0, 199.0, 149.0, 125.0, 77.0, 65.0, 54.0, 35.0, 22.0, 21.0, 11.0, 14.0, 7.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.926116943359375, -2.83074951171875, -2.735382080078125, -2.6400146484375, -2.544647216796875, -2.44927978515625, -2.353912353515625, -2.258544921875, -2.163177490234375, -2.06781005859375, -1.972442626953125, -1.8770751953125, -1.781707763671875, -1.68634033203125, -1.590972900390625, -1.49560546875, -1.400238037109375, -1.30487060546875, -1.209503173828125, -1.1141357421875, -1.018768310546875, -0.92340087890625, -0.828033447265625, -0.732666015625, -0.637298583984375, -0.54193115234375, -0.446563720703125, -0.3511962890625, -0.255828857421875, -0.16046142578125, -0.065093994140625, 0.0302734375, 0.125640869140625, 0.22100830078125, 0.316375732421875, 0.4117431640625, 0.507110595703125, 0.60247802734375, 0.697845458984375, 0.793212890625, 0.888580322265625, 0.98394775390625, 1.079315185546875, 1.1746826171875, 1.270050048828125, 1.36541748046875, 1.460784912109375, 1.55615234375, 1.651519775390625, 1.74688720703125, 1.842254638671875, 1.9376220703125, 2.032989501953125, 2.12835693359375, 2.223724365234375, 2.319091796875, 2.414459228515625, 2.50982666015625, 2.605194091796875, 2.7005615234375, 2.795928955078125, 2.89129638671875, 2.986663818359375, 3.08203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 5.0, 9.0, 26.0, 100.0, 3799.0, 58.0, 20.0, 16.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6615142822265625, -0.640411376953125, -0.6193084716796875, -0.59820556640625, -0.5771026611328125, -0.555999755859375, -0.5348968505859375, -0.5137939453125, -0.4926910400390625, -0.471588134765625, -0.4504852294921875, -0.42938232421875, -0.4082794189453125, -0.387176513671875, -0.3660736083984375, -0.344970703125, -0.3238677978515625, -0.302764892578125, -0.2816619873046875, -0.26055908203125, -0.2394561767578125, -0.218353271484375, -0.1972503662109375, -0.1761474609375, -0.1550445556640625, -0.133941650390625, -0.1128387451171875, -0.09173583984375, -0.0706329345703125, -0.049530029296875, -0.0284271240234375, -0.00732421875, 0.0137786865234375, 0.034881591796875, 0.0559844970703125, 0.07708740234375, 0.0981903076171875, 0.119293212890625, 0.1403961181640625, 0.1614990234375, 0.1826019287109375, 0.203704833984375, 0.2248077392578125, 0.24591064453125, 0.2670135498046875, 0.288116455078125, 0.3092193603515625, 0.330322265625, 0.3514251708984375, 0.372528076171875, 0.3936309814453125, 0.41473388671875, 0.4358367919921875, 0.456939697265625, 0.4780426025390625, 0.4991455078125, 0.5202484130859375, 0.541351318359375, 0.5624542236328125, 0.58355712890625, 0.6046600341796875, 0.625762939453125, 0.6468658447265625, 0.66796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 9.0, 34.0, 69.0, 108.0, 244.0, 277.0, 154.0, 55.0, 29.0, 15.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.771570205688477, -5.6543707847595215, -5.537170886993408, -5.419971466064453, -5.30277156829834, -5.185572147369385, -5.0683722496032715, -4.951172828674316, -4.833972930908203, -4.716773509979248, -4.599573612213135, -4.48237419128418, -4.365174293518066, -4.247974872589111, -4.130774974822998, -4.013575553894043, -3.896376132965088, -3.7791764736175537, -3.6619768142700195, -3.5447771549224854, -3.427577495574951, -3.310378074645996, -3.193178415298462, -3.0759787559509277, -2.9587790966033936, -2.8415794372558594, -2.724379777908325, -2.607180118560791, -2.489980697631836, -2.3727807998657227, -2.2555813789367676, -2.1383817195892334, -2.0211822986602783, -1.9039826393127441, -1.78678297996521, -1.6695834398269653, -1.5523837804794312, -1.435184121131897, -1.3179845809936523, -1.2007849216461182, -1.083585262298584, -0.9663856029510498, -0.8491860032081604, -0.731986403465271, -0.6147867441177368, -0.49758708477020264, -0.38038748502731323, -0.26318788528442383, -0.14598822593688965, -0.028788596391677856, 0.08841103315353394, 0.20561066269874573, 0.3228102922439575, 0.4400099515914917, 0.5572095513343811, 0.6744091510772705, 0.7916088104248047, 0.9088084697723389, 1.026008129119873, 1.1432076692581177, 1.2604073286056519, 1.377606987953186, 1.4948065280914307, 1.6120061874389648, 1.729205846786499]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 4.0, 13.0, 13.0, 9.0, 17.0, 23.0, 26.0, 33.0, 30.0, 39.0, 33.0, 47.0, 43.0, 43.0, 46.0, 51.0, 36.0, 44.0, 52.0, 43.0, 37.0, 47.0, 29.0, 32.0, 32.0, 36.0, 24.0, 20.0, 19.0, 18.0, 9.0, 12.0, 10.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0555193424224854, -1.0179657936096191, -0.9804121255874634, -0.9428585767745972, -0.9053049683570862, -0.8677513599395752, -0.8301977515220642, -0.7926441431045532, -0.755090594291687, -0.717536985874176, -0.679983377456665, -0.6424298286437988, -0.6048762202262878, -0.5673226118087769, -0.5297690033912659, -0.49221542477607727, -0.4546617865562439, -0.4171081781387329, -0.3795545995235443, -0.3420009911060333, -0.3044474124908447, -0.26689380407333374, -0.22934019565582275, -0.19178661704063416, -0.15423300862312317, -0.11667941510677338, -0.07912581413984299, -0.0415722131729126, -0.004018619656562805, 0.03353497385978699, 0.07108858227729797, 0.10864216089248657, 0.14619576930999756, 0.18374936282634735, 0.22130295634269714, 0.25885656476020813, 0.29641014337539673, 0.3339637517929077, 0.3715173602104187, 0.4090709388256073, 0.4466245472431183, 0.4841781556606293, 0.5217317342758179, 0.5592853426933289, 0.5968389511108398, 0.634392499923706, 0.6719461679458618, 0.709499716758728, 0.747053325176239, 0.78460693359375, 0.822160542011261, 0.859714150428772, 0.8972676992416382, 0.9348213076591492, 0.9723749160766602, 1.0099284648895264, 1.0474821329116821, 1.0850356817245483, 1.122589349746704, 1.1601428985595703, 1.197696566581726, 1.2352501153945923, 1.272803783416748, 1.3103573322296143, 1.3479108810424805]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 1.0, 4.0, 8.0, 7.0, 18.0, 13.0, 28.0, 48.0, 61.0, 94.0, 140.0, 225.0, 352.0, 594.0, 1143.0, 2235.0, 4557.0, 9987.0, 25379.0, 76105.0, 303199.0, 449347.0, 114451.0, 35269.0, 13441.0, 5661.0, 2806.0, 1446.0, 784.0, 431.0, 245.0, 162.0, 114.0, 63.0, 48.0, 17.0, 26.0, 11.0, 9.0, 10.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.017578125, -1.95068359375, -1.8837890625, -1.81689453125, -1.75, -1.68310546875, -1.6162109375, -1.54931640625, -1.482421875, -1.41552734375, -1.3486328125, -1.28173828125, -1.21484375, -1.14794921875, -1.0810546875, -1.01416015625, -0.947265625, -0.88037109375, -0.8134765625, -0.74658203125, -0.6796875, -0.61279296875, -0.5458984375, -0.47900390625, -0.412109375, -0.34521484375, -0.2783203125, -0.21142578125, -0.14453125, -0.07763671875, -0.0107421875, 0.05615234375, 0.123046875, 0.18994140625, 0.2568359375, 0.32373046875, 0.390625, 0.45751953125, 0.5244140625, 0.59130859375, 0.658203125, 0.72509765625, 0.7919921875, 0.85888671875, 0.92578125, 0.99267578125, 1.0595703125, 1.12646484375, 1.193359375, 1.26025390625, 1.3271484375, 1.39404296875, 1.4609375, 1.52783203125, 1.5947265625, 1.66162109375, 1.728515625, 1.79541015625, 1.8623046875, 1.92919921875, 1.99609375, 2.06298828125, 2.1298828125, 2.19677734375, 2.263671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 1.0, 11.0, 12.0, 19.0, 18.0, 27.0, 34.0, 47.0, 53.0, 62.0, 48.0, 60.0, 62.0, 96.0, 57.0, 72.0, 64.0, 62.0, 40.0, 37.0, 25.0, 22.0, 17.0, 12.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.794921875, -0.7746047973632812, -0.7542877197265625, -0.7339706420898438, -0.713653564453125, -0.6933364868164062, -0.6730194091796875, -0.6527023315429688, -0.63238525390625, -0.6120681762695312, -0.5917510986328125, -0.5714340209960938, -0.551116943359375, -0.5307998657226562, -0.5104827880859375, -0.49016571044921875, -0.4698486328125, -0.44953155517578125, -0.4292144775390625, -0.40889739990234375, -0.388580322265625, -0.36826324462890625, -0.3479461669921875, -0.32762908935546875, -0.30731201171875, -0.28699493408203125, -0.2666778564453125, -0.24636077880859375, -0.226043701171875, -0.20572662353515625, -0.1854095458984375, -0.16509246826171875, -0.144775390625, -0.12445831298828125, -0.1041412353515625, -0.08382415771484375, -0.063507080078125, -0.04319000244140625, -0.0228729248046875, -0.00255584716796875, 0.01776123046875, 0.03807830810546875, 0.0583953857421875, 0.07871246337890625, 0.099029541015625, 0.11934661865234375, 0.1396636962890625, 0.15998077392578125, 0.1802978515625, 0.20061492919921875, 0.2209320068359375, 0.24124908447265625, 0.261566162109375, 0.28188323974609375, 0.3022003173828125, 0.32251739501953125, 0.34283447265625, 0.36315155029296875, 0.3834686279296875, 0.40378570556640625, 0.424102783203125, 0.44441986083984375, 0.4647369384765625, 0.48505401611328125, 0.50537109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 16.0, 17.0, 27.0, 36.0, 85.0, 98.0, 149.0, 294.0, 523.0, 953.0, 2032.0, 5184.0, 15470.0, 66025.0, 583324.0, 312444.0, 42767.0, 11543.0, 4028.0, 1659.0, 835.0, 409.0, 231.0, 131.0, 73.0, 60.0, 36.0, 36.0, 21.0, 13.0, 7.0, 12.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.841796875, -3.72491455078125, -3.6080322265625, -3.49114990234375, -3.374267578125, -3.25738525390625, -3.1405029296875, -3.02362060546875, -2.90673828125, -2.78985595703125, -2.6729736328125, -2.55609130859375, -2.439208984375, -2.32232666015625, -2.2054443359375, -2.08856201171875, -1.9716796875, -1.85479736328125, -1.7379150390625, -1.62103271484375, -1.504150390625, -1.38726806640625, -1.2703857421875, -1.15350341796875, -1.03662109375, -0.91973876953125, -0.8028564453125, -0.68597412109375, -0.569091796875, -0.45220947265625, -0.3353271484375, -0.21844482421875, -0.1015625, 0.01531982421875, 0.1322021484375, 0.24908447265625, 0.365966796875, 0.48284912109375, 0.5997314453125, 0.71661376953125, 0.83349609375, 0.95037841796875, 1.0672607421875, 1.18414306640625, 1.301025390625, 1.41790771484375, 1.5347900390625, 1.65167236328125, 1.7685546875, 1.88543701171875, 2.0023193359375, 2.11920166015625, 2.236083984375, 2.35296630859375, 2.4698486328125, 2.58673095703125, 2.70361328125, 2.82049560546875, 2.9373779296875, 3.05426025390625, 3.171142578125, 3.28802490234375, 3.4049072265625, 3.52178955078125, 3.638671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 9.0, 5.0, 8.0, 12.0, 19.0, 20.0, 27.0, 29.0, 43.0, 41.0, 65.0, 52.0, 62.0, 74.0, 63.0, 57.0, 65.0, 62.0, 48.0, 48.0, 42.0, 34.0, 21.0, 24.0, 17.0, 10.0, 11.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.266265869140625, -3.12042236328125, -2.974578857421875, -2.8287353515625, -2.682891845703125, -2.53704833984375, -2.391204833984375, -2.245361328125, -2.099517822265625, -1.95367431640625, -1.807830810546875, -1.6619873046875, -1.516143798828125, -1.37030029296875, -1.224456787109375, -1.07861328125, -0.932769775390625, -0.78692626953125, -0.641082763671875, -0.4952392578125, -0.349395751953125, -0.20355224609375, -0.057708740234375, 0.088134765625, 0.233978271484375, 0.37982177734375, 0.525665283203125, 0.6715087890625, 0.817352294921875, 0.96319580078125, 1.109039306640625, 1.2548828125, 1.400726318359375, 1.54656982421875, 1.692413330078125, 1.8382568359375, 1.984100341796875, 2.12994384765625, 2.275787353515625, 2.421630859375, 2.567474365234375, 2.71331787109375, 2.859161376953125, 3.0050048828125, 3.150848388671875, 3.29669189453125, 3.442535400390625, 3.58837890625, 3.734222412109375, 3.88006591796875, 4.025909423828125, 4.1717529296875, 4.317596435546875, 4.46343994140625, 4.609283447265625, 4.755126953125, 4.900970458984375, 5.04681396484375, 5.192657470703125, 5.3385009765625, 5.484344482421875, 5.63018798828125, 5.776031494140625, 5.921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 10.0, 24.0, 40.0, 52.0, 72.0, 107.0, 188.0, 290.0, 488.0, 979.0, 2019.0, 5374.0, 21817.0, 297703.0, 675404.0, 32202.0, 6757.0, 2428.0, 1106.0, 587.0, 335.0, 197.0, 139.0, 52.0, 53.0, 31.0, 28.0, 13.0, 11.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.712890625, -2.6397705078125, -2.566650390625, -2.4935302734375, -2.42041015625, -2.3472900390625, -2.274169921875, -2.2010498046875, -2.1279296875, -2.0548095703125, -1.981689453125, -1.9085693359375, -1.83544921875, -1.7623291015625, -1.689208984375, -1.6160888671875, -1.54296875, -1.4698486328125, -1.396728515625, -1.3236083984375, -1.25048828125, -1.1773681640625, -1.104248046875, -1.0311279296875, -0.9580078125, -0.8848876953125, -0.811767578125, -0.7386474609375, -0.66552734375, -0.5924072265625, -0.519287109375, -0.4461669921875, -0.373046875, -0.2999267578125, -0.226806640625, -0.1536865234375, -0.08056640625, -0.0074462890625, 0.065673828125, 0.1387939453125, 0.2119140625, 0.2850341796875, 0.358154296875, 0.4312744140625, 0.50439453125, 0.5775146484375, 0.650634765625, 0.7237548828125, 0.796875, 0.8699951171875, 0.943115234375, 1.0162353515625, 1.08935546875, 1.1624755859375, 1.235595703125, 1.3087158203125, 1.3818359375, 1.4549560546875, 1.528076171875, 1.6011962890625, 1.67431640625, 1.7474365234375, 1.820556640625, 1.8936767578125, 1.966796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 11.0, 15.0, 37.0, 102.0, 219.0, 321.0, 163.0, 64.0, 29.0, 19.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047588348388671875, -0.00046237558126449585, -0.00044886767864227295, -0.00043535977602005005, -0.00042185187339782715, -0.00040834397077560425, -0.00039483606815338135, -0.00038132816553115845, -0.00036782026290893555, -0.00035431236028671265, -0.00034080445766448975, -0.00032729655504226685, -0.00031378865242004395, -0.00030028074979782104, -0.00028677284717559814, -0.00027326494455337524, -0.00025975704193115234, -0.00024624913930892944, -0.00023274123668670654, -0.00021923333406448364, -0.00020572543144226074, -0.00019221752882003784, -0.00017870962619781494, -0.00016520172357559204, -0.00015169382095336914, -0.00013818591833114624, -0.00012467801570892334, -0.00011117011308670044, -9.766221046447754e-05, -8.415430784225464e-05, -7.064640522003174e-05, -5.713850259780884e-05, -4.363059997558594e-05, -3.0122697353363037e-05, -1.6614794731140137e-05, -3.1068921089172363e-06, 1.0401010513305664e-05, 2.3908913135528564e-05, 3.7416815757751465e-05, 5.0924718379974365e-05, 6.443262100219727e-05, 7.794052362442017e-05, 9.144842624664307e-05, 0.00010495632886886597, 0.00011846423149108887, 0.00013197213411331177, 0.00014548003673553467, 0.00015898793935775757, 0.00017249584197998047, 0.00018600374460220337, 0.00019951164722442627, 0.00021301954984664917, 0.00022652745246887207, 0.00024003535509109497, 0.00025354325771331787, 0.00026705116033554077, 0.00028055906295776367, 0.00029406696557998657, 0.00030757486820220947, 0.0003210827708244324, 0.0003345906734466553, 0.0003480985760688782, 0.0003616064786911011, 0.000375114381313324, 0.0003886222839355469]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 5.0, 12.0, 8.0, 12.0, 16.0, 29.0, 41.0, 41.0, 86.0, 115.0, 194.0, 315.0, 596.0, 1175.0, 2564.0, 6909.0, 26923.0, 236422.0, 701800.0, 53513.0, 10737.0, 3611.0, 1571.0, 750.0, 430.0, 239.0, 164.0, 89.0, 54.0, 34.0, 28.0, 18.0, 9.0, 8.0, 12.0, 7.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2932586669921875, -1.245697021484375, -1.1981353759765625, -1.15057373046875, -1.1030120849609375, -1.055450439453125, -1.0078887939453125, -0.9603271484375, -0.9127655029296875, -0.865203857421875, -0.8176422119140625, -0.77008056640625, -0.7225189208984375, -0.674957275390625, -0.6273956298828125, -0.579833984375, -0.5322723388671875, -0.484710693359375, -0.4371490478515625, -0.38958740234375, -0.3420257568359375, -0.294464111328125, -0.2469024658203125, -0.1993408203125, -0.1517791748046875, -0.104217529296875, -0.0566558837890625, -0.00909423828125, 0.0384674072265625, 0.086029052734375, 0.1335906982421875, 0.18115234375, 0.2287139892578125, 0.276275634765625, 0.3238372802734375, 0.37139892578125, 0.4189605712890625, 0.466522216796875, 0.5140838623046875, 0.5616455078125, 0.6092071533203125, 0.656768798828125, 0.7043304443359375, 0.75189208984375, 0.7994537353515625, 0.847015380859375, 0.8945770263671875, 0.942138671875, 0.9897003173828125, 1.037261962890625, 1.0848236083984375, 1.13238525390625, 1.1799468994140625, 1.227508544921875, 1.2750701904296875, 1.3226318359375, 1.3701934814453125, 1.417755126953125, 1.4653167724609375, 1.51287841796875, 1.5604400634765625, 1.608001708984375, 1.6555633544921875, 1.703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 14.0, 13.0, 24.0, 27.0, 38.0, 50.0, 51.0, 103.0, 168.0, 121.0, 98.0, 64.0, 38.0, 35.0, 27.0, 30.0, 19.0, 15.0, 8.0, 9.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5205078125, -1.4639129638671875, -1.407318115234375, -1.3507232666015625, -1.29412841796875, -1.2375335693359375, -1.180938720703125, -1.1243438720703125, -1.0677490234375, -1.0111541748046875, -0.954559326171875, -0.8979644775390625, -0.84136962890625, -0.7847747802734375, -0.728179931640625, -0.6715850830078125, -0.614990234375, -0.5583953857421875, -0.501800537109375, -0.4452056884765625, -0.38861083984375, -0.3320159912109375, -0.275421142578125, -0.2188262939453125, -0.1622314453125, -0.1056365966796875, -0.049041748046875, 0.0075531005859375, 0.06414794921875, 0.1207427978515625, 0.177337646484375, 0.2339324951171875, 0.29052734375, 0.3471221923828125, 0.403717041015625, 0.4603118896484375, 0.51690673828125, 0.5735015869140625, 0.630096435546875, 0.6866912841796875, 0.7432861328125, 0.7998809814453125, 0.856475830078125, 0.9130706787109375, 0.96966552734375, 1.0262603759765625, 1.082855224609375, 1.1394500732421875, 1.196044921875, 1.2526397705078125, 1.309234619140625, 1.3658294677734375, 1.42242431640625, 1.4790191650390625, 1.535614013671875, 1.5922088623046875, 1.6488037109375, 1.7053985595703125, 1.761993408203125, 1.8185882568359375, 1.87518310546875, 1.9317779541015625, 1.988372802734375, 2.0449676513671875, 2.1015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 15.0, 17.0, 23.0, 45.0, 58.0, 103.0, 155.0, 196.0, 137.0, 114.0, 55.0, 26.0, 20.0, 14.0, 9.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.74540901184082, -29.62629508972168, -28.50718116760254, -27.3880672454834, -26.26895523071289, -25.14984130859375, -24.03072738647461, -22.91161346435547, -21.792499542236328, -20.673385620117188, -19.554271697998047, -18.435157775878906, -17.316043853759766, -16.196929931640625, -15.077817916870117, -13.958703994750977, -12.839590072631836, -11.720476150512695, -10.601362228393555, -9.48224925994873, -8.36313533782959, -7.244021415710449, -6.124907970428467, -5.005794525146484, -3.8866806030273438, -2.7675669193267822, -1.6484532356262207, -0.5293395519256592, 0.5897741317749023, 1.708888053894043, 2.8280014991760254, 3.947114944458008, 5.066226959228516, 6.185340881347656, 7.304454326629639, 8.423567771911621, 9.542681694030762, 10.661795616149902, 11.780908584594727, 12.900022506713867, 14.019136428833008, 15.138250350952148, 16.25736427307129, 17.37647819519043, 18.495590209960938, 19.614704132080078, 20.73381805419922, 21.85293197631836, 22.9720458984375, 24.09115982055664, 25.21027374267578, 26.329387664794922, 27.448501586914062, 28.567615509033203, 29.68672752380371, 30.80584144592285, 31.924955368041992, 33.0440673828125, 34.16318130493164, 35.28229522705078, 36.40140914916992, 37.52052307128906, 38.6396369934082, 39.758750915527344, 40.877864837646484]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 10.0, 11.0, 11.0, 15.0, 18.0, 26.0, 26.0, 26.0, 45.0, 58.0, 55.0, 78.0, 62.0, 65.0, 75.0, 58.0, 47.0, 58.0, 34.0, 38.0, 30.0, 29.0, 18.0, 23.0, 12.0, 12.0, 11.0, 7.0, 8.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.724720001220703, -28.909807205200195, -28.094894409179688, -27.279979705810547, -26.46506690979004, -25.65015411376953, -24.835241317749023, -24.020328521728516, -23.205413818359375, -22.390501022338867, -21.57558822631836, -20.76067352294922, -19.94576072692871, -19.130847930908203, -18.315935134887695, -17.501022338867188, -16.686107635498047, -15.871194839477539, -15.056281089782715, -14.241368293762207, -13.426454544067383, -12.611541748046875, -11.796628952026367, -10.981715202331543, -10.166803359985352, -9.351890563964844, -8.53697681427002, -7.722064018249512, -6.9071502685546875, -6.09223747253418, -5.277324199676514, -4.462410926818848, -3.6474971771240234, -2.8325839042663574, -2.0176706314086914, -1.2027575969696045, -0.3878443241119385, 0.42706871032714844, 1.2419819831848145, 2.0568952560424805, 2.8718085289001465, 3.6867218017578125, 4.5016350746154785, 5.3165483474731445, 6.131461143493652, 6.946374416351318, 7.761287689208984, 8.576200485229492, 9.391114234924316, 10.206027030944824, 11.020940780639648, 11.835853576660156, 12.65076732635498, 13.465680122375488, 14.280593872070312, 15.09550666809082, 15.910419464111328, 16.725332260131836, 17.540245056152344, 18.355159759521484, 19.170072555541992, 19.9849853515625, 20.799898147583008, 21.614810943603516, 22.429725646972656]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 8.0, 2.0, 9.0, 9.0, 7.0, 13.0, 17.0, 25.0, 31.0, 23.0, 53.0, 91.0, 122.0, 207.0, 341.0, 598.0, 1179.0, 2676.0, 7419.0, 46596.0, 4108544.0, 17963.0, 4701.0, 1845.0, 849.0, 402.0, 216.0, 129.0, 72.0, 43.0, 25.0, 17.0, 15.0, 7.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.96026611328125, -7.7408447265625, -7.52142333984375, -7.302001953125, -7.08258056640625, -6.8631591796875, -6.64373779296875, -6.42431640625, -6.20489501953125, -5.9854736328125, -5.76605224609375, -5.546630859375, -5.32720947265625, -5.1077880859375, -4.88836669921875, -4.6689453125, -4.44952392578125, -4.2301025390625, -4.01068115234375, -3.791259765625, -3.57183837890625, -3.3524169921875, -3.13299560546875, -2.91357421875, -2.69415283203125, -2.4747314453125, -2.25531005859375, -2.035888671875, -1.81646728515625, -1.5970458984375, -1.37762451171875, -1.158203125, -0.93878173828125, -0.7193603515625, -0.49993896484375, -0.280517578125, -0.06109619140625, 0.1583251953125, 0.37774658203125, 0.59716796875, 0.81658935546875, 1.0360107421875, 1.25543212890625, 1.474853515625, 1.69427490234375, 1.9136962890625, 2.13311767578125, 2.3525390625, 2.57196044921875, 2.7913818359375, 3.01080322265625, 3.230224609375, 3.44964599609375, 3.6690673828125, 3.88848876953125, 4.10791015625, 4.32733154296875, 4.5467529296875, 4.76617431640625, 4.985595703125, 5.20501708984375, 5.4244384765625, 5.64385986328125, 5.86328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 3.0, 6.0, 12.0, 12.0, 17.0, 25.0, 38.0, 50.0, 64.0, 93.0, 110.0, 107.0, 96.0, 90.0, 90.0, 62.0, 39.0, 19.0, 18.0, 13.0, 8.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3818359375, -1.34271240234375, -1.3035888671875, -1.26446533203125, -1.225341796875, -1.18621826171875, -1.1470947265625, -1.10797119140625, -1.06884765625, -1.02972412109375, -0.9906005859375, -0.95147705078125, -0.912353515625, -0.87322998046875, -0.8341064453125, -0.79498291015625, -0.755859375, -0.71673583984375, -0.6776123046875, -0.63848876953125, -0.599365234375, -0.56024169921875, -0.5211181640625, -0.48199462890625, -0.44287109375, -0.40374755859375, -0.3646240234375, -0.32550048828125, -0.286376953125, -0.24725341796875, -0.2081298828125, -0.16900634765625, -0.1298828125, -0.09075927734375, -0.0516357421875, -0.01251220703125, 0.026611328125, 0.06573486328125, 0.1048583984375, 0.14398193359375, 0.18310546875, 0.22222900390625, 0.2613525390625, 0.30047607421875, 0.339599609375, 0.37872314453125, 0.4178466796875, 0.45697021484375, 0.49609375, 0.53521728515625, 0.5743408203125, 0.61346435546875, 0.652587890625, 0.69171142578125, 0.7308349609375, 0.76995849609375, 0.80908203125, 0.84820556640625, 0.8873291015625, 0.92645263671875, 0.965576171875, 1.00469970703125, 1.0438232421875, 1.08294677734375, 1.1220703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 17.0, 26.0, 39.0, 52.0, 74.0, 100.0, 113.0, 146.0, 216.0, 296.0, 432.0, 540.0, 820.0, 1245.0, 1816.0, 3049.0, 5212.0, 10296.0, 25688.0, 854346.0, 3239453.0, 25768.0, 10387.0, 5231.0, 3016.0, 1764.0, 1183.0, 795.0, 558.0, 386.0, 303.0, 184.0, 182.0, 131.0, 89.0, 69.0, 57.0, 39.0, 36.0, 21.0, 17.0, 14.0, 11.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.9375, -5.76287841796875, -5.5882568359375, -5.41363525390625, -5.239013671875, -5.06439208984375, -4.8897705078125, -4.71514892578125, -4.54052734375, -4.36590576171875, -4.1912841796875, -4.01666259765625, -3.842041015625, -3.66741943359375, -3.4927978515625, -3.31817626953125, -3.1435546875, -2.96893310546875, -2.7943115234375, -2.61968994140625, -2.445068359375, -2.27044677734375, -2.0958251953125, -1.92120361328125, -1.74658203125, -1.57196044921875, -1.3973388671875, -1.22271728515625, -1.048095703125, -0.87347412109375, -0.6988525390625, -0.52423095703125, -0.349609375, -0.17498779296875, -0.0003662109375, 0.17425537109375, 0.348876953125, 0.52349853515625, 0.6981201171875, 0.87274169921875, 1.04736328125, 1.22198486328125, 1.3966064453125, 1.57122802734375, 1.745849609375, 1.92047119140625, 2.0950927734375, 2.26971435546875, 2.4443359375, 2.61895751953125, 2.7935791015625, 2.96820068359375, 3.142822265625, 3.31744384765625, 3.4920654296875, 3.66668701171875, 3.84130859375, 4.01593017578125, 4.1905517578125, 4.36517333984375, 4.539794921875, 4.71441650390625, 4.8890380859375, 5.06365966796875, 5.23828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 9.0, 10.0, 12.0, 12.0, 23.0, 71.0, 3711.0, 94.0, 40.0, 28.0, 15.0, 7.0, 11.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.203125, -2.137420654296875, -2.07171630859375, -2.006011962890625, -1.9403076171875, -1.874603271484375, -1.80889892578125, -1.743194580078125, -1.677490234375, -1.611785888671875, -1.54608154296875, -1.480377197265625, -1.4146728515625, -1.348968505859375, -1.28326416015625, -1.217559814453125, -1.15185546875, -1.086151123046875, -1.02044677734375, -0.954742431640625, -0.8890380859375, -0.823333740234375, -0.75762939453125, -0.691925048828125, -0.626220703125, -0.560516357421875, -0.49481201171875, -0.429107666015625, -0.3634033203125, -0.297698974609375, -0.23199462890625, -0.166290283203125, -0.1005859375, -0.034881591796875, 0.03082275390625, 0.096527099609375, 0.1622314453125, 0.227935791015625, 0.29364013671875, 0.359344482421875, 0.425048828125, 0.490753173828125, 0.55645751953125, 0.622161865234375, 0.6878662109375, 0.753570556640625, 0.81927490234375, 0.884979248046875, 0.95068359375, 1.016387939453125, 1.08209228515625, 1.147796630859375, 1.2135009765625, 1.279205322265625, 1.34490966796875, 1.410614013671875, 1.476318359375, 1.542022705078125, 1.60772705078125, 1.673431396484375, 1.7391357421875, 1.804840087890625, 1.87054443359375, 1.936248779296875, 2.001953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 22.0, 18.0, 26.0, 36.0, 78.0, 91.0, 144.0, 144.0, 99.0, 105.0, 63.0, 47.0, 28.0, 23.0, 11.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.044249534606934, -7.791569709777832, -7.538889408111572, -7.286209583282471, -7.033529281616211, -6.780849456787109, -6.528169631958008, -6.275489807128906, -6.0228095054626465, -5.770129680633545, -5.517449378967285, -5.264769554138184, -5.012089729309082, -4.759409427642822, -4.506729602813721, -4.254049301147461, -4.001369476318359, -3.7486894130706787, -3.496009349822998, -3.2433295249938965, -2.990649461746216, -2.737969398498535, -2.4852895736694336, -2.232609510421753, -1.9799294471740723, -1.7272493839263916, -1.4745694398880005, -1.2218894958496094, -0.9692094326019287, -0.716529369354248, -0.46384942531585693, -0.21116948127746582, 0.04150962829589844, 0.2941896319389343, 0.5468696355819702, 0.7995496392250061, 1.052229642868042, 1.3049097061157227, 1.5575896501541138, 1.8102695941925049, 2.0629496574401855, 2.315629720687866, 2.568309783935547, 2.8209896087646484, 3.073669672012329, 3.3263497352600098, 3.5790295600891113, 3.831709623336792, 4.084389686584473, 4.337069511413574, 4.589749813079834, 4.8424296379089355, 5.095109939575195, 5.347789764404297, 5.600469589233398, 5.8531494140625, 6.10582971572876, 6.358509540557861, 6.611189842224121, 6.863869667053223, 7.116549491882324, 7.369229793548584, 7.6219096183776855, 7.874589920043945, 8.127269744873047]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 5.0, 6.0, 14.0, 8.0, 23.0, 16.0, 16.0, 16.0, 20.0, 14.0, 22.0, 25.0, 29.0, 32.0, 29.0, 33.0, 38.0, 49.0, 38.0, 43.0, 45.0, 39.0, 44.0, 43.0, 35.0, 38.0, 32.0, 35.0, 29.0, 26.0, 23.0, 25.0, 18.0, 12.0, 9.0, 12.0, 8.0, 11.0, 7.0, 5.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.204047203063965, -5.041396141052246, -4.878745079040527, -4.716094017028809, -4.55344295501709, -4.390791893005371, -4.228140830993652, -4.065489768981934, -3.9028384685516357, -3.740187406539917, -3.5775363445281982, -3.4148852825164795, -3.2522339820861816, -3.089582920074463, -2.926931858062744, -2.7642807960510254, -2.6016297340393066, -2.438978672027588, -2.276327610015869, -2.1136765480041504, -1.951025366783142, -1.7883743047714233, -1.625723123550415, -1.4630720615386963, -1.3004209995269775, -1.1377699375152588, -0.9751188158988953, -0.8124676942825317, -0.649816632270813, -0.48716557025909424, -0.3245144486427307, -0.1618633270263672, 0.0007877349853515625, 0.1634388267993927, 0.32608991861343384, 0.488741010427475, 0.6513921022415161, 0.8140431642532349, 0.9766942858695984, 1.139345407485962, 1.3019964694976807, 1.4646475315093994, 1.6272985935211182, 1.7899497747421265, 1.9526008367538452, 2.1152520179748535, 2.2779030799865723, 2.440554141998291, 2.6032052040100098, 2.7658562660217285, 2.9285073280334473, 3.091158390045166, 3.2538094520568848, 3.4164605140686035, 3.5791118144989014, 3.74176287651062, 3.904413938522339, 4.067065238952637, 4.2297163009643555, 4.392367362976074, 4.555018424987793, 4.717669486999512, 4.8803205490112305, 5.042971611022949, 5.205622673034668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 12.0, 10.0, 14.0, 25.0, 27.0, 40.0, 69.0, 76.0, 145.0, 188.0, 321.0, 508.0, 747.0, 1360.0, 2433.0, 4817.0, 10013.0, 23870.0, 68408.0, 266204.0, 474316.0, 126769.0, 38578.0, 14852.0, 6771.0, 3392.0, 1807.0, 1003.0, 616.0, 368.0, 259.0, 150.0, 94.0, 70.0, 69.0, 40.0, 27.0, 16.0, 19.0, 9.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.166015625, -3.070770263671875, -2.97552490234375, -2.880279541015625, -2.7850341796875, -2.689788818359375, -2.59454345703125, -2.499298095703125, -2.404052734375, -2.308807373046875, -2.21356201171875, -2.118316650390625, -2.0230712890625, -1.927825927734375, -1.83258056640625, -1.737335205078125, -1.64208984375, -1.546844482421875, -1.45159912109375, -1.356353759765625, -1.2611083984375, -1.165863037109375, -1.07061767578125, -0.975372314453125, -0.880126953125, -0.784881591796875, -0.68963623046875, -0.594390869140625, -0.4991455078125, -0.403900146484375, -0.30865478515625, -0.213409423828125, -0.1181640625, -0.022918701171875, 0.07232666015625, 0.167572021484375, 0.2628173828125, 0.358062744140625, 0.45330810546875, 0.548553466796875, 0.643798828125, 0.739044189453125, 0.83428955078125, 0.929534912109375, 1.0247802734375, 1.120025634765625, 1.21527099609375, 1.310516357421875, 1.40576171875, 1.501007080078125, 1.59625244140625, 1.691497802734375, 1.7867431640625, 1.881988525390625, 1.97723388671875, 2.072479248046875, 2.167724609375, 2.262969970703125, 2.35821533203125, 2.453460693359375, 2.5487060546875, 2.643951416015625, 2.73919677734375, 2.834442138671875, 2.9296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 2.0, 4.0, 7.0, 16.0, 12.0, 17.0, 22.0, 35.0, 35.0, 47.0, 40.0, 69.0, 72.0, 99.0, 85.0, 87.0, 72.0, 50.0, 40.0, 49.0, 39.0, 33.0, 17.0, 14.0, 9.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5146484375, -1.4702911376953125, -1.425933837890625, -1.3815765380859375, -1.33721923828125, -1.2928619384765625, -1.248504638671875, -1.2041473388671875, -1.1597900390625, -1.1154327392578125, -1.071075439453125, -1.0267181396484375, -0.98236083984375, -0.9380035400390625, -0.893646240234375, -0.8492889404296875, -0.804931640625, -0.7605743408203125, -0.716217041015625, -0.6718597412109375, -0.62750244140625, -0.5831451416015625, -0.538787841796875, -0.4944305419921875, -0.4500732421875, -0.4057159423828125, -0.361358642578125, -0.3170013427734375, -0.27264404296875, -0.2282867431640625, -0.183929443359375, -0.1395721435546875, -0.09521484375, -0.0508575439453125, -0.006500244140625, 0.0378570556640625, 0.08221435546875, 0.1265716552734375, 0.170928955078125, 0.2152862548828125, 0.2596435546875, 0.3040008544921875, 0.348358154296875, 0.3927154541015625, 0.43707275390625, 0.4814300537109375, 0.525787353515625, 0.5701446533203125, 0.614501953125, 0.6588592529296875, 0.703216552734375, 0.7475738525390625, 0.79193115234375, 0.8362884521484375, 0.880645751953125, 0.9250030517578125, 0.9693603515625, 1.0137176513671875, 1.058074951171875, 1.1024322509765625, 1.14678955078125, 1.1911468505859375, 1.235504150390625, 1.2798614501953125, 1.32421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 8.0, 5.0, 26.0, 49.0, 54.0, 106.0, 196.0, 355.0, 742.0, 1703.0, 4871.0, 19662.0, 164109.0, 769441.0, 69662.0, 11596.0, 3437.0, 1235.0, 570.0, 297.0, 159.0, 100.0, 51.0, 40.0, 28.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.795166015625, -7.52001953125, -7.244873046875, -6.9697265625, -6.694580078125, -6.41943359375, -6.144287109375, -5.869140625, -5.593994140625, -5.31884765625, -5.043701171875, -4.7685546875, -4.493408203125, -4.21826171875, -3.943115234375, -3.66796875, -3.392822265625, -3.11767578125, -2.842529296875, -2.5673828125, -2.292236328125, -2.01708984375, -1.741943359375, -1.466796875, -1.191650390625, -0.91650390625, -0.641357421875, -0.3662109375, -0.091064453125, 0.18408203125, 0.459228515625, 0.734375, 1.009521484375, 1.28466796875, 1.559814453125, 1.8349609375, 2.110107421875, 2.38525390625, 2.660400390625, 2.935546875, 3.210693359375, 3.48583984375, 3.760986328125, 4.0361328125, 4.311279296875, 4.58642578125, 4.861572265625, 5.13671875, 5.411865234375, 5.68701171875, 5.962158203125, 6.2373046875, 6.512451171875, 6.78759765625, 7.062744140625, 7.337890625, 7.613037109375, 7.88818359375, 8.163330078125, 8.4384765625, 8.713623046875, 8.98876953125, 9.263916015625, 9.5390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 0.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 8.0, 19.0, 12.0, 16.0, 23.0, 41.0, 47.0, 58.0, 47.0, 71.0, 84.0, 96.0, 75.0, 71.0, 49.0, 50.0, 43.0, 33.0, 37.0, 18.0, 22.0, 9.0, 13.0, 10.0, 10.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6796875, -9.35302734375, -9.0263671875, -8.69970703125, -8.373046875, -8.04638671875, -7.7197265625, -7.39306640625, -7.06640625, -6.73974609375, -6.4130859375, -6.08642578125, -5.759765625, -5.43310546875, -5.1064453125, -4.77978515625, -4.453125, -4.12646484375, -3.7998046875, -3.47314453125, -3.146484375, -2.81982421875, -2.4931640625, -2.16650390625, -1.83984375, -1.51318359375, -1.1865234375, -0.85986328125, -0.533203125, -0.20654296875, 0.1201171875, 0.44677734375, 0.7734375, 1.10009765625, 1.4267578125, 1.75341796875, 2.080078125, 2.40673828125, 2.7333984375, 3.06005859375, 3.38671875, 3.71337890625, 4.0400390625, 4.36669921875, 4.693359375, 5.02001953125, 5.3466796875, 5.67333984375, 6.0, 6.32666015625, 6.6533203125, 6.97998046875, 7.306640625, 7.63330078125, 7.9599609375, 8.28662109375, 8.61328125, 8.93994140625, 9.2666015625, 9.59326171875, 9.919921875, 10.24658203125, 10.5732421875, 10.89990234375, 11.2265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 4.0, 15.0, 14.0, 32.0, 59.0, 75.0, 141.0, 285.0, 751.0, 3179.0, 137673.0, 898530.0, 5919.0, 1046.0, 382.0, 163.0, 104.0, 58.0, 38.0, 30.0, 12.0, 14.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.162109375, -9.85546875, -9.548828125, -9.2421875, -8.935546875, -8.62890625, -8.322265625, -8.015625, -7.708984375, -7.40234375, -7.095703125, -6.7890625, -6.482421875, -6.17578125, -5.869140625, -5.5625, -5.255859375, -4.94921875, -4.642578125, -4.3359375, -4.029296875, -3.72265625, -3.416015625, -3.109375, -2.802734375, -2.49609375, -2.189453125, -1.8828125, -1.576171875, -1.26953125, -0.962890625, -0.65625, -0.349609375, -0.04296875, 0.263671875, 0.5703125, 0.876953125, 1.18359375, 1.490234375, 1.796875, 2.103515625, 2.41015625, 2.716796875, 3.0234375, 3.330078125, 3.63671875, 3.943359375, 4.25, 4.556640625, 4.86328125, 5.169921875, 5.4765625, 5.783203125, 6.08984375, 6.396484375, 6.703125, 7.009765625, 7.31640625, 7.623046875, 7.9296875, 8.236328125, 8.54296875, 8.849609375, 9.15625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 14.0, 38.0, 65.0, 153.0, 278.0, 221.0, 126.0, 49.0, 25.0, 14.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006799697875976562, -0.0006571859121322632, -0.0006344020366668701, -0.000611618161201477, -0.000588834285736084, -0.0005660504102706909, -0.0005432665348052979, -0.0005204826593399048, -0.0004976987838745117, -0.00047491490840911865, -0.0004521310329437256, -0.0004293471574783325, -0.00040656328201293945, -0.0003837794065475464, -0.0003609955310821533, -0.00033821165561676025, -0.0003154277801513672, -0.0002926439046859741, -0.00026986002922058105, -0.000247076153755188, -0.00022429227828979492, -0.00020150840282440186, -0.0001787245273590088, -0.00015594065189361572, -0.00013315677642822266, -0.00011037290096282959, -8.758902549743652e-05, -6.480515003204346e-05, -4.202127456665039e-05, -1.9237399101257324e-05, 3.546476364135742e-06, 2.633035182952881e-05, 4.9114227294921875e-05, 7.189810276031494e-05, 9.468197822570801e-05, 0.00011746585369110107, 0.00014024972915649414, 0.0001630336046218872, 0.00018581748008728027, 0.00020860135555267334, 0.0002313852310180664, 0.00025416910648345947, 0.00027695298194885254, 0.0002997368574142456, 0.00032252073287963867, 0.00034530460834503174, 0.0003680884838104248, 0.00039087235927581787, 0.00041365623474121094, 0.000436440110206604, 0.00045922398567199707, 0.00048200786113739014, 0.0005047917366027832, 0.0005275756120681763, 0.0005503594875335693, 0.0005731433629989624, 0.0005959272384643555, 0.0006187111139297485, 0.0006414949893951416, 0.0006642788648605347, 0.0006870627403259277, 0.0007098466157913208, 0.0007326304912567139, 0.0007554143667221069, 0.0007781982421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 15.0, 19.0, 22.0, 47.0, 107.0, 168.0, 350.0, 827.0, 2188.0, 8513.0, 81563.0, 896578.0, 48473.0, 6427.0, 1879.0, 693.0, 303.0, 158.0, 81.0, 47.0, 30.0, 11.0, 9.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.89453125, -4.7523193359375, -4.610107421875, -4.4678955078125, -4.32568359375, -4.1834716796875, -4.041259765625, -3.8990478515625, -3.7568359375, -3.6146240234375, -3.472412109375, -3.3302001953125, -3.18798828125, -3.0457763671875, -2.903564453125, -2.7613525390625, -2.619140625, -2.4769287109375, -2.334716796875, -2.1925048828125, -2.05029296875, -1.9080810546875, -1.765869140625, -1.6236572265625, -1.4814453125, -1.3392333984375, -1.197021484375, -1.0548095703125, -0.91259765625, -0.7703857421875, -0.628173828125, -0.4859619140625, -0.34375, -0.2015380859375, -0.059326171875, 0.0828857421875, 0.22509765625, 0.3673095703125, 0.509521484375, 0.6517333984375, 0.7939453125, 0.9361572265625, 1.078369140625, 1.2205810546875, 1.36279296875, 1.5050048828125, 1.647216796875, 1.7894287109375, 1.931640625, 2.0738525390625, 2.216064453125, 2.3582763671875, 2.50048828125, 2.6427001953125, 2.784912109375, 2.9271240234375, 3.0693359375, 3.2115478515625, 3.353759765625, 3.4959716796875, 3.63818359375, 3.7803955078125, 3.922607421875, 4.0648193359375, 4.20703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 21.0, 23.0, 56.0, 144.0, 245.0, 243.0, 141.0, 61.0, 27.0, 10.0, 4.0, 8.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.4990234375, -5.294921875, -5.0908203125, -4.88671875, -4.6826171875, -4.478515625, -4.2744140625, -4.0703125, -3.8662109375, -3.662109375, -3.4580078125, -3.25390625, -3.0498046875, -2.845703125, -2.6416015625, -2.4375, -2.2333984375, -2.029296875, -1.8251953125, -1.62109375, -1.4169921875, -1.212890625, -1.0087890625, -0.8046875, -0.6005859375, -0.396484375, -0.1923828125, 0.01171875, 0.2158203125, 0.419921875, 0.6240234375, 0.828125, 1.0322265625, 1.236328125, 1.4404296875, 1.64453125, 1.8486328125, 2.052734375, 2.2568359375, 2.4609375, 2.6650390625, 2.869140625, 3.0732421875, 3.27734375, 3.4814453125, 3.685546875, 3.8896484375, 4.09375, 4.2978515625, 4.501953125, 4.7060546875, 4.91015625, 5.1142578125, 5.318359375, 5.5224609375, 5.7265625, 5.9306640625, 6.134765625, 6.3388671875, 6.54296875, 6.7470703125, 6.951171875, 7.1552734375, 7.359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 10.0, 5.0, 9.0, 22.0, 24.0, 32.0, 59.0, 65.0, 110.0, 118.0, 132.0, 112.0, 94.0, 72.0, 37.0, 32.0, 17.0, 16.0, 11.0, 10.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-58.40155029296875, -56.9228630065918, -55.44417953491211, -53.965492248535156, -52.48680877685547, -51.008121490478516, -49.52943420410156, -48.050750732421875, -46.57206344604492, -45.09337615966797, -43.61469268798828, -42.13600540161133, -40.657318115234375, -39.17863464355469, -37.699947357177734, -36.22126007080078, -34.742576599121094, -33.26388931274414, -31.785205841064453, -30.3065185546875, -28.82783317565918, -27.34914779663086, -25.870460510253906, -24.391775131225586, -22.913089752197266, -21.434404373168945, -19.955718994140625, -18.477031707763672, -16.99834632873535, -15.519660949707031, -14.040974617004395, -12.562288284301758, -11.083602905273438, -9.604917526245117, -8.12623119354248, -6.647545337677002, -5.168859481811523, -3.690173625946045, -2.2114877700805664, -0.7328014373779297, 0.7458839416503906, 2.224569797515869, 3.7032556533813477, 5.181941509246826, 6.660627365112305, 8.139312744140625, 9.617999076843262, 11.096685409545898, 12.575370788574219, 14.054056167602539, 15.532742500305176, 17.011428833007812, 18.490114212036133, 19.968799591064453, 21.447486877441406, 22.926172256469727, 24.404857635498047, 25.883543014526367, 27.362228393554688, 28.84091567993164, 30.31960105895996, 31.79828643798828, 33.276973724365234, 34.75566101074219, 36.234344482421875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 6.0, 10.0, 6.0, 11.0, 17.0, 15.0, 23.0, 23.0, 22.0, 36.0, 40.0, 44.0, 49.0, 59.0, 57.0, 71.0, 65.0, 58.0, 56.0, 47.0, 53.0, 55.0, 34.0, 22.0, 25.0, 13.0, 15.0, 14.0, 8.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.012306213378906, -50.55244827270508, -49.09259033203125, -47.63273239135742, -46.172874450683594, -44.713016510009766, -43.25315856933594, -41.79330062866211, -40.33344268798828, -38.87358474731445, -37.413726806640625, -35.9538688659668, -34.49401092529297, -33.03415298461914, -31.574295043945312, -30.114437103271484, -28.654577255249023, -27.194719314575195, -25.734861373901367, -24.27500343322754, -22.81514549255371, -21.355287551879883, -19.895427703857422, -18.435569763183594, -16.975711822509766, -15.515853881835938, -14.05599594116211, -12.596138000488281, -11.136280059814453, -9.676422119140625, -8.21656322479248, -6.756705284118652, -5.296848297119141, -3.8369903564453125, -2.3771321773529053, -0.917273998260498, 0.5425839424133301, 2.002441883087158, 3.4623003005981445, 4.922158241271973, 6.382016181945801, 7.841874122619629, 9.301732063293457, 10.761590957641602, 12.22144889831543, 13.681306838989258, 15.141164779663086, 16.601022720336914, 18.060880661010742, 19.52073860168457, 20.9805965423584, 22.440454483032227, 23.900312423706055, 25.360170364379883, 26.820030212402344, 28.279888153076172, 29.73974609375, 31.199604034423828, 32.659461975097656, 34.119319915771484, 35.57917785644531, 37.03903579711914, 38.49889373779297, 39.9587516784668, 41.418609619140625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 11.0, 8.0, 10.0, 17.0, 23.0, 45.0, 69.0, 106.0, 212.0, 399.0, 1073.0, 4646.0, 4179404.0, 6065.0, 1262.0, 440.0, 211.0, 103.0, 63.0, 35.0, 27.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.177978515625, -27.46533203125, -26.752685546875, -26.0400390625, -25.327392578125, -24.61474609375, -23.902099609375, -23.189453125, -22.476806640625, -21.76416015625, -21.051513671875, -20.3388671875, -19.626220703125, -18.91357421875, -18.200927734375, -17.48828125, -16.775634765625, -16.06298828125, -15.350341796875, -14.6376953125, -13.925048828125, -13.21240234375, -12.499755859375, -11.787109375, -11.074462890625, -10.36181640625, -9.649169921875, -8.9365234375, -8.223876953125, -7.51123046875, -6.798583984375, -6.0859375, -5.373291015625, -4.66064453125, -3.947998046875, -3.2353515625, -2.522705078125, -1.81005859375, -1.097412109375, -0.384765625, 0.327880859375, 1.04052734375, 1.753173828125, 2.4658203125, 3.178466796875, 3.89111328125, 4.603759765625, 5.31640625, 6.029052734375, 6.74169921875, 7.454345703125, 8.1669921875, 8.879638671875, 9.59228515625, 10.304931640625, 11.017578125, 11.730224609375, 12.44287109375, 13.155517578125, 13.8681640625, 14.580810546875, 15.29345703125, 16.006103515625, 16.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 6.0, 13.0, 15.0, 20.0, 38.0, 49.0, 81.0, 111.0, 152.0, 151.0, 128.0, 73.0, 45.0, 41.0, 21.0, 14.0, 5.0, 15.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.23248291015625, -3.1368408203125, -3.04119873046875, -2.945556640625, -2.84991455078125, -2.7542724609375, -2.65863037109375, -2.56298828125, -2.46734619140625, -2.3717041015625, -2.27606201171875, -2.180419921875, -2.08477783203125, -1.9891357421875, -1.89349365234375, -1.7978515625, -1.70220947265625, -1.6065673828125, -1.51092529296875, -1.415283203125, -1.31964111328125, -1.2239990234375, -1.12835693359375, -1.03271484375, -0.93707275390625, -0.8414306640625, -0.74578857421875, -0.650146484375, -0.55450439453125, -0.4588623046875, -0.36322021484375, -0.267578125, -0.17193603515625, -0.0762939453125, 0.01934814453125, 0.114990234375, 0.21063232421875, 0.3062744140625, 0.40191650390625, 0.49755859375, 0.59320068359375, 0.6888427734375, 0.78448486328125, 0.880126953125, 0.97576904296875, 1.0714111328125, 1.16705322265625, 1.2626953125, 1.35833740234375, 1.4539794921875, 1.54962158203125, 1.645263671875, 1.74090576171875, 1.8365478515625, 1.93218994140625, 2.02783203125, 2.12347412109375, 2.2191162109375, 2.31475830078125, 2.410400390625, 2.50604248046875, 2.6016845703125, 2.69732666015625, 2.79296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 5.0, 9.0, 12.0, 23.0, 33.0, 39.0, 37.0, 49.0, 83.0, 106.0, 149.0, 167.0, 237.0, 323.0, 462.0, 685.0, 1075.0, 2079.0, 7041.0, 4152728.0, 21295.0, 3340.0, 1452.0, 855.0, 560.0, 400.0, 295.0, 200.0, 137.0, 101.0, 73.0, 63.0, 44.0, 18.0, 24.0, 18.0, 18.0, 9.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.375, -18.817138671875, -18.25927734375, -17.701416015625, -17.1435546875, -16.585693359375, -16.02783203125, -15.469970703125, -14.912109375, -14.354248046875, -13.79638671875, -13.238525390625, -12.6806640625, -12.122802734375, -11.56494140625, -11.007080078125, -10.44921875, -9.891357421875, -9.33349609375, -8.775634765625, -8.2177734375, -7.659912109375, -7.10205078125, -6.544189453125, -5.986328125, -5.428466796875, -4.87060546875, -4.312744140625, -3.7548828125, -3.197021484375, -2.63916015625, -2.081298828125, -1.5234375, -0.965576171875, -0.40771484375, 0.150146484375, 0.7080078125, 1.265869140625, 1.82373046875, 2.381591796875, 2.939453125, 3.497314453125, 4.05517578125, 4.613037109375, 5.1708984375, 5.728759765625, 6.28662109375, 6.844482421875, 7.40234375, 7.960205078125, 8.51806640625, 9.075927734375, 9.6337890625, 10.191650390625, 10.74951171875, 11.307373046875, 11.865234375, 12.423095703125, 12.98095703125, 13.538818359375, 14.0966796875, 14.654541015625, 15.21240234375, 15.770263671875, 16.328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 10.0, 10.0, 104.0, 3906.0, 30.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.652984619140625, -4.52081298828125, -4.388641357421875, -4.2564697265625, -4.124298095703125, -3.99212646484375, -3.859954833984375, -3.727783203125, -3.595611572265625, -3.46343994140625, -3.331268310546875, -3.1990966796875, -3.066925048828125, -2.93475341796875, -2.802581787109375, -2.67041015625, -2.538238525390625, -2.40606689453125, -2.273895263671875, -2.1417236328125, -2.009552001953125, -1.87738037109375, -1.745208740234375, -1.613037109375, -1.480865478515625, -1.34869384765625, -1.216522216796875, -1.0843505859375, -0.952178955078125, -0.82000732421875, -0.687835693359375, -0.5556640625, -0.423492431640625, -0.29132080078125, -0.159149169921875, -0.0269775390625, 0.105194091796875, 0.23736572265625, 0.369537353515625, 0.501708984375, 0.633880615234375, 0.76605224609375, 0.898223876953125, 1.0303955078125, 1.162567138671875, 1.29473876953125, 1.426910400390625, 1.55908203125, 1.691253662109375, 1.82342529296875, 1.955596923828125, 2.0877685546875, 2.219940185546875, 2.35211181640625, 2.484283447265625, 2.616455078125, 2.748626708984375, 2.88079833984375, 3.012969970703125, 3.1451416015625, 3.277313232421875, 3.40948486328125, 3.541656494140625, 3.673828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 8.0, 5.0, 4.0, 3.0, 9.0, 15.0, 19.0, 27.0, 29.0, 33.0, 49.0, 62.0, 88.0, 123.0, 122.0, 121.0, 87.0, 56.0, 37.0, 31.0, 18.0, 19.0, 14.0, 9.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.563186645507812, -8.302862167358398, -8.042536735534668, -7.782212257385254, -7.521887302398682, -7.261562347412109, -7.001237869262695, -6.740912914276123, -6.480587959289551, -6.2202630043029785, -5.9599385261535645, -5.699613571166992, -5.43928861618042, -5.178963661193848, -4.918639183044434, -4.658314228057861, -4.397989749908447, -4.137664794921875, -3.877340078353882, -3.6170153617858887, -3.3566904067993164, -3.0963656902313232, -2.83604097366333, -2.575716018676758, -2.3153913021087646, -2.0550665855407715, -1.7947416305541992, -1.534416913986206, -1.2740920782089233, -1.0137672424316406, -0.7534425258636475, -0.49311769008636475, -0.23279285430908203, 0.027531951665878296, 0.2878567576408386, 0.5481815338134766, 0.8085063695907593, 1.068831205368042, 1.3291559219360352, 1.5894807577133179, 1.8498055934906006, 2.1101303100585938, 2.370455265045166, 2.630779981613159, 2.8911046981811523, 3.1514296531677246, 3.4117543697357178, 3.672079086303711, 3.932404041290283, 4.1927289962768555, 4.4530534744262695, 4.713378429412842, 4.973703384399414, 5.234027862548828, 5.4943528175354, 5.754677772521973, 6.015002250671387, 6.275327205657959, 6.535651683807373, 6.795976638793945, 7.056301593780518, 7.31662654876709, 7.576951026916504, 7.837275981903076, 8.097600936889648]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 13.0, 4.0, 11.0, 15.0, 12.0, 17.0, 21.0, 19.0, 33.0, 28.0, 33.0, 42.0, 42.0, 42.0, 36.0, 47.0, 32.0, 39.0, 44.0, 43.0, 29.0, 48.0, 44.0, 29.0, 29.0, 35.0, 26.0, 27.0, 20.0, 30.0, 12.0, 19.0, 12.0, 12.0, 10.0, 7.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.181884288787842, -5.013457775115967, -4.84503173828125, -4.676605224609375, -4.5081787109375, -4.339752197265625, -4.17132568359375, -4.002899646759033, -3.834473133087158, -3.666046619415283, -3.4976203441619873, -3.3291940689086914, -3.1607675552368164, -2.9923410415649414, -2.8239147663116455, -2.6554884910583496, -2.4870619773864746, -2.3186354637145996, -2.1502091884613037, -1.9817827939987183, -1.8133563995361328, -1.6449300050735474, -1.476503610610962, -1.3080772161483765, -1.139650821685791, -0.9712244272232056, -0.8027980327606201, -0.6343716382980347, -0.4659452438354492, -0.29751884937286377, -0.12909245491027832, 0.03933393955230713, 0.20776081085205078, 0.37618720531463623, 0.5446135997772217, 0.7130399942398071, 0.8814663887023926, 1.049892783164978, 1.2183191776275635, 1.386745572090149, 1.5551719665527344, 1.7235983610153198, 1.8920247554779053, 2.060451030731201, 2.228877544403076, 2.397304058074951, 2.565730333328247, 2.734156608581543, 2.902583122253418, 3.071009635925293, 3.239435911178589, 3.4078621864318848, 3.5762887001037598, 3.7447152137756348, 3.9131414890289307, 4.081567764282227, 4.249994277954102, 4.418420791625977, 4.586847305297852, 4.755273342132568, 4.923699855804443, 5.092126369476318, 5.260552406311035, 5.42897891998291, 5.597405433654785]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 11.0, 11.0, 16.0, 19.0, 25.0, 45.0, 65.0, 100.0, 117.0, 189.0, 286.0, 458.0, 745.0, 1236.0, 2125.0, 4062.0, 8860.0, 23143.0, 77170.0, 410671.0, 402437.0, 75388.0, 22773.0, 8931.0, 4200.0, 2113.0, 1178.0, 774.0, 473.0, 288.0, 199.0, 119.0, 93.0, 58.0, 45.0, 40.0, 24.0, 17.0, 9.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-4.91015625, -4.77374267578125, -4.6373291015625, -4.50091552734375, -4.364501953125, -4.22808837890625, -4.0916748046875, -3.95526123046875, -3.81884765625, -3.68243408203125, -3.5460205078125, -3.40960693359375, -3.273193359375, -3.13677978515625, -3.0003662109375, -2.86395263671875, -2.7275390625, -2.59112548828125, -2.4547119140625, -2.31829833984375, -2.181884765625, -2.04547119140625, -1.9090576171875, -1.77264404296875, -1.63623046875, -1.49981689453125, -1.3634033203125, -1.22698974609375, -1.090576171875, -0.95416259765625, -0.8177490234375, -0.68133544921875, -0.544921875, -0.40850830078125, -0.2720947265625, -0.13568115234375, 0.000732421875, 0.13714599609375, 0.2735595703125, 0.40997314453125, 0.54638671875, 0.68280029296875, 0.8192138671875, 0.95562744140625, 1.092041015625, 1.22845458984375, 1.3648681640625, 1.50128173828125, 1.6376953125, 1.77410888671875, 1.9105224609375, 2.04693603515625, 2.183349609375, 2.31976318359375, 2.4561767578125, 2.59259033203125, 2.72900390625, 2.86541748046875, 3.0018310546875, 3.13824462890625, 3.274658203125, 3.41107177734375, 3.5474853515625, 3.68389892578125, 3.8203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 3.0, 12.0, 19.0, 12.0, 18.0, 35.0, 52.0, 56.0, 84.0, 83.0, 103.0, 119.0, 83.0, 72.0, 56.0, 50.0, 36.0, 18.0, 15.0, 17.0, 7.0, 6.0, 2.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.537109375, -2.459625244140625, -2.38214111328125, -2.304656982421875, -2.2271728515625, -2.149688720703125, -2.07220458984375, -1.994720458984375, -1.917236328125, -1.839752197265625, -1.76226806640625, -1.684783935546875, -1.6072998046875, -1.529815673828125, -1.45233154296875, -1.374847412109375, -1.29736328125, -1.219879150390625, -1.14239501953125, -1.064910888671875, -0.9874267578125, -0.909942626953125, -0.83245849609375, -0.754974365234375, -0.677490234375, -0.600006103515625, -0.52252197265625, -0.445037841796875, -0.3675537109375, -0.290069580078125, -0.21258544921875, -0.135101318359375, -0.0576171875, 0.019866943359375, 0.09735107421875, 0.174835205078125, 0.2523193359375, 0.329803466796875, 0.40728759765625, 0.484771728515625, 0.562255859375, 0.639739990234375, 0.71722412109375, 0.794708251953125, 0.8721923828125, 0.949676513671875, 1.02716064453125, 1.104644775390625, 1.18212890625, 1.259613037109375, 1.33709716796875, 1.414581298828125, 1.4920654296875, 1.569549560546875, 1.64703369140625, 1.724517822265625, 1.802001953125, 1.879486083984375, 1.95697021484375, 2.034454345703125, 2.1119384765625, 2.189422607421875, 2.26690673828125, 2.344390869140625, 2.421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 6.0, 6.0, 9.0, 8.0, 16.0, 18.0, 23.0, 47.0, 71.0, 103.0, 204.0, 289.0, 612.0, 1439.0, 4029.0, 14423.0, 80200.0, 713534.0, 196831.0, 26291.0, 6315.0, 2150.0, 893.0, 439.0, 246.0, 123.0, 88.0, 40.0, 44.0, 18.0, 18.0, 12.0, 6.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.6737060546875, -6.441162109375, -6.2086181640625, -5.97607421875, -5.7435302734375, -5.510986328125, -5.2784423828125, -5.0458984375, -4.8133544921875, -4.580810546875, -4.3482666015625, -4.11572265625, -3.8831787109375, -3.650634765625, -3.4180908203125, -3.185546875, -2.9530029296875, -2.720458984375, -2.4879150390625, -2.25537109375, -2.0228271484375, -1.790283203125, -1.5577392578125, -1.3251953125, -1.0926513671875, -0.860107421875, -0.6275634765625, -0.39501953125, -0.1624755859375, 0.070068359375, 0.3026123046875, 0.53515625, 0.7677001953125, 1.000244140625, 1.2327880859375, 1.46533203125, 1.6978759765625, 1.930419921875, 2.1629638671875, 2.3955078125, 2.6280517578125, 2.860595703125, 3.0931396484375, 3.32568359375, 3.5582275390625, 3.790771484375, 4.0233154296875, 4.255859375, 4.4884033203125, 4.720947265625, 4.9534912109375, 5.18603515625, 5.4185791015625, 5.651123046875, 5.8836669921875, 6.1162109375, 6.3487548828125, 6.581298828125, 6.8138427734375, 7.04638671875, 7.2789306640625, 7.511474609375, 7.7440185546875, 7.9765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 9.0, 15.0, 13.0, 22.0, 23.0, 27.0, 27.0, 37.0, 27.0, 47.0, 43.0, 53.0, 53.0, 58.0, 62.0, 48.0, 47.0, 49.0, 50.0, 45.0, 33.0, 41.0, 36.0, 26.0, 20.0, 17.0, 12.0, 8.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8265380859375, -8.535888671875, -8.2452392578125, -7.95458984375, -7.6639404296875, -7.373291015625, -7.0826416015625, -6.7919921875, -6.5013427734375, -6.210693359375, -5.9200439453125, -5.62939453125, -5.3387451171875, -5.048095703125, -4.7574462890625, -4.466796875, -4.1761474609375, -3.885498046875, -3.5948486328125, -3.30419921875, -3.0135498046875, -2.722900390625, -2.4322509765625, -2.1416015625, -1.8509521484375, -1.560302734375, -1.2696533203125, -0.97900390625, -0.6883544921875, -0.397705078125, -0.1070556640625, 0.18359375, 0.4742431640625, 0.764892578125, 1.0555419921875, 1.34619140625, 1.6368408203125, 1.927490234375, 2.2181396484375, 2.5087890625, 2.7994384765625, 3.090087890625, 3.3807373046875, 3.67138671875, 3.9620361328125, 4.252685546875, 4.5433349609375, 4.833984375, 5.1246337890625, 5.415283203125, 5.7059326171875, 5.99658203125, 6.2872314453125, 6.577880859375, 6.8685302734375, 7.1591796875, 7.4498291015625, 7.740478515625, 8.0311279296875, 8.32177734375, 8.6124267578125, 8.903076171875, 9.1937255859375, 9.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 20.0, 36.0, 35.0, 66.0, 147.0, 345.0, 2151.0, 138741.0, 901422.0, 4703.0, 482.0, 160.0, 89.0, 51.0, 33.0, 18.0, 10.0, 8.0, 6.0, 5.0, 2.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -12.0401611328125, -11.697509765625, -11.3548583984375, -11.01220703125, -10.6695556640625, -10.326904296875, -9.9842529296875, -9.6416015625, -9.2989501953125, -8.956298828125, -8.6136474609375, -8.27099609375, -7.9283447265625, -7.585693359375, -7.2430419921875, -6.900390625, -6.5577392578125, -6.215087890625, -5.8724365234375, -5.52978515625, -5.1871337890625, -4.844482421875, -4.5018310546875, -4.1591796875, -3.8165283203125, -3.473876953125, -3.1312255859375, -2.78857421875, -2.4459228515625, -2.103271484375, -1.7606201171875, -1.41796875, -1.0753173828125, -0.732666015625, -0.3900146484375, -0.04736328125, 0.2952880859375, 0.637939453125, 0.9805908203125, 1.3232421875, 1.6658935546875, 2.008544921875, 2.3511962890625, 2.69384765625, 3.0364990234375, 3.379150390625, 3.7218017578125, 4.064453125, 4.4071044921875, 4.749755859375, 5.0924072265625, 5.43505859375, 5.7777099609375, 6.120361328125, 6.4630126953125, 6.8056640625, 7.1483154296875, 7.490966796875, 7.8336181640625, 8.17626953125, 8.5189208984375, 8.861572265625, 9.2042236328125, 9.546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 13.0, 35.0, 60.0, 174.0, 279.0, 238.0, 95.0, 48.0, 29.0, 12.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003571510314941406, -0.0003290101885795593, -0.00030086934566497803, -0.00027272850275039673, -0.00024458765983581543, -0.00021644681692123413, -0.00018830597400665283, -0.00016016513109207153, -0.00013202428817749023, -0.00010388344526290894, -7.574260234832764e-05, -4.760175943374634e-05, -1.946091651916504e-05, 8.67992639541626e-06, 3.682076930999756e-05, 6.496161222457886e-05, 9.310245513916016e-05, 0.00012124329805374146, 0.00014938414096832275, 0.00017752498388290405, 0.00020566582679748535, 0.00023380666971206665, 0.00026194751262664795, 0.00029008835554122925, 0.00031822919845581055, 0.00034637004137039185, 0.00037451088428497314, 0.00040265172719955444, 0.00043079257011413574, 0.00045893341302871704, 0.00048707425594329834, 0.0005152150988578796, 0.0005433559417724609, 0.0005714967846870422, 0.0005996376276016235, 0.0006277784705162048, 0.0006559193134307861, 0.0006840601563453674, 0.0007122009992599487, 0.00074034184217453, 0.0007684826850891113, 0.0007966235280036926, 0.0008247643709182739, 0.0008529052138328552, 0.0008810460567474365, 0.0009091868996620178, 0.0009373277425765991, 0.0009654685854911804, 0.0009936094284057617, 0.001021750271320343, 0.0010498911142349243, 0.0010780319571495056, 0.001106172800064087, 0.0011343136429786682, 0.0011624544858932495, 0.0011905953288078308, 0.0012187361717224121, 0.0012468770146369934, 0.0012750178575515747, 0.001303158700466156, 0.0013312995433807373, 0.0013594403862953186, 0.0013875812292099, 0.0014157220721244812, 0.0014438629150390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 15.0, 6.0, 10.0, 24.0, 40.0, 73.0, 156.0, 350.0, 952.0, 3859.0, 32671.0, 845179.0, 152809.0, 9679.0, 1720.0, 551.0, 220.0, 95.0, 65.0, 27.0, 20.0, 14.0, 7.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.749755859375, -5.59326171875, -5.436767578125, -5.2802734375, -5.123779296875, -4.96728515625, -4.810791015625, -4.654296875, -4.497802734375, -4.34130859375, -4.184814453125, -4.0283203125, -3.871826171875, -3.71533203125, -3.558837890625, -3.40234375, -3.245849609375, -3.08935546875, -2.932861328125, -2.7763671875, -2.619873046875, -2.46337890625, -2.306884765625, -2.150390625, -1.993896484375, -1.83740234375, -1.680908203125, -1.5244140625, -1.367919921875, -1.21142578125, -1.054931640625, -0.8984375, -0.741943359375, -0.58544921875, -0.428955078125, -0.2724609375, -0.115966796875, 0.04052734375, 0.197021484375, 0.353515625, 0.510009765625, 0.66650390625, 0.822998046875, 0.9794921875, 1.135986328125, 1.29248046875, 1.448974609375, 1.60546875, 1.761962890625, 1.91845703125, 2.074951171875, 2.2314453125, 2.387939453125, 2.54443359375, 2.700927734375, 2.857421875, 3.013916015625, 3.17041015625, 3.326904296875, 3.4833984375, 3.639892578125, 3.79638671875, 3.952880859375, 4.109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 6.0, 9.0, 16.0, 22.0, 34.0, 35.0, 55.0, 86.0, 107.0, 139.0, 141.0, 105.0, 52.0, 53.0, 37.0, 33.0, 19.0, 11.0, 15.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.912109375, -3.799957275390625, -3.68780517578125, -3.575653076171875, -3.4635009765625, -3.351348876953125, -3.23919677734375, -3.127044677734375, -3.014892578125, -2.902740478515625, -2.79058837890625, -2.678436279296875, -2.5662841796875, -2.454132080078125, -2.34197998046875, -2.229827880859375, -2.11767578125, -2.005523681640625, -1.89337158203125, -1.781219482421875, -1.6690673828125, -1.556915283203125, -1.44476318359375, -1.332611083984375, -1.220458984375, -1.108306884765625, -0.99615478515625, -0.884002685546875, -0.7718505859375, -0.659698486328125, -0.54754638671875, -0.435394287109375, -0.3232421875, -0.211090087890625, -0.09893798828125, 0.013214111328125, 0.1253662109375, 0.237518310546875, 0.34967041015625, 0.461822509765625, 0.573974609375, 0.686126708984375, 0.79827880859375, 0.910430908203125, 1.0225830078125, 1.134735107421875, 1.24688720703125, 1.359039306640625, 1.47119140625, 1.583343505859375, 1.69549560546875, 1.807647705078125, 1.9197998046875, 2.031951904296875, 2.14410400390625, 2.256256103515625, 2.368408203125, 2.480560302734375, 2.59271240234375, 2.704864501953125, 2.8170166015625, 2.929168701171875, 3.04132080078125, 3.153472900390625, 3.265625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 15.0, 19.0, 12.0, 38.0, 71.0, 120.0, 160.0, 162.0, 166.0, 107.0, 47.0, 37.0, 20.0, 11.0, 4.0, 3.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.06126403808594, -82.25242614746094, -80.44358825683594, -78.63475036621094, -76.82591247558594, -75.01707458496094, -73.20823669433594, -71.39939880371094, -69.59056091308594, -67.78172302246094, -65.97288513183594, -64.16404724121094, -62.35520935058594, -60.54637145996094, -58.73753356933594, -56.92869567871094, -55.1198616027832, -53.3110237121582, -51.5021858215332, -49.6933479309082, -47.8845100402832, -46.0756721496582, -44.26683807373047, -42.45800018310547, -40.64916229248047, -38.84032440185547, -37.03148651123047, -35.22264862060547, -33.41381072998047, -31.60497283935547, -29.7961368560791, -27.9872989654541, -26.17845916748047, -24.36962127685547, -22.56078338623047, -20.75194549560547, -18.94310760498047, -17.13426971435547, -15.325433731079102, -13.516595840454102, -11.707757949829102, -9.898920059204102, -8.090082168579102, -6.281245231628418, -4.472407341003418, -2.663569450378418, -0.8547325134277344, 0.9541053771972656, 2.7629432678222656, 4.571781158447266, 6.380618572235107, 8.18945598602295, 9.99829387664795, 11.80713176727295, 13.615968704223633, 15.424806594848633, 17.233644485473633, 19.042482376098633, 20.851320266723633, 22.66015625, 24.468994140625, 26.27783203125, 28.086669921875, 29.8955078125, 31.704345703125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 15.0, 20.0, 21.0, 18.0, 22.0, 35.0, 41.0, 55.0, 66.0, 65.0, 66.0, 82.0, 91.0, 59.0, 55.0, 65.0, 44.0, 36.0, 26.0, 31.0, 19.0, 15.0, 13.0, 11.0, 12.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.64944839477539, -61.10551071166992, -59.56157302856445, -58.017635345458984, -56.473697662353516, -54.92975616455078, -53.38581848144531, -51.841880798339844, -50.297943115234375, -48.754005432128906, -47.21006774902344, -45.66613006591797, -44.1221923828125, -42.57825469970703, -41.03431701660156, -39.49037551879883, -37.946441650390625, -36.402503967285156, -34.85856628417969, -33.31462860107422, -31.770689010620117, -30.22675132751465, -28.68281364440918, -27.138874053955078, -25.59493637084961, -24.05099868774414, -22.507061004638672, -20.963123321533203, -19.4191837310791, -17.875246047973633, -16.331308364868164, -14.787369728088379, -13.243431091308594, -11.699493408203125, -10.15555477142334, -8.611617088317871, -7.067678928375244, -5.523740768432617, -3.9798030853271484, -2.4358644485473633, -0.8919267654418945, 0.6520112752914429, 2.1959493160247803, 3.739887237548828, 5.283825397491455, 6.827763557434082, 8.37170124053955, 9.915639877319336, 11.459577560424805, 13.003515243530273, 14.547453880310059, 16.091392517089844, 17.635330200195312, 19.17926788330078, 20.72320556640625, 22.26714324951172, 23.811080932617188, 25.355018615722656, 26.898956298828125, 28.442893981933594, 29.986833572387695, 31.530771255493164, 33.07470703125, 34.618648529052734, 36.1625862121582]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 17.0, 18.0, 25.0, 38.0, 63.0, 93.0, 151.0, 254.0, 493.0, 1264.0, 4178.0, 237030.0, 3943385.0, 4932.0, 1275.0, 484.0, 230.0, 128.0, 63.0, 48.0, 28.0, 14.0, 11.0, 2.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.84375, -25.2696533203125, -24.695556640625, -24.1214599609375, -23.54736328125, -22.9732666015625, -22.399169921875, -21.8250732421875, -21.2509765625, -20.6768798828125, -20.102783203125, -19.5286865234375, -18.95458984375, -18.3804931640625, -17.806396484375, -17.2322998046875, -16.658203125, -16.0841064453125, -15.510009765625, -14.9359130859375, -14.36181640625, -13.7877197265625, -13.213623046875, -12.6395263671875, -12.0654296875, -11.4913330078125, -10.917236328125, -10.3431396484375, -9.76904296875, -9.1949462890625, -8.620849609375, -8.0467529296875, -7.47265625, -6.8985595703125, -6.324462890625, -5.7503662109375, -5.17626953125, -4.6021728515625, -4.028076171875, -3.4539794921875, -2.8798828125, -2.3057861328125, -1.731689453125, -1.1575927734375, -0.58349609375, -0.0093994140625, 0.564697265625, 1.1387939453125, 1.712890625, 2.2869873046875, 2.861083984375, 3.4351806640625, 4.00927734375, 4.5833740234375, 5.157470703125, 5.7315673828125, 6.3056640625, 6.8797607421875, 7.453857421875, 8.0279541015625, 8.60205078125, 9.1761474609375, 9.750244140625, 10.3243408203125, 10.8984375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 14.0, 13.0, 18.0, 42.0, 97.0, 133.0, 206.0, 184.0, 129.0, 69.0, 36.0, 16.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5625, -6.41204833984375, -6.2615966796875, -6.11114501953125, -5.960693359375, -5.81024169921875, -5.6597900390625, -5.50933837890625, -5.35888671875, -5.20843505859375, -5.0579833984375, -4.90753173828125, -4.757080078125, -4.60662841796875, -4.4561767578125, -4.30572509765625, -4.1552734375, -4.00482177734375, -3.8543701171875, -3.70391845703125, -3.553466796875, -3.40301513671875, -3.2525634765625, -3.10211181640625, -2.95166015625, -2.80120849609375, -2.6507568359375, -2.50030517578125, -2.349853515625, -2.19940185546875, -2.0489501953125, -1.89849853515625, -1.748046875, -1.59759521484375, -1.4471435546875, -1.29669189453125, -1.146240234375, -0.99578857421875, -0.8453369140625, -0.69488525390625, -0.54443359375, -0.39398193359375, -0.2435302734375, -0.09307861328125, 0.057373046875, 0.20782470703125, 0.3582763671875, 0.50872802734375, 0.6591796875, 0.80963134765625, 0.9600830078125, 1.11053466796875, 1.260986328125, 1.41143798828125, 1.5618896484375, 1.71234130859375, 1.86279296875, 2.01324462890625, 2.1636962890625, 2.31414794921875, 2.464599609375, 2.61505126953125, 2.7655029296875, 2.91595458984375, 3.06640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 4.0, 13.0, 12.0, 17.0, 22.0, 35.0, 25.0, 25.0, 39.0, 67.0, 95.0, 101.0, 127.0, 171.0, 275.0, 404.0, 587.0, 910.0, 1547.0, 2523.0, 4651.0, 9694.0, 34678.0, 4063449.0, 50742.0, 11156.0, 5144.0, 2781.0, 1749.0, 1058.0, 633.0, 430.0, 339.0, 195.0, 128.0, 112.0, 87.0, 74.0, 51.0, 26.0, 24.0, 17.0, 18.0, 9.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.5234375, -8.2447509765625, -7.966064453125, -7.6873779296875, -7.40869140625, -7.1300048828125, -6.851318359375, -6.5726318359375, -6.2939453125, -6.0152587890625, -5.736572265625, -5.4578857421875, -5.17919921875, -4.9005126953125, -4.621826171875, -4.3431396484375, -4.064453125, -3.7857666015625, -3.507080078125, -3.2283935546875, -2.94970703125, -2.6710205078125, -2.392333984375, -2.1136474609375, -1.8349609375, -1.5562744140625, -1.277587890625, -0.9989013671875, -0.72021484375, -0.4415283203125, -0.162841796875, 0.1158447265625, 0.39453125, 0.6732177734375, 0.951904296875, 1.2305908203125, 1.50927734375, 1.7879638671875, 2.066650390625, 2.3453369140625, 2.6240234375, 2.9027099609375, 3.181396484375, 3.4600830078125, 3.73876953125, 4.0174560546875, 4.296142578125, 4.5748291015625, 4.853515625, 5.1322021484375, 5.410888671875, 5.6895751953125, 5.96826171875, 6.2469482421875, 6.525634765625, 6.8043212890625, 7.0830078125, 7.3616943359375, 7.640380859375, 7.9190673828125, 8.19775390625, 8.4764404296875, 8.755126953125, 9.0338134765625, 9.3125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 6.0, 6.0, 10.0, 16.0, 34.0, 168.0, 3671.0, 68.0, 36.0, 15.0, 11.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.96649169921875, -4.8079833984375, -4.64947509765625, -4.490966796875, -4.33245849609375, -4.1739501953125, -4.01544189453125, -3.85693359375, -3.69842529296875, -3.5399169921875, -3.38140869140625, -3.222900390625, -3.06439208984375, -2.9058837890625, -2.74737548828125, -2.5888671875, -2.43035888671875, -2.2718505859375, -2.11334228515625, -1.954833984375, -1.79632568359375, -1.6378173828125, -1.47930908203125, -1.32080078125, -1.16229248046875, -1.0037841796875, -0.84527587890625, -0.686767578125, -0.52825927734375, -0.3697509765625, -0.21124267578125, -0.052734375, 0.10577392578125, 0.2642822265625, 0.42279052734375, 0.581298828125, 0.73980712890625, 0.8983154296875, 1.05682373046875, 1.21533203125, 1.37384033203125, 1.5323486328125, 1.69085693359375, 1.849365234375, 2.00787353515625, 2.1663818359375, 2.32489013671875, 2.4833984375, 2.64190673828125, 2.8004150390625, 2.95892333984375, 3.117431640625, 3.27593994140625, 3.4344482421875, 3.59295654296875, 3.75146484375, 3.90997314453125, 4.0684814453125, 4.22698974609375, 4.385498046875, 4.54400634765625, 4.7025146484375, 4.86102294921875, 5.01953125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 2.0, 6.0, 3.0, 3.0, 7.0, 9.0, 6.0, 10.0, 12.0, 19.0, 17.0, 27.0, 35.0, 47.0, 64.0, 78.0, 91.0, 96.0, 74.0, 72.0, 63.0, 62.0, 40.0, 30.0, 18.0, 12.0, 13.0, 20.0, 15.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.592257499694824, -9.307798385620117, -9.023338317871094, -8.738879203796387, -8.454419136047363, -8.169960021972656, -7.885500431060791, -7.601040840148926, -7.3165812492370605, -7.032121658325195, -6.74766206741333, -6.463202476501465, -6.178743362426758, -5.894283294677734, -5.609824180603027, -5.325364589691162, -5.040904998779297, -4.756445407867432, -4.471985816955566, -4.187526226043701, -3.903066873550415, -3.61860728263855, -3.3341479301452637, -3.0496883392333984, -2.765228748321533, -2.480769157409668, -2.1963095664978027, -1.9118502140045166, -1.6273906230926514, -1.3429310321807861, -1.0584715604782104, -0.7740120887756348, -0.48955345153808594, -0.20509392023086548, 0.07936561107635498, 0.36382514238357544, 0.6482846736907959, 0.9327442646026611, 1.2172037363052368, 1.5016632080078125, 1.7861227989196777, 2.070582389831543, 2.355041980743408, 2.6395013332366943, 2.9239609241485596, 3.208420515060425, 3.492879867553711, 3.777339458465576, 4.061799049377441, 4.346258640289307, 4.630718231201172, 4.915177822113037, 5.199637413024902, 5.484096527099609, 5.768556118011475, 6.05301570892334, 6.337475299835205, 6.62193489074707, 6.9063944816589355, 7.190854072570801, 7.475313186645508, 7.759773254394531, 8.044232368469238, 8.328691482543945, 8.613151550292969]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 9.0, 9.0, 16.0, 10.0, 15.0, 27.0, 19.0, 24.0, 36.0, 39.0, 27.0, 46.0, 49.0, 40.0, 53.0, 56.0, 51.0, 58.0, 61.0, 48.0, 49.0, 36.0, 41.0, 34.0, 28.0, 29.0, 16.0, 14.0, 14.0, 12.0, 7.0, 7.0, 5.0, 2.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.650160789489746, -7.321600437164307, -6.993040084838867, -6.664480209350586, -6.3359198570251465, -6.007359504699707, -5.678799629211426, -5.350239276885986, -5.021678924560547, -4.693118572235107, -4.364558219909668, -4.035998344421387, -3.7074379920959473, -3.378877639770508, -3.0503175258636475, -2.721757411956787, -2.3931970596313477, -2.064636707305908, -1.7360765933990479, -1.407516360282898, -1.078956127166748, -0.7503958940505981, -0.42183566093444824, -0.09327554702758789, 0.23528480529785156, 0.5638450384140015, 0.8924052715301514, 1.2209655046463013, 1.5495257377624512, 1.878085970878601, 2.206646203994751, 2.5352063179016113, 2.863767623901367, 3.1923279762268066, 3.520888090133667, 3.8494482040405273, 4.178008556365967, 4.506568908691406, 4.8351287841796875, 5.163689136505127, 5.492249488830566, 5.820809841156006, 6.149370193481445, 6.477930068969727, 6.806490421295166, 7.1350507736206055, 7.463610649108887, 7.792171001434326, 8.120731353759766, 8.449291229248047, 8.777852058410645, 9.106411933898926, 9.434972763061523, 9.763532638549805, 10.092092514038086, 10.420652389526367, 10.749213218688965, 11.077773094177246, 11.406333923339844, 11.734893798828125, 12.063453674316406, 12.392014503479004, 12.720574378967285, 13.049135208129883, 13.377695083618164]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 16.0, 20.0, 24.0, 37.0, 75.0, 100.0, 141.0, 275.0, 440.0, 945.0, 2310.0, 6237.0, 24865.0, 175979.0, 716032.0, 96516.0, 16356.0, 4628.0, 1752.0, 782.0, 407.0, 226.0, 136.0, 83.0, 43.0, 31.0, 17.0, 23.0, 15.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.671875, -8.3765869140625, -8.081298828125, -7.7860107421875, -7.49072265625, -7.1954345703125, -6.900146484375, -6.6048583984375, -6.3095703125, -6.0142822265625, -5.718994140625, -5.4237060546875, -5.12841796875, -4.8331298828125, -4.537841796875, -4.2425537109375, -3.947265625, -3.6519775390625, -3.356689453125, -3.0614013671875, -2.76611328125, -2.4708251953125, -2.175537109375, -1.8802490234375, -1.5849609375, -1.2896728515625, -0.994384765625, -0.6990966796875, -0.40380859375, -0.1085205078125, 0.186767578125, 0.4820556640625, 0.77734375, 1.0726318359375, 1.367919921875, 1.6632080078125, 1.95849609375, 2.2537841796875, 2.549072265625, 2.8443603515625, 3.1396484375, 3.4349365234375, 3.730224609375, 4.0255126953125, 4.32080078125, 4.6160888671875, 4.911376953125, 5.2066650390625, 5.501953125, 5.7972412109375, 6.092529296875, 6.3878173828125, 6.68310546875, 6.9783935546875, 7.273681640625, 7.5689697265625, 7.8642578125, 8.1595458984375, 8.454833984375, 8.7501220703125, 9.04541015625, 9.3406982421875, 9.635986328125, 9.9312744140625, 10.2265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 8.0, 9.0, 19.0, 9.0, 38.0, 52.0, 60.0, 95.0, 111.0, 133.0, 118.0, 106.0, 86.0, 57.0, 34.0, 18.0, 16.0, 10.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.453765869140625, -4.34112548828125, -4.228485107421875, -4.1158447265625, -4.003204345703125, -3.89056396484375, -3.777923583984375, -3.665283203125, -3.552642822265625, -3.44000244140625, -3.327362060546875, -3.2147216796875, -3.102081298828125, -2.98944091796875, -2.876800537109375, -2.76416015625, -2.651519775390625, -2.53887939453125, -2.426239013671875, -2.3135986328125, -2.200958251953125, -2.08831787109375, -1.975677490234375, -1.863037109375, -1.750396728515625, -1.63775634765625, -1.525115966796875, -1.4124755859375, -1.299835205078125, -1.18719482421875, -1.074554443359375, -0.9619140625, -0.849273681640625, -0.73663330078125, -0.623992919921875, -0.5113525390625, -0.398712158203125, -0.28607177734375, -0.173431396484375, -0.060791015625, 0.051849365234375, 0.16448974609375, 0.277130126953125, 0.3897705078125, 0.502410888671875, 0.61505126953125, 0.727691650390625, 0.84033203125, 0.952972412109375, 1.06561279296875, 1.178253173828125, 1.2908935546875, 1.403533935546875, 1.51617431640625, 1.628814697265625, 1.741455078125, 1.854095458984375, 1.96673583984375, 2.079376220703125, 2.1920166015625, 2.304656982421875, 2.41729736328125, 2.529937744140625, 2.642578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 14.0, 14.0, 22.0, 57.0, 64.0, 112.0, 188.0, 425.0, 971.0, 2596.0, 9127.0, 51313.0, 663415.0, 284894.0, 26185.0, 5811.0, 1858.0, 727.0, 312.0, 171.0, 110.0, 59.0, 25.0, 19.0, 23.0, 9.0, 8.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -6.935546875, -6.64453125, -6.353515625, -6.0625, -5.771484375, -5.48046875, -5.189453125, -4.8984375, -4.607421875, -4.31640625, -4.025390625, -3.734375, -3.443359375, -3.15234375, -2.861328125, -2.5703125, -2.279296875, -1.98828125, -1.697265625, -1.40625, -1.115234375, -0.82421875, -0.533203125, -0.2421875, 0.048828125, 0.33984375, 0.630859375, 0.921875, 1.212890625, 1.50390625, 1.794921875, 2.0859375, 2.376953125, 2.66796875, 2.958984375, 3.25, 3.541015625, 3.83203125, 4.123046875, 4.4140625, 4.705078125, 4.99609375, 5.287109375, 5.578125, 5.869140625, 6.16015625, 6.451171875, 6.7421875, 7.033203125, 7.32421875, 7.615234375, 7.90625, 8.197265625, 8.48828125, 8.779296875, 9.0703125, 9.361328125, 9.65234375, 9.943359375, 10.234375, 10.525390625, 10.81640625, 11.107421875, 11.3984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 5.0, 8.0, 6.0, 6.0, 14.0, 12.0, 13.0, 20.0, 24.0, 23.0, 29.0, 39.0, 51.0, 39.0, 53.0, 50.0, 52.0, 52.0, 49.0, 49.0, 37.0, 53.0, 48.0, 41.0, 49.0, 39.0, 18.0, 19.0, 15.0, 20.0, 9.0, 10.0, 6.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.9140625, -7.65771484375, -7.4013671875, -7.14501953125, -6.888671875, -6.63232421875, -6.3759765625, -6.11962890625, -5.86328125, -5.60693359375, -5.3505859375, -5.09423828125, -4.837890625, -4.58154296875, -4.3251953125, -4.06884765625, -3.8125, -3.55615234375, -3.2998046875, -3.04345703125, -2.787109375, -2.53076171875, -2.2744140625, -2.01806640625, -1.76171875, -1.50537109375, -1.2490234375, -0.99267578125, -0.736328125, -0.47998046875, -0.2236328125, 0.03271484375, 0.2890625, 0.54541015625, 0.8017578125, 1.05810546875, 1.314453125, 1.57080078125, 1.8271484375, 2.08349609375, 2.33984375, 2.59619140625, 2.8525390625, 3.10888671875, 3.365234375, 3.62158203125, 3.8779296875, 4.13427734375, 4.390625, 4.64697265625, 4.9033203125, 5.15966796875, 5.416015625, 5.67236328125, 5.9287109375, 6.18505859375, 6.44140625, 6.69775390625, 6.9541015625, 7.21044921875, 7.466796875, 7.72314453125, 7.9794921875, 8.23583984375, 8.4921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 17.0, 38.0, 53.0, 113.0, 262.0, 679.0, 2848.0, 35391.0, 948779.0, 55400.0, 3633.0, 781.0, 257.0, 132.0, 65.0, 39.0, 19.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.215423583984375, -3.04217529296875, -2.868927001953125, -2.6956787109375, -2.522430419921875, -2.34918212890625, -2.175933837890625, -2.002685546875, -1.829437255859375, -1.65618896484375, -1.482940673828125, -1.3096923828125, -1.136444091796875, -0.96319580078125, -0.789947509765625, -0.61669921875, -0.443450927734375, -0.27020263671875, -0.096954345703125, 0.0762939453125, 0.249542236328125, 0.42279052734375, 0.596038818359375, 0.769287109375, 0.942535400390625, 1.11578369140625, 1.289031982421875, 1.4622802734375, 1.635528564453125, 1.80877685546875, 1.982025146484375, 2.1552734375, 2.328521728515625, 2.50177001953125, 2.675018310546875, 2.8482666015625, 3.021514892578125, 3.19476318359375, 3.368011474609375, 3.541259765625, 3.714508056640625, 3.88775634765625, 4.061004638671875, 4.2342529296875, 4.407501220703125, 4.58074951171875, 4.753997802734375, 4.92724609375, 5.100494384765625, 5.27374267578125, 5.446990966796875, 5.6202392578125, 5.793487548828125, 5.96673583984375, 6.139984130859375, 6.313232421875, 6.486480712890625, 6.65972900390625, 6.832977294921875, 7.0062255859375, 7.179473876953125, 7.35272216796875, 7.525970458984375, 7.69921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 10.0, 19.0, 27.0, 38.0, 72.0, 107.0, 168.0, 171.0, 153.0, 93.0, 50.0, 24.0, 25.0, 15.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.0009245872497558594, -0.0009065326303243637, -0.000888478010892868, -0.0008704233914613724, -0.0008523687720298767, -0.000834314152598381, -0.0008162595331668854, -0.0007982049137353897, -0.000780150294303894, -0.0007620956748723984, -0.0007440410554409027, -0.000725986436009407, -0.0007079318165779114, -0.0006898771971464157, -0.00067182257771492, -0.0006537679582834244, -0.0006357133388519287, -0.000617658719420433, -0.0005996040999889374, -0.0005815494805574417, -0.000563494861125946, -0.0005454402416944504, -0.0005273856222629547, -0.000509331002831459, -0.0004912763833999634, -0.0004732217639684677, -0.00045516714453697205, -0.0004371125251054764, -0.0004190579056739807, -0.00040100328624248505, -0.0003829486668109894, -0.0003648940473794937, -0.00034683942794799805, -0.0003287848085165024, -0.0003107301890850067, -0.00029267556965351105, -0.0002746209502220154, -0.0002565663307905197, -0.00023851171135902405, -0.00022045709192752838, -0.00020240247249603271, -0.00018434785306453705, -0.00016629323363304138, -0.00014823861420154572, -0.00013018399477005005, -0.00011212937533855438, -9.407475590705872e-05, -7.602013647556305e-05, -5.796551704406738e-05, -3.9910897612571716e-05, -2.185627818107605e-05, -3.8016587495803833e-06, 1.4252960681915283e-05, 3.230758011341095e-05, 5.0362199544906616e-05, 6.841681897640228e-05, 8.647143840789795e-05, 0.00010452605783939362, 0.00012258067727088928, 0.00014063529670238495, 0.00015868991613388062, 0.00017674453556537628, 0.00019479915499687195, 0.00021285377442836761, 0.00023090839385986328]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 5.0, 11.0, 13.0, 18.0, 49.0, 85.0, 151.0, 281.0, 660.0, 1852.0, 10784.0, 400015.0, 617954.0, 13158.0, 2134.0, 703.0, 286.0, 163.0, 88.0, 50.0, 32.0, 19.0, 13.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.09808349609375, -3.9344482421875, -3.77081298828125, -3.607177734375, -3.44354248046875, -3.2799072265625, -3.11627197265625, -2.95263671875, -2.78900146484375, -2.6253662109375, -2.46173095703125, -2.298095703125, -2.13446044921875, -1.9708251953125, -1.80718994140625, -1.6435546875, -1.47991943359375, -1.3162841796875, -1.15264892578125, -0.989013671875, -0.82537841796875, -0.6617431640625, -0.49810791015625, -0.33447265625, -0.17083740234375, -0.0072021484375, 0.15643310546875, 0.320068359375, 0.48370361328125, 0.6473388671875, 0.81097412109375, 0.974609375, 1.13824462890625, 1.3018798828125, 1.46551513671875, 1.629150390625, 1.79278564453125, 1.9564208984375, 2.12005615234375, 2.28369140625, 2.44732666015625, 2.6109619140625, 2.77459716796875, 2.938232421875, 3.10186767578125, 3.2655029296875, 3.42913818359375, 3.5927734375, 3.75640869140625, 3.9200439453125, 4.08367919921875, 4.247314453125, 4.41094970703125, 4.5745849609375, 4.73822021484375, 4.90185546875, 5.06549072265625, 5.2291259765625, 5.39276123046875, 5.556396484375, 5.72003173828125, 5.8836669921875, 6.04730224609375, 6.2109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 11.0, 29.0, 44.0, 82.0, 143.0, 202.0, 192.0, 144.0, 70.0, 37.0, 20.0, 13.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.08319091796875, -3.9046630859375, -3.72613525390625, -3.547607421875, -3.36907958984375, -3.1905517578125, -3.01202392578125, -2.83349609375, -2.65496826171875, -2.4764404296875, -2.29791259765625, -2.119384765625, -1.94085693359375, -1.7623291015625, -1.58380126953125, -1.4052734375, -1.22674560546875, -1.0482177734375, -0.86968994140625, -0.691162109375, -0.51263427734375, -0.3341064453125, -0.15557861328125, 0.02294921875, 0.20147705078125, 0.3800048828125, 0.55853271484375, 0.737060546875, 0.91558837890625, 1.0941162109375, 1.27264404296875, 1.451171875, 1.62969970703125, 1.8082275390625, 1.98675537109375, 2.165283203125, 2.34381103515625, 2.5223388671875, 2.70086669921875, 2.87939453125, 3.05792236328125, 3.2364501953125, 3.41497802734375, 3.593505859375, 3.77203369140625, 3.9505615234375, 4.12908935546875, 4.3076171875, 4.48614501953125, 4.6646728515625, 4.84320068359375, 5.021728515625, 5.20025634765625, 5.3787841796875, 5.55731201171875, 5.73583984375, 5.91436767578125, 6.0928955078125, 6.27142333984375, 6.449951171875, 6.62847900390625, 6.8070068359375, 6.98553466796875, 7.1640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 6.0, 19.0, 33.0, 92.0, 135.0, 223.0, 223.0, 137.0, 63.0, 30.0, 20.0, 13.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.38458251953125, -88.84367370605469, -86.30276489257812, -83.76185607910156, -81.220947265625, -78.68003845214844, -76.13912963867188, -73.59822082519531, -71.05731201171875, -68.51640319824219, -65.97549438476562, -63.43458557128906, -60.8936767578125, -58.35276794433594, -55.81186294555664, -53.27095413208008, -50.73004913330078, -48.18914031982422, -45.648231506347656, -43.107322692871094, -40.56641387939453, -38.02550506591797, -35.48460006713867, -32.94369125366211, -30.402782440185547, -27.861873626708984, -25.320964813232422, -22.780057907104492, -20.23914909362793, -17.698240280151367, -15.157332420349121, -12.616424560546875, -10.075515747070312, -7.534607410430908, -4.993699073791504, -2.4527907371520996, 0.08811759948730469, 2.629026412963867, 5.169934272766113, 7.710842132568359, 10.251750946044922, 12.792659759521484, 15.33356761932373, 17.874475479125977, 20.41538429260254, 22.9562931060791, 25.49720001220703, 28.038108825683594, 30.579017639160156, 33.11992645263672, 35.66083526611328, 38.201744079589844, 40.742652893066406, 43.28356170654297, 45.824466705322266, 48.36537551879883, 50.90628433227539, 53.44719314575195, 55.988101959228516, 58.52901077270508, 61.069915771484375, 63.61082458496094, 66.1517333984375, 68.69264221191406, 71.23355102539062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 9.0, 13.0, 9.0, 19.0, 21.0, 29.0, 22.0, 47.0, 30.0, 42.0, 35.0, 41.0, 60.0, 46.0, 64.0, 50.0, 56.0, 48.0, 40.0, 40.0, 36.0, 36.0, 27.0, 26.0, 22.0, 24.0, 16.0, 10.0, 10.0, 8.0, 9.0, 9.0, 3.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.66944885253906, -32.45766830444336, -31.245887756347656, -30.034107208251953, -28.82232666015625, -27.610546112060547, -26.398767471313477, -25.186986923217773, -23.97520637512207, -22.763425827026367, -21.551645278930664, -20.33986473083496, -19.12808609008789, -17.916305541992188, -16.704524993896484, -15.492744445800781, -14.280963897705078, -13.069183349609375, -11.857402801513672, -10.645623207092285, -9.433842658996582, -8.222062110900879, -7.010282039642334, -5.798501968383789, -4.586721420288086, -3.374941110610962, -2.163160800933838, -0.9513804912567139, 0.26039981842041016, 1.4721803665161133, 2.683960437774658, 3.895740509033203, 5.107517242431641, 6.319297790527344, 7.531077861785889, 8.742857933044434, 9.954638481140137, 11.16641902923584, 12.378198623657227, 13.58997917175293, 14.801759719848633, 16.013540267944336, 17.22532081604004, 18.437101364135742, 19.648880004882812, 20.860660552978516, 22.07244110107422, 23.284221649169922, 24.496002197265625, 25.707782745361328, 26.91956329345703, 28.131343841552734, 29.343124389648438, 30.55490493774414, 31.76668357849121, 32.97846221923828, 34.19024658203125, 35.40202713012695, 36.613807678222656, 37.82558822631836, 39.03736877441406, 40.249149322509766, 41.46092987060547, 42.672706604003906, 43.88448715209961]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 10.0, 8.0, 20.0, 25.0, 33.0, 52.0, 64.0, 108.0, 139.0, 211.0, 321.0, 476.0, 753.0, 1224.0, 2244.0, 3945.0, 7834.0, 17937.0, 54871.0, 661695.0, 3295261.0, 98078.0, 26706.0, 10828.0, 5038.0, 2603.0, 1479.0, 854.0, 525.0, 298.0, 221.0, 156.0, 74.0, 51.0, 53.0, 20.0, 14.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.99609375, -3.871917724609375, -3.74774169921875, -3.623565673828125, -3.4993896484375, -3.375213623046875, -3.25103759765625, -3.126861572265625, -3.002685546875, -2.878509521484375, -2.75433349609375, -2.630157470703125, -2.5059814453125, -2.381805419921875, -2.25762939453125, -2.133453369140625, -2.00927734375, -1.885101318359375, -1.76092529296875, -1.636749267578125, -1.5125732421875, -1.388397216796875, -1.26422119140625, -1.140045166015625, -1.015869140625, -0.891693115234375, -0.76751708984375, -0.643341064453125, -0.5191650390625, -0.394989013671875, -0.27081298828125, -0.146636962890625, -0.0224609375, 0.101715087890625, 0.22589111328125, 0.350067138671875, 0.4742431640625, 0.598419189453125, 0.72259521484375, 0.846771240234375, 0.970947265625, 1.095123291015625, 1.21929931640625, 1.343475341796875, 1.4676513671875, 1.591827392578125, 1.71600341796875, 1.840179443359375, 1.96435546875, 2.088531494140625, 2.21270751953125, 2.336883544921875, 2.4610595703125, 2.585235595703125, 2.70941162109375, 2.833587646484375, 2.957763671875, 3.081939697265625, 3.20611572265625, 3.330291748046875, 3.4544677734375, 3.578643798828125, 3.70281982421875, 3.826995849609375, 3.951171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 8.0, 9.0, 10.0, 13.0, 12.0, 23.0, 19.0, 36.0, 35.0, 46.0, 57.0, 70.0, 48.0, 80.0, 81.0, 68.0, 61.0, 65.0, 50.0, 39.0, 33.0, 22.0, 24.0, 15.0, 15.0, 17.0, 9.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.510955810546875, -1.45550537109375, -1.400054931640625, -1.3446044921875, -1.289154052734375, -1.23370361328125, -1.178253173828125, -1.122802734375, -1.067352294921875, -1.01190185546875, -0.956451416015625, -0.9010009765625, -0.845550537109375, -0.79010009765625, -0.734649658203125, -0.67919921875, -0.623748779296875, -0.56829833984375, -0.512847900390625, -0.4573974609375, -0.401947021484375, -0.34649658203125, -0.291046142578125, -0.235595703125, -0.180145263671875, -0.12469482421875, -0.069244384765625, -0.0137939453125, 0.041656494140625, 0.09710693359375, 0.152557373046875, 0.2080078125, 0.263458251953125, 0.31890869140625, 0.374359130859375, 0.4298095703125, 0.485260009765625, 0.54071044921875, 0.596160888671875, 0.651611328125, 0.707061767578125, 0.76251220703125, 0.817962646484375, 0.8734130859375, 0.928863525390625, 0.98431396484375, 1.039764404296875, 1.09521484375, 1.150665283203125, 1.20611572265625, 1.261566162109375, 1.3170166015625, 1.372467041015625, 1.42791748046875, 1.483367919921875, 1.538818359375, 1.594268798828125, 1.64971923828125, 1.705169677734375, 1.7606201171875, 1.816070556640625, 1.87152099609375, 1.926971435546875, 1.982421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 14.0, 24.0, 63.0, 120.0, 335.0, 909.0, 3276.0, 15390.0, 135555.0, 3893901.0, 125258.0, 14817.0, 3184.0, 848.0, 307.0, 138.0, 58.0, 38.0, 24.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.6953125, -10.4375, -10.1796875, -9.921875, -9.6640625, -9.40625, -9.1484375, -8.890625, -8.6328125, -8.375, -8.1171875, -7.859375, -7.6015625, -7.34375, -7.0859375, -6.828125, -6.5703125, -6.3125, -6.0546875, -5.796875, -5.5390625, -5.28125, -5.0234375, -4.765625, -4.5078125, -4.25, -3.9921875, -3.734375, -3.4765625, -3.21875, -2.9609375, -2.703125, -2.4453125, -2.1875, -1.9296875, -1.671875, -1.4140625, -1.15625, -0.8984375, -0.640625, -0.3828125, -0.125, 0.1328125, 0.390625, 0.6484375, 0.90625, 1.1640625, 1.421875, 1.6796875, 1.9375, 2.1953125, 2.453125, 2.7109375, 2.96875, 3.2265625, 3.484375, 3.7421875, 4.0, 4.2578125, 4.515625, 4.7734375, 5.03125, 5.2890625, 5.546875, 5.8046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 5.0, 16.0, 29.0, 46.0, 43.0, 89.0, 141.0, 359.0, 1616.0, 1054.0, 274.0, 136.0, 74.0, 54.0, 35.0, 20.0, 21.0, 18.0, 9.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.75836181640625, -5.5440673828125, -5.32977294921875, -5.115478515625, -4.90118408203125, -4.6868896484375, -4.47259521484375, -4.25830078125, -4.04400634765625, -3.8297119140625, -3.61541748046875, -3.401123046875, -3.18682861328125, -2.9725341796875, -2.75823974609375, -2.5439453125, -2.32965087890625, -2.1153564453125, -1.90106201171875, -1.686767578125, -1.47247314453125, -1.2581787109375, -1.04388427734375, -0.82958984375, -0.61529541015625, -0.4010009765625, -0.18670654296875, 0.027587890625, 0.24188232421875, 0.4561767578125, 0.67047119140625, 0.884765625, 1.09906005859375, 1.3133544921875, 1.52764892578125, 1.741943359375, 1.95623779296875, 2.1705322265625, 2.38482666015625, 2.59912109375, 2.81341552734375, 3.0277099609375, 3.24200439453125, 3.456298828125, 3.67059326171875, 3.8848876953125, 4.09918212890625, 4.3134765625, 4.52777099609375, 4.7420654296875, 4.95635986328125, 5.170654296875, 5.38494873046875, 5.5992431640625, 5.81353759765625, 6.02783203125, 6.24212646484375, 6.4564208984375, 6.67071533203125, 6.885009765625, 7.09930419921875, 7.3135986328125, 7.52789306640625, 7.7421875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 13.0, 30.0, 37.0, 65.0, 138.0, 219.0, 175.0, 119.0, 72.0, 50.0, 23.0, 14.0, 5.0, 11.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.504051208496094, -51.117774963378906, -49.73149871826172, -48.34522247314453, -46.958946228027344, -45.572669982910156, -44.18639373779297, -42.80011749267578, -41.413841247558594, -40.027565002441406, -38.64128875732422, -37.25501251220703, -35.868736267089844, -34.482460021972656, -33.09618377685547, -31.70990753173828, -30.323633193969727, -28.93735694885254, -27.55108070373535, -26.164804458618164, -24.778528213500977, -23.39225196838379, -22.005977630615234, -20.619701385498047, -19.23342514038086, -17.847148895263672, -16.460872650146484, -15.074596405029297, -13.68832015991211, -12.302043914794922, -10.91576862335205, -9.529492378234863, -8.14321517944336, -6.756938934326172, -5.370662689208984, -3.984386920928955, -2.5981106758117676, -1.21183443069458, 0.17444133758544922, 1.5607175827026367, 2.946993827819824, 4.333270072937012, 5.719546318054199, 7.1058220863342285, 8.492097854614258, 9.878374099731445, 11.264650344848633, 12.65092658996582, 14.037202835083008, 15.423479080200195, 16.809755325317383, 18.19603157043457, 19.582307815551758, 20.968584060668945, 22.3548583984375, 23.741134643554688, 25.127410888671875, 26.513687133789062, 27.89996337890625, 29.286239624023438, 30.672515869140625, 32.05879211425781, 33.445068359375, 34.83134460449219, 36.217620849609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 7.0, 10.0, 18.0, 13.0, 23.0, 25.0, 28.0, 31.0, 26.0, 26.0, 49.0, 35.0, 39.0, 46.0, 50.0, 43.0, 57.0, 67.0, 28.0, 39.0, 36.0, 32.0, 31.0, 30.0, 26.0, 23.0, 24.0, 30.0, 12.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.306528091430664, -18.70243263244629, -18.09833526611328, -17.494239807128906, -16.89014434814453, -16.286046981811523, -15.681951522827148, -15.077855110168457, -14.473758697509766, -13.869662284851074, -13.265565872192383, -12.661470413208008, -12.057374000549316, -11.453277587890625, -10.84918212890625, -10.245085716247559, -9.640989303588867, -9.036892890930176, -8.432796478271484, -7.828701019287109, -7.224604606628418, -6.620508193969727, -6.016412258148193, -5.41231632232666, -4.808219909667969, -4.204123497009277, -3.600027561187744, -2.995931386947632, -2.3918352127075195, -1.7877390384674072, -1.183642864227295, -0.5795469284057617, 0.0245513916015625, 0.6286475658416748, 1.232743740081787, 1.8368399143218994, 2.4409360885620117, 3.045032262802124, 3.6491284370422363, 4.2532243728637695, 4.857320785522461, 5.461417198181152, 6.0655131340026855, 6.669609069824219, 7.27370548248291, 7.877801895141602, 8.481897354125977, 9.085993766784668, 9.69009017944336, 10.29418659210205, 10.898283004760742, 11.502378463745117, 12.106474876403809, 12.7105712890625, 13.314666748046875, 13.918763160705566, 14.522859573364258, 15.12695598602295, 15.73105239868164, 16.335147857666016, 16.93924331665039, 17.5433406829834, 18.147436141967773, 18.75153350830078, 19.355628967285156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 13.0, 34.0, 52.0, 64.0, 120.0, 220.0, 396.0, 707.0, 1402.0, 2823.0, 6877.0, 19235.0, 66128.0, 303369.0, 492676.0, 108556.0, 28667.0, 9642.0, 3800.0, 1733.0, 940.0, 463.0, 248.0, 147.0, 77.0, 57.0, 35.0, 16.0, 15.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -5.0091552734375, -4.858154296875, -4.7071533203125, -4.55615234375, -4.4051513671875, -4.254150390625, -4.1031494140625, -3.9521484375, -3.8011474609375, -3.650146484375, -3.4991455078125, -3.34814453125, -3.1971435546875, -3.046142578125, -2.8951416015625, -2.744140625, -2.5931396484375, -2.442138671875, -2.2911376953125, -2.14013671875, -1.9891357421875, -1.838134765625, -1.6871337890625, -1.5361328125, -1.3851318359375, -1.234130859375, -1.0831298828125, -0.93212890625, -0.7811279296875, -0.630126953125, -0.4791259765625, -0.328125, -0.1771240234375, -0.026123046875, 0.1248779296875, 0.27587890625, 0.4268798828125, 0.577880859375, 0.7288818359375, 0.8798828125, 1.0308837890625, 1.181884765625, 1.3328857421875, 1.48388671875, 1.6348876953125, 1.785888671875, 1.9368896484375, 2.087890625, 2.2388916015625, 2.389892578125, 2.5408935546875, 2.69189453125, 2.8428955078125, 2.993896484375, 3.1448974609375, 3.2958984375, 3.4468994140625, 3.597900390625, 3.7489013671875, 3.89990234375, 4.0509033203125, 4.201904296875, 4.3529052734375, 4.50390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 5.0, 11.0, 16.0, 33.0, 34.0, 44.0, 42.0, 49.0, 66.0, 63.0, 83.0, 74.0, 76.0, 67.0, 66.0, 48.0, 46.0, 32.0, 30.0, 29.0, 21.0, 20.0, 11.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.767578125, -1.709686279296875, -1.65179443359375, -1.593902587890625, -1.5360107421875, -1.478118896484375, -1.42022705078125, -1.362335205078125, -1.304443359375, -1.246551513671875, -1.18865966796875, -1.130767822265625, -1.0728759765625, -1.014984130859375, -0.95709228515625, -0.899200439453125, -0.84130859375, -0.783416748046875, -0.72552490234375, -0.667633056640625, -0.6097412109375, -0.551849365234375, -0.49395751953125, -0.436065673828125, -0.378173828125, -0.320281982421875, -0.26239013671875, -0.204498291015625, -0.1466064453125, -0.088714599609375, -0.03082275390625, 0.027069091796875, 0.0849609375, 0.142852783203125, 0.20074462890625, 0.258636474609375, 0.3165283203125, 0.374420166015625, 0.43231201171875, 0.490203857421875, 0.548095703125, 0.605987548828125, 0.66387939453125, 0.721771240234375, 0.7796630859375, 0.837554931640625, 0.89544677734375, 0.953338623046875, 1.01123046875, 1.069122314453125, 1.12701416015625, 1.184906005859375, 1.2427978515625, 1.300689697265625, 1.35858154296875, 1.416473388671875, 1.474365234375, 1.532257080078125, 1.59014892578125, 1.648040771484375, 1.7059326171875, 1.763824462890625, 1.82171630859375, 1.879608154296875, 1.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 8.0, 15.0, 24.0, 26.0, 48.0, 56.0, 74.0, 134.0, 197.0, 401.0, 783.0, 1695.0, 4312.0, 15682.0, 103588.0, 765126.0, 130143.0, 17943.0, 4688.0, 1649.0, 839.0, 444.0, 228.0, 161.0, 96.0, 56.0, 43.0, 22.0, 19.0, 9.0, 10.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5234375, -7.32305908203125, -7.1226806640625, -6.92230224609375, -6.721923828125, -6.52154541015625, -6.3211669921875, -6.12078857421875, -5.92041015625, -5.72003173828125, -5.5196533203125, -5.31927490234375, -5.118896484375, -4.91851806640625, -4.7181396484375, -4.51776123046875, -4.3173828125, -4.11700439453125, -3.9166259765625, -3.71624755859375, -3.515869140625, -3.31549072265625, -3.1151123046875, -2.91473388671875, -2.71435546875, -2.51397705078125, -2.3135986328125, -2.11322021484375, -1.912841796875, -1.71246337890625, -1.5120849609375, -1.31170654296875, -1.111328125, -0.91094970703125, -0.7105712890625, -0.51019287109375, -0.309814453125, -0.10943603515625, 0.0909423828125, 0.29132080078125, 0.49169921875, 0.69207763671875, 0.8924560546875, 1.09283447265625, 1.293212890625, 1.49359130859375, 1.6939697265625, 1.89434814453125, 2.0947265625, 2.29510498046875, 2.4954833984375, 2.69586181640625, 2.896240234375, 3.09661865234375, 3.2969970703125, 3.49737548828125, 3.69775390625, 3.89813232421875, 4.0985107421875, 4.29888916015625, 4.499267578125, 4.69964599609375, 4.9000244140625, 5.10040283203125, 5.30078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 11.0, 5.0, 10.0, 11.0, 22.0, 26.0, 20.0, 33.0, 42.0, 39.0, 53.0, 53.0, 59.0, 61.0, 62.0, 62.0, 53.0, 62.0, 58.0, 52.0, 38.0, 28.0, 23.0, 23.0, 15.0, 21.0, 13.0, 6.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.14306640625, -6.9267578125, -6.71044921875, -6.494140625, -6.27783203125, -6.0615234375, -5.84521484375, -5.62890625, -5.41259765625, -5.1962890625, -4.97998046875, -4.763671875, -4.54736328125, -4.3310546875, -4.11474609375, -3.8984375, -3.68212890625, -3.4658203125, -3.24951171875, -3.033203125, -2.81689453125, -2.6005859375, -2.38427734375, -2.16796875, -1.95166015625, -1.7353515625, -1.51904296875, -1.302734375, -1.08642578125, -0.8701171875, -0.65380859375, -0.4375, -0.22119140625, -0.0048828125, 0.21142578125, 0.427734375, 0.64404296875, 0.8603515625, 1.07666015625, 1.29296875, 1.50927734375, 1.7255859375, 1.94189453125, 2.158203125, 2.37451171875, 2.5908203125, 2.80712890625, 3.0234375, 3.23974609375, 3.4560546875, 3.67236328125, 3.888671875, 4.10498046875, 4.3212890625, 4.53759765625, 4.75390625, 4.97021484375, 5.1865234375, 5.40283203125, 5.619140625, 5.83544921875, 6.0517578125, 6.26806640625, 6.484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 10.0, 22.0, 15.0, 52.0, 60.0, 148.0, 324.0, 804.0, 2624.0, 17437.0, 835336.0, 180916.0, 8089.0, 1628.0, 566.0, 241.0, 110.0, 58.0, 37.0, 25.0, 10.0, 8.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.078125, -5.90362548828125, -5.7291259765625, -5.55462646484375, -5.380126953125, -5.20562744140625, -5.0311279296875, -4.85662841796875, -4.68212890625, -4.50762939453125, -4.3331298828125, -4.15863037109375, -3.984130859375, -3.80963134765625, -3.6351318359375, -3.46063232421875, -3.2861328125, -3.11163330078125, -2.9371337890625, -2.76263427734375, -2.588134765625, -2.41363525390625, -2.2391357421875, -2.06463623046875, -1.89013671875, -1.71563720703125, -1.5411376953125, -1.36663818359375, -1.192138671875, -1.01763916015625, -0.8431396484375, -0.66864013671875, -0.494140625, -0.31964111328125, -0.1451416015625, 0.02935791015625, 0.203857421875, 0.37835693359375, 0.5528564453125, 0.72735595703125, 0.90185546875, 1.07635498046875, 1.2508544921875, 1.42535400390625, 1.599853515625, 1.77435302734375, 1.9488525390625, 2.12335205078125, 2.2978515625, 2.47235107421875, 2.6468505859375, 2.82135009765625, 2.995849609375, 3.17034912109375, 3.3448486328125, 3.51934814453125, 3.69384765625, 3.86834716796875, 4.0428466796875, 4.21734619140625, 4.391845703125, 4.56634521484375, 4.7408447265625, 4.91534423828125, 5.08984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 9.0, 10.0, 22.0, 38.0, 48.0, 69.0, 126.0, 172.0, 194.0, 112.0, 58.0, 48.0, 25.0, 21.0, 9.0, 8.0, 8.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00043010711669921875, -0.00040959566831588745, -0.00038908421993255615, -0.00036857277154922485, -0.00034806132316589355, -0.00032754987478256226, -0.00030703842639923096, -0.00028652697801589966, -0.00026601552963256836, -0.00024550408124923706, -0.00022499263286590576, -0.00020448118448257446, -0.00018396973609924316, -0.00016345828771591187, -0.00014294683933258057, -0.00012243539094924927, -0.00010192394256591797, -8.141249418258667e-05, -6.090104579925537e-05, -4.038959741592407e-05, -1.9878149032592773e-05, 6.332993507385254e-07, 2.1144747734069824e-05, 4.165619611740112e-05, 6.216764450073242e-05, 8.267909288406372e-05, 0.00010319054126739502, 0.00012370198965072632, 0.00014421343803405762, 0.00016472488641738892, 0.00018523633480072021, 0.00020574778318405151, 0.0002262592315673828, 0.0002467706799507141, 0.0002672821283340454, 0.0002877935767173767, 0.000308305025100708, 0.0003288164734840393, 0.0003493279218673706, 0.0003698393702507019, 0.0003903508186340332, 0.0004108622670173645, 0.0004313737154006958, 0.0004518851637840271, 0.0004723966121673584, 0.0004929080605506897, 0.000513419508934021, 0.0005339309573173523, 0.0005544424057006836, 0.0005749538540840149, 0.0005954653024673462, 0.0006159767508506775, 0.0006364881992340088, 0.0006569996476173401, 0.0006775110960006714, 0.0006980225443840027, 0.000718533992767334, 0.0007390454411506653, 0.0007595568895339966, 0.0007800683379173279, 0.0008005797863006592, 0.0008210912346839905, 0.0008416026830673218, 0.0008621141314506531, 0.0008826255798339844]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 5.0, 6.0, 4.0, 15.0, 11.0, 41.0, 42.0, 56.0, 104.0, 191.0, 383.0, 904.0, 2487.0, 10165.0, 125963.0, 858724.0, 40952.0, 5546.0, 1589.0, 615.0, 280.0, 170.0, 100.0, 62.0, 39.0, 29.0, 17.0, 15.0, 9.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.18359375, -5.055023193359375, -4.92645263671875, -4.797882080078125, -4.6693115234375, -4.540740966796875, -4.41217041015625, -4.283599853515625, -4.155029296875, -4.026458740234375, -3.89788818359375, -3.769317626953125, -3.6407470703125, -3.512176513671875, -3.38360595703125, -3.255035400390625, -3.12646484375, -2.997894287109375, -2.86932373046875, -2.740753173828125, -2.6121826171875, -2.483612060546875, -2.35504150390625, -2.226470947265625, -2.097900390625, -1.969329833984375, -1.84075927734375, -1.712188720703125, -1.5836181640625, -1.455047607421875, -1.32647705078125, -1.197906494140625, -1.0693359375, -0.940765380859375, -0.81219482421875, -0.683624267578125, -0.5550537109375, -0.426483154296875, -0.29791259765625, -0.169342041015625, -0.040771484375, 0.087799072265625, 0.21636962890625, 0.344940185546875, 0.4735107421875, 0.602081298828125, 0.73065185546875, 0.859222412109375, 0.98779296875, 1.116363525390625, 1.24493408203125, 1.373504638671875, 1.5020751953125, 1.630645751953125, 1.75921630859375, 1.887786865234375, 2.016357421875, 2.144927978515625, 2.27349853515625, 2.402069091796875, 2.5306396484375, 2.659210205078125, 2.78778076171875, 2.916351318359375, 3.044921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 6.0, 9.0, 8.0, 14.0, 25.0, 24.0, 32.0, 29.0, 55.0, 63.0, 96.0, 114.0, 115.0, 90.0, 87.0, 48.0, 38.0, 26.0, 25.0, 25.0, 15.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.830078125, -3.7394866943359375, -3.648895263671875, -3.5583038330078125, -3.46771240234375, -3.3771209716796875, -3.286529541015625, -3.1959381103515625, -3.1053466796875, -3.0147552490234375, -2.924163818359375, -2.8335723876953125, -2.74298095703125, -2.6523895263671875, -2.561798095703125, -2.4712066650390625, -2.380615234375, -2.2900238037109375, -2.199432373046875, -2.1088409423828125, -2.01824951171875, -1.9276580810546875, -1.837066650390625, -1.7464752197265625, -1.6558837890625, -1.5652923583984375, -1.474700927734375, -1.3841094970703125, -1.29351806640625, -1.2029266357421875, -1.112335205078125, -1.0217437744140625, -0.93115234375, -0.8405609130859375, -0.749969482421875, -0.6593780517578125, -0.56878662109375, -0.4781951904296875, -0.387603759765625, -0.2970123291015625, -0.2064208984375, -0.1158294677734375, -0.025238037109375, 0.0653533935546875, 0.15594482421875, 0.2465362548828125, 0.337127685546875, 0.4277191162109375, 0.518310546875, 0.6089019775390625, 0.699493408203125, 0.7900848388671875, 0.88067626953125, 0.9712677001953125, 1.061859130859375, 1.1524505615234375, 1.2430419921875, 1.3336334228515625, 1.424224853515625, 1.5148162841796875, 1.60540771484375, 1.6959991455078125, 1.786590576171875, 1.8771820068359375, 1.9677734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 8.0, 10.0, 34.0, 64.0, 141.0, 268.0, 246.0, 126.0, 55.0, 20.0, 14.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.88066101074219, -81.82772064208984, -79.77478790283203, -77.72184753417969, -75.66891479492188, -73.61597442626953, -71.56303405761719, -69.51010131835938, -67.45716094970703, -65.40422058105469, -63.351287841796875, -61.29834747314453, -59.24541091918945, -57.192474365234375, -55.13953399658203, -53.08659744262695, -51.033660888671875, -48.9807243347168, -46.92778778076172, -44.874847412109375, -42.8219108581543, -40.76897430419922, -38.716033935546875, -36.6630973815918, -34.61016082763672, -32.55722427368164, -30.50428581237793, -28.45134735107422, -26.39841079711914, -24.345474243164062, -22.29253578186035, -20.23959732055664, -18.18665313720703, -16.133716583251953, -14.080778121948242, -12.027840614318848, -9.974903106689453, -7.921965599060059, -5.869028091430664, -3.8160905838012695, -1.763153076171875, 0.28978443145751953, 2.342721939086914, 4.395659446716309, 6.448596954345703, 8.501534461975098, 10.554471969604492, 12.607409477233887, 14.660346984863281, 16.71328353881836, 18.76622200012207, 20.81916046142578, 22.87209701538086, 24.925033569335938, 26.97797203063965, 29.03091049194336, 31.083847045898438, 33.136783599853516, 35.189720153808594, 37.24266052246094, 39.295597076416016, 41.348533630371094, 43.40147399902344, 45.454410552978516, 47.507347106933594]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 10.0, 7.0, 10.0, 8.0, 30.0, 25.0, 24.0, 31.0, 38.0, 65.0, 62.0, 70.0, 79.0, 74.0, 66.0, 55.0, 58.0, 58.0, 49.0, 27.0, 30.0, 21.0, 24.0, 13.0, 16.0, 15.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-40.44575500488281, -39.4511604309082, -38.456565856933594, -37.46196746826172, -36.46737289428711, -35.4727783203125, -34.47818374633789, -33.48358917236328, -32.488990783691406, -31.494396209716797, -30.499799728393555, -29.505205154418945, -28.510608673095703, -27.516014099121094, -26.521419525146484, -25.526824951171875, -24.532230377197266, -23.537635803222656, -22.543039321899414, -21.548444747924805, -20.553848266601562, -19.559253692626953, -18.564659118652344, -17.570064544677734, -16.575468063354492, -15.580872535705566, -14.58627700805664, -13.591682434082031, -12.597086906433105, -11.60249137878418, -10.60789680480957, -9.613301277160645, -8.618705749511719, -7.624110221862793, -6.629515171051025, -5.634920120239258, -4.640324592590332, -3.6457290649414062, -2.6511340141296387, -1.656538963317871, -0.6619434356689453, 0.33265185356140137, 1.327247142791748, 2.3218424320220947, 3.3164377212524414, 4.311033248901367, 5.305628299713135, 6.300223350524902, 7.294818878173828, 8.289414405822754, 9.28400993347168, 10.278604507446289, 11.273200035095215, 12.26779556274414, 13.26239013671875, 14.256985664367676, 15.251581192016602, 16.24617576599121, 17.240772247314453, 18.235366821289062, 19.229961395263672, 20.224557876586914, 21.219152450561523, 22.213748931884766, 23.208343505859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 13.0, 4.0, 9.0, 15.0, 12.0, 17.0, 37.0, 37.0, 56.0, 84.0, 111.0, 157.0, 226.0, 293.0, 471.0, 732.0, 1260.0, 2121.0, 4267.0, 8944.0, 22696.0, 97100.0, 3234350.0, 730437.0, 58387.0, 17422.0, 7313.0, 3389.0, 1766.0, 927.0, 618.0, 343.0, 206.0, 139.0, 96.0, 68.0, 39.0, 28.0, 25.0, 16.0, 13.0, 7.0, 11.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0], "bins": [-3.44140625, -3.350433349609375, -3.25946044921875, -3.168487548828125, -3.0775146484375, -2.986541748046875, -2.89556884765625, -2.804595947265625, -2.713623046875, -2.622650146484375, -2.53167724609375, -2.440704345703125, -2.3497314453125, -2.258758544921875, -2.16778564453125, -2.076812744140625, -1.98583984375, -1.894866943359375, -1.80389404296875, -1.712921142578125, -1.6219482421875, -1.530975341796875, -1.44000244140625, -1.349029541015625, -1.258056640625, -1.167083740234375, -1.07611083984375, -0.985137939453125, -0.8941650390625, -0.803192138671875, -0.71221923828125, -0.621246337890625, -0.5302734375, -0.439300537109375, -0.34832763671875, -0.257354736328125, -0.1663818359375, -0.075408935546875, 0.01556396484375, 0.106536865234375, 0.197509765625, 0.288482666015625, 0.37945556640625, 0.470428466796875, 0.5614013671875, 0.652374267578125, 0.74334716796875, 0.834320068359375, 0.92529296875, 1.016265869140625, 1.10723876953125, 1.198211669921875, 1.2891845703125, 1.380157470703125, 1.47113037109375, 1.562103271484375, 1.653076171875, 1.744049072265625, 1.83502197265625, 1.925994873046875, 2.0169677734375, 2.107940673828125, 2.19891357421875, 2.289886474609375, 2.380859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 12.0, 16.0, 29.0, 54.0, 59.0, 82.0, 100.0, 95.0, 109.0, 114.0, 87.0, 59.0, 48.0, 41.0, 30.0, 20.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.2507781982421875, -3.175384521484375, -3.0999908447265625, -3.02459716796875, -2.9492034912109375, -2.873809814453125, -2.7984161376953125, -2.7230224609375, -2.6476287841796875, -2.572235107421875, -2.4968414306640625, -2.42144775390625, -2.3460540771484375, -2.270660400390625, -2.1952667236328125, -2.119873046875, -2.0444793701171875, -1.969085693359375, -1.8936920166015625, -1.81829833984375, -1.7429046630859375, -1.667510986328125, -1.5921173095703125, -1.5167236328125, -1.4413299560546875, -1.365936279296875, -1.2905426025390625, -1.21514892578125, -1.1397552490234375, -1.064361572265625, -0.9889678955078125, -0.91357421875, -0.8381805419921875, -0.762786865234375, -0.6873931884765625, -0.61199951171875, -0.5366058349609375, -0.461212158203125, -0.3858184814453125, -0.3104248046875, -0.2350311279296875, -0.159637451171875, -0.0842437744140625, -0.00885009765625, 0.0665435791015625, 0.141937255859375, 0.2173309326171875, 0.292724609375, 0.3681182861328125, 0.443511962890625, 0.5189056396484375, 0.59429931640625, 0.6696929931640625, 0.745086669921875, 0.8204803466796875, 0.8958740234375, 0.9712677001953125, 1.046661376953125, 1.1220550537109375, 1.19744873046875, 1.2728424072265625, 1.348236083984375, 1.4236297607421875, 1.4990234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 24.0, 26.0, 44.0, 62.0, 98.0, 161.0, 311.0, 590.0, 1159.0, 2337.0, 5161.0, 12445.0, 35346.0, 158156.0, 3372465.0, 510553.0, 63027.0, 18662.0, 7044.0, 3257.0, 1615.0, 761.0, 402.0, 240.0, 127.0, 80.0, 34.0, 32.0, 23.0, 10.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.401885986328125, -3.29791259765625, -3.193939208984375, -3.0899658203125, -2.985992431640625, -2.88201904296875, -2.778045654296875, -2.674072265625, -2.570098876953125, -2.46612548828125, -2.362152099609375, -2.2581787109375, -2.154205322265625, -2.05023193359375, -1.946258544921875, -1.84228515625, -1.738311767578125, -1.63433837890625, -1.530364990234375, -1.4263916015625, -1.322418212890625, -1.21844482421875, -1.114471435546875, -1.010498046875, -0.906524658203125, -0.80255126953125, -0.698577880859375, -0.5946044921875, -0.490631103515625, -0.38665771484375, -0.282684326171875, -0.1787109375, -0.074737548828125, 0.02923583984375, 0.133209228515625, 0.2371826171875, 0.341156005859375, 0.44512939453125, 0.549102783203125, 0.653076171875, 0.757049560546875, 0.86102294921875, 0.964996337890625, 1.0689697265625, 1.172943115234375, 1.27691650390625, 1.380889892578125, 1.48486328125, 1.588836669921875, 1.69281005859375, 1.796783447265625, 1.9007568359375, 2.004730224609375, 2.10870361328125, 2.212677001953125, 2.316650390625, 2.420623779296875, 2.52459716796875, 2.628570556640625, 2.7325439453125, 2.836517333984375, 2.94049072265625, 3.044464111328125, 3.1484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 8.0, 8.0, 10.0, 8.0, 9.0, 17.0, 12.0, 28.0, 34.0, 36.0, 52.0, 57.0, 150.0, 263.0, 605.0, 1218.0, 702.0, 343.0, 148.0, 98.0, 61.0, 49.0, 30.0, 32.0, 22.0, 8.0, 10.0, 9.0, 4.0, 4.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.193359375, -3.095367431640625, -2.99737548828125, -2.899383544921875, -2.8013916015625, -2.703399658203125, -2.60540771484375, -2.507415771484375, -2.409423828125, -2.311431884765625, -2.21343994140625, -2.115447998046875, -2.0174560546875, -1.919464111328125, -1.82147216796875, -1.723480224609375, -1.62548828125, -1.527496337890625, -1.42950439453125, -1.331512451171875, -1.2335205078125, -1.135528564453125, -1.03753662109375, -0.939544677734375, -0.841552734375, -0.743560791015625, -0.64556884765625, -0.547576904296875, -0.4495849609375, -0.351593017578125, -0.25360107421875, -0.155609130859375, -0.0576171875, 0.040374755859375, 0.13836669921875, 0.236358642578125, 0.3343505859375, 0.432342529296875, 0.53033447265625, 0.628326416015625, 0.726318359375, 0.824310302734375, 0.92230224609375, 1.020294189453125, 1.1182861328125, 1.216278076171875, 1.31427001953125, 1.412261962890625, 1.51025390625, 1.608245849609375, 1.70623779296875, 1.804229736328125, 1.9022216796875, 2.000213623046875, 2.09820556640625, 2.196197509765625, 2.294189453125, 2.392181396484375, 2.49017333984375, 2.588165283203125, 2.6861572265625, 2.784149169921875, 2.88214111328125, 2.980133056640625, 3.078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 27.0, 61.0, 142.0, 248.0, 269.0, 122.0, 51.0, 22.0, 13.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.43701934814453, -44.16937255859375, -42.901729583740234, -41.63408279418945, -40.36643981933594, -39.098793029785156, -37.831146240234375, -36.563499450683594, -35.29585647583008, -34.0282096862793, -32.76056671142578, -31.492919921875, -30.22527503967285, -28.957630157470703, -27.689983367919922, -26.422338485717773, -25.154693603515625, -23.887048721313477, -22.619403839111328, -21.351757049560547, -20.0841121673584, -18.81646728515625, -17.54882049560547, -16.28117561340332, -15.013530731201172, -13.745885848999023, -12.478240013122559, -11.210594177246094, -9.942949295043945, -8.675304412841797, -7.407658576965332, -6.140012741088867, -4.872364044189453, -3.6047186851501465, -2.33707332611084, -1.0694279670715332, 0.19821739196777344, 1.46586275100708, 2.7335081100463867, 4.001153945922852, 5.268798828125, 6.536444187164307, 7.804089546203613, 9.071735382080078, 10.339380264282227, 11.607025146484375, 12.87467098236084, 14.142316818237305, 15.409961700439453, 16.6776065826416, 17.94525146484375, 19.21289825439453, 20.48054313659668, 21.748188018798828, 23.01583480834961, 24.283479690551758, 25.551124572753906, 26.818769454956055, 28.086414337158203, 29.354061126708984, 30.621706008911133, 31.88935089111328, 33.15699768066406, 34.424644470214844, 35.69228744506836]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 6.0, 12.0, 8.0, 14.0, 12.0, 12.0, 15.0, 18.0, 25.0, 15.0, 27.0, 33.0, 31.0, 28.0, 25.0, 32.0, 44.0, 49.0, 51.0, 39.0, 50.0, 44.0, 43.0, 34.0, 37.0, 29.0, 37.0, 37.0, 29.0, 17.0, 25.0, 10.0, 18.0, 17.0, 14.0, 8.0, 8.0, 5.0, 6.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.222179412841797, -10.851251602172852, -10.480324745178223, -10.109396934509277, -9.738469123840332, -9.367541313171387, -8.996614456176758, -8.625686645507812, -8.254758834838867, -7.88383150100708, -7.512903690338135, -7.141976356506348, -6.771048545837402, -6.400121212005615, -6.029193878173828, -5.658266067504883, -5.287338733673096, -4.916411399841309, -4.545483589172363, -4.174556255340576, -3.803628444671631, -3.4327011108398438, -3.0617735385894775, -2.6908459663391113, -2.319918394088745, -1.948990821838379, -1.5780632495880127, -1.207135796546936, -0.8362082242965698, -0.4652806520462036, -0.09435319900512695, 0.27657437324523926, 0.6475019454956055, 1.0184295177459717, 1.389357089996338, 1.7602845430374146, 2.1312122344970703, 2.5021395683288574, 2.8730671405792236, 3.24399471282959, 3.614922285079956, 3.9858498573303223, 4.356777191162109, 4.727705001831055, 5.098632335662842, 5.469560146331787, 5.840487480163574, 6.2114152908325195, 6.582342624664307, 6.953269958496094, 7.324197769165039, 7.695125102996826, 8.066052436828613, 8.436980247497559, 8.807908058166504, 9.178834915161133, 9.549762725830078, 9.920690536499023, 10.291617393493652, 10.662545204162598, 11.033473014831543, 11.404400825500488, 11.775327682495117, 12.146255493164062, 12.517183303833008]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 7.0, 12.0, 11.0, 18.0, 32.0, 50.0, 51.0, 79.0, 120.0, 202.0, 270.0, 454.0, 690.0, 1187.0, 2099.0, 4123.0, 9196.0, 23504.0, 68653.0, 239542.0, 472439.0, 149015.0, 45895.0, 16540.0, 6794.0, 3165.0, 1706.0, 1022.0, 579.0, 344.0, 224.0, 155.0, 120.0, 71.0, 49.0, 38.0, 34.0, 19.0, 17.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.361328125, -3.25732421875, -3.1533203125, -3.04931640625, -2.9453125, -2.84130859375, -2.7373046875, -2.63330078125, -2.529296875, -2.42529296875, -2.3212890625, -2.21728515625, -2.11328125, -2.00927734375, -1.9052734375, -1.80126953125, -1.697265625, -1.59326171875, -1.4892578125, -1.38525390625, -1.28125, -1.17724609375, -1.0732421875, -0.96923828125, -0.865234375, -0.76123046875, -0.6572265625, -0.55322265625, -0.44921875, -0.34521484375, -0.2412109375, -0.13720703125, -0.033203125, 0.07080078125, 0.1748046875, 0.27880859375, 0.3828125, 0.48681640625, 0.5908203125, 0.69482421875, 0.798828125, 0.90283203125, 1.0068359375, 1.11083984375, 1.21484375, 1.31884765625, 1.4228515625, 1.52685546875, 1.630859375, 1.73486328125, 1.8388671875, 1.94287109375, 2.046875, 2.15087890625, 2.2548828125, 2.35888671875, 2.462890625, 2.56689453125, 2.6708984375, 2.77490234375, 2.87890625, 2.98291015625, 3.0869140625, 3.19091796875, 3.294921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 8.0, 6.0, 11.0, 10.0, 31.0, 35.0, 30.0, 51.0, 56.0, 73.0, 75.0, 71.0, 75.0, 73.0, 75.0, 57.0, 49.0, 39.0, 37.0, 42.0, 28.0, 14.0, 20.0, 11.0, 7.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9340972900390625, -1.877960205078125, -1.8218231201171875, -1.76568603515625, -1.7095489501953125, -1.653411865234375, -1.5972747802734375, -1.5411376953125, -1.4850006103515625, -1.428863525390625, -1.3727264404296875, -1.31658935546875, -1.2604522705078125, -1.204315185546875, -1.1481781005859375, -1.092041015625, -1.0359039306640625, -0.979766845703125, -0.9236297607421875, -0.86749267578125, -0.8113555908203125, -0.755218505859375, -0.6990814208984375, -0.6429443359375, -0.5868072509765625, -0.530670166015625, -0.4745330810546875, -0.41839599609375, -0.3622589111328125, -0.306121826171875, -0.2499847412109375, -0.19384765625, -0.1377105712890625, -0.081573486328125, -0.0254364013671875, 0.03070068359375, 0.0868377685546875, 0.142974853515625, 0.1991119384765625, 0.2552490234375, 0.3113861083984375, 0.367523193359375, 0.4236602783203125, 0.47979736328125, 0.5359344482421875, 0.592071533203125, 0.6482086181640625, 0.704345703125, 0.7604827880859375, 0.816619873046875, 0.8727569580078125, 0.92889404296875, 0.9850311279296875, 1.041168212890625, 1.0973052978515625, 1.1534423828125, 1.2095794677734375, 1.265716552734375, 1.3218536376953125, 1.37799072265625, 1.4341278076171875, 1.490264892578125, 1.5464019775390625, 1.6025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 16.0, 24.0, 56.0, 71.0, 126.0, 227.0, 424.0, 963.0, 2951.0, 13287.0, 120502.0, 806950.0, 87760.0, 10877.0, 2563.0, 852.0, 417.0, 189.0, 105.0, 60.0, 36.0, 31.0, 13.0, 11.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.66766357421875, -6.4486083984375, -6.22955322265625, -6.010498046875, -5.79144287109375, -5.5723876953125, -5.35333251953125, -5.13427734375, -4.91522216796875, -4.6961669921875, -4.47711181640625, -4.258056640625, -4.03900146484375, -3.8199462890625, -3.60089111328125, -3.3818359375, -3.16278076171875, -2.9437255859375, -2.72467041015625, -2.505615234375, -2.28656005859375, -2.0675048828125, -1.84844970703125, -1.62939453125, -1.41033935546875, -1.1912841796875, -0.97222900390625, -0.753173828125, -0.53411865234375, -0.3150634765625, -0.09600830078125, 0.123046875, 0.34210205078125, 0.5611572265625, 0.78021240234375, 0.999267578125, 1.21832275390625, 1.4373779296875, 1.65643310546875, 1.87548828125, 2.09454345703125, 2.3135986328125, 2.53265380859375, 2.751708984375, 2.97076416015625, 3.1898193359375, 3.40887451171875, 3.6279296875, 3.84698486328125, 4.0660400390625, 4.28509521484375, 4.504150390625, 4.72320556640625, 4.9422607421875, 5.16131591796875, 5.38037109375, 5.59942626953125, 5.8184814453125, 6.03753662109375, 6.256591796875, 6.47564697265625, 6.6947021484375, 6.91375732421875, 7.1328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 8.0, 6.0, 5.0, 14.0, 9.0, 19.0, 25.0, 21.0, 26.0, 24.0, 30.0, 43.0, 42.0, 43.0, 45.0, 48.0, 63.0, 65.0, 41.0, 48.0, 41.0, 46.0, 31.0, 42.0, 42.0, 22.0, 23.0, 22.0, 20.0, 10.0, 13.0, 12.0, 11.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1171875, -3.97186279296875, -3.8265380859375, -3.68121337890625, -3.535888671875, -3.39056396484375, -3.2452392578125, -3.09991455078125, -2.95458984375, -2.80926513671875, -2.6639404296875, -2.51861572265625, -2.373291015625, -2.22796630859375, -2.0826416015625, -1.93731689453125, -1.7919921875, -1.64666748046875, -1.5013427734375, -1.35601806640625, -1.210693359375, -1.06536865234375, -0.9200439453125, -0.77471923828125, -0.62939453125, -0.48406982421875, -0.3387451171875, -0.19342041015625, -0.048095703125, 0.09722900390625, 0.2425537109375, 0.38787841796875, 0.533203125, 0.67852783203125, 0.8238525390625, 0.96917724609375, 1.114501953125, 1.25982666015625, 1.4051513671875, 1.55047607421875, 1.69580078125, 1.84112548828125, 1.9864501953125, 2.13177490234375, 2.277099609375, 2.42242431640625, 2.5677490234375, 2.71307373046875, 2.8583984375, 3.00372314453125, 3.1490478515625, 3.29437255859375, 3.439697265625, 3.58502197265625, 3.7303466796875, 3.87567138671875, 4.02099609375, 4.16632080078125, 4.3116455078125, 4.45697021484375, 4.602294921875, 4.74761962890625, 4.8929443359375, 5.03826904296875, 5.18359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 9.0, 6.0, 11.0, 14.0, 22.0, 59.0, 116.0, 236.0, 546.0, 1882.0, 11894.0, 307544.0, 703347.0, 19082.0, 2533.0, 672.0, 262.0, 117.0, 75.0, 37.0, 32.0, 14.0, 8.0, 3.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76171875, -3.660308837890625, -3.55889892578125, -3.457489013671875, -3.3560791015625, -3.254669189453125, -3.15325927734375, -3.051849365234375, -2.950439453125, -2.849029541015625, -2.74761962890625, -2.646209716796875, -2.5447998046875, -2.443389892578125, -2.34197998046875, -2.240570068359375, -2.13916015625, -2.037750244140625, -1.93634033203125, -1.834930419921875, -1.7335205078125, -1.632110595703125, -1.53070068359375, -1.429290771484375, -1.327880859375, -1.226470947265625, -1.12506103515625, -1.023651123046875, -0.9222412109375, -0.820831298828125, -0.71942138671875, -0.618011474609375, -0.5166015625, -0.415191650390625, -0.31378173828125, -0.212371826171875, -0.1109619140625, -0.009552001953125, 0.09185791015625, 0.193267822265625, 0.294677734375, 0.396087646484375, 0.49749755859375, 0.598907470703125, 0.7003173828125, 0.801727294921875, 0.90313720703125, 1.004547119140625, 1.10595703125, 1.207366943359375, 1.30877685546875, 1.410186767578125, 1.5115966796875, 1.613006591796875, 1.71441650390625, 1.815826416015625, 1.917236328125, 2.018646240234375, 2.12005615234375, 2.221466064453125, 2.3228759765625, 2.424285888671875, 2.52569580078125, 2.627105712890625, 2.728515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 14.0, 10.0, 18.0, 36.0, 34.0, 47.0, 58.0, 78.0, 113.0, 118.0, 111.0, 95.0, 63.0, 62.0, 34.0, 34.0, 15.0, 13.0, 14.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00027108192443847656, -0.0002601146697998047, -0.0002491474151611328, -0.00023818016052246094, -0.00022721290588378906, -0.0002162456512451172, -0.0002052783966064453, -0.00019431114196777344, -0.00018334388732910156, -0.0001723766326904297, -0.0001614093780517578, -0.00015044212341308594, -0.00013947486877441406, -0.0001285076141357422, -0.00011754035949707031, -0.00010657310485839844, -9.560585021972656e-05, -8.463859558105469e-05, -7.367134094238281e-05, -6.270408630371094e-05, -5.173683166503906e-05, -4.076957702636719e-05, -2.9802322387695312e-05, -1.8835067749023438e-05, -7.867813110351562e-06, 3.0994415283203125e-06, 1.4066696166992188e-05, 2.5033950805664062e-05, 3.600120544433594e-05, 4.696846008300781e-05, 5.793571472167969e-05, 6.890296936035156e-05, 7.987022399902344e-05, 9.083747863769531e-05, 0.00010180473327636719, 0.00011277198791503906, 0.00012373924255371094, 0.0001347064971923828, 0.0001456737518310547, 0.00015664100646972656, 0.00016760826110839844, 0.0001785755157470703, 0.0001895427703857422, 0.00020051002502441406, 0.00021147727966308594, 0.0002224445343017578, 0.0002334117889404297, 0.00024437904357910156, 0.00025534629821777344, 0.0002663135528564453, 0.0002772808074951172, 0.00028824806213378906, 0.00029921531677246094, 0.0003101825714111328, 0.0003211498260498047, 0.00033211708068847656, 0.00034308433532714844, 0.0003540515899658203, 0.0003650188446044922, 0.00037598609924316406, 0.00038695335388183594, 0.0003979206085205078, 0.0004088878631591797, 0.00041985511779785156, 0.00043082237243652344]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 8.0, 12.0, 12.0, 16.0, 31.0, 42.0, 67.0, 113.0, 173.0, 327.0, 613.0, 1368.0, 4021.0, 18452.0, 171825.0, 767641.0, 68746.0, 10161.0, 2721.0, 1061.0, 460.0, 270.0, 167.0, 87.0, 53.0, 26.0, 23.0, 16.0, 16.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8828125, -1.818603515625, -1.75439453125, -1.690185546875, -1.6259765625, -1.561767578125, -1.49755859375, -1.433349609375, -1.369140625, -1.304931640625, -1.24072265625, -1.176513671875, -1.1123046875, -1.048095703125, -0.98388671875, -0.919677734375, -0.85546875, -0.791259765625, -0.72705078125, -0.662841796875, -0.5986328125, -0.534423828125, -0.47021484375, -0.406005859375, -0.341796875, -0.277587890625, -0.21337890625, -0.149169921875, -0.0849609375, -0.020751953125, 0.04345703125, 0.107666015625, 0.171875, 0.236083984375, 0.30029296875, 0.364501953125, 0.4287109375, 0.492919921875, 0.55712890625, 0.621337890625, 0.685546875, 0.749755859375, 0.81396484375, 0.878173828125, 0.9423828125, 1.006591796875, 1.07080078125, 1.135009765625, 1.19921875, 1.263427734375, 1.32763671875, 1.391845703125, 1.4560546875, 1.520263671875, 1.58447265625, 1.648681640625, 1.712890625, 1.777099609375, 1.84130859375, 1.905517578125, 1.9697265625, 2.033935546875, 2.09814453125, 2.162353515625, 2.2265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 3.0, 9.0, 16.0, 16.0, 30.0, 33.0, 40.0, 35.0, 61.0, 56.0, 76.0, 98.0, 78.0, 76.0, 68.0, 63.0, 39.0, 40.0, 35.0, 16.0, 20.0, 24.0, 11.0, 4.0, 7.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.9248046875, -1.8764495849609375, -1.828094482421875, -1.7797393798828125, -1.73138427734375, -1.6830291748046875, -1.634674072265625, -1.5863189697265625, -1.5379638671875, -1.4896087646484375, -1.441253662109375, -1.3928985595703125, -1.34454345703125, -1.2961883544921875, -1.247833251953125, -1.1994781494140625, -1.151123046875, -1.1027679443359375, -1.054412841796875, -1.0060577392578125, -0.95770263671875, -0.9093475341796875, -0.860992431640625, -0.8126373291015625, -0.7642822265625, -0.7159271240234375, -0.667572021484375, -0.6192169189453125, -0.57086181640625, -0.5225067138671875, -0.474151611328125, -0.4257965087890625, -0.37744140625, -0.3290863037109375, -0.280731201171875, -0.2323760986328125, -0.18402099609375, -0.1356658935546875, -0.087310791015625, -0.0389556884765625, 0.0093994140625, 0.0577545166015625, 0.106109619140625, 0.1544647216796875, 0.20281982421875, 0.2511749267578125, 0.299530029296875, 0.3478851318359375, 0.396240234375, 0.4445953369140625, 0.492950439453125, 0.5413055419921875, 0.58966064453125, 0.6380157470703125, 0.686370849609375, 0.7347259521484375, 0.7830810546875, 0.8314361572265625, 0.879791259765625, 0.9281463623046875, 0.97650146484375, 1.0248565673828125, 1.073211669921875, 1.1215667724609375, 1.169921875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 14.0, 53.0, 131.0, 345.0, 291.0, 113.0, 30.0, 15.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.91323852539062, -71.73523712158203, -69.5572280883789, -67.37922668457031, -65.20121765136719, -63.023216247558594, -60.845211029052734, -58.667205810546875, -56.48920440673828, -54.31119918823242, -52.13319396972656, -49.95519256591797, -47.77718734741211, -45.59918212890625, -43.42117691040039, -41.24317169189453, -39.06516647338867, -36.88716125488281, -34.70915603637695, -32.531150817871094, -30.3531494140625, -28.17514419555664, -25.99713897705078, -23.819133758544922, -21.641130447387695, -19.463125228881836, -17.28512191772461, -15.10711669921875, -12.929112434387207, -10.751108169555664, -8.573102951049805, -6.395098686218262, -4.217094421386719, -2.0390899181365967, 0.1389145851135254, 2.3169193267822266, 4.4949235916137695, 6.6729278564453125, 8.850933074951172, 11.028937339782715, 13.206941604614258, 15.3849458694458, 17.562950134277344, 19.740955352783203, 21.918960571289062, 24.09696388244629, 26.27496910095215, 28.452972412109375, 30.630977630615234, 32.808982849121094, 34.98698806762695, 37.16499328613281, 39.342994689941406, 41.520999908447266, 43.699005126953125, 45.877010345458984, 48.055015563964844, 50.2330207824707, 52.41102600097656, 54.589027404785156, 56.767032623291016, 58.945037841796875, 61.123043060302734, 63.301048278808594, 65.47904968261719]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 8.0, 9.0, 10.0, 9.0, 15.0, 23.0, 22.0, 16.0, 31.0, 28.0, 31.0, 29.0, 41.0, 46.0, 62.0, 68.0, 69.0, 59.0, 64.0, 37.0, 30.0, 51.0, 36.0, 43.0, 31.0, 21.0, 21.0, 24.0, 15.0, 13.0, 7.0, 4.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.756563186645508, -21.063051223754883, -20.369537353515625, -19.676025390625, -18.982513427734375, -18.288999557495117, -17.595487594604492, -16.901973724365234, -16.20846176147461, -15.514948844909668, -14.821435928344727, -14.127923965454102, -13.43441104888916, -12.740898132324219, -12.047386169433594, -11.353873252868652, -10.660360336303711, -9.96684741973877, -9.273334503173828, -8.579822540283203, -7.886309623718262, -7.19279670715332, -6.499284267425537, -5.805771827697754, -5.1122589111328125, -4.418745994567871, -3.725233554840088, -3.0317208766937256, -2.3382081985473633, -1.644695520401001, -0.9511828422546387, -0.25767040252685547, 0.43584442138671875, 1.129357099533081, 1.8228697776794434, 2.5163824558258057, 3.209895133972168, 3.9034078121185303, 4.596920490264893, 5.290432929992676, 5.983945846557617, 6.677458763122559, 7.370971202850342, 8.064483642578125, 8.757996559143066, 9.451509475708008, 10.145021438598633, 10.838534355163574, 11.532047271728516, 12.225560188293457, 12.919073104858398, 13.612585067749023, 14.306097984313965, 14.999610900878906, 15.693122863769531, 16.386634826660156, 17.080148696899414, 17.77366065979004, 18.467174530029297, 19.160686492919922, 19.854198455810547, 20.547712326049805, 21.24122428894043, 21.934738159179688, 22.628250122070312]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 8.0, 15.0, 9.0, 20.0, 25.0, 32.0, 49.0, 76.0, 131.0, 250.0, 419.0, 823.0, 1640.0, 3729.0, 9186.0, 26044.0, 103478.0, 1071102.0, 2673471.0, 233502.0, 45767.0, 14388.0, 5687.0, 2334.0, 1089.0, 480.0, 258.0, 118.0, 77.0, 31.0, 14.0, 10.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.5604248046875, -2.499755859375, -2.4390869140625, -2.37841796875, -2.3177490234375, -2.257080078125, -2.1964111328125, -2.1357421875, -2.0750732421875, -2.014404296875, -1.9537353515625, -1.89306640625, -1.8323974609375, -1.771728515625, -1.7110595703125, -1.650390625, -1.5897216796875, -1.529052734375, -1.4683837890625, -1.40771484375, -1.3470458984375, -1.286376953125, -1.2257080078125, -1.1650390625, -1.1043701171875, -1.043701171875, -0.9830322265625, -0.92236328125, -0.8616943359375, -0.801025390625, -0.7403564453125, -0.6796875, -0.6190185546875, -0.558349609375, -0.4976806640625, -0.43701171875, -0.3763427734375, -0.315673828125, -0.2550048828125, -0.1943359375, -0.1336669921875, -0.072998046875, -0.0123291015625, 0.04833984375, 0.1090087890625, 0.169677734375, 0.2303466796875, 0.291015625, 0.3516845703125, 0.412353515625, 0.4730224609375, 0.53369140625, 0.5943603515625, 0.655029296875, 0.7156982421875, 0.7763671875, 0.8370361328125, 0.897705078125, 0.9583740234375, 1.01904296875, 1.0797119140625, 1.140380859375, 1.2010498046875, 1.26171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 16.0, 16.0, 22.0, 34.0, 34.0, 63.0, 66.0, 67.0, 79.0, 75.0, 88.0, 84.0, 65.0, 78.0, 52.0, 41.0, 33.0, 23.0, 24.0, 18.0, 9.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6484375, -2.5921859741210938, -2.5359344482421875, -2.4796829223632812, -2.423431396484375, -2.3671798706054688, -2.3109283447265625, -2.2546768188476562, -2.19842529296875, -2.1421737670898438, -2.0859222412109375, -2.0296707153320312, -1.973419189453125, -1.9171676635742188, -1.8609161376953125, -1.8046646118164062, -1.7484130859375, -1.6921615600585938, -1.6359100341796875, -1.5796585083007812, -1.523406982421875, -1.4671554565429688, -1.4109039306640625, -1.3546524047851562, -1.29840087890625, -1.2421493530273438, -1.1858978271484375, -1.1296463012695312, -1.073394775390625, -1.0171432495117188, -0.9608917236328125, -0.9046401977539062, -0.848388671875, -0.7921371459960938, -0.7358856201171875, -0.6796340942382812, -0.623382568359375, -0.5671310424804688, -0.5108795166015625, -0.45462799072265625, -0.39837646484375, -0.34212493896484375, -0.2858734130859375, -0.22962188720703125, -0.173370361328125, -0.11711883544921875, -0.0608673095703125, -0.00461578369140625, 0.0516357421875, 0.10788726806640625, 0.1641387939453125, 0.22039031982421875, 0.276641845703125, 0.33289337158203125, 0.3891448974609375, 0.44539642333984375, 0.50164794921875, 0.5578994750976562, 0.6141510009765625, 0.6704025268554688, 0.726654052734375, 0.7829055786132812, 0.8391571044921875, 0.8954086303710938, 0.95166015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 12.0, 16.0, 13.0, 21.0, 44.0, 39.0, 96.0, 144.0, 251.0, 441.0, 953.0, 2061.0, 5204.0, 15182.0, 55558.0, 343458.0, 3334046.0, 344052.0, 61234.0, 18282.0, 6875.0, 2989.0, 1388.0, 763.0, 430.0, 246.0, 163.0, 98.0, 66.0, 39.0, 31.0, 22.0, 11.0, 10.0, 8.0, 7.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.57757568359375, -2.4930419921875, -2.40850830078125, -2.323974609375, -2.23944091796875, -2.1549072265625, -2.07037353515625, -1.98583984375, -1.90130615234375, -1.8167724609375, -1.73223876953125, -1.647705078125, -1.56317138671875, -1.4786376953125, -1.39410400390625, -1.3095703125, -1.22503662109375, -1.1405029296875, -1.05596923828125, -0.971435546875, -0.88690185546875, -0.8023681640625, -0.71783447265625, -0.63330078125, -0.54876708984375, -0.4642333984375, -0.37969970703125, -0.295166015625, -0.21063232421875, -0.1260986328125, -0.04156494140625, 0.04296875, 0.12750244140625, 0.2120361328125, 0.29656982421875, 0.381103515625, 0.46563720703125, 0.5501708984375, 0.63470458984375, 0.71923828125, 0.80377197265625, 0.8883056640625, 0.97283935546875, 1.057373046875, 1.14190673828125, 1.2264404296875, 1.31097412109375, 1.3955078125, 1.48004150390625, 1.5645751953125, 1.64910888671875, 1.733642578125, 1.81817626953125, 1.9027099609375, 1.98724365234375, 2.07177734375, 2.15631103515625, 2.2408447265625, 2.32537841796875, 2.409912109375, 2.49444580078125, 2.5789794921875, 2.66351318359375, 2.748046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 0.0, 8.0, 9.0, 6.0, 15.0, 9.0, 19.0, 19.0, 28.0, 45.0, 47.0, 74.0, 87.0, 172.0, 225.0, 412.0, 764.0, 744.0, 455.0, 256.0, 160.0, 105.0, 102.0, 74.0, 36.0, 40.0, 31.0, 23.0, 19.0, 14.0, 10.0, 16.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.169921875, -2.086669921875, -2.00341796875, -1.920166015625, -1.8369140625, -1.753662109375, -1.67041015625, -1.587158203125, -1.50390625, -1.420654296875, -1.33740234375, -1.254150390625, -1.1708984375, -1.087646484375, -1.00439453125, -0.921142578125, -0.837890625, -0.754638671875, -0.67138671875, -0.588134765625, -0.5048828125, -0.421630859375, -0.33837890625, -0.255126953125, -0.171875, -0.088623046875, -0.00537109375, 0.077880859375, 0.1611328125, 0.244384765625, 0.32763671875, 0.410888671875, 0.494140625, 0.577392578125, 0.66064453125, 0.743896484375, 0.8271484375, 0.910400390625, 0.99365234375, 1.076904296875, 1.16015625, 1.243408203125, 1.32666015625, 1.409912109375, 1.4931640625, 1.576416015625, 1.65966796875, 1.742919921875, 1.826171875, 1.909423828125, 1.99267578125, 2.075927734375, 2.1591796875, 2.242431640625, 2.32568359375, 2.408935546875, 2.4921875, 2.575439453125, 2.65869140625, 2.741943359375, 2.8251953125, 2.908447265625, 2.99169921875, 3.074951171875, 3.158203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 43.0, 134.0, 329.0, 294.0, 107.0, 38.0, 11.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.229286193847656, -28.30753517150879, -26.385784149169922, -24.464035034179688, -22.542282104492188, -20.620532989501953, -18.698781967163086, -16.77703094482422, -14.855279922485352, -12.933528900146484, -11.011777877807617, -9.090027809143066, -7.168276786804199, -5.246525764465332, -3.3247756958007812, -1.403024673461914, 0.5187263488769531, 2.440477132797241, 4.362227916717529, 6.283978462219238, 8.205729484558105, 10.127480506896973, 12.049230575561523, 13.97098159790039, 15.892732620239258, 17.814483642578125, 19.736234664916992, 21.65798568725586, 23.579734802246094, 25.501487731933594, 27.423236846923828, 29.344987869262695, 31.266738891601562, 33.1884880065918, 35.1102409362793, 37.03199005126953, 38.95374298095703, 40.875492095947266, 42.7972412109375, 44.718994140625, 46.6407470703125, 48.562496185302734, 50.484249114990234, 52.40599822998047, 54.32775115966797, 56.2495002746582, 58.17124938964844, 60.09300231933594, 62.01475143432617, 63.936500549316406, 65.8582534790039, 67.7800064086914, 69.70175170898438, 71.62350463867188, 73.54525756835938, 75.46701049804688, 77.38875579833984, 79.31050872802734, 81.23225402832031, 83.15400695800781, 85.07575988769531, 86.99751281738281, 88.91925811767578, 90.84101104736328, 92.76276397705078]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 8.0, 9.0, 15.0, 15.0, 26.0, 33.0, 48.0, 34.0, 66.0, 61.0, 67.0, 54.0, 59.0, 62.0, 56.0, 61.0, 63.0, 46.0, 34.0, 27.0, 30.0, 22.0, 24.0, 17.0, 14.0, 11.0, 6.0, 4.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.80950927734375, -16.142671585083008, -15.475834846496582, -14.808998107910156, -14.142160415649414, -13.475323677062988, -12.808486938476562, -12.14164924621582, -11.474812507629395, -10.807975769042969, -10.141138076782227, -9.4743013381958, -8.807464599609375, -8.140626907348633, -7.473790168762207, -6.806952953338623, -6.140115737915039, -5.473278522491455, -4.806441307067871, -4.139604568481445, -3.4727673530578613, -2.8059301376342773, -2.1390933990478516, -1.4722561836242676, -0.8054189682006836, -0.13858187198638916, 0.5282552242279053, 1.1950922012329102, 1.8619294166564941, 2.528766632080078, 3.195603370666504, 3.862440586090088, 4.529279708862305, 5.196116924285889, 5.862954139709473, 6.529790878295898, 7.196628093719482, 7.863465309143066, 8.530302047729492, 9.197139739990234, 9.86397647857666, 10.530813217163086, 11.197650909423828, 11.864487648010254, 12.53132438659668, 13.198162078857422, 13.864998817443848, 14.531835556030273, 15.198673248291016, 15.865509986877441, 16.532346725463867, 17.19918441772461, 17.86602210998535, 18.532859802246094, 19.199695587158203, 19.866533279418945, 20.533370971679688, 21.20020866394043, 21.86704444885254, 22.53388214111328, 23.200719833374023, 23.867557525634766, 24.534393310546875, 25.201231002807617, 25.868066787719727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 6.0, 15.0, 14.0, 35.0, 43.0, 57.0, 78.0, 116.0, 175.0, 293.0, 441.0, 803.0, 1429.0, 2742.0, 5090.0, 10122.0, 21371.0, 46154.0, 103427.0, 244941.0, 338307.0, 148890.0, 64969.0, 29868.0, 14309.0, 6758.0, 3563.0, 1820.0, 1088.0, 607.0, 356.0, 218.0, 131.0, 108.0, 53.0, 45.0, 36.0, 17.0, 13.0, 14.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.30078125, -2.2293701171875, -2.157958984375, -2.0865478515625, -2.01513671875, -1.9437255859375, -1.872314453125, -1.8009033203125, -1.7294921875, -1.6580810546875, -1.586669921875, -1.5152587890625, -1.44384765625, -1.3724365234375, -1.301025390625, -1.2296142578125, -1.158203125, -1.0867919921875, -1.015380859375, -0.9439697265625, -0.87255859375, -0.8011474609375, -0.729736328125, -0.6583251953125, -0.5869140625, -0.5155029296875, -0.444091796875, -0.3726806640625, -0.30126953125, -0.2298583984375, -0.158447265625, -0.0870361328125, -0.015625, 0.0557861328125, 0.127197265625, 0.1986083984375, 0.27001953125, 0.3414306640625, 0.412841796875, 0.4842529296875, 0.5556640625, 0.6270751953125, 0.698486328125, 0.7698974609375, 0.84130859375, 0.9127197265625, 0.984130859375, 1.0555419921875, 1.126953125, 1.1983642578125, 1.269775390625, 1.3411865234375, 1.41259765625, 1.4840087890625, 1.555419921875, 1.6268310546875, 1.6982421875, 1.7696533203125, 1.841064453125, 1.9124755859375, 1.98388671875, 2.0552978515625, 2.126708984375, 2.1981201171875, 2.26953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 20.0, 8.0, 12.0, 15.0, 14.0, 22.0, 36.0, 30.0, 37.0, 29.0, 32.0, 33.0, 34.0, 40.0, 46.0, 47.0, 42.0, 51.0, 50.0, 36.0, 39.0, 42.0, 40.0, 21.0, 25.0, 30.0, 14.0, 16.0, 14.0, 17.0, 18.0, 11.0, 6.0, 12.0, 10.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.9296875, -0.9017715454101562, -0.8738555908203125, -0.8459396362304688, -0.818023681640625, -0.7901077270507812, -0.7621917724609375, -0.7342758178710938, -0.70635986328125, -0.6784439086914062, -0.6505279541015625, -0.6226119995117188, -0.594696044921875, -0.5667800903320312, -0.5388641357421875, -0.5109481811523438, -0.4830322265625, -0.45511627197265625, -0.4272003173828125, -0.39928436279296875, -0.371368408203125, -0.34345245361328125, -0.3155364990234375, -0.28762054443359375, -0.25970458984375, -0.23178863525390625, -0.2038726806640625, -0.17595672607421875, -0.148040771484375, -0.12012481689453125, -0.0922088623046875, -0.06429290771484375, -0.036376953125, -0.00846099853515625, 0.0194549560546875, 0.04737091064453125, 0.075286865234375, 0.10320281982421875, 0.1311187744140625, 0.15903472900390625, 0.18695068359375, 0.21486663818359375, 0.2427825927734375, 0.27069854736328125, 0.298614501953125, 0.32653045654296875, 0.3544464111328125, 0.38236236572265625, 0.4102783203125, 0.43819427490234375, 0.4661102294921875, 0.49402618408203125, 0.521942138671875, 0.5498580932617188, 0.5777740478515625, 0.6056900024414062, 0.63360595703125, 0.6615219116210938, 0.6894378662109375, 0.7173538208007812, 0.745269775390625, 0.7731857299804688, 0.8011016845703125, 0.8290176391601562, 0.85693359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 6.0, 8.0, 10.0, 12.0, 17.0, 24.0, 31.0, 40.0, 53.0, 85.0, 125.0, 152.0, 206.0, 331.0, 528.0, 805.0, 1306.0, 2348.0, 4733.0, 12647.0, 48594.0, 259469.0, 593513.0, 89179.0, 20119.0, 6637.0, 3007.0, 1655.0, 974.0, 623.0, 408.0, 251.0, 187.0, 125.0, 98.0, 53.0, 52.0, 37.0, 33.0, 24.0, 11.0, 10.0, 5.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.537109375, -3.4237060546875, -3.310302734375, -3.1968994140625, -3.08349609375, -2.9700927734375, -2.856689453125, -2.7432861328125, -2.6298828125, -2.5164794921875, -2.403076171875, -2.2896728515625, -2.17626953125, -2.0628662109375, -1.949462890625, -1.8360595703125, -1.72265625, -1.6092529296875, -1.495849609375, -1.3824462890625, -1.26904296875, -1.1556396484375, -1.042236328125, -0.9288330078125, -0.8154296875, -0.7020263671875, -0.588623046875, -0.4752197265625, -0.36181640625, -0.2484130859375, -0.135009765625, -0.0216064453125, 0.091796875, 0.2052001953125, 0.318603515625, 0.4320068359375, 0.54541015625, 0.6588134765625, 0.772216796875, 0.8856201171875, 0.9990234375, 1.1124267578125, 1.225830078125, 1.3392333984375, 1.45263671875, 1.5660400390625, 1.679443359375, 1.7928466796875, 1.90625, 2.0196533203125, 2.133056640625, 2.2464599609375, 2.35986328125, 2.4732666015625, 2.586669921875, 2.7000732421875, 2.8134765625, 2.9268798828125, 3.040283203125, 3.1536865234375, 3.26708984375, 3.3804931640625, 3.493896484375, 3.6072998046875, 3.720703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 16.0, 7.0, 14.0, 17.0, 20.0, 29.0, 31.0, 38.0, 39.0, 47.0, 60.0, 48.0, 59.0, 60.0, 60.0, 64.0, 56.0, 42.0, 36.0, 33.0, 33.0, 30.0, 19.0, 27.0, 22.0, 20.0, 11.0, 10.0, 8.0, 10.0, 6.0, 6.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.32757568359375, -5.1707763671875, -5.01397705078125, -4.857177734375, -4.70037841796875, -4.5435791015625, -4.38677978515625, -4.22998046875, -4.07318115234375, -3.9163818359375, -3.75958251953125, -3.602783203125, -3.44598388671875, -3.2891845703125, -3.13238525390625, -2.9755859375, -2.81878662109375, -2.6619873046875, -2.50518798828125, -2.348388671875, -2.19158935546875, -2.0347900390625, -1.87799072265625, -1.72119140625, -1.56439208984375, -1.4075927734375, -1.25079345703125, -1.093994140625, -0.93719482421875, -0.7803955078125, -0.62359619140625, -0.466796875, -0.30999755859375, -0.1531982421875, 0.00360107421875, 0.160400390625, 0.31719970703125, 0.4739990234375, 0.63079833984375, 0.78759765625, 0.94439697265625, 1.1011962890625, 1.25799560546875, 1.414794921875, 1.57159423828125, 1.7283935546875, 1.88519287109375, 2.0419921875, 2.19879150390625, 2.3555908203125, 2.51239013671875, 2.669189453125, 2.82598876953125, 2.9827880859375, 3.13958740234375, 3.29638671875, 3.45318603515625, 3.6099853515625, 3.76678466796875, 3.923583984375, 4.08038330078125, 4.2371826171875, 4.39398193359375, 4.55078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 14.0, 15.0, 41.0, 75.0, 166.0, 549.0, 2456.0, 32285.0, 958304.0, 50620.0, 3067.0, 581.0, 209.0, 95.0, 26.0, 22.0, 7.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.482879638671875, -2.38177490234375, -2.280670166015625, -2.1795654296875, -2.078460693359375, -1.97735595703125, -1.876251220703125, -1.775146484375, -1.674041748046875, -1.57293701171875, -1.471832275390625, -1.3707275390625, -1.269622802734375, -1.16851806640625, -1.067413330078125, -0.96630859375, -0.865203857421875, -0.76409912109375, -0.662994384765625, -0.5618896484375, -0.460784912109375, -0.35968017578125, -0.258575439453125, -0.157470703125, -0.056365966796875, 0.04473876953125, 0.145843505859375, 0.2469482421875, 0.348052978515625, 0.44915771484375, 0.550262451171875, 0.6513671875, 0.752471923828125, 0.85357666015625, 0.954681396484375, 1.0557861328125, 1.156890869140625, 1.25799560546875, 1.359100341796875, 1.460205078125, 1.561309814453125, 1.66241455078125, 1.763519287109375, 1.8646240234375, 1.965728759765625, 2.06683349609375, 2.167938232421875, 2.26904296875, 2.370147705078125, 2.47125244140625, 2.572357177734375, 2.6734619140625, 2.774566650390625, 2.87567138671875, 2.976776123046875, 3.077880859375, 3.178985595703125, 3.28009033203125, 3.381195068359375, 3.4822998046875, 3.583404541015625, 3.68450927734375, 3.785614013671875, 3.88671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 12.0, 24.0, 20.0, 34.0, 52.0, 72.0, 125.0, 163.0, 140.0, 103.0, 78.0, 54.0, 39.0, 24.0, 11.0, 9.0, 12.0, 6.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006084442138671875, -0.0005939304828643799, -0.0005794167518615723, -0.0005649030208587646, -0.000550389289855957, -0.0005358755588531494, -0.0005213618278503418, -0.0005068480968475342, -0.0004923343658447266, -0.00047782063484191895, -0.00046330690383911133, -0.0004487931728363037, -0.0004342794418334961, -0.0004197657108306885, -0.00040525197982788086, -0.00039073824882507324, -0.0003762245178222656, -0.000361710786819458, -0.0003471970558166504, -0.0003326833248138428, -0.00031816959381103516, -0.00030365586280822754, -0.0002891421318054199, -0.0002746284008026123, -0.0002601146697998047, -0.00024560093879699707, -0.00023108720779418945, -0.00021657347679138184, -0.00020205974578857422, -0.0001875460147857666, -0.00017303228378295898, -0.00015851855278015137, -0.00014400482177734375, -0.00012949109077453613, -0.00011497735977172852, -0.0001004636287689209, -8.594989776611328e-05, -7.143616676330566e-05, -5.692243576049805e-05, -4.240870475769043e-05, -2.7894973754882812e-05, -1.3381242752075195e-05, 1.1324882507324219e-06, 1.564621925354004e-05, 3.0159950256347656e-05, 4.4673681259155273e-05, 5.918741226196289e-05, 7.370114326477051e-05, 8.821487426757812e-05, 0.00010272860527038574, 0.00011724233627319336, 0.00013175606727600098, 0.0001462697982788086, 0.0001607835292816162, 0.00017529726028442383, 0.00018981099128723145, 0.00020432472229003906, 0.00021883845329284668, 0.0002333521842956543, 0.0002478659152984619, 0.00026237964630126953, 0.00027689337730407715, 0.00029140710830688477, 0.0003059208393096924, 0.0003204345703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 18.0, 20.0, 21.0, 36.0, 57.0, 90.0, 121.0, 131.0, 220.0, 335.0, 543.0, 952.0, 1760.0, 3531.0, 8749.0, 27526.0, 140490.0, 669361.0, 148433.0, 29300.0, 8741.0, 3652.0, 1728.0, 997.0, 571.0, 344.0, 237.0, 148.0, 100.0, 78.0, 57.0, 48.0, 29.0, 26.0, 11.0, 21.0, 11.0, 7.0, 6.0, 10.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.97802734375, -0.9459762573242188, -0.9139251708984375, -0.8818740844726562, -0.849822998046875, -0.8177719116210938, -0.7857208251953125, -0.7536697387695312, -0.72161865234375, -0.6895675659179688, -0.6575164794921875, -0.6254653930664062, -0.593414306640625, -0.5613632202148438, -0.5293121337890625, -0.49726104736328125, -0.4652099609375, -0.43315887451171875, -0.4011077880859375, -0.36905670166015625, -0.337005615234375, -0.30495452880859375, -0.2729034423828125, -0.24085235595703125, -0.20880126953125, -0.17675018310546875, -0.1446990966796875, -0.11264801025390625, -0.080596923828125, -0.04854583740234375, -0.0164947509765625, 0.01555633544921875, 0.047607421875, 0.07965850830078125, 0.1117095947265625, 0.14376068115234375, 0.175811767578125, 0.20786285400390625, 0.2399139404296875, 0.27196502685546875, 0.30401611328125, 0.33606719970703125, 0.3681182861328125, 0.40016937255859375, 0.432220458984375, 0.46427154541015625, 0.4963226318359375, 0.5283737182617188, 0.5604248046875, 0.5924758911132812, 0.6245269775390625, 0.6565780639648438, 0.688629150390625, 0.7206802368164062, 0.7527313232421875, 0.7847824096679688, 0.81683349609375, 0.8488845825195312, 0.8809356689453125, 0.9129867553710938, 0.945037841796875, 0.9770889282226562, 1.0091400146484375, 1.0411911010742188, 1.0732421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 8.0, 12.0, 22.0, 18.0, 36.0, 30.0, 37.0, 42.0, 56.0, 54.0, 59.0, 63.0, 66.0, 71.0, 62.0, 46.0, 46.0, 31.0, 49.0, 29.0, 29.0, 30.0, 14.0, 16.0, 8.0, 3.0, 8.0, 4.0, 3.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.0048675537109375, -0.971649169921875, -0.9384307861328125, -0.90521240234375, -0.8719940185546875, -0.838775634765625, -0.8055572509765625, -0.7723388671875, -0.7391204833984375, -0.705902099609375, -0.6726837158203125, -0.63946533203125, -0.6062469482421875, -0.573028564453125, -0.5398101806640625, -0.506591796875, -0.4733734130859375, -0.440155029296875, -0.4069366455078125, -0.37371826171875, -0.3404998779296875, -0.307281494140625, -0.2740631103515625, -0.2408447265625, -0.2076263427734375, -0.174407958984375, -0.1411895751953125, -0.10797119140625, -0.0747528076171875, -0.041534423828125, -0.0083160400390625, 0.02490234375, 0.0581207275390625, 0.091339111328125, 0.1245574951171875, 0.15777587890625, 0.1909942626953125, 0.224212646484375, 0.2574310302734375, 0.2906494140625, 0.3238677978515625, 0.357086181640625, 0.3903045654296875, 0.42352294921875, 0.4567413330078125, 0.489959716796875, 0.5231781005859375, 0.556396484375, 0.5896148681640625, 0.622833251953125, 0.6560516357421875, 0.68927001953125, 0.7224884033203125, 0.755706787109375, 0.7889251708984375, 0.8221435546875, 0.8553619384765625, 0.888580322265625, 0.9217987060546875, 0.95501708984375, 0.9882354736328125, 1.021453857421875, 1.0546722412109375, 1.087890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 16.0, 22.0, 35.0, 66.0, 89.0, 126.0, 248.0, 138.0, 94.0, 51.0, 41.0, 21.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.20698165893555, -35.37528610229492, -34.54359436035156, -33.71189880371094, -32.88020324707031, -32.04851150512695, -31.216815948486328, -30.385122299194336, -29.553428649902344, -28.72173500061035, -27.890039443969727, -27.058345794677734, -26.226652145385742, -25.39495849609375, -24.563262939453125, -23.731569290161133, -22.899873733520508, -22.068180084228516, -21.23648452758789, -20.4047908782959, -19.573097229003906, -18.74140167236328, -17.90970802307129, -17.078014373779297, -16.246318817138672, -15.414624214172363, -14.582930564880371, -13.751235961914062, -12.91954231262207, -12.087847709655762, -11.256153106689453, -10.424459457397461, -9.592767715454102, -8.761073112487793, -7.929379463195801, -7.097684860229492, -6.265990734100342, -5.434296607971191, -4.602602005004883, -3.7709078788757324, -2.939213752746582, -2.1075196266174316, -1.2758252620697021, -0.44413089752197266, 0.38756322860717773, 1.2192573547363281, 2.0509519577026367, 2.882646083831787, 3.7143402099609375, 4.546034336090088, 5.377728462219238, 6.209423065185547, 7.041117191314697, 7.872811317443848, 8.704505920410156, 9.536199569702148, 10.367894172668457, 11.199588775634766, 12.031282424926758, 12.862977027893066, 13.694671630859375, 14.526365280151367, 15.358059883117676, 16.189754486083984, 17.021448135375977]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 5.0, 6.0, 16.0, 12.0, 12.0, 18.0, 24.0, 28.0, 26.0, 18.0, 32.0, 38.0, 34.0, 48.0, 62.0, 73.0, 74.0, 73.0, 41.0, 33.0, 41.0, 45.0, 30.0, 33.0, 30.0, 17.0, 19.0, 17.0, 20.0, 10.0, 8.0, 10.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.68695068359375, -16.132951736450195, -15.57895278930664, -15.02495288848877, -14.470953941345215, -13.91695499420166, -13.362955093383789, -12.808956146240234, -12.25495719909668, -11.700958251953125, -11.14695930480957, -10.5929594039917, -10.038960456848145, -9.48496150970459, -8.930961608886719, -8.376962661743164, -7.822963714599609, -7.268964767456055, -6.714965343475342, -6.160965919494629, -5.606966972351074, -5.0529680252075195, -4.498968601226807, -3.944969415664673, -3.390970230102539, -2.8369710445404053, -2.2829718589782715, -1.7289726734161377, -1.174973487854004, -0.6209743022918701, -0.06697511672973633, 0.48702406883239746, 1.0410232543945312, 1.595022439956665, 2.149021625518799, 2.7030208110809326, 3.2570199966430664, 3.8110191822052, 4.365018367767334, 4.919017791748047, 5.473016738891602, 6.027015686035156, 6.581015110015869, 7.135014533996582, 7.689013481140137, 8.243012428283691, 8.797012329101562, 9.351011276245117, 9.905010223388672, 10.459009170532227, 11.013008117675781, 11.567008018493652, 12.121006965637207, 12.675005912780762, 13.229005813598633, 13.783004760742188, 14.337003707885742, 14.891002655029297, 15.445001602172852, 15.999001502990723, 16.553001403808594, 17.10700035095215, 17.660999298095703, 18.214998245239258, 18.768997192382812]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 10.0, 13.0, 17.0, 39.0, 53.0, 70.0, 108.0, 183.0, 309.0, 557.0, 986.0, 1872.0, 3613.0, 7145.0, 15603.0, 39884.0, 145500.0, 955857.0, 2497802.0, 398509.0, 77882.0, 26307.0, 11134.0, 5103.0, 2590.0, 1338.0, 759.0, 417.0, 217.0, 154.0, 95.0, 60.0, 21.0, 21.0, 18.0, 9.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5, -1.4586639404296875, -1.417327880859375, -1.3759918212890625, -1.33465576171875, -1.2933197021484375, -1.251983642578125, -1.2106475830078125, -1.1693115234375, -1.1279754638671875, -1.086639404296875, -1.0453033447265625, -1.00396728515625, -0.9626312255859375, -0.921295166015625, -0.8799591064453125, -0.838623046875, -0.7972869873046875, -0.755950927734375, -0.7146148681640625, -0.67327880859375, -0.6319427490234375, -0.590606689453125, -0.5492706298828125, -0.5079345703125, -0.4665985107421875, -0.425262451171875, -0.3839263916015625, -0.34259033203125, -0.3012542724609375, -0.259918212890625, -0.2185821533203125, -0.17724609375, -0.1359100341796875, -0.094573974609375, -0.0532379150390625, -0.01190185546875, 0.0294342041015625, 0.070770263671875, 0.1121063232421875, 0.1534423828125, 0.1947784423828125, 0.236114501953125, 0.2774505615234375, 0.31878662109375, 0.3601226806640625, 0.401458740234375, 0.4427947998046875, 0.484130859375, 0.5254669189453125, 0.566802978515625, 0.6081390380859375, 0.64947509765625, 0.6908111572265625, 0.732147216796875, 0.7734832763671875, 0.8148193359375, 0.8561553955078125, 0.897491455078125, 0.9388275146484375, 0.98016357421875, 1.0214996337890625, 1.062835693359375, 1.1041717529296875, 1.1455078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 5.0, 11.0, 11.0, 13.0, 17.0, 12.0, 9.0, 26.0, 23.0, 24.0, 36.0, 35.0, 39.0, 42.0, 39.0, 39.0, 43.0, 47.0, 43.0, 49.0, 30.0, 55.0, 36.0, 48.0, 34.0, 29.0, 23.0, 26.0, 22.0, 15.0, 23.0, 16.0, 13.0, 7.0, 10.0, 3.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8193359375, -0.791656494140625, -0.76397705078125, -0.736297607421875, -0.7086181640625, -0.680938720703125, -0.65325927734375, -0.625579833984375, -0.597900390625, -0.570220947265625, -0.54254150390625, -0.514862060546875, -0.4871826171875, -0.459503173828125, -0.43182373046875, -0.404144287109375, -0.37646484375, -0.348785400390625, -0.32110595703125, -0.293426513671875, -0.2657470703125, -0.238067626953125, -0.21038818359375, -0.182708740234375, -0.155029296875, -0.127349853515625, -0.09967041015625, -0.071990966796875, -0.0443115234375, -0.016632080078125, 0.01104736328125, 0.038726806640625, 0.06640625, 0.094085693359375, 0.12176513671875, 0.149444580078125, 0.1771240234375, 0.204803466796875, 0.23248291015625, 0.260162353515625, 0.287841796875, 0.315521240234375, 0.34320068359375, 0.370880126953125, 0.3985595703125, 0.426239013671875, 0.45391845703125, 0.481597900390625, 0.50927734375, 0.536956787109375, 0.56463623046875, 0.592315673828125, 0.6199951171875, 0.647674560546875, 0.67535400390625, 0.703033447265625, 0.730712890625, 0.758392333984375, 0.78607177734375, 0.813751220703125, 0.8414306640625, 0.869110107421875, 0.89678955078125, 0.924468994140625, 0.9521484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 10.0, 15.0, 10.0, 19.0, 30.0, 52.0, 69.0, 99.0, 126.0, 214.0, 403.0, 730.0, 1248.0, 2516.0, 5627.0, 14633.0, 46800.0, 213970.0, 2914582.0, 848451.0, 101392.0, 26944.0, 8954.0, 3493.0, 1684.0, 871.0, 497.0, 292.0, 181.0, 118.0, 67.0, 54.0, 35.0, 24.0, 22.0, 14.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 3.0, 1.0], "bins": [-2.115234375, -2.054412841796875, -1.99359130859375, -1.932769775390625, -1.8719482421875, -1.811126708984375, -1.75030517578125, -1.689483642578125, -1.628662109375, -1.567840576171875, -1.50701904296875, -1.446197509765625, -1.3853759765625, -1.324554443359375, -1.26373291015625, -1.202911376953125, -1.14208984375, -1.081268310546875, -1.02044677734375, -0.959625244140625, -0.8988037109375, -0.837982177734375, -0.77716064453125, -0.716339111328125, -0.655517578125, -0.594696044921875, -0.53387451171875, -0.473052978515625, -0.4122314453125, -0.351409912109375, -0.29058837890625, -0.229766845703125, -0.1689453125, -0.108123779296875, -0.04730224609375, 0.013519287109375, 0.0743408203125, 0.135162353515625, 0.19598388671875, 0.256805419921875, 0.317626953125, 0.378448486328125, 0.43927001953125, 0.500091552734375, 0.5609130859375, 0.621734619140625, 0.68255615234375, 0.743377685546875, 0.80419921875, 0.865020751953125, 0.92584228515625, 0.986663818359375, 1.0474853515625, 1.108306884765625, 1.16912841796875, 1.229949951171875, 1.290771484375, 1.351593017578125, 1.41241455078125, 1.473236083984375, 1.5340576171875, 1.594879150390625, 1.65570068359375, 1.716522216796875, 1.77734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 5.0, 8.0, 8.0, 19.0, 15.0, 36.0, 44.0, 65.0, 91.0, 167.0, 313.0, 598.0, 1049.0, 732.0, 345.0, 190.0, 143.0, 65.0, 37.0, 42.0, 23.0, 22.0, 17.0, 11.0, 9.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.689453125, -3.596405029296875, -3.50335693359375, -3.410308837890625, -3.3172607421875, -3.224212646484375, -3.13116455078125, -3.038116455078125, -2.945068359375, -2.852020263671875, -2.75897216796875, -2.665924072265625, -2.5728759765625, -2.479827880859375, -2.38677978515625, -2.293731689453125, -2.20068359375, -2.107635498046875, -2.01458740234375, -1.921539306640625, -1.8284912109375, -1.735443115234375, -1.64239501953125, -1.549346923828125, -1.456298828125, -1.363250732421875, -1.27020263671875, -1.177154541015625, -1.0841064453125, -0.991058349609375, -0.89801025390625, -0.804962158203125, -0.7119140625, -0.618865966796875, -0.52581787109375, -0.432769775390625, -0.3397216796875, -0.246673583984375, -0.15362548828125, -0.060577392578125, 0.032470703125, 0.125518798828125, 0.21856689453125, 0.311614990234375, 0.4046630859375, 0.497711181640625, 0.59075927734375, 0.683807373046875, 0.77685546875, 0.869903564453125, 0.96295166015625, 1.055999755859375, 1.1490478515625, 1.242095947265625, 1.33514404296875, 1.428192138671875, 1.521240234375, 1.614288330078125, 1.70733642578125, 1.800384521484375, 1.8934326171875, 1.986480712890625, 2.07952880859375, 2.172576904296875, 2.265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 17.0, 61.0, 367.0, 435.0, 87.0, 15.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.178726196289062, -24.17584800720215, -22.172969818115234, -20.170089721679688, -18.167211532592773, -16.16433334350586, -14.161454200744629, -12.158575057983398, -10.155696868896484, -8.15281867980957, -6.14993953704834, -4.147060871124268, -2.1441822052001953, -0.14130401611328125, 1.8615751266479492, 3.8644542694091797, 5.867332458496094, 7.870211124420166, 9.873089790344238, 11.875968933105469, 13.878847122192383, 15.881725311279297, 17.884605407714844, 19.887483596801758, 21.890361785888672, 23.893239974975586, 25.8961181640625, 27.898998260498047, 29.90187644958496, 31.904754638671875, 33.90763473510742, 35.91051483154297, 37.91338348388672, 39.916263580322266, 41.91913986206055, 43.922019958496094, 45.924896240234375, 47.92777633666992, 49.93065643310547, 51.93353271484375, 53.9364128112793, 55.939292907714844, 57.942169189453125, 59.94504928588867, 61.94792938232422, 63.9508056640625, 65.95368194580078, 67.9565658569336, 69.95944213867188, 71.96231842041016, 73.96520233154297, 75.96807861328125, 77.97095489501953, 79.97383117675781, 81.97671508789062, 83.9795913696289, 85.98246765136719, 87.98534393310547, 89.98822784423828, 91.99110412597656, 93.99398040771484, 95.99685668945312, 97.99974060058594, 100.00261688232422, 102.00550079345703]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 11.0, 16.0, 16.0, 28.0, 25.0, 36.0, 42.0, 37.0, 55.0, 44.0, 58.0, 62.0, 72.0, 78.0, 58.0, 50.0, 55.0, 48.0, 35.0, 37.0, 23.0, 26.0, 20.0, 10.0, 10.0, 7.0, 9.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.574365615844727, -12.098608016967773, -11.622849464416504, -11.14709186553955, -10.671334266662598, -10.195575714111328, -9.719818115234375, -9.244060516357422, -8.768301963806152, -8.2925443649292, -7.816786289215088, -7.341028213500977, -6.865270137786865, -6.389512062072754, -5.913754463195801, -5.4379963874816895, -4.962238788604736, -4.486480712890625, -4.010723114013672, -3.5349650382995605, -3.059206962585449, -2.583449125289917, -2.1076912879943848, -1.6319332122802734, -1.1561753749847412, -0.6804174184799194, -0.20465952157974243, 0.27109837532043457, 0.7468563318252563, 1.2226142883300781, 1.6983721256256104, 2.1741302013397217, 2.649888038635254, 3.125645875930786, 3.6014039516448975, 4.07716178894043, 4.552919864654541, 5.028677940368652, 5.5044355392456055, 5.980193614959717, 6.455951690673828, 6.9317097663879395, 7.407467365264893, 7.883225440979004, 8.358983039855957, 8.834741592407227, 9.31049919128418, 9.786256790161133, 10.262014389038086, 10.737771987915039, 11.213530540466309, 11.689288139343262, 12.165045738220215, 12.640804290771484, 13.116561889648438, 13.59231948852539, 14.06807804107666, 14.543835639953613, 15.019594192504883, 15.495351791381836, 15.971109390258789, 16.446866989135742, 16.922626495361328, 17.39838409423828, 17.874141693115234]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 1.0, 16.0, 18.0, 26.0, 38.0, 61.0, 66.0, 163.0, 212.0, 369.0, 697.0, 1173.0, 2101.0, 3955.0, 8593.0, 19633.0, 49657.0, 133344.0, 348405.0, 298588.0, 108529.0, 41061.0, 16600.0, 7399.0, 3526.0, 1832.0, 992.0, 568.0, 341.0, 222.0, 126.0, 83.0, 55.0, 38.0, 19.0, 23.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.357421875, -2.2857666015625, -2.214111328125, -2.1424560546875, -2.07080078125, -1.9991455078125, -1.927490234375, -1.8558349609375, -1.7841796875, -1.7125244140625, -1.640869140625, -1.5692138671875, -1.49755859375, -1.4259033203125, -1.354248046875, -1.2825927734375, -1.2109375, -1.1392822265625, -1.067626953125, -0.9959716796875, -0.92431640625, -0.8526611328125, -0.781005859375, -0.7093505859375, -0.6376953125, -0.5660400390625, -0.494384765625, -0.4227294921875, -0.35107421875, -0.2794189453125, -0.207763671875, -0.1361083984375, -0.064453125, 0.0072021484375, 0.078857421875, 0.1505126953125, 0.22216796875, 0.2938232421875, 0.365478515625, 0.4371337890625, 0.5087890625, 0.5804443359375, 0.652099609375, 0.7237548828125, 0.79541015625, 0.8670654296875, 0.938720703125, 1.0103759765625, 1.08203125, 1.1536865234375, 1.225341796875, 1.2969970703125, 1.36865234375, 1.4403076171875, 1.511962890625, 1.5836181640625, 1.6552734375, 1.7269287109375, 1.798583984375, 1.8702392578125, 1.94189453125, 2.0135498046875, 2.085205078125, 2.1568603515625, 2.228515625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 9.0, 8.0, 15.0, 12.0, 12.0, 15.0, 18.0, 22.0, 19.0, 30.0, 35.0, 30.0, 33.0, 45.0, 37.0, 44.0, 37.0, 35.0, 47.0, 44.0, 39.0, 46.0, 38.0, 36.0, 29.0, 43.0, 25.0, 23.0, 22.0, 18.0, 10.0, 20.0, 9.0, 12.0, 19.0, 5.0, 11.0, 4.0, 6.0, 5.0, 5.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.775390625, -0.7483978271484375, -0.721405029296875, -0.6944122314453125, -0.66741943359375, -0.6404266357421875, -0.613433837890625, -0.5864410400390625, -0.5594482421875, -0.5324554443359375, -0.505462646484375, -0.4784698486328125, -0.45147705078125, -0.4244842529296875, -0.397491455078125, -0.3704986572265625, -0.343505859375, -0.3165130615234375, -0.289520263671875, -0.2625274658203125, -0.23553466796875, -0.2085418701171875, -0.181549072265625, -0.1545562744140625, -0.1275634765625, -0.1005706787109375, -0.073577880859375, -0.0465850830078125, -0.01959228515625, 0.0074005126953125, 0.034393310546875, 0.0613861083984375, 0.08837890625, 0.1153717041015625, 0.142364501953125, 0.1693572998046875, 0.19635009765625, 0.2233428955078125, 0.250335693359375, 0.2773284912109375, 0.3043212890625, 0.3313140869140625, 0.358306884765625, 0.3852996826171875, 0.41229248046875, 0.4392852783203125, 0.466278076171875, 0.4932708740234375, 0.520263671875, 0.5472564697265625, 0.574249267578125, 0.6012420654296875, 0.62823486328125, 0.6552276611328125, 0.682220458984375, 0.7092132568359375, 0.7362060546875, 0.7631988525390625, 0.790191650390625, 0.8171844482421875, 0.84417724609375, 0.8711700439453125, 0.898162841796875, 0.9251556396484375, 0.9521484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 9.0, 5.0, 12.0, 9.0, 19.0, 28.0, 38.0, 57.0, 77.0, 107.0, 163.0, 270.0, 415.0, 765.0, 1464.0, 3052.0, 8798.0, 40557.0, 352553.0, 574170.0, 49101.0, 9931.0, 3376.0, 1510.0, 757.0, 467.0, 259.0, 171.0, 141.0, 76.0, 45.0, 33.0, 35.0, 18.0, 13.0, 17.0, 14.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.6328125, -4.500640869140625, -4.36846923828125, -4.236297607421875, -4.1041259765625, -3.971954345703125, -3.83978271484375, -3.707611083984375, -3.575439453125, -3.443267822265625, -3.31109619140625, -3.178924560546875, -3.0467529296875, -2.914581298828125, -2.78240966796875, -2.650238037109375, -2.51806640625, -2.385894775390625, -2.25372314453125, -2.121551513671875, -1.9893798828125, -1.857208251953125, -1.72503662109375, -1.592864990234375, -1.460693359375, -1.328521728515625, -1.19635009765625, -1.064178466796875, -0.9320068359375, -0.799835205078125, -0.66766357421875, -0.535491943359375, -0.4033203125, -0.271148681640625, -0.13897705078125, -0.006805419921875, 0.1253662109375, 0.257537841796875, 0.38970947265625, 0.521881103515625, 0.654052734375, 0.786224365234375, 0.91839599609375, 1.050567626953125, 1.1827392578125, 1.314910888671875, 1.44708251953125, 1.579254150390625, 1.71142578125, 1.843597412109375, 1.97576904296875, 2.107940673828125, 2.2401123046875, 2.372283935546875, 2.50445556640625, 2.636627197265625, 2.768798828125, 2.900970458984375, 3.03314208984375, 3.165313720703125, 3.2974853515625, 3.429656982421875, 3.56182861328125, 3.694000244140625, 3.826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 16.0, 17.0, 19.0, 40.0, 31.0, 49.0, 52.0, 65.0, 80.0, 63.0, 62.0, 55.0, 72.0, 67.0, 46.0, 56.0, 47.0, 34.0, 20.0, 25.0, 16.0, 12.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75390625, -3.58203125, -3.41015625, -3.23828125, -3.06640625, -2.89453125, -2.72265625, -2.55078125, -2.37890625, -2.20703125, -2.03515625, -1.86328125, -1.69140625, -1.51953125, -1.34765625, -1.17578125, -1.00390625, -0.83203125, -0.66015625, -0.48828125, -0.31640625, -0.14453125, 0.02734375, 0.19921875, 0.37109375, 0.54296875, 0.71484375, 0.88671875, 1.05859375, 1.23046875, 1.40234375, 1.57421875, 1.74609375, 1.91796875, 2.08984375, 2.26171875, 2.43359375, 2.60546875, 2.77734375, 2.94921875, 3.12109375, 3.29296875, 3.46484375, 3.63671875, 3.80859375, 3.98046875, 4.15234375, 4.32421875, 4.49609375, 4.66796875, 4.83984375, 5.01171875, 5.18359375, 5.35546875, 5.52734375, 5.69921875, 5.87109375, 6.04296875, 6.21484375, 6.38671875, 6.55859375, 6.73046875, 6.90234375, 7.07421875, 7.24609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 6.0, 7.0, 10.0, 11.0, 17.0, 17.0, 38.0, 58.0, 72.0, 117.0, 204.0, 430.0, 928.0, 2449.0, 9781.0, 73085.0, 785000.0, 154532.0, 15834.0, 3560.0, 1225.0, 464.0, 289.0, 133.0, 85.0, 67.0, 39.0, 23.0, 16.0, 16.0, 3.0, 7.0, 3.0, 5.0, 5.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.423828125, -1.3788299560546875, -1.333831787109375, -1.2888336181640625, -1.24383544921875, -1.1988372802734375, -1.153839111328125, -1.1088409423828125, -1.0638427734375, -1.0188446044921875, -0.973846435546875, -0.9288482666015625, -0.88385009765625, -0.8388519287109375, -0.793853759765625, -0.7488555908203125, -0.703857421875, -0.6588592529296875, -0.613861083984375, -0.5688629150390625, -0.52386474609375, -0.4788665771484375, -0.433868408203125, -0.3888702392578125, -0.3438720703125, -0.2988739013671875, -0.253875732421875, -0.2088775634765625, -0.16387939453125, -0.1188812255859375, -0.073883056640625, -0.0288848876953125, 0.01611328125, 0.0611114501953125, 0.106109619140625, 0.1511077880859375, 0.19610595703125, 0.2411041259765625, 0.286102294921875, 0.3311004638671875, 0.3760986328125, 0.4210968017578125, 0.466094970703125, 0.5110931396484375, 0.55609130859375, 0.6010894775390625, 0.646087646484375, 0.6910858154296875, 0.736083984375, 0.7810821533203125, 0.826080322265625, 0.8710784912109375, 0.91607666015625, 0.9610748291015625, 1.006072998046875, 1.0510711669921875, 1.0960693359375, 1.1410675048828125, 1.186065673828125, 1.2310638427734375, 1.27606201171875, 1.3210601806640625, 1.366058349609375, 1.4110565185546875, 1.4560546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 4.0, 8.0, 13.0, 16.0, 10.0, 18.0, 18.0, 38.0, 29.0, 54.0, 49.0, 72.0, 94.0, 98.0, 110.0, 82.0, 65.0, 45.0, 44.0, 30.0, 22.0, 14.0, 9.0, 11.0, 3.0, 12.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002732276916503906, -0.0002643391489982605, -0.00025545060634613037, -0.00024656206369400024, -0.00023767352104187012, -0.00022878497838974, -0.00021989643573760986, -0.00021100789308547974, -0.0002021193504333496, -0.00019323080778121948, -0.00018434226512908936, -0.00017545372247695923, -0.0001665651798248291, -0.00015767663717269897, -0.00014878809452056885, -0.00013989955186843872, -0.0001310110092163086, -0.00012212246656417847, -0.00011323392391204834, -0.00010434538125991821, -9.545683860778809e-05, -8.656829595565796e-05, -7.767975330352783e-05, -6.87912106513977e-05, -5.990266799926758e-05, -5.101412534713745e-05, -4.2125582695007324e-05, -3.32370400428772e-05, -2.434849739074707e-05, -1.5459954738616943e-05, -6.571412086486816e-06, 2.3171305656433105e-06, 1.1205673217773438e-05, 2.0094215869903564e-05, 2.898275852203369e-05, 3.787130117416382e-05, 4.6759843826293945e-05, 5.564838647842407e-05, 6.45369291305542e-05, 7.342547178268433e-05, 8.231401443481445e-05, 9.120255708694458e-05, 0.00010009109973907471, 0.00010897964239120483, 0.00011786818504333496, 0.0001267567276954651, 0.00013564527034759521, 0.00014453381299972534, 0.00015342235565185547, 0.0001623108983039856, 0.00017119944095611572, 0.00018008798360824585, 0.00018897652626037598, 0.0001978650689125061, 0.00020675361156463623, 0.00021564215421676636, 0.00022453069686889648, 0.0002334192395210266, 0.00024230778217315674, 0.00025119632482528687, 0.000260084867477417, 0.0002689734101295471, 0.00027786195278167725, 0.0002867504954338074, 0.0002956390380859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 7.0, 5.0, 11.0, 8.0, 18.0, 17.0, 36.0, 38.0, 78.0, 154.0, 274.0, 566.0, 1312.0, 3571.0, 16881.0, 219435.0, 750982.0, 45001.0, 6542.0, 1949.0, 831.0, 357.0, 212.0, 116.0, 48.0, 34.0, 24.0, 21.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5314178466796875, -1.486663818359375, -1.4419097900390625, -1.39715576171875, -1.3524017333984375, -1.307647705078125, -1.2628936767578125, -1.2181396484375, -1.1733856201171875, -1.128631591796875, -1.0838775634765625, -1.03912353515625, -0.9943695068359375, -0.949615478515625, -0.9048614501953125, -0.860107421875, -0.8153533935546875, -0.770599365234375, -0.7258453369140625, -0.68109130859375, -0.6363372802734375, -0.591583251953125, -0.5468292236328125, -0.5020751953125, -0.4573211669921875, -0.412567138671875, -0.3678131103515625, -0.32305908203125, -0.2783050537109375, -0.233551025390625, -0.1887969970703125, -0.14404296875, -0.0992889404296875, -0.054534912109375, -0.0097808837890625, 0.03497314453125, 0.0797271728515625, 0.124481201171875, 0.1692352294921875, 0.2139892578125, 0.2587432861328125, 0.303497314453125, 0.3482513427734375, 0.39300537109375, 0.4377593994140625, 0.482513427734375, 0.5272674560546875, 0.572021484375, 0.6167755126953125, 0.661529541015625, 0.7062835693359375, 0.75103759765625, 0.7957916259765625, 0.840545654296875, 0.8852996826171875, 0.9300537109375, 0.9748077392578125, 1.019561767578125, 1.0643157958984375, 1.10906982421875, 1.1538238525390625, 1.198577880859375, 1.2433319091796875, 1.2880859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 15.0, 17.0, 25.0, 42.0, 51.0, 72.0, 93.0, 104.0, 121.0, 110.0, 104.0, 80.0, 52.0, 27.0, 27.0, 25.0, 15.0, 3.0, 7.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.451171875, -2.401702880859375, -2.35223388671875, -2.302764892578125, -2.2532958984375, -2.203826904296875, -2.15435791015625, -2.104888916015625, -2.055419921875, -2.005950927734375, -1.95648193359375, -1.907012939453125, -1.8575439453125, -1.808074951171875, -1.75860595703125, -1.709136962890625, -1.65966796875, -1.610198974609375, -1.56072998046875, -1.511260986328125, -1.4617919921875, -1.412322998046875, -1.36285400390625, -1.313385009765625, -1.263916015625, -1.214447021484375, -1.16497802734375, -1.115509033203125, -1.0660400390625, -1.016571044921875, -0.96710205078125, -0.917633056640625, -0.8681640625, -0.818695068359375, -0.76922607421875, -0.719757080078125, -0.6702880859375, -0.620819091796875, -0.57135009765625, -0.521881103515625, -0.472412109375, -0.422943115234375, -0.37347412109375, -0.324005126953125, -0.2745361328125, -0.225067138671875, -0.17559814453125, -0.126129150390625, -0.07666015625, -0.027191162109375, 0.02227783203125, 0.071746826171875, 0.1212158203125, 0.170684814453125, 0.22015380859375, 0.269622802734375, 0.319091796875, 0.368560791015625, 0.41802978515625, 0.467498779296875, 0.5169677734375, 0.566436767578125, 0.61590576171875, 0.665374755859375, 0.71484375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 10.0, 8.0, 8.0, 8.0, 13.0, 30.0, 52.0, 117.0, 189.0, 276.0, 125.0, 77.0, 41.0, 20.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.426483154296875, -24.557722091674805, -23.688961029052734, -22.820199966430664, -21.951438903808594, -21.08267593383789, -20.21391487121582, -19.34515380859375, -18.47639274597168, -17.60763168334961, -16.73887062072754, -15.870108604431152, -15.001347541809082, -14.132586479187012, -13.263824462890625, -12.395063400268555, -11.526302337646484, -10.657541275024414, -9.788780212402344, -8.920018196105957, -8.051257133483887, -7.182496070861816, -6.313734531402588, -5.444972991943359, -4.576211929321289, -3.7074506282806396, -2.8386893272399902, -1.9699280261993408, -1.1011667251586914, -0.2324056625366211, 0.6363558769226074, 1.505117416381836, 2.373880386352539, 3.2426416873931885, 4.111402988433838, 4.980164527893066, 5.848925590515137, 6.717686653137207, 7.5864481925964355, 8.455209732055664, 9.323970794677734, 10.192731857299805, 11.061492919921875, 11.930254936218262, 12.799015998840332, 13.667777061462402, 14.536539077758789, 15.40530014038086, 16.27406120300293, 17.142822265625, 18.01158332824707, 18.88034439086914, 19.749107360839844, 20.61786651611328, 21.486629486083984, 22.355390548706055, 23.224151611328125, 24.092912673950195, 24.961673736572266, 25.830434799194336, 26.699195861816406, 27.56795883178711, 28.43671989440918, 29.30548095703125, 30.17424201965332]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 5.0, 10.0, 12.0, 8.0, 14.0, 18.0, 11.0, 21.0, 20.0, 25.0, 27.0, 25.0, 22.0, 32.0, 42.0, 45.0, 63.0, 66.0, 67.0, 58.0, 61.0, 43.0, 39.0, 33.0, 31.0, 22.0, 22.0, 18.0, 16.0, 12.0, 18.0, 6.0, 13.0, 16.0, 10.0, 6.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.952184677124023, -13.482481956481934, -13.01278018951416, -12.54307746887207, -12.073375701904297, -11.603672981262207, -11.133970260620117, -10.664268493652344, -10.19456672668457, -9.72486400604248, -9.255162239074707, -8.785459518432617, -8.315757751464844, -7.846055030822754, -7.376352787017822, -6.906650543212891, -6.436947822570801, -5.967245578765869, -5.4975433349609375, -5.027840614318848, -4.558138847351074, -4.088436126708984, -3.6187338829040527, -3.149031639099121, -2.6793293952941895, -2.209627151489258, -1.7399247884750366, -1.2702224254608154, -0.8005201816558838, -0.33081793785095215, 0.1388845443725586, 0.6085867881774902, 1.0782890319824219, 1.5479912757873535, 2.017693519592285, 2.487396001815796, 2.9570982456207275, 3.426800489425659, 3.89650297164917, 4.366205215454102, 4.835907459259033, 5.305609703063965, 5.7753119468688965, 6.245014190673828, 6.714716911315918, 7.184418678283691, 7.654121398925781, 8.123823165893555, 8.593525886535645, 9.063228607177734, 9.532930374145508, 10.002633094787598, 10.472334861755371, 10.942037582397461, 11.411739349365234, 11.881442070007324, 12.351144790649414, 12.820847511291504, 13.290549278259277, 13.760251998901367, 14.22995376586914, 14.69965648651123, 15.16935920715332, 15.639060974121094, 16.108762741088867]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 11.0, 10.0, 17.0, 26.0, 42.0, 43.0, 100.0, 99.0, 143.0, 255.0, 355.0, 617.0, 1229.0, 2360.0, 4830.0, 11125.0, 32768.0, 185089.0, 2107797.0, 1657682.0, 142503.0, 27958.0, 9977.0, 4261.0, 2161.0, 1069.0, 632.0, 383.0, 225.0, 163.0, 85.0, 77.0, 50.0, 33.0, 27.0, 11.0, 6.0, 10.0, 8.0, 6.0, 4.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.34765625, -1.304107666015625, -1.26055908203125, -1.217010498046875, -1.1734619140625, -1.129913330078125, -1.08636474609375, -1.042816162109375, -0.999267578125, -0.955718994140625, -0.91217041015625, -0.868621826171875, -0.8250732421875, -0.781524658203125, -0.73797607421875, -0.694427490234375, -0.65087890625, -0.607330322265625, -0.56378173828125, -0.520233154296875, -0.4766845703125, -0.433135986328125, -0.38958740234375, -0.346038818359375, -0.302490234375, -0.258941650390625, -0.21539306640625, -0.171844482421875, -0.1282958984375, -0.084747314453125, -0.04119873046875, 0.002349853515625, 0.0458984375, 0.089447021484375, 0.13299560546875, 0.176544189453125, 0.2200927734375, 0.263641357421875, 0.30718994140625, 0.350738525390625, 0.394287109375, 0.437835693359375, 0.48138427734375, 0.524932861328125, 0.5684814453125, 0.612030029296875, 0.65557861328125, 0.699127197265625, 0.74267578125, 0.786224365234375, 0.82977294921875, 0.873321533203125, 0.9168701171875, 0.960418701171875, 1.00396728515625, 1.047515869140625, 1.091064453125, 1.134613037109375, 1.17816162109375, 1.221710205078125, 1.2652587890625, 1.308807373046875, 1.35235595703125, 1.395904541015625, 1.439453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 10.0, 6.0, 5.0, 14.0, 12.0, 12.0, 18.0, 28.0, 23.0, 28.0, 30.0, 33.0, 41.0, 38.0, 47.0, 38.0, 31.0, 41.0, 38.0, 41.0, 43.0, 50.0, 40.0, 39.0, 37.0, 31.0, 26.0, 37.0, 19.0, 26.0, 15.0, 19.0, 10.0, 15.0, 15.0, 10.0, 9.0, 7.0, 2.0, 7.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.8642578125, -0.8381881713867188, -0.8121185302734375, -0.7860488891601562, -0.759979248046875, -0.7339096069335938, -0.7078399658203125, -0.6817703247070312, -0.65570068359375, -0.6296310424804688, -0.6035614013671875, -0.5774917602539062, -0.551422119140625, -0.5253524780273438, -0.4992828369140625, -0.47321319580078125, -0.4471435546875, -0.42107391357421875, -0.3950042724609375, -0.36893463134765625, -0.342864990234375, -0.31679534912109375, -0.2907257080078125, -0.26465606689453125, -0.23858642578125, -0.21251678466796875, -0.1864471435546875, -0.16037750244140625, -0.134307861328125, -0.10823822021484375, -0.0821685791015625, -0.05609893798828125, -0.030029296875, -0.00395965576171875, 0.0221099853515625, 0.04817962646484375, 0.074249267578125, 0.10031890869140625, 0.1263885498046875, 0.15245819091796875, 0.17852783203125, 0.20459747314453125, 0.2306671142578125, 0.25673675537109375, 0.282806396484375, 0.30887603759765625, 0.3349456787109375, 0.36101531982421875, 0.3870849609375, 0.41315460205078125, 0.4392242431640625, 0.46529388427734375, 0.491363525390625, 0.5174331665039062, 0.5435028076171875, 0.5695724487304688, 0.59564208984375, 0.6217117309570312, 0.6477813720703125, 0.6738510131835938, 0.699920654296875, 0.7259902954101562, 0.7520599365234375, 0.7781295776367188, 0.80419921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 15.0, 13.0, 21.0, 32.0, 58.0, 116.0, 220.0, 499.0, 1294.0, 4324.0, 20560.0, 244331.0, 3795917.0, 107968.0, 13534.0, 3279.0, 1156.0, 463.0, 224.0, 101.0, 61.0, 39.0, 18.0, 15.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.958984375, -3.858428955078125, -3.75787353515625, -3.657318115234375, -3.5567626953125, -3.456207275390625, -3.35565185546875, -3.255096435546875, -3.154541015625, -3.053985595703125, -2.95343017578125, -2.852874755859375, -2.7523193359375, -2.651763916015625, -2.55120849609375, -2.450653076171875, -2.35009765625, -2.249542236328125, -2.14898681640625, -2.048431396484375, -1.9478759765625, -1.847320556640625, -1.74676513671875, -1.646209716796875, -1.545654296875, -1.445098876953125, -1.34454345703125, -1.243988037109375, -1.1434326171875, -1.042877197265625, -0.94232177734375, -0.841766357421875, -0.7412109375, -0.640655517578125, -0.54010009765625, -0.439544677734375, -0.3389892578125, -0.238433837890625, -0.13787841796875, -0.037322998046875, 0.063232421875, 0.163787841796875, 0.26434326171875, 0.364898681640625, 0.4654541015625, 0.566009521484375, 0.66656494140625, 0.767120361328125, 0.86767578125, 0.968231201171875, 1.06878662109375, 1.169342041015625, 1.2698974609375, 1.370452880859375, 1.47100830078125, 1.571563720703125, 1.672119140625, 1.772674560546875, 1.87322998046875, 1.973785400390625, 2.0743408203125, 2.174896240234375, 2.27545166015625, 2.376007080078125, 2.4765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 9.0, 16.0, 12.0, 22.0, 36.0, 55.0, 90.0, 132.0, 323.0, 692.0, 1145.0, 792.0, 309.0, 153.0, 94.0, 57.0, 30.0, 24.0, 20.0, 15.0, 9.0, 10.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.76171875, -2.676788330078125, -2.59185791015625, -2.506927490234375, -2.4219970703125, -2.337066650390625, -2.25213623046875, -2.167205810546875, -2.082275390625, -1.997344970703125, -1.91241455078125, -1.827484130859375, -1.7425537109375, -1.657623291015625, -1.57269287109375, -1.487762451171875, -1.40283203125, -1.317901611328125, -1.23297119140625, -1.148040771484375, -1.0631103515625, -0.978179931640625, -0.89324951171875, -0.808319091796875, -0.723388671875, -0.638458251953125, -0.55352783203125, -0.468597412109375, -0.3836669921875, -0.298736572265625, -0.21380615234375, -0.128875732421875, -0.0439453125, 0.040985107421875, 0.12591552734375, 0.210845947265625, 0.2957763671875, 0.380706787109375, 0.46563720703125, 0.550567626953125, 0.635498046875, 0.720428466796875, 0.80535888671875, 0.890289306640625, 0.9752197265625, 1.060150146484375, 1.14508056640625, 1.230010986328125, 1.31494140625, 1.399871826171875, 1.48480224609375, 1.569732666015625, 1.6546630859375, 1.739593505859375, 1.82452392578125, 1.909454345703125, 1.994384765625, 2.079315185546875, 2.16424560546875, 2.249176025390625, 2.3341064453125, 2.419036865234375, 2.50396728515625, 2.588897705078125, 2.673828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 20.0, 46.0, 215.0, 394.0, 224.0, 52.0, 12.0, 13.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.07345962524414, -15.891817092895508, -14.710174560546875, -13.528532028198242, -12.34688949584961, -11.165246963500977, -9.983604431152344, -8.801961898803711, -7.620319366455078, -6.438676834106445, -5.2570343017578125, -4.07539176940918, -2.893749237060547, -1.712106704711914, -0.5304641723632812, 0.6511783599853516, 1.8328208923339844, 3.014463424682617, 4.19610595703125, 5.377748489379883, 6.559391021728516, 7.741033554077148, 8.922676086425781, 10.104318618774414, 11.285961151123047, 12.46760368347168, 13.649246215820312, 14.830888748168945, 16.012531280517578, 17.19417381286621, 18.375816345214844, 19.557458877563477, 20.739105224609375, 21.920747756958008, 23.10239028930664, 24.284032821655273, 25.465675354003906, 26.64731788635254, 27.828960418701172, 29.010602951049805, 30.192245483398438, 31.37388801574707, 32.5555305480957, 33.73717498779297, 34.91881561279297, 36.10045623779297, 37.282100677490234, 38.4637451171875, 39.6453857421875, 40.8270263671875, 42.008670806884766, 43.19031524658203, 44.37195587158203, 45.55359649658203, 46.7352409362793, 47.91688537597656, 49.09852600097656, 50.28016662597656, 51.46181106567383, 52.643455505371094, 53.825096130371094, 55.006736755371094, 56.18838119506836, 57.370025634765625, 58.551666259765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 9.0, 10.0, 20.0, 26.0, 23.0, 25.0, 36.0, 31.0, 55.0, 57.0, 65.0, 74.0, 45.0, 56.0, 61.0, 60.0, 66.0, 44.0, 39.0, 42.0, 31.0, 23.0, 32.0, 18.0, 15.0, 14.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.715545654296875, -11.338780403137207, -10.962014198303223, -10.585248947143555, -10.20848274230957, -9.831717491149902, -9.454952239990234, -9.07818603515625, -8.701420783996582, -8.324655532836914, -7.94788932800293, -7.571124076843262, -7.1943583488464355, -6.817592620849609, -6.440827369689941, -6.064061641693115, -5.687295913696289, -5.310530185699463, -4.933764457702637, -4.556999206542969, -4.180233478546143, -3.8034677505493164, -3.4267022609710693, -3.0499367713928223, -2.673171043395996, -2.29640531539917, -1.9196398258209229, -1.5428742170333862, -1.1661086082458496, -0.789342999458313, -0.41257739067077637, -0.0358119010925293, 0.3409538269042969, 0.7177194356918335, 1.0944850444793701, 1.4712506532669067, 1.8480162620544434, 2.2247819900512695, 2.6015474796295166, 2.9783129692077637, 3.35507869720459, 3.731844425201416, 4.108610153198242, 4.48537540435791, 4.862141132354736, 5.2389068603515625, 5.6156721115112305, 5.992437839508057, 6.369203567504883, 6.745969295501709, 7.122735023498535, 7.499500274658203, 7.876266002655029, 8.253031730651855, 8.629796981811523, 9.006563186645508, 9.383328437805176, 9.760093688964844, 10.136859893798828, 10.513625144958496, 10.890390396118164, 11.267156600952148, 11.643921852111816, 12.020687103271484, 12.397453308105469]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 7.0, 24.0, 26.0, 48.0, 65.0, 99.0, 144.0, 238.0, 361.0, 585.0, 994.0, 1726.0, 3041.0, 6079.0, 12941.0, 30511.0, 74703.0, 184718.0, 343298.0, 226165.0, 93869.0, 37533.0, 15621.0, 7269.0, 3674.0, 1977.0, 1103.0, 619.0, 417.0, 256.0, 158.0, 97.0, 55.0, 51.0, 26.0, 11.0, 11.0, 9.0, 7.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.376983642578125, -1.32525634765625, -1.273529052734375, -1.2218017578125, -1.170074462890625, -1.11834716796875, -1.066619873046875, -1.014892578125, -0.963165283203125, -0.91143798828125, -0.859710693359375, -0.8079833984375, -0.756256103515625, -0.70452880859375, -0.652801513671875, -0.60107421875, -0.549346923828125, -0.49761962890625, -0.445892333984375, -0.3941650390625, -0.342437744140625, -0.29071044921875, -0.238983154296875, -0.187255859375, -0.135528564453125, -0.08380126953125, -0.032073974609375, 0.0196533203125, 0.071380615234375, 0.12310791015625, 0.174835205078125, 0.2265625, 0.278289794921875, 0.33001708984375, 0.381744384765625, 0.4334716796875, 0.485198974609375, 0.53692626953125, 0.588653564453125, 0.640380859375, 0.692108154296875, 0.74383544921875, 0.795562744140625, 0.8472900390625, 0.899017333984375, 0.95074462890625, 1.002471923828125, 1.05419921875, 1.105926513671875, 1.15765380859375, 1.209381103515625, 1.2611083984375, 1.312835693359375, 1.36456298828125, 1.416290283203125, 1.468017578125, 1.519744873046875, 1.57147216796875, 1.623199462890625, 1.6749267578125, 1.726654052734375, 1.77838134765625, 1.830108642578125, 1.8818359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 13.0, 11.0, 6.0, 11.0, 20.0, 16.0, 21.0, 29.0, 38.0, 26.0, 33.0, 33.0, 42.0, 31.0, 42.0, 33.0, 38.0, 40.0, 40.0, 41.0, 44.0, 56.0, 37.0, 40.0, 23.0, 22.0, 19.0, 27.0, 27.0, 20.0, 15.0, 19.0, 18.0, 5.0, 16.0, 5.0, 9.0, 10.0, 4.0, 3.0, 5.0, 3.0, 1.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.85009765625, -0.82452392578125, -0.7989501953125, -0.77337646484375, -0.747802734375, -0.72222900390625, -0.6966552734375, -0.67108154296875, -0.6455078125, -0.61993408203125, -0.5943603515625, -0.56878662109375, -0.543212890625, -0.51763916015625, -0.4920654296875, -0.46649169921875, -0.44091796875, -0.41534423828125, -0.3897705078125, -0.36419677734375, -0.338623046875, -0.31304931640625, -0.2874755859375, -0.26190185546875, -0.236328125, -0.21075439453125, -0.1851806640625, -0.15960693359375, -0.134033203125, -0.10845947265625, -0.0828857421875, -0.05731201171875, -0.03173828125, -0.00616455078125, 0.0194091796875, 0.04498291015625, 0.070556640625, 0.09613037109375, 0.1217041015625, 0.14727783203125, 0.1728515625, 0.19842529296875, 0.2239990234375, 0.24957275390625, 0.275146484375, 0.30072021484375, 0.3262939453125, 0.35186767578125, 0.37744140625, 0.40301513671875, 0.4285888671875, 0.45416259765625, 0.479736328125, 0.50531005859375, 0.5308837890625, 0.55645751953125, 0.58203125, 0.60760498046875, 0.6331787109375, 0.65875244140625, 0.684326171875, 0.70989990234375, 0.7354736328125, 0.76104736328125, 0.78662109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 10.0, 11.0, 18.0, 29.0, 21.0, 28.0, 32.0, 79.0, 109.0, 199.0, 313.0, 610.0, 1442.0, 3994.0, 14153.0, 65017.0, 446367.0, 430308.0, 64650.0, 14088.0, 4072.0, 1492.0, 602.0, 310.0, 174.0, 120.0, 69.0, 53.0, 41.0, 40.0, 26.0, 19.0, 14.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.396484375, -2.3138427734375, -2.231201171875, -2.1485595703125, -2.06591796875, -1.9832763671875, -1.900634765625, -1.8179931640625, -1.7353515625, -1.6527099609375, -1.570068359375, -1.4874267578125, -1.40478515625, -1.3221435546875, -1.239501953125, -1.1568603515625, -1.07421875, -0.9915771484375, -0.908935546875, -0.8262939453125, -0.74365234375, -0.6610107421875, -0.578369140625, -0.4957275390625, -0.4130859375, -0.3304443359375, -0.247802734375, -0.1651611328125, -0.08251953125, 0.0001220703125, 0.082763671875, 0.1654052734375, 0.248046875, 0.3306884765625, 0.413330078125, 0.4959716796875, 0.57861328125, 0.6612548828125, 0.743896484375, 0.8265380859375, 0.9091796875, 0.9918212890625, 1.074462890625, 1.1571044921875, 1.23974609375, 1.3223876953125, 1.405029296875, 1.4876708984375, 1.5703125, 1.6529541015625, 1.735595703125, 1.8182373046875, 1.90087890625, 1.9835205078125, 2.066162109375, 2.1488037109375, 2.2314453125, 2.3140869140625, 2.396728515625, 2.4793701171875, 2.56201171875, 2.6446533203125, 2.727294921875, 2.8099365234375, 2.892578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 12.0, 15.0, 16.0, 22.0, 22.0, 26.0, 42.0, 35.0, 37.0, 48.0, 47.0, 53.0, 57.0, 51.0, 62.0, 50.0, 43.0, 50.0, 50.0, 43.0, 29.0, 38.0, 19.0, 21.0, 20.0, 15.0, 15.0, 11.0, 5.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.328125, -3.224029541015625, -3.11993408203125, -3.015838623046875, -2.9117431640625, -2.807647705078125, -2.70355224609375, -2.599456787109375, -2.495361328125, -2.391265869140625, -2.28717041015625, -2.183074951171875, -2.0789794921875, -1.974884033203125, -1.87078857421875, -1.766693115234375, -1.66259765625, -1.558502197265625, -1.45440673828125, -1.350311279296875, -1.2462158203125, -1.142120361328125, -1.03802490234375, -0.933929443359375, -0.829833984375, -0.725738525390625, -0.62164306640625, -0.517547607421875, -0.4134521484375, -0.309356689453125, -0.20526123046875, -0.101165771484375, 0.0029296875, 0.107025146484375, 0.21112060546875, 0.315216064453125, 0.4193115234375, 0.523406982421875, 0.62750244140625, 0.731597900390625, 0.835693359375, 0.939788818359375, 1.04388427734375, 1.147979736328125, 1.2520751953125, 1.356170654296875, 1.46026611328125, 1.564361572265625, 1.66845703125, 1.772552490234375, 1.87664794921875, 1.980743408203125, 2.0848388671875, 2.188934326171875, 2.29302978515625, 2.397125244140625, 2.501220703125, 2.605316162109375, 2.70941162109375, 2.813507080078125, 2.9176025390625, 3.021697998046875, 3.12579345703125, 3.229888916015625, 3.333984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 22.0, 18.0, 24.0, 48.0, 82.0, 164.0, 294.0, 660.0, 1821.0, 5890.0, 27403.0, 182467.0, 702981.0, 103218.0, 16943.0, 4056.0, 1351.0, 505.0, 258.0, 147.0, 71.0, 43.0, 20.0, 18.0, 10.0, 11.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7683029174804688, -0.7402191162109375, -0.7121353149414062, -0.684051513671875, -0.6559677124023438, -0.6278839111328125, -0.5998001098632812, -0.57171630859375, -0.5436325073242188, -0.5155487060546875, -0.48746490478515625, -0.459381103515625, -0.43129730224609375, -0.4032135009765625, -0.37512969970703125, -0.3470458984375, -0.31896209716796875, -0.2908782958984375, -0.26279449462890625, -0.234710693359375, -0.20662689208984375, -0.1785430908203125, -0.15045928955078125, -0.12237548828125, -0.09429168701171875, -0.0662078857421875, -0.03812408447265625, -0.010040283203125, 0.01804351806640625, 0.0461273193359375, 0.07421112060546875, 0.102294921875, 0.13037872314453125, 0.1584625244140625, 0.18654632568359375, 0.214630126953125, 0.24271392822265625, 0.2707977294921875, 0.29888153076171875, 0.32696533203125, 0.35504913330078125, 0.3831329345703125, 0.41121673583984375, 0.439300537109375, 0.46738433837890625, 0.4954681396484375, 0.5235519409179688, 0.5516357421875, 0.5797195434570312, 0.6078033447265625, 0.6358871459960938, 0.663970947265625, 0.6920547485351562, 0.7201385498046875, 0.7482223510742188, 0.77630615234375, 0.8043899536132812, 0.8324737548828125, 0.8605575561523438, 0.888641357421875, 0.9167251586914062, 0.9448089599609375, 0.9728927612304688, 1.0009765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 5.0, 9.0, 8.0, 15.0, 19.0, 24.0, 38.0, 58.0, 80.0, 107.0, 132.0, 124.0, 119.0, 92.0, 49.0, 32.0, 21.0, 13.0, 15.0, 13.0, 7.0, 4.0, 2.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031828880310058594, -0.0003085993230342865, -0.00029890984296798706, -0.0002892203629016876, -0.0002795308828353882, -0.00026984140276908875, -0.0002601519227027893, -0.00025046244263648987, -0.00024077296257019043, -0.000231083482503891, -0.00022139400243759155, -0.00021170452237129211, -0.00020201504230499268, -0.00019232556223869324, -0.0001826360821723938, -0.00017294660210609436, -0.00016325712203979492, -0.00015356764197349548, -0.00014387816190719604, -0.0001341886818408966, -0.00012449920177459717, -0.00011480972170829773, -0.00010512024164199829, -9.543076157569885e-05, -8.574128150939941e-05, -7.605180144309998e-05, -6.636232137680054e-05, -5.66728413105011e-05, -4.698336124420166e-05, -3.729388117790222e-05, -2.7604401111602783e-05, -1.7914921045303345e-05, -8.225440979003906e-06, 1.4640390872955322e-06, 1.115351915359497e-05, 2.084299921989441e-05, 3.053247928619385e-05, 4.0221959352493286e-05, 4.9911439418792725e-05, 5.960091948509216e-05, 6.92903995513916e-05, 7.897987961769104e-05, 8.866935968399048e-05, 9.835883975028992e-05, 0.00010804831981658936, 0.0001177377998828888, 0.00012742727994918823, 0.00013711676001548767, 0.0001468062400817871, 0.00015649572014808655, 0.00016618520021438599, 0.00017587468028068542, 0.00018556416034698486, 0.0001952536404132843, 0.00020494312047958374, 0.00021463260054588318, 0.00022432208061218262, 0.00023401156067848206, 0.0002437010407447815, 0.00025339052081108093, 0.00026308000087738037, 0.0002727694809436798, 0.00028245896100997925, 0.0002921484410762787, 0.0003018379211425781]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 16.0, 12.0, 19.0, 38.0, 55.0, 138.0, 316.0, 837.0, 2704.0, 12402.0, 95218.0, 759548.0, 153990.0, 17957.0, 3542.0, 1015.0, 394.0, 164.0, 72.0, 43.0, 28.0, 19.0, 4.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2538299560546875, -1.219573974609375, -1.1853179931640625, -1.15106201171875, -1.1168060302734375, -1.082550048828125, -1.0482940673828125, -1.0140380859375, -0.9797821044921875, -0.945526123046875, -0.9112701416015625, -0.87701416015625, -0.8427581787109375, -0.808502197265625, -0.7742462158203125, -0.739990234375, -0.7057342529296875, -0.671478271484375, -0.6372222900390625, -0.60296630859375, -0.5687103271484375, -0.534454345703125, -0.5001983642578125, -0.4659423828125, -0.4316864013671875, -0.397430419921875, -0.3631744384765625, -0.32891845703125, -0.2946624755859375, -0.260406494140625, -0.2261505126953125, -0.19189453125, -0.1576385498046875, -0.123382568359375, -0.0891265869140625, -0.05487060546875, -0.0206146240234375, 0.013641357421875, 0.0478973388671875, 0.0821533203125, 0.1164093017578125, 0.150665283203125, 0.1849212646484375, 0.21917724609375, 0.2534332275390625, 0.287689208984375, 0.3219451904296875, 0.356201171875, 0.3904571533203125, 0.424713134765625, 0.4589691162109375, 0.49322509765625, 0.5274810791015625, 0.561737060546875, 0.5959930419921875, 0.6302490234375, 0.6645050048828125, 0.698760986328125, 0.7330169677734375, 0.76727294921875, 0.8015289306640625, 0.835784912109375, 0.8700408935546875, 0.904296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 13.0, 15.0, 32.0, 20.0, 33.0, 49.0, 48.0, 62.0, 69.0, 82.0, 98.0, 89.0, 75.0, 63.0, 54.0, 46.0, 24.0, 33.0, 21.0, 21.0, 12.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8707733154296875, -0.843109130859375, -0.8154449462890625, -0.78778076171875, -0.7601165771484375, -0.732452392578125, -0.7047882080078125, -0.6771240234375, -0.6494598388671875, -0.621795654296875, -0.5941314697265625, -0.56646728515625, -0.5388031005859375, -0.511138916015625, -0.4834747314453125, -0.455810546875, -0.4281463623046875, -0.400482177734375, -0.3728179931640625, -0.34515380859375, -0.3174896240234375, -0.289825439453125, -0.2621612548828125, -0.2344970703125, -0.2068328857421875, -0.179168701171875, -0.1515045166015625, -0.12384033203125, -0.0961761474609375, -0.068511962890625, -0.0408477783203125, -0.01318359375, 0.0144805908203125, 0.042144775390625, 0.0698089599609375, 0.09747314453125, 0.1251373291015625, 0.152801513671875, 0.1804656982421875, 0.2081298828125, 0.2357940673828125, 0.263458251953125, 0.2911224365234375, 0.31878662109375, 0.3464508056640625, 0.374114990234375, 0.4017791748046875, 0.429443359375, 0.4571075439453125, 0.484771728515625, 0.5124359130859375, 0.54010009765625, 0.5677642822265625, 0.595428466796875, 0.6230926513671875, 0.6507568359375, 0.6784210205078125, 0.706085205078125, 0.7337493896484375, 0.76141357421875, 0.7890777587890625, 0.816741943359375, 0.8444061279296875, 0.8720703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 16.0, 13.0, 36.0, 54.0, 79.0, 128.0, 217.0, 157.0, 93.0, 51.0, 54.0, 34.0, 18.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.331497192382812, -12.849333763122559, -12.367170333862305, -11.885005950927734, -11.40284252166748, -10.920679092407227, -10.438515663146973, -9.956352233886719, -9.474187850952148, -8.992024421691895, -8.50986099243164, -8.02769660949707, -7.545533180236816, -7.0633697509765625, -6.581206321716309, -6.099042892456055, -5.616879463195801, -5.134716033935547, -4.652552127838135, -4.170388698577881, -3.688225030899048, -3.206061363220215, -2.723897933959961, -2.241734266281128, -1.759570598602295, -1.277406930923462, -0.7952433824539185, -0.313079833984375, 0.169083833694458, 0.651247501373291, 1.133410930633545, 1.615574598312378, 2.097738265991211, 2.579901933670044, 3.062065601348877, 3.544229030609131, 4.026392936706543, 4.508556365966797, 4.990719795227051, 5.472883224487305, 5.955047130584717, 6.437210559844971, 6.919374465942383, 7.401537895202637, 7.883701324462891, 8.365865707397461, 8.848028182983398, 9.330192565917969, 9.812355995178223, 10.294519424438477, 10.77668285369873, 11.258846282958984, 11.741010665893555, 12.223174095153809, 12.705337524414062, 13.187500953674316, 13.66966438293457, 14.151827812194824, 14.633991241455078, 15.116155624389648, 15.598319053649902, 16.080482482910156, 16.562644958496094, 17.044809341430664, 17.526973724365234]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 7.0, 12.0, 7.0, 14.0, 18.0, 26.0, 18.0, 27.0, 25.0, 27.0, 31.0, 39.0, 50.0, 46.0, 63.0, 76.0, 65.0, 54.0, 49.0, 29.0, 24.0, 22.0, 26.0, 25.0, 23.0, 22.0, 16.0, 24.0, 16.0, 13.0, 18.0, 5.0, 8.0, 6.0, 5.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.22567367553711, -9.891401290893555, -9.55712890625, -9.222856521606445, -8.88858413696289, -8.554311752319336, -8.220039367675781, -7.885766983032227, -7.551494598388672, -7.217222213745117, -6.8829498291015625, -6.548677444458008, -6.214405059814453, -5.880132675170898, -5.545860290527344, -5.211587905883789, -4.877315044403076, -4.5430426597595215, -4.208770275115967, -3.874497890472412, -3.5402255058288574, -3.2059531211853027, -2.871680498123169, -2.5374081134796143, -2.2031357288360596, -1.8688633441925049, -1.5345909595489502, -1.200318455696106, -0.8660460710525513, -0.5317736864089966, -0.19750118255615234, 0.13677120208740234, 0.47104358673095703, 0.8053159713745117, 1.1395883560180664, 1.4738608598709106, 1.8081332445144653, 2.1424055099487305, 2.4766781330108643, 2.810950517654419, 3.1452229022979736, 3.4794952869415283, 3.813767671585083, 4.148040294647217, 4.4823126792907715, 4.816585063934326, 5.150857448577881, 5.4851298332214355, 5.81940221786499, 6.153674602508545, 6.4879469871521, 6.822219371795654, 7.156491756439209, 7.490764141082764, 7.825037002563477, 8.159309387207031, 8.493581771850586, 8.82785415649414, 9.162126541137695, 9.49639892578125, 9.830671310424805, 10.16494369506836, 10.499216079711914, 10.833488464355469, 11.167760848999023]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 12.0, 21.0, 33.0, 40.0, 54.0, 72.0, 95.0, 135.0, 229.0, 314.0, 544.0, 942.0, 1663.0, 3237.0, 6765.0, 16306.0, 56966.0, 357909.0, 2612663.0, 973137.0, 117845.0, 25971.0, 9667.0, 4363.0, 2145.0, 1252.0, 722.0, 366.0, 259.0, 179.0, 87.0, 61.0, 54.0, 43.0, 33.0, 27.0, 16.0, 10.0, 12.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.009765625, -0.9733428955078125, -0.936920166015625, -0.9004974365234375, -0.86407470703125, -0.8276519775390625, -0.791229248046875, -0.7548065185546875, -0.7183837890625, -0.6819610595703125, -0.645538330078125, -0.6091156005859375, -0.57269287109375, -0.5362701416015625, -0.499847412109375, -0.4634246826171875, -0.427001953125, -0.3905792236328125, -0.354156494140625, -0.3177337646484375, -0.28131103515625, -0.2448883056640625, -0.208465576171875, -0.1720428466796875, -0.1356201171875, -0.0991973876953125, -0.062774658203125, -0.0263519287109375, 0.01007080078125, 0.0464935302734375, 0.082916259765625, 0.1193389892578125, 0.15576171875, 0.1921844482421875, 0.228607177734375, 0.2650299072265625, 0.30145263671875, 0.3378753662109375, 0.374298095703125, 0.4107208251953125, 0.4471435546875, 0.4835662841796875, 0.519989013671875, 0.5564117431640625, 0.59283447265625, 0.6292572021484375, 0.665679931640625, 0.7021026611328125, 0.738525390625, 0.7749481201171875, 0.811370849609375, 0.8477935791015625, 0.88421630859375, 0.9206390380859375, 0.957061767578125, 0.9934844970703125, 1.0299072265625, 1.0663299560546875, 1.102752685546875, 1.1391754150390625, 1.17559814453125, 1.2120208740234375, 1.248443603515625, 1.2848663330078125, 1.3212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 9.0, 6.0, 5.0, 10.0, 10.0, 11.0, 12.0, 19.0, 20.0, 31.0, 26.0, 31.0, 36.0, 43.0, 34.0, 41.0, 32.0, 31.0, 33.0, 47.0, 35.0, 53.0, 49.0, 39.0, 49.0, 32.0, 32.0, 25.0, 30.0, 20.0, 22.0, 20.0, 17.0, 18.0, 14.0, 10.0, 8.0, 5.0, 3.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7724609375, -0.7482147216796875, -0.723968505859375, -0.6997222900390625, -0.67547607421875, -0.6512298583984375, -0.626983642578125, -0.6027374267578125, -0.5784912109375, -0.5542449951171875, -0.529998779296875, -0.5057525634765625, -0.48150634765625, -0.4572601318359375, -0.433013916015625, -0.4087677001953125, -0.384521484375, -0.3602752685546875, -0.336029052734375, -0.3117828369140625, -0.28753662109375, -0.2632904052734375, -0.239044189453125, -0.2147979736328125, -0.1905517578125, -0.1663055419921875, -0.142059326171875, -0.1178131103515625, -0.09356689453125, -0.0693206787109375, -0.045074462890625, -0.0208282470703125, 0.00341796875, 0.0276641845703125, 0.051910400390625, 0.0761566162109375, 0.10040283203125, 0.1246490478515625, 0.148895263671875, 0.1731414794921875, 0.1973876953125, 0.2216339111328125, 0.245880126953125, 0.2701263427734375, 0.29437255859375, 0.3186187744140625, 0.342864990234375, 0.3671112060546875, 0.391357421875, 0.4156036376953125, 0.439849853515625, 0.4640960693359375, 0.48834228515625, 0.5125885009765625, 0.536834716796875, 0.5610809326171875, 0.5853271484375, 0.6095733642578125, 0.633819580078125, 0.6580657958984375, 0.68231201171875, 0.7065582275390625, 0.730804443359375, 0.7550506591796875, 0.779296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 5.0, 2.0, 18.0, 23.0, 28.0, 44.0, 57.0, 125.0, 299.0, 693.0, 2051.0, 7706.0, 46313.0, 2200385.0, 1882987.0, 42966.0, 7302.0, 1976.0, 645.0, 290.0, 141.0, 74.0, 42.0, 28.0, 29.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.984375, -2.899078369140625, -2.81378173828125, -2.728485107421875, -2.6431884765625, -2.557891845703125, -2.47259521484375, -2.387298583984375, -2.302001953125, -2.216705322265625, -2.13140869140625, -2.046112060546875, -1.9608154296875, -1.875518798828125, -1.79022216796875, -1.704925537109375, -1.61962890625, -1.534332275390625, -1.44903564453125, -1.363739013671875, -1.2784423828125, -1.193145751953125, -1.10784912109375, -1.022552490234375, -0.937255859375, -0.851959228515625, -0.76666259765625, -0.681365966796875, -0.5960693359375, -0.510772705078125, -0.42547607421875, -0.340179443359375, -0.2548828125, -0.169586181640625, -0.08428955078125, 0.001007080078125, 0.0863037109375, 0.171600341796875, 0.25689697265625, 0.342193603515625, 0.427490234375, 0.512786865234375, 0.59808349609375, 0.683380126953125, 0.7686767578125, 0.853973388671875, 0.93927001953125, 1.024566650390625, 1.10986328125, 1.195159912109375, 1.28045654296875, 1.365753173828125, 1.4510498046875, 1.536346435546875, 1.62164306640625, 1.706939697265625, 1.792236328125, 1.877532958984375, 1.96282958984375, 2.048126220703125, 2.1334228515625, 2.218719482421875, 2.30401611328125, 2.389312744140625, 2.474609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 3.0, 10.0, 26.0, 17.0, 23.0, 47.0, 68.0, 103.0, 212.0, 469.0, 979.0, 1059.0, 517.0, 218.0, 119.0, 63.0, 45.0, 23.0, 22.0, 8.0, 11.0, 4.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.9129791259765625, -1.836700439453125, -1.7604217529296875, -1.68414306640625, -1.6078643798828125, -1.531585693359375, -1.4553070068359375, -1.3790283203125, -1.3027496337890625, -1.226470947265625, -1.1501922607421875, -1.07391357421875, -0.9976348876953125, -0.921356201171875, -0.8450775146484375, -0.768798828125, -0.6925201416015625, -0.616241455078125, -0.5399627685546875, -0.46368408203125, -0.3874053955078125, -0.311126708984375, -0.2348480224609375, -0.1585693359375, -0.0822906494140625, -0.006011962890625, 0.0702667236328125, 0.14654541015625, 0.2228240966796875, 0.299102783203125, 0.3753814697265625, 0.45166015625, 0.5279388427734375, 0.604217529296875, 0.6804962158203125, 0.75677490234375, 0.8330535888671875, 0.909332275390625, 0.9856109619140625, 1.0618896484375, 1.1381683349609375, 1.214447021484375, 1.2907257080078125, 1.36700439453125, 1.4432830810546875, 1.519561767578125, 1.5958404541015625, 1.672119140625, 1.7483978271484375, 1.824676513671875, 1.9009552001953125, 1.97723388671875, 2.0535125732421875, 2.129791259765625, 2.2060699462890625, 2.2823486328125, 2.3586273193359375, 2.434906005859375, 2.5111846923828125, 2.58746337890625, 2.6637420654296875, 2.740020751953125, 2.8162994384765625, 2.892578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 5.0, 15.0, 22.0, 47.0, 85.0, 167.0, 257.0, 192.0, 93.0, 62.0, 24.0, 13.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.713455200195312, -20.100908279418945, -19.48836326599121, -18.875816345214844, -18.26327133178711, -17.650724411010742, -17.038177490234375, -16.42563247680664, -15.813085556030273, -15.200539588928223, -14.587993621826172, -13.975446701049805, -13.362900733947754, -12.750354766845703, -12.137808799743652, -11.525262832641602, -10.91271686553955, -10.3001708984375, -9.68762493133545, -9.075078964233398, -8.462532043457031, -7.8499860763549805, -7.23744010925293, -6.624893665313721, -6.01234769821167, -5.399801731109619, -4.78725528717041, -4.174709320068359, -3.5621631145477295, -2.9496169090270996, -2.337070941925049, -1.7245244979858398, -1.111978530883789, -0.49943238496780396, 0.11311376094818115, 0.7256598472595215, 1.3382060527801514, 1.9507522583007812, 2.563298225402832, 3.175844669342041, 3.788390636444092, 4.400936603546143, 5.013483047485352, 5.626029014587402, 6.238574981689453, 6.851121425628662, 7.463667392730713, 8.076213836669922, 8.688759803771973, 9.301305770874023, 9.913851737976074, 10.526397705078125, 11.138944625854492, 11.751490592956543, 12.364036560058594, 12.976583480834961, 13.589128494262695, 14.201674461364746, 14.814220428466797, 15.426767349243164, 16.0393123626709, 16.651859283447266, 17.264404296875, 17.876951217651367, 18.489498138427734]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 13.0, 17.0, 14.0, 13.0, 18.0, 19.0, 24.0, 32.0, 26.0, 45.0, 44.0, 42.0, 49.0, 52.0, 45.0, 57.0, 42.0, 66.0, 35.0, 44.0, 46.0, 31.0, 43.0, 29.0, 31.0, 24.0, 14.0, 16.0, 11.0, 14.0, 9.0, 9.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.31397819519043, -9.049446105957031, -8.784913063049316, -8.520380973815918, -8.255847930908203, -7.991315841674805, -7.726783275604248, -7.462250709533691, -7.197718143463135, -6.933185577392578, -6.6686530113220215, -6.404120445251465, -6.139588356018066, -5.875055313110352, -5.610523223876953, -5.3459906578063965, -5.08145809173584, -4.816925525665283, -4.552392959594727, -4.28786039352417, -4.023327827453613, -3.7587954998016357, -3.494263172149658, -3.2297306060791016, -2.965198040008545, -2.7006654739379883, -2.4361329078674316, -2.171600580215454, -1.9070680141448975, -1.6425354480743408, -1.3780030012130737, -1.1134705543518066, -0.8489370346069336, -0.5844045281410217, -0.31987202167510986, -0.055339515209198, 0.20919299125671387, 0.4737255573272705, 0.7382580041885376, 1.0027904510498047, 1.2673230171203613, 1.531855583190918, 1.796388030052185, 2.060920476913452, 2.325453042984009, 2.5899856090545654, 2.854517936706543, 3.1190505027770996, 3.3835830688476562, 3.648115634918213, 3.9126482009887695, 4.177180767059326, 4.441713333129883, 4.706245422363281, 4.970777988433838, 5.2353105545043945, 5.499843120574951, 5.764375686645508, 6.0289082527160645, 6.293440818786621, 6.5579729080200195, 6.822505950927734, 7.087038040161133, 7.3515706062316895, 7.616103172302246]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 9.0, 18.0, 23.0, 37.0, 54.0, 76.0, 114.0, 175.0, 206.0, 333.0, 520.0, 805.0, 1312.0, 2234.0, 3750.0, 6773.0, 12748.0, 25508.0, 54246.0, 122987.0, 276508.0, 291662.0, 132540.0, 57889.0, 27259.0, 13629.0, 7072.0, 3866.0, 2334.0, 1352.0, 850.0, 534.0, 375.0, 231.0, 168.0, 107.0, 77.0, 41.0, 36.0, 23.0, 22.0, 10.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.134124755859375, -1.09637451171875, -1.058624267578125, -1.0208740234375, -0.983123779296875, -0.94537353515625, -0.907623291015625, -0.869873046875, -0.832122802734375, -0.79437255859375, -0.756622314453125, -0.7188720703125, -0.681121826171875, -0.64337158203125, -0.605621337890625, -0.56787109375, -0.530120849609375, -0.49237060546875, -0.454620361328125, -0.4168701171875, -0.379119873046875, -0.34136962890625, -0.303619384765625, -0.265869140625, -0.228118896484375, -0.19036865234375, -0.152618408203125, -0.1148681640625, -0.077117919921875, -0.03936767578125, -0.001617431640625, 0.0361328125, 0.073883056640625, 0.11163330078125, 0.149383544921875, 0.1871337890625, 0.224884033203125, 0.26263427734375, 0.300384521484375, 0.338134765625, 0.375885009765625, 0.41363525390625, 0.451385498046875, 0.4891357421875, 0.526885986328125, 0.56463623046875, 0.602386474609375, 0.64013671875, 0.677886962890625, 0.71563720703125, 0.753387451171875, 0.7911376953125, 0.828887939453125, 0.86663818359375, 0.904388427734375, 0.942138671875, 0.979888916015625, 1.01763916015625, 1.055389404296875, 1.0931396484375, 1.130889892578125, 1.16864013671875, 1.206390380859375, 1.244140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 7.0, 15.0, 10.0, 15.0, 13.0, 11.0, 15.0, 15.0, 32.0, 32.0, 21.0, 29.0, 36.0, 29.0, 40.0, 35.0, 35.0, 38.0, 51.0, 42.0, 37.0, 34.0, 48.0, 37.0, 43.0, 35.0, 30.0, 27.0, 15.0, 26.0, 22.0, 24.0, 23.0, 15.0, 11.0, 11.0, 6.0, 7.0, 5.0, 1.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.71044921875, -0.68707275390625, -0.6636962890625, -0.64031982421875, -0.616943359375, -0.59356689453125, -0.5701904296875, -0.54681396484375, -0.5234375, -0.50006103515625, -0.4766845703125, -0.45330810546875, -0.429931640625, -0.40655517578125, -0.3831787109375, -0.35980224609375, -0.33642578125, -0.31304931640625, -0.2896728515625, -0.26629638671875, -0.242919921875, -0.21954345703125, -0.1961669921875, -0.17279052734375, -0.1494140625, -0.12603759765625, -0.1026611328125, -0.07928466796875, -0.055908203125, -0.03253173828125, -0.0091552734375, 0.01422119140625, 0.03759765625, 0.06097412109375, 0.0843505859375, 0.10772705078125, 0.131103515625, 0.15447998046875, 0.1778564453125, 0.20123291015625, 0.224609375, 0.24798583984375, 0.2713623046875, 0.29473876953125, 0.318115234375, 0.34149169921875, 0.3648681640625, 0.38824462890625, 0.41162109375, 0.43499755859375, 0.4583740234375, 0.48175048828125, 0.505126953125, 0.52850341796875, 0.5518798828125, 0.57525634765625, 0.5986328125, 0.62200927734375, 0.6453857421875, 0.66876220703125, 0.692138671875, 0.71551513671875, 0.7388916015625, 0.76226806640625, 0.78564453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 7.0, 9.0, 10.0, 17.0, 33.0, 38.0, 40.0, 75.0, 127.0, 146.0, 224.0, 432.0, 711.0, 1320.0, 2794.0, 7078.0, 24227.0, 114454.0, 689434.0, 160329.0, 31500.0, 8855.0, 3260.0, 1444.0, 759.0, 432.0, 266.0, 160.0, 117.0, 76.0, 40.0, 35.0, 25.0, 19.0, 19.0, 7.0, 6.0, 5.0, 6.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.326171875, -2.2589263916015625, -2.191680908203125, -2.1244354248046875, -2.05718994140625, -1.9899444580078125, -1.922698974609375, -1.8554534912109375, -1.7882080078125, -1.7209625244140625, -1.653717041015625, -1.5864715576171875, -1.51922607421875, -1.4519805908203125, -1.384735107421875, -1.3174896240234375, -1.250244140625, -1.1829986572265625, -1.115753173828125, -1.0485076904296875, -0.98126220703125, -0.9140167236328125, -0.846771240234375, -0.7795257568359375, -0.7122802734375, -0.6450347900390625, -0.577789306640625, -0.5105438232421875, -0.44329833984375, -0.3760528564453125, -0.308807373046875, -0.2415618896484375, -0.17431640625, -0.1070709228515625, -0.039825439453125, 0.0274200439453125, 0.09466552734375, 0.1619110107421875, 0.229156494140625, 0.2964019775390625, 0.3636474609375, 0.4308929443359375, 0.498138427734375, 0.5653839111328125, 0.63262939453125, 0.6998748779296875, 0.767120361328125, 0.8343658447265625, 0.901611328125, 0.9688568115234375, 1.036102294921875, 1.1033477783203125, 1.17059326171875, 1.2378387451171875, 1.305084228515625, 1.3723297119140625, 1.4395751953125, 1.5068206787109375, 1.574066162109375, 1.6413116455078125, 1.70855712890625, 1.7758026123046875, 1.843048095703125, 1.9102935791015625, 1.9775390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 6.0, 9.0, 12.0, 9.0, 24.0, 30.0, 29.0, 41.0, 50.0, 53.0, 53.0, 59.0, 62.0, 66.0, 62.0, 53.0, 52.0, 48.0, 56.0, 46.0, 30.0, 30.0, 32.0, 19.0, 13.0, 15.0, 7.0, 1.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.2265625, -4.115997314453125, -4.00543212890625, -3.894866943359375, -3.7843017578125, -3.673736572265625, -3.56317138671875, -3.452606201171875, -3.342041015625, -3.231475830078125, -3.12091064453125, -3.010345458984375, -2.8997802734375, -2.789215087890625, -2.67864990234375, -2.568084716796875, -2.45751953125, -2.346954345703125, -2.23638916015625, -2.125823974609375, -2.0152587890625, -1.904693603515625, -1.79412841796875, -1.683563232421875, -1.572998046875, -1.462432861328125, -1.35186767578125, -1.241302490234375, -1.1307373046875, -1.020172119140625, -0.90960693359375, -0.799041748046875, -0.6884765625, -0.577911376953125, -0.46734619140625, -0.356781005859375, -0.2462158203125, -0.135650634765625, -0.02508544921875, 0.085479736328125, 0.196044921875, 0.306610107421875, 0.41717529296875, 0.527740478515625, 0.6383056640625, 0.748870849609375, 0.85943603515625, 0.970001220703125, 1.08056640625, 1.191131591796875, 1.30169677734375, 1.412261962890625, 1.5228271484375, 1.633392333984375, 1.74395751953125, 1.854522705078125, 1.965087890625, 2.075653076171875, 2.18621826171875, 2.296783447265625, 2.4073486328125, 2.517913818359375, 2.62847900390625, 2.739044189453125, 2.849609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 6.0, 9.0, 11.0, 10.0, 16.0, 26.0, 46.0, 65.0, 108.0, 181.0, 341.0, 703.0, 1593.0, 4422.0, 15898.0, 81536.0, 753646.0, 153973.0, 25429.0, 6518.0, 2120.0, 904.0, 420.0, 204.0, 120.0, 70.0, 63.0, 48.0, 23.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6773529052734375, -0.654510498046875, -0.6316680908203125, -0.60882568359375, -0.5859832763671875, -0.563140869140625, -0.5402984619140625, -0.5174560546875, -0.4946136474609375, -0.471771240234375, -0.4489288330078125, -0.42608642578125, -0.4032440185546875, -0.380401611328125, -0.3575592041015625, -0.334716796875, -0.3118743896484375, -0.289031982421875, -0.2661895751953125, -0.24334716796875, -0.2205047607421875, -0.197662353515625, -0.1748199462890625, -0.1519775390625, -0.1291351318359375, -0.106292724609375, -0.0834503173828125, -0.06060791015625, -0.0377655029296875, -0.014923095703125, 0.0079193115234375, 0.03076171875, 0.0536041259765625, 0.076446533203125, 0.0992889404296875, 0.12213134765625, 0.1449737548828125, 0.167816162109375, 0.1906585693359375, 0.2135009765625, 0.2363433837890625, 0.259185791015625, 0.2820281982421875, 0.30487060546875, 0.3277130126953125, 0.350555419921875, 0.3733978271484375, 0.396240234375, 0.4190826416015625, 0.441925048828125, 0.4647674560546875, 0.48760986328125, 0.5104522705078125, 0.533294677734375, 0.5561370849609375, 0.5789794921875, 0.6018218994140625, 0.624664306640625, 0.6475067138671875, 0.67034912109375, 0.6931915283203125, 0.716033935546875, 0.7388763427734375, 0.76171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 9.0, 2.0, 8.0, 16.0, 12.0, 17.0, 22.0, 31.0, 35.0, 61.0, 40.0, 66.0, 95.0, 123.0, 111.0, 65.0, 58.0, 44.0, 39.0, 24.0, 21.0, 20.0, 12.0, 12.0, 8.0, 3.0, 9.0, 4.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014162063598632812, -0.000136692076921463, -0.0001317635178565979, -0.0001268349587917328, -0.00012190639972686768, -0.00011697784066200256, -0.00011204928159713745, -0.00010712072253227234, -0.00010219216346740723, -9.726360440254211e-05, -9.2335045337677e-05, -8.740648627281189e-05, -8.247792720794678e-05, -7.754936814308167e-05, -7.262080907821655e-05, -6.769225001335144e-05, -6.276369094848633e-05, -5.7835131883621216e-05, -5.2906572818756104e-05, -4.797801375389099e-05, -4.304945468902588e-05, -3.8120895624160767e-05, -3.3192336559295654e-05, -2.8263777494430542e-05, -2.333521842956543e-05, -1.8406659364700317e-05, -1.3478100299835205e-05, -8.549541234970093e-06, -3.6209821701049805e-06, 1.3075768947601318e-06, 6.236135959625244e-06, 1.1164695024490356e-05, 1.609325408935547e-05, 2.102181315422058e-05, 2.5950372219085693e-05, 3.0878931283950806e-05, 3.580749034881592e-05, 4.073604941368103e-05, 4.566460847854614e-05, 5.0593167543411255e-05, 5.552172660827637e-05, 6.045028567314148e-05, 6.537884473800659e-05, 7.03074038028717e-05, 7.523596286773682e-05, 8.016452193260193e-05, 8.509308099746704e-05, 9.002164006233215e-05, 9.495019912719727e-05, 9.987875819206238e-05, 0.00010480731725692749, 0.0001097358763217926, 0.00011466443538665771, 0.00011959299445152283, 0.00012452155351638794, 0.00012945011258125305, 0.00013437867164611816, 0.00013930723071098328, 0.0001442357897758484, 0.0001491643488407135, 0.0001540929079055786, 0.00015902146697044373, 0.00016395002603530884, 0.00016887858510017395, 0.00017380714416503906]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 8.0, 4.0, 1.0, 7.0, 5.0, 10.0, 18.0, 20.0, 43.0, 56.0, 123.0, 257.0, 411.0, 868.0, 2144.0, 6215.0, 26524.0, 232395.0, 715770.0, 49013.0, 9515.0, 2799.0, 1137.0, 541.0, 279.0, 153.0, 84.0, 48.0, 30.0, 25.0, 20.0, 6.0, 3.0, 5.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7664260864257812, -0.7418365478515625, -0.7172470092773438, -0.692657470703125, -0.6680679321289062, -0.6434783935546875, -0.6188888549804688, -0.59429931640625, -0.5697097778320312, -0.5451202392578125, -0.5205307006835938, -0.495941162109375, -0.47135162353515625, -0.4467620849609375, -0.42217254638671875, -0.3975830078125, -0.37299346923828125, -0.3484039306640625, -0.32381439208984375, -0.299224853515625, -0.27463531494140625, -0.2500457763671875, -0.22545623779296875, -0.20086669921875, -0.17627716064453125, -0.1516876220703125, -0.12709808349609375, -0.102508544921875, -0.07791900634765625, -0.0533294677734375, -0.02873992919921875, -0.004150390625, 0.02043914794921875, 0.0450286865234375, 0.06961822509765625, 0.094207763671875, 0.11879730224609375, 0.1433868408203125, 0.16797637939453125, 0.19256591796875, 0.21715545654296875, 0.2417449951171875, 0.26633453369140625, 0.290924072265625, 0.31551361083984375, 0.3401031494140625, 0.36469268798828125, 0.3892822265625, 0.41387176513671875, 0.4384613037109375, 0.46305084228515625, 0.487640380859375, 0.5122299194335938, 0.5368194580078125, 0.5614089965820312, 0.58599853515625, 0.6105880737304688, 0.6351776123046875, 0.6597671508789062, 0.684356689453125, 0.7089462280273438, 0.7335357666015625, 0.7581253051757812, 0.78271484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 15.0, 13.0, 37.0, 57.0, 85.0, 140.0, 180.0, 148.0, 105.0, 71.0, 41.0, 35.0, 22.0, 19.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1321258544921875, -1.095306396484375, -1.0584869384765625, -1.02166748046875, -0.9848480224609375, -0.948028564453125, -0.9112091064453125, -0.8743896484375, -0.8375701904296875, -0.800750732421875, -0.7639312744140625, -0.72711181640625, -0.6902923583984375, -0.653472900390625, -0.6166534423828125, -0.579833984375, -0.5430145263671875, -0.506195068359375, -0.4693756103515625, -0.43255615234375, -0.3957366943359375, -0.358917236328125, -0.3220977783203125, -0.2852783203125, -0.2484588623046875, -0.211639404296875, -0.1748199462890625, -0.13800048828125, -0.1011810302734375, -0.064361572265625, -0.0275421142578125, 0.00927734375, 0.0460968017578125, 0.082916259765625, 0.1197357177734375, 0.15655517578125, 0.1933746337890625, 0.230194091796875, 0.2670135498046875, 0.3038330078125, 0.3406524658203125, 0.377471923828125, 0.4142913818359375, 0.45111083984375, 0.4879302978515625, 0.524749755859375, 0.5615692138671875, 0.598388671875, 0.6352081298828125, 0.672027587890625, 0.7088470458984375, 0.74566650390625, 0.7824859619140625, 0.819305419921875, 0.8561248779296875, 0.8929443359375, 0.9297637939453125, 0.966583251953125, 1.0034027099609375, 1.04022216796875, 1.0770416259765625, 1.113861083984375, 1.1506805419921875, 1.1875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 16.0, 21.0, 30.0, 55.0, 87.0, 148.0, 264.0, 126.0, 83.0, 54.0, 28.0, 22.0, 21.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-16.689308166503906, -16.253013610839844, -15.816718101501465, -15.380422592163086, -14.944127082824707, -14.507831573486328, -14.071537017822266, -13.635241508483887, -13.198945999145508, -12.762650489807129, -12.326355934143066, -11.890060424804688, -11.453764915466309, -11.01746940612793, -10.581174850463867, -10.144879341125488, -9.70858383178711, -9.27228832244873, -8.835993766784668, -8.399698257446289, -7.96340274810791, -7.5271077156066895, -7.090812683105469, -6.65451717376709, -6.218222618103027, -5.781927585601807, -5.345632076263428, -4.909337043762207, -4.473041534423828, -4.036746501922607, -3.6004512310028076, -3.164155960083008, -2.727860450744629, -2.291565179824829, -1.8552699089050293, -1.418974757194519, -0.9826794862747192, -0.546384334564209, -0.11008906364440918, 0.3262062072753906, 0.7625014781951904, 1.1987967491149902, 1.63509202003479, 2.07138729095459, 2.5076823234558105, 2.9439775943756104, 3.38027286529541, 3.81656813621521, 4.25286340713501, 4.6891584396362305, 5.125453948974609, 5.56174898147583, 5.998044490814209, 6.43433952331543, 6.870635032653809, 7.306930065155029, 7.74322509765625, 8.179520606994629, 8.615815162658691, 9.05211067199707, 9.48840618133545, 9.924701690673828, 10.36099624633789, 10.79729175567627, 11.233587265014648]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 6.0, 10.0, 10.0, 11.0, 15.0, 31.0, 15.0, 28.0, 23.0, 23.0, 36.0, 42.0, 45.0, 54.0, 60.0, 116.0, 93.0, 49.0, 44.0, 39.0, 30.0, 27.0, 28.0, 31.0, 22.0, 13.0, 8.0, 12.0, 14.0, 14.0, 8.0, 11.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-13.936079025268555, -13.544151306152344, -13.152223587036133, -12.760295867919922, -12.368367195129395, -11.976439476013184, -11.584511756896973, -11.192584037780762, -10.800655364990234, -10.408727645874023, -10.016799926757812, -9.624872207641602, -9.232943534851074, -8.841015815734863, -8.449088096618652, -8.057160377502441, -7.6652326583862305, -7.2733049392700195, -6.88137674331665, -6.4894490242004395, -6.09752082824707, -5.705593109130859, -5.313665390014648, -4.9217376708984375, -4.529809474945068, -4.137881755828857, -3.7459535598754883, -3.3540258407592773, -2.9620978832244873, -2.5701699256896973, -2.1782422065734863, -1.7863142490386963, -1.3943853378295898, -1.0024573802947998, -0.6105295419692993, -0.21860170364379883, 0.1733262538909912, 0.5652542114257812, 0.9571819305419922, 1.3491098880767822, 1.7410378456115723, 2.1329658031463623, 2.5248937606811523, 2.9168214797973633, 3.3087494373321533, 3.7006773948669434, 4.092605113983154, 4.484533309936523, 4.876461029052734, 5.268388748168945, 5.6603169441223145, 6.052244663238525, 6.4441728591918945, 6.8361005783081055, 7.228028297424316, 7.619956016540527, 8.011884689331055, 8.403812408447266, 8.795740127563477, 9.187667846679688, 9.579596519470215, 9.971524238586426, 10.363451957702637, 10.755379676818848, 11.147307395935059]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 18.0, 14.0, 27.0, 27.0, 52.0, 73.0, 123.0, 190.0, 335.0, 597.0, 1075.0, 2230.0, 5053.0, 14265.0, 58412.0, 451304.0, 2717467.0, 816972.0, 94100.0, 19588.0, 6541.0, 2811.0, 1307.0, 659.0, 368.0, 227.0, 137.0, 82.0, 56.0, 57.0, 34.0, 20.0, 17.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.111328125, -1.073822021484375, -1.03631591796875, -0.998809814453125, -0.9613037109375, -0.923797607421875, -0.88629150390625, -0.848785400390625, -0.811279296875, -0.773773193359375, -0.73626708984375, -0.698760986328125, -0.6612548828125, -0.623748779296875, -0.58624267578125, -0.548736572265625, -0.51123046875, -0.473724365234375, -0.43621826171875, -0.398712158203125, -0.3612060546875, -0.323699951171875, -0.28619384765625, -0.248687744140625, -0.211181640625, -0.173675537109375, -0.13616943359375, -0.098663330078125, -0.0611572265625, -0.023651123046875, 0.01385498046875, 0.051361083984375, 0.0888671875, 0.126373291015625, 0.16387939453125, 0.201385498046875, 0.2388916015625, 0.276397705078125, 0.31390380859375, 0.351409912109375, 0.388916015625, 0.426422119140625, 0.46392822265625, 0.501434326171875, 0.5389404296875, 0.576446533203125, 0.61395263671875, 0.651458740234375, 0.68896484375, 0.726470947265625, 0.76397705078125, 0.801483154296875, 0.8389892578125, 0.876495361328125, 0.91400146484375, 0.951507568359375, 0.989013671875, 1.026519775390625, 1.06402587890625, 1.101531982421875, 1.1390380859375, 1.176544189453125, 1.21405029296875, 1.251556396484375, 1.2890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 14.0, 11.0, 14.0, 13.0, 17.0, 22.0, 17.0, 25.0, 33.0, 24.0, 34.0, 36.0, 45.0, 40.0, 28.0, 47.0, 52.0, 53.0, 40.0, 33.0, 37.0, 39.0, 39.0, 34.0, 39.0, 35.0, 24.0, 26.0, 23.0, 25.0, 17.0, 9.0, 7.0, 5.0, 7.0, 7.0, 3.0, 9.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.814453125, -0.7899246215820312, -0.7653961181640625, -0.7408676147460938, -0.716339111328125, -0.6918106079101562, -0.6672821044921875, -0.6427536010742188, -0.61822509765625, -0.5936965942382812, -0.5691680908203125, -0.5446395874023438, -0.520111083984375, -0.49558258056640625, -0.4710540771484375, -0.44652557373046875, -0.4219970703125, -0.39746856689453125, -0.3729400634765625, -0.34841156005859375, -0.323883056640625, -0.29935455322265625, -0.2748260498046875, -0.25029754638671875, -0.22576904296875, -0.20124053955078125, -0.1767120361328125, -0.15218353271484375, -0.127655029296875, -0.10312652587890625, -0.0785980224609375, -0.05406951904296875, -0.029541015625, -0.00501251220703125, 0.0195159912109375, 0.04404449462890625, 0.068572998046875, 0.09310150146484375, 0.1176300048828125, 0.14215850830078125, 0.16668701171875, 0.19121551513671875, 0.2157440185546875, 0.24027252197265625, 0.264801025390625, 0.28932952880859375, 0.3138580322265625, 0.33838653564453125, 0.3629150390625, 0.38744354248046875, 0.4119720458984375, 0.43650054931640625, 0.461029052734375, 0.48555755615234375, 0.5100860595703125, 0.5346145629882812, 0.55914306640625, 0.5836715698242188, 0.6082000732421875, 0.6327285766601562, 0.657257080078125, 0.6817855834960938, 0.7063140869140625, 0.7308425903320312, 0.75537109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 2.0, 12.0, 7.0, 12.0, 29.0, 34.0, 42.0, 79.0, 161.0, 294.0, 664.0, 2158.0, 7947.0, 48523.0, 2216296.0, 1861102.0, 45454.0, 7820.0, 2184.0, 734.0, 319.0, 137.0, 85.0, 46.0, 45.0, 25.0, 21.0, 17.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.484375, -2.4090576171875, -2.333740234375, -2.2584228515625, -2.18310546875, -2.1077880859375, -2.032470703125, -1.9571533203125, -1.8818359375, -1.8065185546875, -1.731201171875, -1.6558837890625, -1.58056640625, -1.5052490234375, -1.429931640625, -1.3546142578125, -1.279296875, -1.2039794921875, -1.128662109375, -1.0533447265625, -0.97802734375, -0.9027099609375, -0.827392578125, -0.7520751953125, -0.6767578125, -0.6014404296875, -0.526123046875, -0.4508056640625, -0.37548828125, -0.3001708984375, -0.224853515625, -0.1495361328125, -0.07421875, 0.0010986328125, 0.076416015625, 0.1517333984375, 0.22705078125, 0.3023681640625, 0.377685546875, 0.4530029296875, 0.5283203125, 0.6036376953125, 0.678955078125, 0.7542724609375, 0.82958984375, 0.9049072265625, 0.980224609375, 1.0555419921875, 1.130859375, 1.2061767578125, 1.281494140625, 1.3568115234375, 1.43212890625, 1.5074462890625, 1.582763671875, 1.6580810546875, 1.7333984375, 1.8087158203125, 1.884033203125, 1.9593505859375, 2.03466796875, 2.1099853515625, 2.185302734375, 2.2606201171875, 2.3359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 0.0, 3.0, 6.0, 6.0, 11.0, 18.0, 24.0, 39.0, 57.0, 96.0, 144.0, 281.0, 598.0, 1003.0, 839.0, 392.0, 218.0, 119.0, 74.0, 35.0, 22.0, 23.0, 21.0, 9.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.475738525390625, -2.40655517578125, -2.337371826171875, -2.2681884765625, -2.199005126953125, -2.12982177734375, -2.060638427734375, -1.991455078125, -1.922271728515625, -1.85308837890625, -1.783905029296875, -1.7147216796875, -1.645538330078125, -1.57635498046875, -1.507171630859375, -1.43798828125, -1.368804931640625, -1.29962158203125, -1.230438232421875, -1.1612548828125, -1.092071533203125, -1.02288818359375, -0.953704833984375, -0.884521484375, -0.815338134765625, -0.74615478515625, -0.676971435546875, -0.6077880859375, -0.538604736328125, -0.46942138671875, -0.400238037109375, -0.3310546875, -0.261871337890625, -0.19268798828125, -0.123504638671875, -0.0543212890625, 0.014862060546875, 0.08404541015625, 0.153228759765625, 0.222412109375, 0.291595458984375, 0.36077880859375, 0.429962158203125, 0.4991455078125, 0.568328857421875, 0.63751220703125, 0.706695556640625, 0.77587890625, 0.845062255859375, 0.91424560546875, 0.983428955078125, 1.0526123046875, 1.121795654296875, 1.19097900390625, 1.260162353515625, 1.329345703125, 1.398529052734375, 1.46771240234375, 1.536895751953125, 1.6060791015625, 1.675262451171875, 1.74444580078125, 1.813629150390625, 1.8828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 43.0, 99.0, 284.0, 321.0, 158.0, 40.0, 21.0, 9.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.12636947631836, -35.36076354980469, -34.59516143798828, -33.829559326171875, -33.0639533996582, -32.29834747314453, -31.532745361328125, -30.767141342163086, -30.001537322998047, -29.235933303833008, -28.47032928466797, -27.70472526550293, -26.93912124633789, -26.17351722717285, -25.407913208007812, -24.642309188842773, -23.876705169677734, -23.111101150512695, -22.345497131347656, -21.579893112182617, -20.814289093017578, -20.04868507385254, -19.2830810546875, -18.51747703552246, -17.751873016357422, -16.986268997192383, -16.220664978027344, -15.455060958862305, -14.689456939697266, -13.923852920532227, -13.158248901367188, -12.392644882202148, -11.62704086303711, -10.86143684387207, -10.095832824707031, -9.330228805541992, -8.564624786376953, -7.799020767211914, -7.033416748046875, -6.267812728881836, -5.502208709716797, -4.736604690551758, -3.9710006713867188, -3.2053966522216797, -2.4397926330566406, -1.6741886138916016, -0.9085845947265625, -0.14298057556152344, 0.6226234436035156, 1.3882274627685547, 2.1538314819335938, 2.919435501098633, 3.685039520263672, 4.450643539428711, 5.21624755859375, 5.981851577758789, 6.747455596923828, 7.513059616088867, 8.278663635253906, 9.044267654418945, 9.809871673583984, 10.575475692749023, 11.341079711914062, 12.106683731079102, 12.87228775024414]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 15.0, 11.0, 11.0, 16.0, 18.0, 24.0, 18.0, 28.0, 37.0, 39.0, 48.0, 31.0, 41.0, 48.0, 51.0, 51.0, 54.0, 45.0, 43.0, 38.0, 44.0, 31.0, 31.0, 34.0, 20.0, 15.0, 25.0, 22.0, 10.0, 7.0, 14.0, 10.0, 9.0, 7.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.457266807556152, -6.251025199890137, -6.044783592224121, -5.838541507720947, -5.632299900054932, -5.426058292388916, -5.219816207885742, -5.013574600219727, -4.807332992553711, -4.601091384887695, -4.39484977722168, -4.188607692718506, -3.9823660850524902, -3.7761244773864746, -3.56988263130188, -3.363640785217285, -3.1573991775512695, -2.951157569885254, -2.744915723800659, -2.5386738777160645, -2.332432270050049, -2.126190662384033, -1.9199488162994385, -1.7137070894241333, -1.5074653625488281, -1.301223635673523, -1.0949819087982178, -0.8887401819229126, -0.6824984550476074, -0.47625672817230225, -0.27001500129699707, -0.0637732744216919, 0.14246892929077148, 0.34871065616607666, 0.5549523830413818, 0.761194109916687, 0.9674358367919922, 1.1736775636672974, 1.3799192905426025, 1.5861610174179077, 1.792402744293213, 1.998644471168518, 2.2048861980438232, 2.411128044128418, 2.6173696517944336, 2.823611259460449, 3.029853105545044, 3.2360949516296387, 3.4423365592956543, 3.64857816696167, 3.8548200130462646, 4.061061859130859, 4.267303466796875, 4.473545074462891, 4.679786682128906, 4.88602876663208, 5.092270374298096, 5.298511981964111, 5.504754066467285, 5.710995674133301, 5.917237281799316, 6.123478889465332, 6.329720497131348, 6.5359625816345215, 6.742204189300537]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 13.0, 20.0, 26.0, 32.0, 61.0, 102.0, 111.0, 174.0, 250.0, 370.0, 531.0, 898.0, 1415.0, 2227.0, 3727.0, 6667.0, 12690.0, 27454.0, 67152.0, 187711.0, 420290.0, 190945.0, 68009.0, 28087.0, 12918.0, 6560.0, 3861.0, 2214.0, 1353.0, 848.0, 615.0, 367.0, 266.0, 198.0, 120.0, 82.0, 66.0, 32.0, 35.0, 14.0, 9.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.59375, -1.5431671142578125, -1.492584228515625, -1.4420013427734375, -1.39141845703125, -1.3408355712890625, -1.290252685546875, -1.2396697998046875, -1.1890869140625, -1.1385040283203125, -1.087921142578125, -1.0373382568359375, -0.98675537109375, -0.9361724853515625, -0.885589599609375, -0.8350067138671875, -0.784423828125, -0.7338409423828125, -0.683258056640625, -0.6326751708984375, -0.58209228515625, -0.5315093994140625, -0.480926513671875, -0.4303436279296875, -0.3797607421875, -0.3291778564453125, -0.278594970703125, -0.2280120849609375, -0.17742919921875, -0.1268463134765625, -0.076263427734375, -0.0256805419921875, 0.02490234375, 0.0754852294921875, 0.126068115234375, 0.1766510009765625, 0.22723388671875, 0.2778167724609375, 0.328399658203125, 0.3789825439453125, 0.4295654296875, 0.4801483154296875, 0.530731201171875, 0.5813140869140625, 0.63189697265625, 0.6824798583984375, 0.733062744140625, 0.7836456298828125, 0.834228515625, 0.8848114013671875, 0.935394287109375, 0.9859771728515625, 1.03656005859375, 1.0871429443359375, 1.137725830078125, 1.1883087158203125, 1.2388916015625, 1.2894744873046875, 1.340057373046875, 1.3906402587890625, 1.44122314453125, 1.4918060302734375, 1.542388916015625, 1.5929718017578125, 1.6435546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 6.0, 8.0, 5.0, 8.0, 15.0, 13.0, 20.0, 17.0, 25.0, 22.0, 34.0, 29.0, 33.0, 39.0, 30.0, 34.0, 55.0, 50.0, 39.0, 53.0, 45.0, 38.0, 37.0, 33.0, 40.0, 36.0, 35.0, 35.0, 27.0, 27.0, 22.0, 20.0, 21.0, 11.0, 7.0, 6.0, 7.0, 1.0, 8.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7744140625, -0.7486953735351562, -0.7229766845703125, -0.6972579956054688, -0.671539306640625, -0.6458206176757812, -0.6201019287109375, -0.5943832397460938, -0.56866455078125, -0.5429458618164062, -0.5172271728515625, -0.49150848388671875, -0.465789794921875, -0.44007110595703125, -0.4143524169921875, -0.38863372802734375, -0.3629150390625, -0.33719635009765625, -0.3114776611328125, -0.28575897216796875, -0.260040283203125, -0.23432159423828125, -0.2086029052734375, -0.18288421630859375, -0.15716552734375, -0.13144683837890625, -0.1057281494140625, -0.08000946044921875, -0.054290771484375, -0.02857208251953125, -0.0028533935546875, 0.02286529541015625, 0.048583984375, 0.07430267333984375, 0.1000213623046875, 0.12574005126953125, 0.151458740234375, 0.17717742919921875, 0.2028961181640625, 0.22861480712890625, 0.25433349609375, 0.28005218505859375, 0.3057708740234375, 0.33148956298828125, 0.357208251953125, 0.38292694091796875, 0.4086456298828125, 0.43436431884765625, 0.4600830078125, 0.48580169677734375, 0.5115203857421875, 0.5372390747070312, 0.562957763671875, 0.5886764526367188, 0.6143951416015625, 0.6401138305664062, 0.66583251953125, 0.6915512084960938, 0.7172698974609375, 0.7429885864257812, 0.768707275390625, 0.7944259643554688, 0.8201446533203125, 0.8458633422851562, 0.87158203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 5.0, 11.0, 10.0, 11.0, 20.0, 20.0, 16.0, 22.0, 47.0, 54.0, 78.0, 110.0, 140.0, 189.0, 269.0, 370.0, 616.0, 1104.0, 2334.0, 5411.0, 17139.0, 78631.0, 747940.0, 152626.0, 26924.0, 7830.0, 2967.0, 1407.0, 767.0, 485.0, 282.0, 171.0, 140.0, 95.0, 76.0, 47.0, 44.0, 44.0, 25.0, 16.0, 15.0, 12.0, 7.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.564453125, -2.490478515625, -2.41650390625, -2.342529296875, -2.2685546875, -2.194580078125, -2.12060546875, -2.046630859375, -1.97265625, -1.898681640625, -1.82470703125, -1.750732421875, -1.6767578125, -1.602783203125, -1.52880859375, -1.454833984375, -1.380859375, -1.306884765625, -1.23291015625, -1.158935546875, -1.0849609375, -1.010986328125, -0.93701171875, -0.863037109375, -0.7890625, -0.715087890625, -0.64111328125, -0.567138671875, -0.4931640625, -0.419189453125, -0.34521484375, -0.271240234375, -0.197265625, -0.123291015625, -0.04931640625, 0.024658203125, 0.0986328125, 0.172607421875, 0.24658203125, 0.320556640625, 0.39453125, 0.468505859375, 0.54248046875, 0.616455078125, 0.6904296875, 0.764404296875, 0.83837890625, 0.912353515625, 0.986328125, 1.060302734375, 1.13427734375, 1.208251953125, 1.2822265625, 1.356201171875, 1.43017578125, 1.504150390625, 1.578125, 1.652099609375, 1.72607421875, 1.800048828125, 1.8740234375, 1.947998046875, 2.02197265625, 2.095947265625, 2.169921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 5.0, 8.0, 14.0, 10.0, 22.0, 24.0, 17.0, 22.0, 22.0, 32.0, 30.0, 32.0, 42.0, 40.0, 45.0, 63.0, 49.0, 63.0, 55.0, 46.0, 43.0, 38.0, 33.0, 25.0, 25.0, 20.0, 24.0, 23.0, 23.0, 10.0, 10.0, 12.0, 8.0, 18.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.9903564453125, -2.902587890625, -2.8148193359375, -2.72705078125, -2.6392822265625, -2.551513671875, -2.4637451171875, -2.3759765625, -2.2882080078125, -2.200439453125, -2.1126708984375, -2.02490234375, -1.9371337890625, -1.849365234375, -1.7615966796875, -1.673828125, -1.5860595703125, -1.498291015625, -1.4105224609375, -1.32275390625, -1.2349853515625, -1.147216796875, -1.0594482421875, -0.9716796875, -0.8839111328125, -0.796142578125, -0.7083740234375, -0.62060546875, -0.5328369140625, -0.445068359375, -0.3572998046875, -0.26953125, -0.1817626953125, -0.093994140625, -0.0062255859375, 0.08154296875, 0.1693115234375, 0.257080078125, 0.3448486328125, 0.4326171875, 0.5203857421875, 0.608154296875, 0.6959228515625, 0.78369140625, 0.8714599609375, 0.959228515625, 1.0469970703125, 1.134765625, 1.2225341796875, 1.310302734375, 1.3980712890625, 1.48583984375, 1.5736083984375, 1.661376953125, 1.7491455078125, 1.8369140625, 1.9246826171875, 2.012451171875, 2.1002197265625, 2.18798828125, 2.2757568359375, 2.363525390625, 2.4512939453125, 2.5390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 7.0, 3.0, 7.0, 19.0, 20.0, 23.0, 29.0, 59.0, 95.0, 135.0, 238.0, 380.0, 730.0, 1425.0, 3273.0, 9755.0, 39766.0, 282590.0, 639683.0, 51249.0, 11790.0, 3851.0, 1565.0, 795.0, 376.0, 239.0, 149.0, 97.0, 47.0, 34.0, 30.0, 19.0, 18.0, 8.0, 7.0, 11.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.598419189453125, -0.57916259765625, -0.559906005859375, -0.5406494140625, -0.521392822265625, -0.50213623046875, -0.482879638671875, -0.463623046875, -0.444366455078125, -0.42510986328125, -0.405853271484375, -0.3865966796875, -0.367340087890625, -0.34808349609375, -0.328826904296875, -0.3095703125, -0.290313720703125, -0.27105712890625, -0.251800537109375, -0.2325439453125, -0.213287353515625, -0.19403076171875, -0.174774169921875, -0.155517578125, -0.136260986328125, -0.11700439453125, -0.097747802734375, -0.0784912109375, -0.059234619140625, -0.03997802734375, -0.020721435546875, -0.00146484375, 0.017791748046875, 0.03704833984375, 0.056304931640625, 0.0755615234375, 0.094818115234375, 0.11407470703125, 0.133331298828125, 0.152587890625, 0.171844482421875, 0.19110107421875, 0.210357666015625, 0.2296142578125, 0.248870849609375, 0.26812744140625, 0.287384033203125, 0.306640625, 0.325897216796875, 0.34515380859375, 0.364410400390625, 0.3836669921875, 0.402923583984375, 0.42218017578125, 0.441436767578125, 0.460693359375, 0.479949951171875, 0.49920654296875, 0.518463134765625, 0.5377197265625, 0.556976318359375, 0.57623291015625, 0.595489501953125, 0.61474609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 14.0, 28.0, 35.0, 61.0, 92.0, 124.0, 145.0, 149.0, 88.0, 62.0, 50.0, 34.0, 29.0, 11.0, 8.0, 12.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00028777122497558594, -0.00028052181005477905, -0.00027327239513397217, -0.0002660229802131653, -0.0002587735652923584, -0.0002515241503715515, -0.00024427473545074463, -0.00023702532052993774, -0.00022977590560913086, -0.00022252649068832397, -0.0002152770757675171, -0.0002080276608467102, -0.00020077824592590332, -0.00019352883100509644, -0.00018627941608428955, -0.00017903000116348267, -0.00017178058624267578, -0.0001645311713218689, -0.000157281756401062, -0.00015003234148025513, -0.00014278292655944824, -0.00013553351163864136, -0.00012828409671783447, -0.00012103468179702759, -0.0001137852668762207, -0.00010653585195541382, -9.928643703460693e-05, -9.203702211380005e-05, -8.478760719299316e-05, -7.753819227218628e-05, -7.02887773513794e-05, -6.303936243057251e-05, -5.5789947509765625e-05, -4.854053258895874e-05, -4.1291117668151855e-05, -3.404170274734497e-05, -2.6792287826538086e-05, -1.95428729057312e-05, -1.2293457984924316e-05, -5.044043064117432e-06, 2.205371856689453e-06, 9.454786777496338e-06, 1.6704201698303223e-05, 2.3953616619110107e-05, 3.120303153991699e-05, 3.845244646072388e-05, 4.570186138153076e-05, 5.2951276302337646e-05, 6.020069122314453e-05, 6.745010614395142e-05, 7.46995210647583e-05, 8.194893598556519e-05, 8.919835090637207e-05, 9.644776582717896e-05, 0.00010369718074798584, 0.00011094659566879272, 0.00011819601058959961, 0.0001254454255104065, 0.00013269484043121338, 0.00013994425535202026, 0.00014719367027282715, 0.00015444308519363403, 0.00016169250011444092, 0.0001689419150352478, 0.0001761913299560547]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 5.0, 3.0, 7.0, 10.0, 8.0, 15.0, 8.0, 30.0, 35.0, 49.0, 62.0, 89.0, 128.0, 222.0, 364.0, 635.0, 1458.0, 3490.0, 10073.0, 43685.0, 429673.0, 497415.0, 44367.0, 10202.0, 3483.0, 1340.0, 649.0, 380.0, 216.0, 126.0, 96.0, 58.0, 49.0, 30.0, 23.0, 21.0, 11.0, 13.0, 13.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.5947265625, -0.5767059326171875, -0.558685302734375, -0.5406646728515625, -0.52264404296875, -0.5046234130859375, -0.486602783203125, -0.4685821533203125, -0.4505615234375, -0.4325408935546875, -0.414520263671875, -0.3964996337890625, -0.37847900390625, -0.3604583740234375, -0.342437744140625, -0.3244171142578125, -0.306396484375, -0.2883758544921875, -0.270355224609375, -0.2523345947265625, -0.23431396484375, -0.2162933349609375, -0.198272705078125, -0.1802520751953125, -0.1622314453125, -0.1442108154296875, -0.126190185546875, -0.1081695556640625, -0.09014892578125, -0.0721282958984375, -0.054107666015625, -0.0360870361328125, -0.01806640625, -4.57763671875e-05, 0.017974853515625, 0.0359954833984375, 0.05401611328125, 0.0720367431640625, 0.090057373046875, 0.1080780029296875, 0.1260986328125, 0.1441192626953125, 0.162139892578125, 0.1801605224609375, 0.19818115234375, 0.2162017822265625, 0.234222412109375, 0.2522430419921875, 0.270263671875, 0.2882843017578125, 0.306304931640625, 0.3243255615234375, 0.34234619140625, 0.3603668212890625, 0.378387451171875, 0.3964080810546875, 0.4144287109375, 0.4324493408203125, 0.450469970703125, 0.4684906005859375, 0.48651123046875, 0.5045318603515625, 0.522552490234375, 0.5405731201171875, 0.55859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 1.0, 8.0, 13.0, 12.0, 18.0, 15.0, 16.0, 26.0, 32.0, 37.0, 43.0, 55.0, 53.0, 59.0, 74.0, 60.0, 63.0, 67.0, 64.0, 38.0, 39.0, 33.0, 31.0, 18.0, 23.0, 14.0, 9.0, 12.0, 9.0, 14.0, 3.0, 4.0, 5.0, 0.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.4462890625, -0.43256378173828125, -0.4188385009765625, -0.40511322021484375, -0.391387939453125, -0.37766265869140625, -0.3639373779296875, -0.35021209716796875, -0.33648681640625, -0.32276153564453125, -0.3090362548828125, -0.29531097412109375, -0.281585693359375, -0.26786041259765625, -0.2541351318359375, -0.24040985107421875, -0.2266845703125, -0.21295928955078125, -0.1992340087890625, -0.18550872802734375, -0.171783447265625, -0.15805816650390625, -0.1443328857421875, -0.13060760498046875, -0.11688232421875, -0.10315704345703125, -0.0894317626953125, -0.07570648193359375, -0.061981201171875, -0.04825592041015625, -0.0345306396484375, -0.02080535888671875, -0.007080078125, 0.00664520263671875, 0.0203704833984375, 0.03409576416015625, 0.047821044921875, 0.06154632568359375, 0.0752716064453125, 0.08899688720703125, 0.10272216796875, 0.11644744873046875, 0.1301727294921875, 0.14389801025390625, 0.157623291015625, 0.17134857177734375, 0.1850738525390625, 0.19879913330078125, 0.2125244140625, 0.22624969482421875, 0.2399749755859375, 0.25370025634765625, 0.267425537109375, 0.28115081787109375, 0.2948760986328125, 0.30860137939453125, 0.32232666015625, 0.33605194091796875, 0.3497772216796875, 0.36350250244140625, 0.377227783203125, 0.39095306396484375, 0.4046783447265625, 0.41840362548828125, 0.43212890625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 11.0, 11.0, 23.0, 49.0, 97.0, 331.0, 227.0, 112.0, 53.0, 39.0, 25.0, 12.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.293344497680664, -12.657795906066895, -12.022247314453125, -11.386699676513672, -10.751151084899902, -10.115602493286133, -9.48005485534668, -8.84450626373291, -8.20895767211914, -7.573409080505371, -6.93786096572876, -6.302312850952148, -5.666764259338379, -5.031215667724609, -4.395667552947998, -3.7601194381713867, -3.124570846557617, -2.4890224933624268, -1.8534741401672363, -1.217925786972046, -0.5823774337768555, 0.05317091941833496, 0.6887192726135254, 1.3242673873901367, 1.9598159790039062, 2.5953643321990967, 3.230912685394287, 3.8664610385894775, 4.502009391784668, 5.1375579833984375, 5.773106098175049, 6.40865421295166, 7.0442047119140625, 7.679753303527832, 8.315301895141602, 8.950849533081055, 9.586398124694824, 10.221946716308594, 10.857494354248047, 11.493042945861816, 12.128591537475586, 12.764140129089355, 13.399688720703125, 14.035236358642578, 14.670784950256348, 15.306333541870117, 15.94188117980957, 16.577430725097656, 17.21297836303711, 17.848526000976562, 18.48407554626465, 19.1196231842041, 19.755172729492188, 20.39072036743164, 21.026268005371094, 21.661815643310547, 22.297365188598633, 22.932912826538086, 23.568462371826172, 24.204010009765625, 24.839557647705078, 25.475107192993164, 26.110654830932617, 26.746204376220703, 27.381752014160156]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 4.0, 7.0, 8.0, 9.0, 7.0, 14.0, 13.0, 18.0, 12.0, 19.0, 19.0, 21.0, 20.0, 25.0, 30.0, 39.0, 35.0, 39.0, 68.0, 86.0, 128.0, 88.0, 42.0, 33.0, 28.0, 23.0, 14.0, 23.0, 17.0, 17.0, 19.0, 11.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.808591842651367, -9.52204418182373, -9.235495567321777, -8.94894790649414, -8.662399291992188, -8.37585163116455, -8.089303970336914, -7.802755832672119, -7.516207695007324, -7.229659557342529, -6.943111419677734, -6.656563758850098, -6.370015621185303, -6.083467483520508, -5.796919822692871, -5.510371685028076, -5.223823547363281, -4.937275409698486, -4.650727272033691, -4.364179611206055, -4.07763147354126, -3.791083335876465, -3.504535436630249, -3.217987537384033, -2.9314393997192383, -2.6448912620544434, -2.3583433628082275, -2.0717954635620117, -1.7852473258972168, -1.4986993074417114, -1.212151288986206, -0.9256033897399902, -0.6390552520751953, -0.35250723361968994, -0.06595921516418457, 0.2205888032913208, 0.5071368217468262, 0.7936848402023315, 1.080232858657837, 1.3667807579040527, 1.6533288955688477, 1.939876914024353, 2.2264249324798584, 2.512972831726074, 2.799520969390869, 3.086069107055664, 3.37261700630188, 3.6591649055480957, 3.9457130432128906, 4.2322611808776855, 4.5188093185424805, 4.805356979370117, 5.091905117034912, 5.378453254699707, 5.665000915527344, 5.951549053192139, 6.238097190856934, 6.5246453285217285, 6.811193466186523, 7.09774112701416, 7.384289264678955, 7.67083740234375, 7.957385063171387, 8.243932723999023, 8.530481338500977]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 18.0, 31.0, 25.0, 51.0, 79.0, 107.0, 173.0, 266.0, 458.0, 827.0, 1513.0, 3283.0, 8334.0, 27599.0, 136975.0, 1365623.0, 2345134.0, 244145.0, 39880.0, 11158.0, 4269.0, 1904.0, 968.0, 558.0, 345.0, 178.0, 135.0, 69.0, 44.0, 38.0, 25.0, 18.0, 16.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.98114013671875, -1.9154052734375, -1.84967041015625, -1.783935546875, -1.71820068359375, -1.6524658203125, -1.58673095703125, -1.52099609375, -1.45526123046875, -1.3895263671875, -1.32379150390625, -1.258056640625, -1.19232177734375, -1.1265869140625, -1.06085205078125, -0.9951171875, -0.92938232421875, -0.8636474609375, -0.79791259765625, -0.732177734375, -0.66644287109375, -0.6007080078125, -0.53497314453125, -0.46923828125, -0.40350341796875, -0.3377685546875, -0.27203369140625, -0.206298828125, -0.14056396484375, -0.0748291015625, -0.00909423828125, 0.056640625, 0.12237548828125, 0.1881103515625, 0.25384521484375, 0.319580078125, 0.38531494140625, 0.4510498046875, 0.51678466796875, 0.58251953125, 0.64825439453125, 0.7139892578125, 0.77972412109375, 0.845458984375, 0.91119384765625, 0.9769287109375, 1.04266357421875, 1.1083984375, 1.17413330078125, 1.2398681640625, 1.30560302734375, 1.371337890625, 1.43707275390625, 1.5028076171875, 1.56854248046875, 1.63427734375, 1.70001220703125, 1.7657470703125, 1.83148193359375, 1.897216796875, 1.96295166015625, 2.0286865234375, 2.09442138671875, 2.16015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 8.0, 15.0, 9.0, 15.0, 23.0, 26.0, 29.0, 22.0, 26.0, 51.0, 41.0, 38.0, 43.0, 32.0, 53.0, 65.0, 54.0, 52.0, 37.0, 42.0, 35.0, 30.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 16.0, 15.0, 9.0, 6.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.767578125, -0.7418289184570312, -0.7160797119140625, -0.6903305053710938, -0.664581298828125, -0.6388320922851562, -0.6130828857421875, -0.5873336791992188, -0.56158447265625, -0.5358352661132812, -0.5100860595703125, -0.48433685302734375, -0.458587646484375, -0.43283843994140625, -0.4070892333984375, -0.38134002685546875, -0.3555908203125, -0.32984161376953125, -0.3040924072265625, -0.27834320068359375, -0.252593994140625, -0.22684478759765625, -0.2010955810546875, -0.17534637451171875, -0.14959716796875, -0.12384796142578125, -0.0980987548828125, -0.07234954833984375, -0.046600341796875, -0.02085113525390625, 0.0048980712890625, 0.03064727783203125, 0.056396484375, 0.08214569091796875, 0.1078948974609375, 0.13364410400390625, 0.159393310546875, 0.18514251708984375, 0.2108917236328125, 0.23664093017578125, 0.26239013671875, 0.28813934326171875, 0.3138885498046875, 0.33963775634765625, 0.365386962890625, 0.39113616943359375, 0.4168853759765625, 0.44263458251953125, 0.4683837890625, 0.49413299560546875, 0.5198822021484375, 0.5456314086914062, 0.571380615234375, 0.5971298217773438, 0.6228790283203125, 0.6486282348632812, 0.67437744140625, 0.7001266479492188, 0.7258758544921875, 0.7516250610351562, 0.777374267578125, 0.8031234741210938, 0.8288726806640625, 0.8546218872070312, 0.88037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 2.0, 6.0, 7.0, 12.0, 15.0, 16.0, 26.0, 38.0, 64.0, 90.0, 153.0, 259.0, 462.0, 959.0, 2372.0, 7865.0, 66454.0, 3787899.0, 305348.0, 15811.0, 3670.0, 1310.0, 615.0, 307.0, 175.0, 108.0, 75.0, 55.0, 40.0, 20.0, 15.0, 7.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-5.1640625, -5.027099609375, -4.89013671875, -4.753173828125, -4.6162109375, -4.479248046875, -4.34228515625, -4.205322265625, -4.068359375, -3.931396484375, -3.79443359375, -3.657470703125, -3.5205078125, -3.383544921875, -3.24658203125, -3.109619140625, -2.97265625, -2.835693359375, -2.69873046875, -2.561767578125, -2.4248046875, -2.287841796875, -2.15087890625, -2.013916015625, -1.876953125, -1.739990234375, -1.60302734375, -1.466064453125, -1.3291015625, -1.192138671875, -1.05517578125, -0.918212890625, -0.78125, -0.644287109375, -0.50732421875, -0.370361328125, -0.2333984375, -0.096435546875, 0.04052734375, 0.177490234375, 0.314453125, 0.451416015625, 0.58837890625, 0.725341796875, 0.8623046875, 0.999267578125, 1.13623046875, 1.273193359375, 1.41015625, 1.547119140625, 1.68408203125, 1.821044921875, 1.9580078125, 2.094970703125, 2.23193359375, 2.368896484375, 2.505859375, 2.642822265625, 2.77978515625, 2.916748046875, 3.0537109375, 3.190673828125, 3.32763671875, 3.464599609375, 3.6015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 8.0, 18.0, 27.0, 26.0, 40.0, 68.0, 77.0, 143.0, 228.0, 392.0, 591.0, 825.0, 588.0, 332.0, 226.0, 153.0, 87.0, 82.0, 51.0, 35.0, 22.0, 7.0, 10.0, 12.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.610626220703125, -2.50836181640625, -2.406097412109375, -2.3038330078125, -2.201568603515625, -2.09930419921875, -1.997039794921875, -1.894775390625, -1.792510986328125, -1.69024658203125, -1.587982177734375, -1.4857177734375, -1.383453369140625, -1.28118896484375, -1.178924560546875, -1.07666015625, -0.974395751953125, -0.87213134765625, -0.769866943359375, -0.6676025390625, -0.565338134765625, -0.46307373046875, -0.360809326171875, -0.258544921875, -0.156280517578125, -0.05401611328125, 0.048248291015625, 0.1505126953125, 0.252777099609375, 0.35504150390625, 0.457305908203125, 0.5595703125, 0.661834716796875, 0.76409912109375, 0.866363525390625, 0.9686279296875, 1.070892333984375, 1.17315673828125, 1.275421142578125, 1.377685546875, 1.479949951171875, 1.58221435546875, 1.684478759765625, 1.7867431640625, 1.889007568359375, 1.99127197265625, 2.093536376953125, 2.19580078125, 2.298065185546875, 2.40032958984375, 2.502593994140625, 2.6048583984375, 2.707122802734375, 2.80938720703125, 2.911651611328125, 3.013916015625, 3.116180419921875, 3.21844482421875, 3.320709228515625, 3.4229736328125, 3.525238037109375, 3.62750244140625, 3.729766845703125, 3.83203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 16.0, 27.0, 33.0, 83.0, 151.0, 212.0, 198.0, 116.0, 52.0, 38.0, 18.0, 13.0, 7.0, 5.0, 0.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.202171325683594, -34.131813049316406, -33.06145477294922, -31.99109649658203, -30.920738220214844, -29.850379943847656, -28.78002166748047, -27.70966339111328, -26.639305114746094, -25.568946838378906, -24.49858856201172, -23.42823028564453, -22.357872009277344, -21.287513732910156, -20.21715545654297, -19.14679718017578, -18.076440811157227, -17.00608253479004, -15.935724258422852, -14.865365982055664, -13.795007705688477, -12.724649429321289, -11.654292106628418, -10.58393383026123, -9.513575553894043, -8.443217277526855, -7.372859001159668, -6.302501201629639, -5.232142925262451, -4.161784648895264, -3.0914268493652344, -2.021068572998047, -0.9507102966308594, 0.11964786052703857, 1.1900060176849365, 2.260364055633545, 3.3307223320007324, 4.40108060836792, 5.471438407897949, 6.541796684265137, 7.612154960632324, 8.682513236999512, 9.7528715133667, 10.82322883605957, 11.893587112426758, 12.963945388793945, 14.034303665161133, 15.10466194152832, 16.175020217895508, 17.245378494262695, 18.315736770629883, 19.38609504699707, 20.456453323364258, 21.526811599731445, 22.59716796875, 23.667526245117188, 24.737884521484375, 25.808242797851562, 26.87860107421875, 27.948959350585938, 29.019317626953125, 30.089675903320312, 31.1600341796875, 32.23039245605469, 33.300750732421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 7.0, 9.0, 6.0, 13.0, 15.0, 15.0, 18.0, 24.0, 20.0, 33.0, 32.0, 45.0, 35.0, 42.0, 48.0, 57.0, 58.0, 61.0, 60.0, 53.0, 46.0, 40.0, 43.0, 31.0, 37.0, 17.0, 22.0, 16.0, 28.0, 7.0, 17.0, 9.0, 7.0, 6.0, 9.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.340259552001953, -14.857845306396484, -14.375432014465332, -13.893017768859863, -13.410604476928711, -12.928190231323242, -12.445775985717773, -11.963362693786621, -11.480949401855469, -10.99853515625, -10.516121864318848, -10.033707618713379, -9.551294326782227, -9.068880081176758, -8.586465835571289, -8.104052543640137, -7.621638298034668, -7.139224529266357, -6.656810760498047, -6.174396514892578, -5.691983222961426, -5.209568977355957, -4.7271552085876465, -4.244741439819336, -3.7623276710510254, -3.279913902282715, -2.7975001335144043, -2.3150861263275146, -1.832672357559204, -1.3502585887908936, -0.8678445816040039, -0.38543081283569336, 0.0969839096069336, 0.5793977379798889, 1.0618115663528442, 1.5442254543304443, 2.026639223098755, 2.5090529918670654, 2.991466999053955, 3.4738807678222656, 3.956294536590576, 4.438708305358887, 4.921122074127197, 5.403535842895508, 5.885950088500977, 6.368363380432129, 6.850777626037598, 7.333191394805908, 7.815605163574219, 8.298019409179688, 8.78043270111084, 9.262846946716309, 9.745260238647461, 10.22767448425293, 10.710088729858398, 11.19250202178955, 11.674915313720703, 12.157329559326172, 12.639742851257324, 13.122157096862793, 13.604570388793945, 14.086984634399414, 14.569398880004883, 15.051812171936035, 15.534226417541504]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 11.0, 21.0, 35.0, 41.0, 52.0, 73.0, 111.0, 177.0, 244.0, 429.0, 655.0, 1116.0, 1935.0, 3375.0, 5853.0, 11200.0, 22545.0, 52054.0, 150481.0, 535166.0, 159386.0, 54057.0, 23466.0, 11501.0, 6023.0, 3445.0, 2039.0, 1147.0, 647.0, 422.0, 284.0, 183.0, 107.0, 81.0, 49.0, 31.0, 29.0, 19.0, 11.0, 10.0, 9.0, 2.0, 6.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-1.35546875, -1.315032958984375, -1.27459716796875, -1.234161376953125, -1.1937255859375, -1.153289794921875, -1.11285400390625, -1.072418212890625, -1.031982421875, -0.991546630859375, -0.95111083984375, -0.910675048828125, -0.8702392578125, -0.829803466796875, -0.78936767578125, -0.748931884765625, -0.70849609375, -0.668060302734375, -0.62762451171875, -0.587188720703125, -0.5467529296875, -0.506317138671875, -0.46588134765625, -0.425445556640625, -0.385009765625, -0.344573974609375, -0.30413818359375, -0.263702392578125, -0.2232666015625, -0.182830810546875, -0.14239501953125, -0.101959228515625, -0.0615234375, -0.021087646484375, 0.01934814453125, 0.059783935546875, 0.1002197265625, 0.140655517578125, 0.18109130859375, 0.221527099609375, 0.261962890625, 0.302398681640625, 0.34283447265625, 0.383270263671875, 0.4237060546875, 0.464141845703125, 0.50457763671875, 0.545013427734375, 0.58544921875, 0.625885009765625, 0.66632080078125, 0.706756591796875, 0.7471923828125, 0.787628173828125, 0.82806396484375, 0.868499755859375, 0.908935546875, 0.949371337890625, 0.98980712890625, 1.030242919921875, 1.0706787109375, 1.111114501953125, 1.15155029296875, 1.191986083984375, 1.232421875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 9.0, 15.0, 14.0, 14.0, 22.0, 18.0, 25.0, 30.0, 39.0, 39.0, 40.0, 50.0, 74.0, 49.0, 54.0, 72.0, 61.0, 51.0, 34.0, 51.0, 33.0, 27.0, 37.0, 30.0, 29.0, 20.0, 11.0, 14.0, 12.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.193359375, -1.157928466796875, -1.12249755859375, -1.087066650390625, -1.0516357421875, -1.016204833984375, -0.98077392578125, -0.945343017578125, -0.909912109375, -0.874481201171875, -0.83905029296875, -0.803619384765625, -0.7681884765625, -0.732757568359375, -0.69732666015625, -0.661895751953125, -0.62646484375, -0.591033935546875, -0.55560302734375, -0.520172119140625, -0.4847412109375, -0.449310302734375, -0.41387939453125, -0.378448486328125, -0.343017578125, -0.307586669921875, -0.27215576171875, -0.236724853515625, -0.2012939453125, -0.165863037109375, -0.13043212890625, -0.095001220703125, -0.0595703125, -0.024139404296875, 0.01129150390625, 0.046722412109375, 0.0821533203125, 0.117584228515625, 0.15301513671875, 0.188446044921875, 0.223876953125, 0.259307861328125, 0.29473876953125, 0.330169677734375, 0.3656005859375, 0.401031494140625, 0.43646240234375, 0.471893310546875, 0.50732421875, 0.542755126953125, 0.57818603515625, 0.613616943359375, 0.6490478515625, 0.684478759765625, 0.71990966796875, 0.755340576171875, 0.790771484375, 0.826202392578125, 0.86163330078125, 0.897064208984375, 0.9324951171875, 0.967926025390625, 1.00335693359375, 1.038787841796875, 1.07421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 6.0, 7.0, 18.0, 30.0, 44.0, 57.0, 114.0, 189.0, 336.0, 765.0, 2146.0, 9174.0, 142000.0, 872407.0, 16223.0, 3057.0, 1038.0, 433.0, 203.0, 111.0, 53.0, 34.0, 31.0, 21.0, 18.0, 10.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.59765625, -5.464813232421875, -5.33197021484375, -5.199127197265625, -5.0662841796875, -4.933441162109375, -4.80059814453125, -4.667755126953125, -4.534912109375, -4.402069091796875, -4.26922607421875, -4.136383056640625, -4.0035400390625, -3.870697021484375, -3.73785400390625, -3.605010986328125, -3.47216796875, -3.339324951171875, -3.20648193359375, -3.073638916015625, -2.9407958984375, -2.807952880859375, -2.67510986328125, -2.542266845703125, -2.409423828125, -2.276580810546875, -2.14373779296875, -2.010894775390625, -1.8780517578125, -1.745208740234375, -1.61236572265625, -1.479522705078125, -1.3466796875, -1.213836669921875, -1.08099365234375, -0.948150634765625, -0.8153076171875, -0.682464599609375, -0.54962158203125, -0.416778564453125, -0.283935546875, -0.151092529296875, -0.01824951171875, 0.114593505859375, 0.2474365234375, 0.380279541015625, 0.51312255859375, 0.645965576171875, 0.77880859375, 0.911651611328125, 1.04449462890625, 1.177337646484375, 1.3101806640625, 1.443023681640625, 1.57586669921875, 1.708709716796875, 1.841552734375, 1.974395751953125, 2.10723876953125, 2.240081787109375, 2.3729248046875, 2.505767822265625, 2.63861083984375, 2.771453857421875, 2.904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 11.0, 24.0, 24.0, 16.0, 24.0, 27.0, 25.0, 39.0, 60.0, 56.0, 98.0, 118.0, 88.0, 67.0, 51.0, 48.0, 37.0, 31.0, 33.0, 16.0, 18.0, 11.0, 9.0, 11.0, 8.0, 6.0, 4.0, 6.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.73828125, -5.56707763671875, -5.3958740234375, -5.22467041015625, -5.053466796875, -4.88226318359375, -4.7110595703125, -4.53985595703125, -4.36865234375, -4.19744873046875, -4.0262451171875, -3.85504150390625, -3.683837890625, -3.51263427734375, -3.3414306640625, -3.17022705078125, -2.9990234375, -2.82781982421875, -2.6566162109375, -2.48541259765625, -2.314208984375, -2.14300537109375, -1.9718017578125, -1.80059814453125, -1.62939453125, -1.45819091796875, -1.2869873046875, -1.11578369140625, -0.944580078125, -0.77337646484375, -0.6021728515625, -0.43096923828125, -0.259765625, -0.08856201171875, 0.0826416015625, 0.25384521484375, 0.425048828125, 0.59625244140625, 0.7674560546875, 0.93865966796875, 1.10986328125, 1.28106689453125, 1.4522705078125, 1.62347412109375, 1.794677734375, 1.96588134765625, 2.1370849609375, 2.30828857421875, 2.4794921875, 2.65069580078125, 2.8218994140625, 2.99310302734375, 3.164306640625, 3.33551025390625, 3.5067138671875, 3.67791748046875, 3.84912109375, 4.02032470703125, 4.1915283203125, 4.36273193359375, 4.533935546875, 4.70513916015625, 4.8763427734375, 5.04754638671875, 5.21875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 10.0, 6.0, 10.0, 12.0, 16.0, 21.0, 38.0, 80.0, 96.0, 149.0, 211.0, 334.0, 620.0, 1133.0, 2423.0, 6551.0, 23424.0, 168384.0, 792187.0, 37347.0, 9012.0, 3178.0, 1446.0, 706.0, 400.0, 233.0, 167.0, 121.0, 75.0, 49.0, 27.0, 21.0, 16.0, 5.0, 6.0, 5.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.56591796875, -0.5498161315917969, -0.5337142944335938, -0.5176124572753906, -0.5015106201171875, -0.4854087829589844, -0.46930694580078125, -0.4532051086425781, -0.437103271484375, -0.4210014343261719, -0.40489959716796875, -0.3887977600097656, -0.3726959228515625, -0.3565940856933594, -0.34049224853515625, -0.3243904113769531, -0.30828857421875, -0.2921867370605469, -0.27608489990234375, -0.2599830627441406, -0.2438812255859375, -0.22777938842773438, -0.21167755126953125, -0.19557571411132812, -0.179473876953125, -0.16337203979492188, -0.14727020263671875, -0.13116836547851562, -0.1150665283203125, -0.09896469116210938, -0.08286285400390625, -0.06676101684570312, -0.0506591796875, -0.034557342529296875, -0.01845550537109375, -0.002353668212890625, 0.0137481689453125, 0.029850006103515625, 0.04595184326171875, 0.062053680419921875, 0.078155517578125, 0.09425735473632812, 0.11035919189453125, 0.12646102905273438, 0.1425628662109375, 0.15866470336914062, 0.17476654052734375, 0.19086837768554688, 0.20697021484375, 0.22307205200195312, 0.23917388916015625, 0.2552757263183594, 0.2713775634765625, 0.2874794006347656, 0.30358123779296875, 0.3196830749511719, 0.335784912109375, 0.3518867492675781, 0.36798858642578125, 0.3840904235839844, 0.4001922607421875, 0.4162940979003906, 0.43239593505859375, 0.4484977722167969, 0.464599609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 11.0, 25.0, 19.0, 27.0, 40.0, 66.0, 105.0, 188.0, 167.0, 132.0, 63.0, 45.0, 26.0, 25.0, 15.0, 17.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00026535987854003906, -0.0002579987049102783, -0.0002506375312805176, -0.00024327635765075684, -0.0002359151840209961, -0.00022855401039123535, -0.0002211928367614746, -0.00021383166313171387, -0.00020647048950195312, -0.00019910931587219238, -0.00019174814224243164, -0.0001843869686126709, -0.00017702579498291016, -0.00016966462135314941, -0.00016230344772338867, -0.00015494227409362793, -0.0001475811004638672, -0.00014021992683410645, -0.0001328587532043457, -0.00012549757957458496, -0.00011813640594482422, -0.00011077523231506348, -0.00010341405868530273, -9.605288505554199e-05, -8.869171142578125e-05, -8.133053779602051e-05, -7.396936416625977e-05, -6.660819053649902e-05, -5.924701690673828e-05, -5.188584327697754e-05, -4.45246696472168e-05, -3.7163496017456055e-05, -2.9802322387695312e-05, -2.244114875793457e-05, -1.5079975128173828e-05, -7.718801498413086e-06, -3.5762786865234375e-07, 7.0035457611083984e-06, 1.436471939086914e-05, 2.1725893020629883e-05, 2.9087066650390625e-05, 3.644824028015137e-05, 4.380941390991211e-05, 5.117058753967285e-05, 5.8531761169433594e-05, 6.589293479919434e-05, 7.325410842895508e-05, 8.061528205871582e-05, 8.797645568847656e-05, 9.53376293182373e-05, 0.00010269880294799805, 0.00011005997657775879, 0.00011742115020751953, 0.00012478232383728027, 0.00013214349746704102, 0.00013950467109680176, 0.0001468658447265625, 0.00015422701835632324, 0.00016158819198608398, 0.00016894936561584473, 0.00017631053924560547, 0.0001836717128753662, 0.00019103288650512695, 0.0001983940601348877, 0.00020575523376464844]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 6.0, 14.0, 15.0, 30.0, 46.0, 72.0, 94.0, 161.0, 298.0, 485.0, 933.0, 2152.0, 5285.0, 17101.0, 84366.0, 836735.0, 75606.0, 15860.0, 5082.0, 2115.0, 927.0, 463.0, 280.0, 144.0, 86.0, 52.0, 32.0, 35.0, 11.0, 10.0, 9.0, 13.0, 9.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477294921875, -0.4645576477050781, -0.45182037353515625, -0.4390830993652344, -0.4263458251953125, -0.4136085510253906, -0.40087127685546875, -0.3881340026855469, -0.375396728515625, -0.3626594543457031, -0.34992218017578125, -0.3371849060058594, -0.3244476318359375, -0.3117103576660156, -0.29897308349609375, -0.2862358093261719, -0.27349853515625, -0.2607612609863281, -0.24802398681640625, -0.23528671264648438, -0.2225494384765625, -0.20981216430664062, -0.19707489013671875, -0.18433761596679688, -0.171600341796875, -0.15886306762695312, -0.14612579345703125, -0.13338851928710938, -0.1206512451171875, -0.10791397094726562, -0.09517669677734375, -0.08243942260742188, -0.0697021484375, -0.056964874267578125, -0.04422760009765625, -0.031490325927734375, -0.0187530517578125, -0.006015777587890625, 0.00672149658203125, 0.019458770751953125, 0.032196044921875, 0.044933319091796875, 0.05767059326171875, 0.07040786743164062, 0.0831451416015625, 0.09588241577148438, 0.10861968994140625, 0.12135696411132812, 0.13409423828125, 0.14683151245117188, 0.15956878662109375, 0.17230606079101562, 0.1850433349609375, 0.19778060913085938, 0.21051788330078125, 0.22325515747070312, 0.235992431640625, 0.24872970581054688, 0.26146697998046875, 0.2742042541503906, 0.2869415283203125, 0.2996788024902344, 0.31241607666015625, 0.3251533508300781, 0.337890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 11.0, 10.0, 5.0, 10.0, 14.0, 23.0, 27.0, 35.0, 74.0, 142.0, 196.0, 197.0, 77.0, 42.0, 38.0, 20.0, 19.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.0218505859375, -0.993896484375, -0.9659423828125, -0.93798828125, -0.9100341796875, -0.882080078125, -0.8541259765625, -0.826171875, -0.7982177734375, -0.770263671875, -0.7423095703125, -0.71435546875, -0.6864013671875, -0.658447265625, -0.6304931640625, -0.6025390625, -0.5745849609375, -0.546630859375, -0.5186767578125, -0.49072265625, -0.4627685546875, -0.434814453125, -0.4068603515625, -0.37890625, -0.3509521484375, -0.322998046875, -0.2950439453125, -0.26708984375, -0.2391357421875, -0.211181640625, -0.1832275390625, -0.1552734375, -0.1273193359375, -0.099365234375, -0.0714111328125, -0.04345703125, -0.0155029296875, 0.012451171875, 0.0404052734375, 0.068359375, 0.0963134765625, 0.124267578125, 0.1522216796875, 0.18017578125, 0.2081298828125, 0.236083984375, 0.2640380859375, 0.2919921875, 0.3199462890625, 0.347900390625, 0.3758544921875, 0.40380859375, 0.4317626953125, 0.459716796875, 0.4876708984375, 0.515625, 0.5435791015625, 0.571533203125, 0.5994873046875, 0.62744140625, 0.6553955078125, 0.683349609375, 0.7113037109375, 0.7392578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 11.0, 25.0, 44.0, 149.0, 574.0, 112.0, 44.0, 28.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.82303810119629, -29.77545166015625, -28.727863311767578, -27.68027687072754, -26.6326904296875, -25.58510398864746, -24.537517547607422, -23.48992919921875, -22.44234275817871, -21.394756317138672, -20.34716796875, -19.29958152770996, -18.251995086669922, -17.204408645629883, -16.156822204589844, -15.109233856201172, -14.061647415161133, -13.014060974121094, -11.966473579406738, -10.918886184692383, -9.871299743652344, -8.823713302612305, -7.776125907897949, -6.728538990020752, -5.680952072143555, -4.633365154266357, -3.58577823638916, -2.538191318511963, -1.4906044006347656, -0.44301748275756836, 0.6045694351196289, 1.6521563529968262, 2.6997451782226562, 3.7473320960998535, 4.794919013977051, 5.842505931854248, 6.890092849731445, 7.937679767608643, 8.98526668548584, 10.032854080200195, 11.080440521240234, 12.128026962280273, 13.175614356994629, 14.223201751708984, 15.270788192749023, 16.318374633789062, 17.365962982177734, 18.413549423217773, 19.461135864257812, 20.50872230529785, 21.55630874633789, 22.603897094726562, 23.6514835357666, 24.69906997680664, 25.746658325195312, 26.79424476623535, 27.84183120727539, 28.88941764831543, 29.93700408935547, 30.98459243774414, 32.03218078613281, 33.07976531982422, 34.12735366821289, 35.1749382019043, 36.22252655029297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 8.0, 7.0, 9.0, 10.0, 7.0, 22.0, 12.0, 18.0, 19.0, 22.0, 21.0, 30.0, 45.0, 110.0, 165.0, 143.0, 109.0, 39.0, 26.0, 25.0, 17.0, 18.0, 18.0, 10.0, 11.0, 11.0, 17.0, 13.0, 4.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.334632873535156, -11.94738483428955, -11.560136795043945, -11.17288875579834, -10.785640716552734, -10.398392677307129, -10.011144638061523, -9.623896598815918, -9.236648559570312, -8.849400520324707, -8.462152481079102, -8.074904441833496, -7.687656402587891, -7.300408363342285, -6.91316032409668, -6.525912284851074, -6.1386637687683105, -5.751415729522705, -5.3641676902771, -4.976919651031494, -4.589671611785889, -4.202423572540283, -3.8151752948760986, -3.427927255630493, -3.0406792163848877, -2.6534311771392822, -2.2661831378936768, -1.8789349794387817, -1.4916869401931763, -1.1044389009475708, -0.7171907424926758, -0.3299427032470703, 0.057305335998535156, 0.444553405046463, 0.8318014740943909, 1.2190495729446411, 1.6062976121902466, 1.993545651435852, 2.380793809890747, 2.7680418491363525, 3.155289888381958, 3.5425379276275635, 3.929785966873169, 4.3170342445373535, 4.704282283782959, 5.0915303230285645, 5.47877836227417, 5.866026401519775, 6.253274440765381, 6.640522480010986, 7.027770519256592, 7.415018558502197, 7.802266597747803, 8.189515113830566, 8.576763153076172, 8.964011192321777, 9.351259231567383, 9.738507270812988, 10.125755310058594, 10.5130033493042, 10.900251388549805, 11.28749942779541, 11.674747467041016, 12.061995506286621, 12.449243545532227]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 9.0, 11.0, 9.0, 10.0, 12.0, 12.0, 18.0, 29.0, 17.0, 33.0, 34.0, 34.0, 55.0, 123.0, 250.0, 66.0, 33.0, 28.0, 25.0, 28.0, 19.0, 17.0, 14.0, 16.0, 15.0, 10.0, 10.0, 9.0, 6.0, 7.0, 3.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.078125, -1.0498580932617188, -1.0215911865234375, -0.9933242797851562, -0.965057373046875, -0.9367904663085938, -0.9085235595703125, -0.8802566528320312, -0.85198974609375, -0.8237228393554688, -0.7954559326171875, -0.7671890258789062, -0.738922119140625, -0.7106552124023438, -0.6823883056640625, -0.6541213989257812, -0.6258544921875, -0.5975875854492188, -0.5693206787109375, -0.5410537719726562, -0.512786865234375, -0.48451995849609375, -0.4562530517578125, -0.42798614501953125, -0.39971923828125, -0.37145233154296875, -0.3431854248046875, -0.31491851806640625, -0.286651611328125, -0.25838470458984375, -0.2301177978515625, -0.20185089111328125, -0.173583984375, -0.14531707763671875, -0.1170501708984375, -0.08878326416015625, -0.060516357421875, -0.03224945068359375, -0.0039825439453125, 0.02428436279296875, 0.05255126953125, 0.08081817626953125, 0.1090850830078125, 0.13735198974609375, 0.165618896484375, 0.19388580322265625, 0.2221527099609375, 0.25041961669921875, 0.2786865234375, 0.30695343017578125, 0.3352203369140625, 0.36348724365234375, 0.391754150390625, 0.42002105712890625, 0.4482879638671875, 0.47655487060546875, 0.50482177734375, 0.5330886840820312, 0.5613555908203125, 0.5896224975585938, 0.617889404296875, 0.6461563110351562, 0.6744232177734375, 0.7026901245117188, 0.73095703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 18.0, 15.0, 27.0, 48.0, 99.0, 284.0, 1242.0, 9081.0, 8364688.0, 11113.0, 1319.0, 344.0, 145.0, 48.0, 31.0, 19.0, 5.0, 5.0, 11.0, 16.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0], "bins": [-14.428406715393066, -13.922683715820312, -13.416961669921875, -12.911238670349121, -12.405515670776367, -11.89979362487793, -11.394070625305176, -10.888347625732422, -10.382625579833984, -9.87690258026123, -9.371180534362793, -8.865457534790039, -8.359735488891602, -7.854012489318848, -7.348289489746094, -6.842566967010498, -6.336844444274902, -5.831121921539307, -5.325399398803711, -4.819676399230957, -4.313953876495361, -3.8082313537597656, -3.302508592605591, -2.796785831451416, -2.2910633087158203, -1.785340666770935, -1.2796180248260498, -0.7738953828811646, -0.2681727409362793, 0.2375497817993164, 0.7432725429534912, 1.248995304107666, 1.7547187805175781, 2.260441303253174, 2.7661640644073486, 3.2718868255615234, 3.777609348297119, 4.283331871032715, 4.789054870605469, 5.2947773933410645, 5.80049991607666, 6.306222438812256, 6.811944961547852, 7.3176679611206055, 7.823390483856201, 8.329113006591797, 8.83483600616455, 9.340559005737305, 9.846281051635742, 10.352004051208496, 10.857726097106934, 11.363449096679688, 11.869171142578125, 12.374894142150879, 12.880617141723633, 13.38633918762207, 13.892062187194824, 14.397785186767578, 14.903507232666016, 15.40923023223877, 15.914953231811523, 16.42067527770996, 16.9263973236084, 17.43212127685547, 17.937843322753906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 12.0, 8.0, 11.0, 4.0, 6.0, 7.0, 4.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.34786033630371, -17.9002742767334, -17.45269012451172, -17.005104064941406, -16.557518005371094, -16.10993194580078, -15.662347793579102, -15.214761734008789, -14.767176628112793, -14.319591522216797, -13.872005462646484, -13.424420356750488, -12.976835250854492, -12.52924919128418, -12.081664085388184, -11.634078979492188, -11.186492919921875, -10.738907814025879, -10.291321754455566, -9.84373664855957, -9.396150588989258, -8.948565483093262, -8.500980377197266, -8.053394317626953, -7.605809211730957, -7.158223628997803, -6.710638046264648, -6.263052940368652, -5.815467357635498, -5.367881774902344, -4.920296669006348, -4.472711086273193, -4.025124549865723, -3.5775389671325684, -3.129953622817993, -2.682368278503418, -2.2347826957702637, -1.7871971130371094, -1.3396117687225342, -0.892026424407959, -0.4444408416748047, 0.0031446218490600586, 0.4507300853729248, 0.8983155488967896, 1.3459010124206543, 1.7934865951538086, 2.241071939468384, 2.688657283782959, 3.1362428665161133, 3.5838284492492676, 4.031414031982422, 4.478999137878418, 4.926584720611572, 5.374170303344727, 5.821755409240723, 6.269340991973877, 6.716926574707031, 7.1645121574401855, 7.61209774017334, 8.059682846069336, 8.507268905639648, 8.954854011535645, 9.40243911743164, 9.850025177001953, 10.29761028289795]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 10.0, 4.0, 11.0, 11.0, 16.0, 19.0, 27.0, 37.0, 52.0, 80.0, 132.0, 231.0, 402.0, 860.0, 1823.0, 3979.0, 10163.0, 28252.0, 90381.0, 212254.0, 117146.0, 36323.0, 12858.0, 4962.0, 2153.0, 957.0, 468.0, 268.0, 136.0, 69.0, 73.0, 24.0, 26.0, 19.0, 14.0, 6.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.984375, -7.76019287109375, -7.5360107421875, -7.31182861328125, -7.087646484375, -6.86346435546875, -6.6392822265625, -6.41510009765625, -6.19091796875, -5.96673583984375, -5.7425537109375, -5.51837158203125, -5.294189453125, -5.07000732421875, -4.8458251953125, -4.62164306640625, -4.3974609375, -4.17327880859375, -3.9490966796875, -3.72491455078125, -3.500732421875, -3.27655029296875, -3.0523681640625, -2.82818603515625, -2.60400390625, -2.37982177734375, -2.1556396484375, -1.93145751953125, -1.707275390625, -1.48309326171875, -1.2589111328125, -1.03472900390625, -0.810546875, -0.58636474609375, -0.3621826171875, -0.13800048828125, 0.086181640625, 0.31036376953125, 0.5345458984375, 0.75872802734375, 0.98291015625, 1.20709228515625, 1.4312744140625, 1.65545654296875, 1.879638671875, 2.10382080078125, 2.3280029296875, 2.55218505859375, 2.7763671875, 3.00054931640625, 3.2247314453125, 3.44891357421875, 3.673095703125, 3.89727783203125, 4.1214599609375, 4.34564208984375, 4.56982421875, 4.79400634765625, 5.0181884765625, 5.24237060546875, 5.466552734375, 5.69073486328125, 5.9149169921875, 6.13909912109375, 6.36328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 5.0, 8.0, 10.0, 9.0, 19.0, 23.0, 23.0, 33.0, 46.0, 49.0, 56.0, 59.0, 55.0, 71.0, 93.0, 84.0, 71.0, 60.0, 53.0, 33.0, 27.0, 21.0, 22.0, 17.0, 14.0, 6.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4498443603515625, -1.408477783203125, -1.3671112060546875, -1.32574462890625, -1.2843780517578125, -1.243011474609375, -1.2016448974609375, -1.1602783203125, -1.1189117431640625, -1.077545166015625, -1.0361785888671875, -0.99481201171875, -0.9534454345703125, -0.912078857421875, -0.8707122802734375, -0.829345703125, -0.7879791259765625, -0.746612548828125, -0.7052459716796875, -0.66387939453125, -0.6225128173828125, -0.581146240234375, -0.5397796630859375, -0.4984130859375, -0.4570465087890625, -0.415679931640625, -0.3743133544921875, -0.33294677734375, -0.2915802001953125, -0.250213623046875, -0.2088470458984375, -0.16748046875, -0.1261138916015625, -0.084747314453125, -0.0433807373046875, -0.00201416015625, 0.0393524169921875, 0.080718994140625, 0.1220855712890625, 0.1634521484375, 0.2048187255859375, 0.246185302734375, 0.2875518798828125, 0.32891845703125, 0.3702850341796875, 0.411651611328125, 0.4530181884765625, 0.494384765625, 0.5357513427734375, 0.577117919921875, 0.6184844970703125, 0.65985107421875, 0.7012176513671875, 0.742584228515625, 0.7839508056640625, 0.8253173828125, 0.8666839599609375, 0.908050537109375, 0.9494171142578125, 0.99078369140625, 1.0321502685546875, 1.073516845703125, 1.1148834228515625, 1.15625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 13.0, 4.0, 11.0, 21.0, 35.0, 62.0, 144.0, 121.0, 43.0, 15.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673454284667969, -9.242777824401855, -8.812101364135742, -8.381423950195312, -7.950747489929199, -7.520071029663086, -7.089394569396973, -6.658718109130859, -6.228041172027588, -5.797364711761475, -5.366687774658203, -4.93601131439209, -4.505334854125977, -4.074657917022705, -3.643981456756592, -3.2133047580718994, -2.782628059387207, -2.3519513607025146, -1.9212747812271118, -1.490598201751709, -1.0599215030670166, -0.6292448043823242, -0.19856834411621094, 0.23210835456848145, 0.6627850532531738, 1.0934617519378662, 1.524138331413269, 1.9548149108886719, 2.3854916095733643, 2.8161683082580566, 3.24684476852417, 3.6775214672088623, 4.108198165893555, 4.538874626159668, 4.9695515632629395, 5.400228023529053, 5.830904960632324, 6.2615814208984375, 6.692257881164551, 7.122934341430664, 7.5536112785339355, 7.984287738800049, 8.41496467590332, 8.845641136169434, 9.276317596435547, 9.706995010375977, 10.137670516967773, 10.568347930908203, 10.999024391174316, 11.42970085144043, 11.860377311706543, 12.291053771972656, 12.721731185913086, 13.1524076461792, 13.583084106445312, 14.013760566711426, 14.444437026977539, 14.875113487243652, 15.305789947509766, 15.736467361450195, 16.167142868041992, 16.597820281982422, 17.02849578857422, 17.45917320251465, 17.889850616455078]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 5.0, 9.0, 9.0, 9.0, 11.0, 20.0, 48.0, 66.0, 90.0, 73.0, 46.0, 31.0, 18.0, 5.0, 4.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.619020462036133, -6.4260993003845215, -6.23317813873291, -6.040256977081299, -5.8473358154296875, -5.654414176940918, -5.461493015289307, -5.268571853637695, -5.075650691986084, -4.882729530334473, -4.689808368682861, -4.49688720703125, -4.3039655685424805, -4.111044406890869, -3.918123245239258, -3.7252020835876465, -3.532280921936035, -3.339359760284424, -3.1464385986328125, -2.953517198562622, -2.7605960369110107, -2.5676748752593994, -2.374753475189209, -2.1818323135375977, -1.9889111518859863, -1.795989990234375, -1.6030687093734741, -1.4101474285125732, -1.217226266860962, -1.0243051052093506, -0.8313838243484497, -0.6384625434875488, -0.4455413818359375, -0.2526201605796814, -0.05969893932342529, 0.1332222819328308, 0.3261435031890869, 0.519064724445343, 0.7119859457015991, 0.9049072265625, 1.0978283882141113, 1.2907495498657227, 1.4836708307266235, 1.6765921115875244, 1.8695132732391357, 2.062434434890747, 2.2553558349609375, 2.448276996612549, 2.64119815826416, 2.8341193199157715, 3.027040481567383, 3.2199618816375732, 3.4128830432891846, 3.605804204940796, 3.7987256050109863, 3.9916467666625977, 4.184567928314209, 4.37748908996582, 4.570410251617432, 4.763331413269043, 4.9562530517578125, 5.149174213409424, 5.342095375061035, 5.5350165367126465, 5.727937698364258]}, "eval/loss": 4.745861530303955, "eval/wer": 1.976279254264181, "eval/runtime": 966.758, "eval/samples_per_second": 2.733, "eval/steps_per_second": 0.342, "train/train_runtime": 8574.3703, "train/train_samples_per_second": 3.328, "train/train_steps_per_second": 0.208, "train/total_flos": 0.0, "train/train_loss": 4.819954753590272} \ No newline at end of file