{"train/loss": 6.632, "train/learning_rate": 0.0002982, "train/epoch": 0.49, "train/global_step": 500, "_runtime": 2357, "_timestamp": 1646259834, "_step": 499, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 7.0, 11.0, 21.0, 48.0, 206.0, 453.0, 126.0, 65.0, 23.0, 21.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-165.7322998046875, -145.85516357421875, -125.97804260253906, -106.10090637207031, -86.2237777709961, -66.34664916992188, -46.469512939453125, -26.592391967773438, -6.7152557373046875, 13.161874771118164, 33.039005279541016, 52.9161376953125, 72.79326629638672, 92.67039489746094, 112.54753112792969, 132.42465209960938, 152.30178833007812, 172.17892456054688, 192.05604553222656, 211.9331817626953, 231.810302734375, 251.68743896484375, 271.5645751953125, 291.44171142578125, 311.31884765625, 331.19598388671875, 351.0731201171875, 370.95025634765625, 390.8273620605469, 410.7044982910156, 430.5816345214844, 450.458740234375, 470.33587646484375, 490.2130126953125, 510.09014892578125, 529.96728515625, 549.8444213867188, 569.7215576171875, 589.5986328125, 609.4757690429688, 629.3529052734375, 649.2300415039062, 669.107177734375, 688.9843139648438, 708.8614501953125, 728.738525390625, 748.61572265625, 768.4927978515625, 788.3699951171875, 808.2471313476562, 828.124267578125, 848.0014038085938, 867.8785400390625, 887.755615234375, 907.6328125, 927.5098876953125, 947.3870239257812, 967.26416015625, 987.1412963867188, 1007.0184326171875, 1026.8955078125, 1046.772705078125, 1066.6497802734375, 1086.5269775390625, 1106.404052734375]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 9.0, 7.0, 5.0, 12.0, 13.0, 10.0, 15.0, 13.0, 17.0, 21.0, 23.0, 22.0, 28.0, 24.0, 26.0, 43.0, 67.0, 106.0, 124.0, 91.0, 41.0, 32.0, 34.0, 29.0, 24.0, 29.0, 19.0, 13.0, 12.0, 11.0, 15.0, 10.0, 11.0, 4.0, 5.0, 3.0, 3.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-919.1222534179688, -892.2859497070312, -865.44970703125, -838.6134033203125, -811.7771606445312, -784.9408569335938, -758.1046142578125, -731.268310546875, -704.4320068359375, -677.595703125, -650.7594604492188, -623.9231567382812, -597.0869140625, -570.2506103515625, -543.414306640625, -516.5780639648438, -489.7417907714844, -462.905517578125, -436.0692443847656, -409.23297119140625, -382.39666748046875, -355.5603942871094, -328.72412109375, -301.8878173828125, -275.05157470703125, -248.21530151367188, -221.37901306152344, -194.54273986816406, -167.70645141601562, -140.87017822265625, -114.03390502929688, -87.19761657714844, -60.361328125, -33.525047302246094, -6.688770294189453, 20.147506713867188, 46.983787536621094, 73.820068359375, 100.65634155273438, 127.49263000488281, 154.3289031982422, 181.16517639160156, 208.00146484375, 234.83773803710938, 261.67401123046875, 288.51031494140625, 315.3465576171875, 342.182861328125, 369.0191345214844, 395.85540771484375, 422.6916809082031, 449.5279541015625, 476.3642578125, 503.2005310058594, 530.0368041992188, 556.8731079101562, 583.7093505859375, 610.545654296875, 637.3818969726562, 664.2182006835938, 691.054443359375, 717.8907470703125, 744.72705078125, 771.5632934570312, 798.3995971679688]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 11.0, 7.0, 8.0, 6.0, 14.0, 14.0, 15.0, 8.0, 23.0, 22.0, 28.0, 24.0, 25.0, 33.0, 39.0, 64.0, 94.0, 125.0, 99.0, 54.0, 36.0, 34.0, 29.0, 31.0, 29.0, 18.0, 12.0, 11.0, 16.0, 15.0, 11.0, 5.0, 4.0, 6.0, 2.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.484375, -25.708251953125, -24.93212890625, -24.156005859375, -23.3798828125, -22.603759765625, -21.82763671875, -21.051513671875, -20.275390625, -19.499267578125, -18.72314453125, -17.947021484375, -17.1708984375, -16.394775390625, -15.61865234375, -14.842529296875, -14.06640625, -13.290283203125, -12.51416015625, -11.738037109375, -10.9619140625, -10.185791015625, -9.40966796875, -8.633544921875, -7.857421875, -7.081298828125, -6.30517578125, -5.529052734375, -4.7529296875, -3.976806640625, -3.20068359375, -2.424560546875, -1.6484375, -0.872314453125, -0.09619140625, 0.679931640625, 1.4560546875, 2.232177734375, 3.00830078125, 3.784423828125, 4.560546875, 5.336669921875, 6.11279296875, 6.888916015625, 7.6650390625, 8.441162109375, 9.21728515625, 9.993408203125, 10.76953125, 11.545654296875, 12.32177734375, 13.097900390625, 13.8740234375, 14.650146484375, 15.42626953125, 16.202392578125, 16.978515625, 17.754638671875, 18.53076171875, 19.306884765625, 20.0830078125, 20.859130859375, 21.63525390625, 22.411376953125, 23.1875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 8.0, 7.0, 9.0, 11.0, 21.0, 18.0, 35.0, 38.0, 55.0, 56.0, 82.0, 128.0, 154.0, 203.0, 316.0, 456.0, 715.0, 1075.0, 1847.0, 3663.0, 8482.0, 24284.0, 407340.0, 3681098.0, 42518.0, 11499.0, 4491.0, 2157.0, 1182.0, 729.0, 470.0, 320.0, 195.0, 166.0, 134.0, 73.0, 63.0, 35.0, 24.0, 35.0, 19.0, 23.0, 14.0, 11.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-174.125, -169.033203125, -163.94140625, -158.849609375, -153.7578125, -148.666015625, -143.57421875, -138.482421875, -133.390625, -128.298828125, -123.20703125, -118.115234375, -113.0234375, -107.931640625, -102.83984375, -97.748046875, -92.65625, -87.564453125, -82.47265625, -77.380859375, -72.2890625, -67.197265625, -62.10546875, -57.013671875, -51.921875, -46.830078125, -41.73828125, -36.646484375, -31.5546875, -26.462890625, -21.37109375, -16.279296875, -11.1875, -6.095703125, -1.00390625, 4.087890625, 9.1796875, 14.271484375, 19.36328125, 24.455078125, 29.546875, 34.638671875, 39.73046875, 44.822265625, 49.9140625, 55.005859375, 60.09765625, 65.189453125, 70.28125, 75.373046875, 80.46484375, 85.556640625, 90.6484375, 95.740234375, 100.83203125, 105.923828125, 111.015625, 116.107421875, 121.19921875, 126.291015625, 131.3828125, 136.474609375, 141.56640625, 146.658203125, 151.75]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 9.0, 15.0, 12.0, 19.0, 21.0, 24.0, 24.0, 29.0, 36.0, 33.0, 43.0, 64.0, 82.0, 132.0, 197.0, 413.0, 1017.0, 878.0, 402.0, 161.0, 107.0, 56.0, 60.0, 39.0, 34.0, 27.0, 19.0, 20.0, 3.0, 16.0, 12.0, 13.0, 9.0, 9.0, 2.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-91.5625, -89.01171875, -86.4609375, -83.91015625, -81.359375, -78.80859375, -76.2578125, -73.70703125, -71.15625, -68.60546875, -66.0546875, -63.50390625, -60.953125, -58.40234375, -55.8515625, -53.30078125, -50.75, -48.19921875, -45.6484375, -43.09765625, -40.546875, -37.99609375, -35.4453125, -32.89453125, -30.34375, -27.79296875, -25.2421875, -22.69140625, -20.140625, -17.58984375, -15.0390625, -12.48828125, -9.9375, -7.38671875, -4.8359375, -2.28515625, 0.265625, 2.81640625, 5.3671875, 7.91796875, 10.46875, 13.01953125, 15.5703125, 18.12109375, 20.671875, 23.22265625, 25.7734375, 28.32421875, 30.875, 33.42578125, 35.9765625, 38.52734375, 41.078125, 43.62890625, 46.1796875, 48.73046875, 51.28125, 53.83203125, 56.3828125, 58.93359375, 61.484375, 64.03515625, 66.5859375, 69.13671875, 71.6875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 2.0, 10.0, 9.0, 11.0, 17.0, 20.0, 24.0, 33.0, 46.0, 59.0, 64.0, 69.0, 77.0, 111.0, 135.0, 201.0, 368.0, 919.0, 3283.0, 19238.0, 270568.0, 3833671.0, 54853.0, 7303.0, 1623.0, 555.0, 270.0, 157.0, 120.0, 85.0, 67.0, 52.0, 48.0, 48.0, 33.0, 33.0, 25.0, 14.0, 15.0, 7.0, 13.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-262.0, -254.1171875, -246.234375, -238.3515625, -230.46875, -222.5859375, -214.703125, -206.8203125, -198.9375, -191.0546875, -183.171875, -175.2890625, -167.40625, -159.5234375, -151.640625, -143.7578125, -135.875, -127.9921875, -120.109375, -112.2265625, -104.34375, -96.4609375, -88.578125, -80.6953125, -72.8125, -64.9296875, -57.046875, -49.1640625, -41.28125, -33.3984375, -25.515625, -17.6328125, -9.75, -1.8671875, 6.015625, 13.8984375, 21.78125, 29.6640625, 37.546875, 45.4296875, 53.3125, 61.1953125, 69.078125, 76.9609375, 84.84375, 92.7265625, 100.609375, 108.4921875, 116.375, 124.2578125, 132.140625, 140.0234375, 147.90625, 155.7890625, 163.671875, 171.5546875, 179.4375, 187.3203125, 195.203125, 203.0859375, 210.96875, 218.8515625, 226.734375, 234.6171875, 242.5]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 13.0, 214.0, 748.0, 29.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-401.31201171875, -346.63958740234375, -291.9671936035156, -237.29478454589844, -182.62237548828125, -127.949951171875, -73.27755737304688, -18.60516357421875, 36.0672607421875, 90.73966979980469, 145.41207885742188, 200.08448791503906, 254.75689697265625, 309.4293212890625, 364.1017150878906, 418.77410888671875, 473.446533203125, 528.1189575195312, 582.7913818359375, 637.4637451171875, 692.1361694335938, 746.80859375, 801.48095703125, 856.1533813476562, 910.8258056640625, 965.4982299804688, 1020.170654296875, 1074.843017578125, 1129.515380859375, 1184.1878662109375, 1238.8602294921875, 1293.53271484375, 1348.205078125, 1402.87744140625, 1457.5499267578125, 1512.2222900390625, 1566.894775390625, 1621.567138671875, 1676.239501953125, 1730.911865234375, 1785.5843505859375, 1840.2567138671875, 1894.92919921875, 1949.6015625, 2004.27392578125, 2058.9462890625, 2113.618896484375, 2168.291259765625, 2222.963623046875, 2277.635986328125, 2332.308349609375, 2386.98095703125, 2441.6533203125, 2496.32568359375, 2550.998046875, 2605.67041015625, 2660.3427734375, 2715.01513671875, 2769.6875, 2824.360107421875, 2879.032470703125, 2933.704833984375, 2988.377197265625, 3043.049560546875, 3097.72216796875]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 13.0, 12.0, 15.0, 16.0, 17.0, 14.0, 30.0, 33.0, 25.0, 34.0, 45.0, 41.0, 44.0, 29.0, 44.0, 48.0, 31.0, 47.0, 45.0, 44.0, 36.0, 40.0, 32.0, 31.0, 23.0, 29.0, 28.0, 30.0, 25.0, 16.0, 10.0, 14.0, 12.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-349.6394958496094, -338.2491455078125, -326.8587951660156, -315.46844482421875, -304.0780944824219, -292.687744140625, -281.29742431640625, -269.9070739746094, -258.5167236328125, -247.12637329101562, -235.73602294921875, -224.34567260742188, -212.95533752441406, -201.5649871826172, -190.1746368408203, -178.7843017578125, -167.39393615722656, -156.0035858154297, -144.6132354736328, -133.222900390625, -121.83255004882812, -110.44219970703125, -99.05184936523438, -87.66150665283203, -76.27115631103516, -64.88080596923828, -53.49046325683594, -42.10011291503906, -30.709766387939453, -19.319419860839844, -7.929069519042969, 3.461273193359375, 14.85162353515625, 26.24197006225586, 37.63231658935547, 49.022666931152344, 60.41301345825195, 71.80335998535156, 83.19371032714844, 94.58405303955078, 105.97440338134766, 117.36475372314453, 128.75509643554688, 140.14544677734375, 151.53579711914062, 162.9261474609375, 174.31649780273438, 185.7068328857422, 197.09718322753906, 208.48753356933594, 219.8778839111328, 231.26821899414062, 242.6585693359375, 254.04891967773438, 265.43927001953125, 276.8296203613281, 288.219970703125, 299.6103210449219, 311.00067138671875, 322.3910217285156, 333.7813720703125, 345.17169189453125, 356.56207275390625, 367.952392578125, 379.3427429199219]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 12.0, 10.0, 13.0, 14.0, 13.0, 20.0, 20.0, 30.0, 29.0, 23.0, 46.0, 44.0, 48.0, 82.0, 76.0, 75.0, 67.0, 55.0, 63.0, 45.0, 32.0, 28.0, 22.0, 18.0, 17.0, 10.0, 10.0, 7.0, 11.0, 8.0, 4.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.078125, -27.263671875, -26.44921875, -25.634765625, -24.8203125, -24.005859375, -23.19140625, -22.376953125, -21.5625, -20.748046875, -19.93359375, -19.119140625, -18.3046875, -17.490234375, -16.67578125, -15.861328125, -15.046875, -14.232421875, -13.41796875, -12.603515625, -11.7890625, -10.974609375, -10.16015625, -9.345703125, -8.53125, -7.716796875, -6.90234375, -6.087890625, -5.2734375, -4.458984375, -3.64453125, -2.830078125, -2.015625, -1.201171875, -0.38671875, 0.427734375, 1.2421875, 2.056640625, 2.87109375, 3.685546875, 4.5, 5.314453125, 6.12890625, 6.943359375, 7.7578125, 8.572265625, 9.38671875, 10.201171875, 11.015625, 11.830078125, 12.64453125, 13.458984375, 14.2734375, 15.087890625, 15.90234375, 16.716796875, 17.53125, 18.345703125, 19.16015625, 19.974609375, 20.7890625, 21.603515625, 22.41796875, 23.232421875, 24.046875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 10.0, 10.0, 16.0, 18.0, 32.0, 38.0, 58.0, 85.0, 127.0, 186.0, 256.0, 379.0, 573.0, 859.0, 1300.0, 1987.0, 3040.0, 4692.0, 7300.0, 11860.0, 19714.0, 36127.0, 73939.0, 197245.0, 446154.0, 120518.0, 52516.0, 27280.0, 15588.0, 9426.0, 5990.0, 3783.0, 2518.0, 1681.0, 1033.0, 706.0, 505.0, 314.0, 222.0, 135.0, 100.0, 70.0, 50.0, 39.0, 29.0, 15.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0], "bins": [-1.0771484375, -1.0457229614257812, -1.0142974853515625, -0.9828720092773438, -0.951446533203125, -0.9200210571289062, -0.8885955810546875, -0.8571701049804688, -0.82574462890625, -0.7943191528320312, -0.7628936767578125, -0.7314682006835938, -0.700042724609375, -0.6686172485351562, -0.6371917724609375, -0.6057662963867188, -0.5743408203125, -0.5429153442382812, -0.5114898681640625, -0.48006439208984375, -0.448638916015625, -0.41721343994140625, -0.3857879638671875, -0.35436248779296875, -0.32293701171875, -0.29151153564453125, -0.2600860595703125, -0.22866058349609375, -0.197235107421875, -0.16580963134765625, -0.1343841552734375, -0.10295867919921875, -0.071533203125, -0.04010772705078125, -0.0086822509765625, 0.02274322509765625, 0.054168701171875, 0.08559417724609375, 0.1170196533203125, 0.14844512939453125, 0.17987060546875, 0.21129608154296875, 0.2427215576171875, 0.27414703369140625, 0.305572509765625, 0.33699798583984375, 0.3684234619140625, 0.39984893798828125, 0.4312744140625, 0.46269989013671875, 0.4941253662109375, 0.5255508422851562, 0.556976318359375, 0.5884017944335938, 0.6198272705078125, 0.6512527465820312, 0.68267822265625, 0.7141036987304688, 0.7455291748046875, 0.7769546508789062, 0.808380126953125, 0.8398056030273438, 0.8712310791015625, 0.9026565551757812, 0.93408203125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 6.0, 3.0, 11.0, 8.0, 15.0, 20.0, 10.0, 31.0, 24.0, 21.0, 23.0, 23.0, 23.0, 27.0, 37.0, 38.0, 33.0, 43.0, 34.0, 44.0, 1064.0, 33.0, 40.0, 37.0, 43.0, 29.0, 33.0, 24.0, 20.0, 19.0, 27.0, 19.0, 17.0, 25.0, 27.0, 14.0, 16.0, 10.0, 10.0, 5.0, 4.0, 5.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.8671875, -11.5162353515625, -11.165283203125, -10.8143310546875, -10.46337890625, -10.1124267578125, -9.761474609375, -9.4105224609375, -9.0595703125, -8.7086181640625, -8.357666015625, -8.0067138671875, -7.65576171875, -7.3048095703125, -6.953857421875, -6.6029052734375, -6.251953125, -5.9010009765625, -5.550048828125, -5.1990966796875, -4.84814453125, -4.4971923828125, -4.146240234375, -3.7952880859375, -3.4443359375, -3.0933837890625, -2.742431640625, -2.3914794921875, -2.04052734375, -1.6895751953125, -1.338623046875, -0.9876708984375, -0.63671875, -0.2857666015625, 0.065185546875, 0.4161376953125, 0.76708984375, 1.1180419921875, 1.468994140625, 1.8199462890625, 2.1708984375, 2.5218505859375, 2.872802734375, 3.2237548828125, 3.57470703125, 3.9256591796875, 4.276611328125, 4.6275634765625, 4.978515625, 5.3294677734375, 5.680419921875, 6.0313720703125, 6.38232421875, 6.7332763671875, 7.084228515625, 7.4351806640625, 7.7861328125, 8.1370849609375, 8.488037109375, 8.8389892578125, 9.18994140625, 9.5408935546875, 9.891845703125, 10.2427978515625, 10.59375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 11.0, 23.0, 24.0, 42.0, 77.0, 87.0, 114.0, 140.0, 239.0, 326.0, 448.0, 640.0, 959.0, 1384.0, 2031.0, 2996.0, 4145.0, 6323.0, 9218.0, 13765.0, 20089.0, 29807.0, 44978.0, 72009.0, 126919.0, 1352300.0, 163740.0, 85476.0, 52719.0, 34147.0, 22826.0, 15752.0, 10620.0, 7122.0, 4794.0, 3310.0, 2277.0, 1617.0, 1118.0, 759.0, 533.0, 357.0, 262.0, 173.0, 121.0, 87.0, 68.0, 47.0, 34.0, 24.0, 13.0, 12.0, 9.0, 7.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.475830078125, -0.4608039855957031, -0.44577789306640625, -0.4307518005371094, -0.4157257080078125, -0.4006996154785156, -0.38567352294921875, -0.3706474304199219, -0.355621337890625, -0.3405952453613281, -0.32556915283203125, -0.3105430603027344, -0.2955169677734375, -0.2804908752441406, -0.26546478271484375, -0.2504386901855469, -0.23541259765625, -0.22038650512695312, -0.20536041259765625, -0.19033432006835938, -0.1753082275390625, -0.16028213500976562, -0.14525604248046875, -0.13022994995117188, -0.115203857421875, -0.10017776489257812, -0.08515167236328125, -0.07012557983398438, -0.0550994873046875, -0.040073394775390625, -0.02504730224609375, -0.010021209716796875, 0.0050048828125, 0.020030975341796875, 0.03505706787109375, 0.050083160400390625, 0.0651092529296875, 0.08013534545898438, 0.09516143798828125, 0.11018753051757812, 0.125213623046875, 0.14023971557617188, 0.15526580810546875, 0.17029190063476562, 0.1853179931640625, 0.20034408569335938, 0.21537017822265625, 0.23039627075195312, 0.24542236328125, 0.2604484558105469, 0.27547454833984375, 0.2905006408691406, 0.3055267333984375, 0.3205528259277344, 0.33557891845703125, 0.3506050109863281, 0.365631103515625, 0.3806571960449219, 0.39568328857421875, 0.4107093811035156, 0.4257354736328125, 0.4407615661621094, 0.45578765869140625, 0.4708137512207031, 0.48583984375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 15.0, 10.0, 12.0, 9.0, 16.0, 26.0, 37.0, 36.0, 62.0, 82.0, 130.0, 164.0, 77.0, 69.0, 42.0, 33.0, 25.0, 25.0, 23.0, 15.0, 9.0, 9.0, 5.0, 6.0, 5.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.594160079956055e-05, -3.456044942140579e-05, -3.317929804325104e-05, -3.179814666509628e-05, -3.041699528694153e-05, -2.9035843908786774e-05, -2.765469253063202e-05, -2.6273541152477264e-05, -2.489238977432251e-05, -2.3511238396167755e-05, -2.2130087018013e-05, -2.0748935639858246e-05, -1.936778426170349e-05, -1.7986632883548737e-05, -1.6605481505393982e-05, -1.5224330127239227e-05, -1.3843178749084473e-05, -1.2462027370929718e-05, -1.1080875992774963e-05, -9.699724614620209e-06, -8.318573236465454e-06, -6.9374218583106995e-06, -5.556270480155945e-06, -4.17511910200119e-06, -2.7939677238464355e-06, -1.412816345691681e-06, -3.166496753692627e-08, 1.3494864106178284e-06, 2.730637788772583e-06, 4.111789166927338e-06, 5.492940545082092e-06, 6.874091923236847e-06, 8.255243301391602e-06, 9.636394679546356e-06, 1.101754605770111e-05, 1.2398697435855865e-05, 1.377984881401062e-05, 1.5161000192165375e-05, 1.654215157032013e-05, 1.7923302948474884e-05, 1.930445432662964e-05, 2.0685605704784393e-05, 2.2066757082939148e-05, 2.3447908461093903e-05, 2.4829059839248657e-05, 2.6210211217403412e-05, 2.7591362595558167e-05, 2.897251397371292e-05, 3.0353665351867676e-05, 3.173481673002243e-05, 3.3115968108177185e-05, 3.449711948633194e-05, 3.5878270864486694e-05, 3.725942224264145e-05, 3.8640573620796204e-05, 4.002172499895096e-05, 4.140287637710571e-05, 4.278402775526047e-05, 4.416517913341522e-05, 4.554633051156998e-05, 4.692748188972473e-05, 4.8308633267879486e-05, 4.968978464603424e-05, 5.1070936024188995e-05, 5.245208740234375e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 13.0, 12.0, 15.0, 9.0, 11.0, 29.0, 24.0, 40.0, 46.0, 50.0, 53.0, 103.0, 134.0, 175.0, 349.0, 960.0, 1021326.0, 23734.0, 525.0, 280.0, 169.0, 99.0, 86.0, 71.0, 49.0, 35.0, 30.0, 23.0, 16.0, 17.0, 18.0, 10.0, 8.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008249282836914062, -0.0007972493767738342, -0.0007695704698562622, -0.0007418915629386902, -0.0007142126560211182, -0.0006865337491035461, -0.0006588548421859741, -0.0006311759352684021, -0.0006034970283508301, -0.0005758181214332581, -0.000548139214515686, -0.000520460307598114, -0.000492781400680542, -0.00046510249376296997, -0.00043742358684539795, -0.00040974467992782593, -0.0003820657730102539, -0.0003543868660926819, -0.00032670795917510986, -0.00029902905225753784, -0.0002713501453399658, -0.0002436712384223938, -0.00021599233150482178, -0.00018831342458724976, -0.00016063451766967773, -0.0001329556107521057, -0.00010527670383453369, -7.759779691696167e-05, -4.991888999938965e-05, -2.2239983081817627e-05, 5.4389238357543945e-06, 3.3117830753326416e-05, 6.079673767089844e-05, 8.847564458847046e-05, 0.00011615455150604248, 0.0001438334584236145, 0.00017151236534118652, 0.00019919127225875854, 0.00022687017917633057, 0.0002545490860939026, 0.0002822279930114746, 0.00030990689992904663, 0.00033758580684661865, 0.0003652647137641907, 0.0003929436206817627, 0.0004206225275993347, 0.00044830143451690674, 0.00047598034143447876, 0.0005036592483520508, 0.0005313381552696228, 0.0005590170621871948, 0.0005866959691047668, 0.0006143748760223389, 0.0006420537829399109, 0.0006697326898574829, 0.0006974115967750549, 0.000725090503692627, 0.000752769410610199, 0.000780448317527771, 0.000808127224445343, 0.000835806131362915, 0.0008634850382804871, 0.0008911639451980591, 0.0009188428521156311, 0.0009465217590332031]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 17.0, 68.0, 340.0, 489.0, 69.0, 21.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.718855340499431e-05, -7.561613892903551e-05, -7.404372445307672e-05, -7.247131725307554e-05, -7.089890277711675e-05, -6.932648830115795e-05, -6.775407382519916e-05, -6.618165934924036e-05, -6.460925214923918e-05, -6.303683767328039e-05, -6.14644231973216e-05, -5.9892012359341606e-05, -5.831960152136162e-05, -5.6747187045402825e-05, -5.517477256944403e-05, -5.360236173146404e-05, -5.202994725550525e-05, -5.0457532779546455e-05, -4.888512194156647e-05, -4.731270746560767e-05, -4.5740296627627686e-05, -4.416788215166889e-05, -4.2595471313688904e-05, -4.102305683773011e-05, -3.9450642361771315e-05, -3.787822788581252e-05, -3.6305817047832534e-05, -3.473340257187374e-05, -3.316099173389375e-05, -3.158857725793496e-05, -3.0016164600965567e-05, -2.8443751943996176e-05, -2.6871339287026785e-05, -2.5298926630057395e-05, -2.3726513973088004e-05, -2.2154101316118613e-05, -2.058168684015982e-05, -1.900927600217983e-05, -1.7436861526221037e-05, -1.5864448869251646e-05, -1.4292036212282255e-05, -1.2719623555312864e-05, -1.1147210898343474e-05, -9.574797331879381e-06, -8.00238467490999e-06, -6.4299720179405995e-06, -4.857558451476507e-06, -3.285145794507116e-06, -1.7127331375377253e-06, -1.4032025319465902e-07, 1.4320926311484072e-06, 3.004505742865149e-06, 4.57691839983454e-06, 6.1493310568039306e-06, 7.721744623268023e-06, 9.294157280237414e-06, 1.0866569937206805e-05, 1.2438982594176196e-05, 1.4011395251145586e-05, 1.558380972710438e-05, 1.7156220565084368e-05, 1.8728635041043162e-05, 2.0301047698012553e-05, 2.1873460354981944e-05, 2.3445873011951335e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 7.0, 9.0, 8.0, 14.0, 11.0, 7.0, 16.0, 16.0, 24.0, 32.0, 26.0, 32.0, 38.0, 33.0, 44.0, 44.0, 55.0, 49.0, 36.0, 48.0, 32.0, 51.0, 50.0, 37.0, 33.0, 44.0, 34.0, 23.0, 31.0, 22.0, 18.0, 16.0, 18.0, 11.0, 3.0, 5.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1159648895263672e-05, -2.0544975996017456e-05, -1.993030309677124e-05, -1.9315630197525024e-05, -1.870095729827881e-05, -1.8086284399032593e-05, -1.7471611499786377e-05, -1.685693860054016e-05, -1.6242265701293945e-05, -1.562759280204773e-05, -1.5012919902801514e-05, -1.4398247003555298e-05, -1.3783574104309082e-05, -1.3168901205062866e-05, -1.255422830581665e-05, -1.1939555406570435e-05, -1.1324882507324219e-05, -1.0710209608078003e-05, -1.0095536708831787e-05, -9.480863809585571e-06, -8.866190910339355e-06, -8.25151801109314e-06, -7.636845111846924e-06, -7.022172212600708e-06, -6.407499313354492e-06, -5.792826414108276e-06, -5.1781535148620605e-06, -4.563480615615845e-06, -3.948807716369629e-06, -3.334134817123413e-06, -2.7194619178771973e-06, -2.1047890186309814e-06, -1.4901161193847656e-06, -8.754432201385498e-07, -2.60770320892334e-07, 3.5390257835388184e-07, 9.685754776000977e-07, 1.5832483768463135e-06, 2.1979212760925293e-06, 2.812594175338745e-06, 3.427267074584961e-06, 4.041939973831177e-06, 4.656612873077393e-06, 5.271285772323608e-06, 5.885958671569824e-06, 6.50063157081604e-06, 7.115304470062256e-06, 7.729977369308472e-06, 8.344650268554688e-06, 8.959323167800903e-06, 9.573996067047119e-06, 1.0188668966293335e-05, 1.080334186553955e-05, 1.1418014764785767e-05, 1.2032687664031982e-05, 1.2647360563278198e-05, 1.3262033462524414e-05, 1.387670636177063e-05, 1.4491379261016846e-05, 1.5106052160263062e-05, 1.5720725059509277e-05, 1.6335397958755493e-05, 1.695007085800171e-05, 1.7564743757247925e-05, 1.817941665649414e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 12.0, 10.0, 13.0, 14.0, 13.0, 20.0, 20.0, 30.0, 29.0, 23.0, 46.0, 44.0, 48.0, 82.0, 76.0, 75.0, 67.0, 55.0, 63.0, 45.0, 32.0, 28.0, 22.0, 18.0, 17.0, 10.0, 10.0, 7.0, 11.0, 8.0, 4.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.078125, -27.263671875, -26.44921875, -25.634765625, -24.8203125, -24.005859375, -23.19140625, -22.376953125, -21.5625, -20.748046875, -19.93359375, -19.119140625, -18.3046875, -17.490234375, -16.67578125, -15.861328125, -15.046875, -14.232421875, -13.41796875, -12.603515625, -11.7890625, -10.974609375, -10.16015625, -9.345703125, -8.53125, -7.716796875, -6.90234375, -6.087890625, -5.2734375, -4.458984375, -3.64453125, -2.830078125, -2.015625, -1.201171875, -0.38671875, 0.427734375, 1.2421875, 2.056640625, 2.87109375, 3.685546875, 4.5, 5.314453125, 6.12890625, 6.943359375, 7.7578125, 8.572265625, 9.38671875, 10.201171875, 11.015625, 11.830078125, 12.64453125, 13.458984375, 14.2734375, 15.087890625, 15.90234375, 16.716796875, 17.53125, 18.345703125, 19.16015625, 19.974609375, 20.7890625, 21.603515625, 22.41796875, 23.232421875, 24.046875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 12.0, 10.0, 17.0, 19.0, 23.0, 28.0, 45.0, 60.0, 74.0, 111.0, 144.0, 249.0, 345.0, 455.0, 692.0, 1119.0, 1711.0, 2874.0, 5180.0, 10881.0, 29415.0, 133848.0, 728061.0, 88757.0, 23246.0, 9248.0, 4606.0, 2543.0, 1627.0, 1038.0, 647.0, 427.0, 318.0, 201.0, 164.0, 96.0, 60.0, 55.0, 36.0, 36.0, 28.0, 12.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-104.5625, -101.5224609375, -98.482421875, -95.4423828125, -92.40234375, -89.3623046875, -86.322265625, -83.2822265625, -80.2421875, -77.2021484375, -74.162109375, -71.1220703125, -68.08203125, -65.0419921875, -62.001953125, -58.9619140625, -55.921875, -52.8818359375, -49.841796875, -46.8017578125, -43.76171875, -40.7216796875, -37.681640625, -34.6416015625, -31.6015625, -28.5615234375, -25.521484375, -22.4814453125, -19.44140625, -16.4013671875, -13.361328125, -10.3212890625, -7.28125, -4.2412109375, -1.201171875, 1.8388671875, 4.87890625, 7.9189453125, 10.958984375, 13.9990234375, 17.0390625, 20.0791015625, 23.119140625, 26.1591796875, 29.19921875, 32.2392578125, 35.279296875, 38.3193359375, 41.359375, 44.3994140625, 47.439453125, 50.4794921875, 53.51953125, 56.5595703125, 59.599609375, 62.6396484375, 65.6796875, 68.7197265625, 71.759765625, 74.7998046875, 77.83984375, 80.8798828125, 83.919921875, 86.9599609375, 90.0]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 10.0, 11.0, 13.0, 14.0, 24.0, 30.0, 30.0, 30.0, 44.0, 33.0, 49.0, 54.0, 59.0, 94.0, 221.0, 1651.0, 153.0, 59.0, 61.0, 43.0, 36.0, 34.0, 32.0, 37.0, 36.0, 28.0, 28.0, 23.0, 8.0, 11.0, 15.0, 16.0, 4.0, 9.0, 9.0, 1.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-86.0, -83.5673828125, -81.134765625, -78.7021484375, -76.26953125, -73.8369140625, -71.404296875, -68.9716796875, -66.5390625, -64.1064453125, -61.673828125, -59.2412109375, -56.80859375, -54.3759765625, -51.943359375, -49.5107421875, -47.078125, -44.6455078125, -42.212890625, -39.7802734375, -37.34765625, -34.9150390625, -32.482421875, -30.0498046875, -27.6171875, -25.1845703125, -22.751953125, -20.3193359375, -17.88671875, -15.4541015625, -13.021484375, -10.5888671875, -8.15625, -5.7236328125, -3.291015625, -0.8583984375, 1.57421875, 4.0068359375, 6.439453125, 8.8720703125, 11.3046875, 13.7373046875, 16.169921875, 18.6025390625, 21.03515625, 23.4677734375, 25.900390625, 28.3330078125, 30.765625, 33.1982421875, 35.630859375, 38.0634765625, 40.49609375, 42.9287109375, 45.361328125, 47.7939453125, 50.2265625, 52.6591796875, 55.091796875, 57.5244140625, 59.95703125, 62.3896484375, 64.822265625, 67.2548828125, 69.6875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 7.0, 6.0, 16.0, 16.0, 9.0, 7.0, 18.0, 23.0, 28.0, 28.0, 31.0, 39.0, 45.0, 71.0, 157.0, 321.0, 1366.0, 30238.0, 3100125.0, 11588.0, 900.0, 239.0, 111.0, 70.0, 42.0, 38.0, 27.0, 29.0, 19.0, 24.0, 10.0, 10.0, 10.0, 8.0, 9.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-340.25, -328.265625, -316.28125, -304.296875, -292.3125, -280.328125, -268.34375, -256.359375, -244.375, -232.390625, -220.40625, -208.421875, -196.4375, -184.453125, -172.46875, -160.484375, -148.5, -136.515625, -124.53125, -112.546875, -100.5625, -88.578125, -76.59375, -64.609375, -52.625, -40.640625, -28.65625, -16.671875, -4.6875, 7.296875, 19.28125, 31.265625, 43.25, 55.234375, 67.21875, 79.203125, 91.1875, 103.171875, 115.15625, 127.140625, 139.125, 151.109375, 163.09375, 175.078125, 187.0625, 199.046875, 211.03125, 223.015625, 235.0, 246.984375, 258.96875, 270.953125, 282.9375, 294.921875, 306.90625, 318.890625, 330.875, 342.859375, 354.84375, 366.828125, 378.8125, 390.796875, 402.78125, 414.765625, 426.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 14.0, 208.0, 707.0, 78.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-808.6544189453125, -781.9524536132812, -755.25048828125, -728.5485229492188, -701.8465576171875, -675.1445922851562, -648.442626953125, -621.7406616210938, -595.0386962890625, -568.3367309570312, -541.634765625, -514.9328002929688, -488.2308349609375, -461.52886962890625, -434.826904296875, -408.12493896484375, -381.4229736328125, -354.72100830078125, -328.01904296875, -301.31707763671875, -274.6151123046875, -247.91314697265625, -221.211181640625, -194.50921630859375, -167.8072509765625, -141.10528564453125, -114.4033203125, -87.70135498046875, -60.9993896484375, -34.29742431640625, -7.595458984375, 19.10650634765625, 45.80841064453125, 72.5103759765625, 99.21234130859375, 125.914306640625, 152.61627197265625, 179.3182373046875, 206.02020263671875, 232.72216796875, 259.42413330078125, 286.1260986328125, 312.82806396484375, 339.530029296875, 366.23199462890625, 392.9339599609375, 419.63592529296875, 446.337890625, 473.03985595703125, 499.7418212890625, 526.4437866210938, 553.145751953125, 579.8477172851562, 606.5496826171875, 633.2516479492188, 659.95361328125, 686.6555786132812, 713.3575439453125, 740.0595092773438, 766.761474609375, 793.4634399414062, 820.1654052734375, 846.8673706054688, 873.5693359375, 900.2713012695312]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 6.0, 5.0, 14.0, 7.0, 13.0, 16.0, 10.0, 21.0, 20.0, 25.0, 29.0, 30.0, 29.0, 18.0, 35.0, 22.0, 21.0, 33.0, 39.0, 39.0, 34.0, 34.0, 30.0, 26.0, 39.0, 37.0, 15.0, 28.0, 29.0, 24.0, 31.0, 24.0, 27.0, 20.0, 17.0, 16.0, 22.0, 14.0, 9.0, 13.0, 10.0, 8.0, 10.0, 4.0, 10.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0], "bins": [-201.40931701660156, -195.08128356933594, -188.75326538085938, -182.42523193359375, -176.09719848632812, -169.76918029785156, -163.44114685058594, -157.11312866210938, -150.78509521484375, -144.45706176757812, -138.12904357910156, -131.80101013183594, -125.47298431396484, -119.14495849609375, -112.81692504882812, -106.48889923095703, -100.16087341308594, -93.83284759521484, -87.50482177734375, -81.17678833007812, -74.84876251220703, -68.52073669433594, -62.19270706176758, -55.86467742919922, -49.536651611328125, -43.20862579345703, -36.88059616088867, -30.552568435668945, -24.22454071044922, -17.896512985229492, -11.568485260009766, -5.240455627441406, 1.087554931640625, 7.415582656860352, 13.743610382080078, 20.071638107299805, 26.39966583251953, 32.727691650390625, 39.055721282958984, 45.383750915527344, 51.71177673339844, 58.03980255126953, 64.36782836914062, 70.69586181640625, 77.02388763427734, 83.35191345214844, 89.67994689941406, 96.00797271728516, 102.33599853515625, 108.66402435302734, 114.99205017089844, 121.32008361816406, 127.64810943603516, 133.97613525390625, 140.30416870117188, 146.6322021484375, 152.96022033691406, 159.2882537841797, 165.61627197265625, 171.94430541992188, 178.2723388671875, 184.60035705566406, 190.9283905029297, 197.25640869140625, 203.58444213867188]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 7.0, 2.0, 11.0, 8.0, 12.0, 9.0, 14.0, 13.0, 18.0, 9.0, 32.0, 26.0, 26.0, 45.0, 35.0, 51.0, 54.0, 59.0, 91.0, 51.0, 65.0, 67.0, 58.0, 42.0, 32.0, 25.0, 21.0, 15.0, 15.0, 15.0, 10.0, 7.0, 15.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-29.78125, -28.9599609375, -28.138671875, -27.3173828125, -26.49609375, -25.6748046875, -24.853515625, -24.0322265625, -23.2109375, -22.3896484375, -21.568359375, -20.7470703125, -19.92578125, -19.1044921875, -18.283203125, -17.4619140625, -16.640625, -15.8193359375, -14.998046875, -14.1767578125, -13.35546875, -12.5341796875, -11.712890625, -10.8916015625, -10.0703125, -9.2490234375, -8.427734375, -7.6064453125, -6.78515625, -5.9638671875, -5.142578125, -4.3212890625, -3.5, -2.6787109375, -1.857421875, -1.0361328125, -0.21484375, 0.6064453125, 1.427734375, 2.2490234375, 3.0703125, 3.8916015625, 4.712890625, 5.5341796875, 6.35546875, 7.1767578125, 7.998046875, 8.8193359375, 9.640625, 10.4619140625, 11.283203125, 12.1044921875, 12.92578125, 13.7470703125, 14.568359375, 15.3896484375, 16.2109375, 17.0322265625, 17.853515625, 18.6748046875, 19.49609375, 20.3173828125, 21.138671875, 21.9599609375, 22.78125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 3.0, 7.0, 15.0, 19.0, 18.0, 24.0, 30.0, 43.0, 46.0, 69.0, 89.0, 110.0, 173.0, 271.0, 401.0, 696.0, 1317.0, 2404.0, 4990.0, 11174.0, 40646.0, 3911420.0, 193224.0, 15440.0, 5751.0, 2633.0, 1346.0, 698.0, 382.0, 254.0, 151.0, 99.0, 85.0, 66.0, 29.0, 36.0, 26.0, 24.0, 16.0, 16.0, 8.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0], "bins": [-166.875, -162.3232421875, -157.771484375, -153.2197265625, -148.66796875, -144.1162109375, -139.564453125, -135.0126953125, -130.4609375, -125.9091796875, -121.357421875, -116.8056640625, -112.25390625, -107.7021484375, -103.150390625, -98.5986328125, -94.046875, -89.4951171875, -84.943359375, -80.3916015625, -75.83984375, -71.2880859375, -66.736328125, -62.1845703125, -57.6328125, -53.0810546875, -48.529296875, -43.9775390625, -39.42578125, -34.8740234375, -30.322265625, -25.7705078125, -21.21875, -16.6669921875, -12.115234375, -7.5634765625, -3.01171875, 1.5400390625, 6.091796875, 10.6435546875, 15.1953125, 19.7470703125, 24.298828125, 28.8505859375, 33.40234375, 37.9541015625, 42.505859375, 47.0576171875, 51.609375, 56.1611328125, 60.712890625, 65.2646484375, 69.81640625, 74.3681640625, 78.919921875, 83.4716796875, 88.0234375, 92.5751953125, 97.126953125, 101.6787109375, 106.23046875, 110.7822265625, 115.333984375, 119.8857421875, 124.4375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 7.0, 15.0, 11.0, 22.0, 25.0, 35.0, 43.0, 51.0, 122.0, 478.0, 1609.0, 1055.0, 277.0, 92.0, 50.0, 33.0, 37.0, 26.0, 16.0, 19.0, 11.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0], "bins": [-142.375, -138.794921875, -135.21484375, -131.634765625, -128.0546875, -124.474609375, -120.89453125, -117.314453125, -113.734375, -110.154296875, -106.57421875, -102.994140625, -99.4140625, -95.833984375, -92.25390625, -88.673828125, -85.09375, -81.513671875, -77.93359375, -74.353515625, -70.7734375, -67.193359375, -63.61328125, -60.033203125, -56.453125, -52.873046875, -49.29296875, -45.712890625, -42.1328125, -38.552734375, -34.97265625, -31.392578125, -27.8125, -24.232421875, -20.65234375, -17.072265625, -13.4921875, -9.912109375, -6.33203125, -2.751953125, 0.828125, 4.408203125, 7.98828125, 11.568359375, 15.1484375, 18.728515625, 22.30859375, 25.888671875, 29.46875, 33.048828125, 36.62890625, 40.208984375, 43.7890625, 47.369140625, 50.94921875, 54.529296875, 58.109375, 61.689453125, 65.26953125, 68.849609375, 72.4296875, 76.009765625, 79.58984375, 83.169921875, 86.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 1.0, 11.0, 7.0, 20.0, 20.0, 26.0, 35.0, 38.0, 62.0, 125.0, 182.0, 303.0, 432.0, 803.0, 1457.0, 2810.0, 6005.0, 14534.0, 40965.0, 225194.0, 3713759.0, 132644.0, 32270.0, 11858.0, 5093.0, 2512.0, 1274.0, 705.0, 395.0, 264.0, 158.0, 96.0, 80.0, 43.0, 37.0, 21.0, 12.0, 12.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.75, -122.91015625, -118.0703125, -113.23046875, -108.390625, -103.55078125, -98.7109375, -93.87109375, -89.03125, -84.19140625, -79.3515625, -74.51171875, -69.671875, -64.83203125, -59.9921875, -55.15234375, -50.3125, -45.47265625, -40.6328125, -35.79296875, -30.953125, -26.11328125, -21.2734375, -16.43359375, -11.59375, -6.75390625, -1.9140625, 2.92578125, 7.765625, 12.60546875, 17.4453125, 22.28515625, 27.125, 31.96484375, 36.8046875, 41.64453125, 46.484375, 51.32421875, 56.1640625, 61.00390625, 65.84375, 70.68359375, 75.5234375, 80.36328125, 85.203125, 90.04296875, 94.8828125, 99.72265625, 104.5625, 109.40234375, 114.2421875, 119.08203125, 123.921875, 128.76171875, 133.6015625, 138.44140625, 143.28125, 148.12109375, 152.9609375, 157.80078125, 162.640625, 167.48046875, 172.3203125, 177.16015625, 182.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 18.0, 58.0, 284.0, 502.0, 106.0, 26.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-465.0841979980469, -432.31146240234375, -399.53875732421875, -366.7660217285156, -333.9932861328125, -301.2205505371094, -268.44781494140625, -235.67510986328125, -202.90237426757812, -170.129638671875, -137.35691833496094, -104.58419036865234, -71.81146240234375, -39.038726806640625, -6.2660064697265625, 26.5067138671875, 59.279449462890625, 92.05217742919922, 124.82490539550781, 157.59762573242188, 190.370361328125, 223.14309692382812, 255.9158172607422, 288.68853759765625, 321.4612731933594, 354.2340087890625, 387.0067138671875, 419.7794494628906, 452.55218505859375, 485.3249206542969, 518.09765625, 550.870361328125, 583.6431884765625, 616.4158935546875, 649.1886596679688, 681.9613647460938, 714.734130859375, 747.5068359375, 780.279541015625, 813.05224609375, 845.8250122070312, 878.5977172851562, 911.3704833984375, 944.1431884765625, 976.9158935546875, 1009.6886596679688, 1042.46142578125, 1075.234130859375, 1108.0068359375, 1140.779541015625, 1173.55224609375, 1206.3250732421875, 1239.0977783203125, 1271.8704833984375, 1304.6431884765625, 1337.4158935546875, 1370.188720703125, 1402.96142578125, 1435.734130859375, 1468.5069580078125, 1501.2796630859375, 1534.0523681640625, 1566.8250732421875, 1599.5977783203125, 1632.3704833984375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 10.0, 3.0, 7.0, 8.0, 8.0, 19.0, 16.0, 13.0, 24.0, 28.0, 28.0, 32.0, 22.0, 48.0, 43.0, 23.0, 33.0, 36.0, 30.0, 42.0, 44.0, 40.0, 36.0, 32.0, 32.0, 30.0, 39.0, 30.0, 23.0, 39.0, 31.0, 27.0, 24.0, 11.0, 15.0, 16.0, 13.0, 7.0, 6.0, 11.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-196.9012908935547, -190.0442657470703, -183.18724060058594, -176.33021545410156, -169.47317504882812, -162.61614990234375, -155.75912475585938, -148.902099609375, -142.04507446289062, -135.18804931640625, -128.33102416992188, -121.47399139404297, -114.6169662475586, -107.75994110107422, -100.90290832519531, -94.04588317871094, -87.18885803222656, -80.33183288574219, -73.47480773925781, -66.6177749633789, -59.76074981689453, -52.903724670410156, -46.046695709228516, -39.189666748046875, -32.3326416015625, -25.475614547729492, -18.618587493896484, -11.761560440063477, -4.904533386230469, 1.9524917602539062, 8.809520721435547, 15.666549682617188, 22.5235595703125, 29.380586624145508, 36.237613677978516, 43.094642639160156, 49.95166778564453, 56.808692932128906, 63.66572189331055, 70.52275085449219, 77.37977600097656, 84.23680114746094, 91.09382629394531, 97.95085906982422, 104.8078842163086, 111.66490936279297, 118.52194213867188, 125.37896728515625, 132.23599243164062, 139.093017578125, 145.95004272460938, 152.80706787109375, 159.66409301757812, 166.5211181640625, 173.37815856933594, 180.2351837158203, 187.0922088623047, 193.94923400878906, 200.80625915527344, 207.6632843017578, 214.52032470703125, 221.37734985351562, 228.234375, 235.09140014648438, 241.94842529296875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 3.0, 11.0, 9.0, 7.0, 11.0, 15.0, 10.0, 12.0, 14.0, 26.0, 23.0, 23.0, 29.0, 34.0, 54.0, 50.0, 61.0, 55.0, 61.0, 56.0, 52.0, 71.0, 54.0, 41.0, 44.0, 17.0, 25.0, 25.0, 18.0, 14.0, 16.0, 11.0, 7.0, 6.0, 5.0, 6.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-30.0, -29.124755859375, -28.24951171875, -27.374267578125, -26.4990234375, -25.623779296875, -24.74853515625, -23.873291015625, -22.998046875, -22.122802734375, -21.24755859375, -20.372314453125, -19.4970703125, -18.621826171875, -17.74658203125, -16.871337890625, -15.99609375, -15.120849609375, -14.24560546875, -13.370361328125, -12.4951171875, -11.619873046875, -10.74462890625, -9.869384765625, -8.994140625, -8.118896484375, -7.24365234375, -6.368408203125, -5.4931640625, -4.617919921875, -3.74267578125, -2.867431640625, -1.9921875, -1.116943359375, -0.24169921875, 0.633544921875, 1.5087890625, 2.384033203125, 3.25927734375, 4.134521484375, 5.009765625, 5.885009765625, 6.76025390625, 7.635498046875, 8.5107421875, 9.385986328125, 10.26123046875, 11.136474609375, 12.01171875, 12.886962890625, 13.76220703125, 14.637451171875, 15.5126953125, 16.387939453125, 17.26318359375, 18.138427734375, 19.013671875, 19.888916015625, 20.76416015625, 21.639404296875, 22.5146484375, 23.389892578125, 24.26513671875, 25.140380859375, 26.015625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 9.0, 6.0, 13.0, 19.0, 28.0, 44.0, 41.0, 63.0, 84.0, 131.0, 178.0, 250.0, 367.0, 485.0, 744.0, 1069.0, 1509.0, 2263.0, 3424.0, 5175.0, 8220.0, 13116.0, 21701.0, 38733.0, 77037.0, 191934.0, 406925.0, 133794.0, 59390.0, 31552.0, 18140.0, 11055.0, 7093.0, 4530.0, 2993.0, 2026.0, 1348.0, 939.0, 631.0, 426.0, 304.0, 216.0, 169.0, 115.0, 80.0, 53.0, 43.0, 27.0, 18.0, 7.0, 15.0, 9.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.0625, -1.029632568359375, -0.99676513671875, -0.963897705078125, -0.9310302734375, -0.898162841796875, -0.86529541015625, -0.832427978515625, -0.799560546875, -0.766693115234375, -0.73382568359375, -0.700958251953125, -0.6680908203125, -0.635223388671875, -0.60235595703125, -0.569488525390625, -0.53662109375, -0.503753662109375, -0.47088623046875, -0.438018798828125, -0.4051513671875, -0.372283935546875, -0.33941650390625, -0.306549072265625, -0.273681640625, -0.240814208984375, -0.20794677734375, -0.175079345703125, -0.1422119140625, -0.109344482421875, -0.07647705078125, -0.043609619140625, -0.0107421875, 0.022125244140625, 0.05499267578125, 0.087860107421875, 0.1207275390625, 0.153594970703125, 0.18646240234375, 0.219329833984375, 0.252197265625, 0.285064697265625, 0.31793212890625, 0.350799560546875, 0.3836669921875, 0.416534423828125, 0.44940185546875, 0.482269287109375, 0.51513671875, 0.548004150390625, 0.58087158203125, 0.613739013671875, 0.6466064453125, 0.679473876953125, 0.71234130859375, 0.745208740234375, 0.778076171875, 0.810943603515625, 0.84381103515625, 0.876678466796875, 0.9095458984375, 0.942413330078125, 0.97528076171875, 1.008148193359375, 1.041015625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 11.0, 10.0, 18.0, 15.0, 25.0, 16.0, 21.0, 27.0, 29.0, 34.0, 37.0, 39.0, 36.0, 42.0, 46.0, 34.0, 1079.0, 52.0, 31.0, 46.0, 53.0, 46.0, 33.0, 47.0, 35.0, 23.0, 32.0, 10.0, 20.0, 13.0, 10.0, 8.0, 13.0, 8.0, 4.0, 1.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.5625, -17.08154296875, -16.6005859375, -16.11962890625, -15.638671875, -15.15771484375, -14.6767578125, -14.19580078125, -13.71484375, -13.23388671875, -12.7529296875, -12.27197265625, -11.791015625, -11.31005859375, -10.8291015625, -10.34814453125, -9.8671875, -9.38623046875, -8.9052734375, -8.42431640625, -7.943359375, -7.46240234375, -6.9814453125, -6.50048828125, -6.01953125, -5.53857421875, -5.0576171875, -4.57666015625, -4.095703125, -3.61474609375, -3.1337890625, -2.65283203125, -2.171875, -1.69091796875, -1.2099609375, -0.72900390625, -0.248046875, 0.23291015625, 0.7138671875, 1.19482421875, 1.67578125, 2.15673828125, 2.6376953125, 3.11865234375, 3.599609375, 4.08056640625, 4.5615234375, 5.04248046875, 5.5234375, 6.00439453125, 6.4853515625, 6.96630859375, 7.447265625, 7.92822265625, 8.4091796875, 8.89013671875, 9.37109375, 9.85205078125, 10.3330078125, 10.81396484375, 11.294921875, 11.77587890625, 12.2568359375, 12.73779296875, 13.21875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 9.0, 15.0, 33.0, 45.0, 54.0, 75.0, 131.0, 201.0, 297.0, 489.0, 761.0, 1218.0, 1937.0, 3077.0, 5040.0, 8036.0, 13234.0, 22463.0, 39488.0, 71083.0, 137288.0, 1409632.0, 178459.0, 88157.0, 47581.0, 27102.0, 16005.0, 9738.0, 5848.0, 3488.0, 2192.0, 1413.0, 890.0, 601.0, 344.0, 224.0, 178.0, 100.0, 69.0, 42.0, 35.0, 21.0, 10.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.70458984375, -0.682342529296875, -0.66009521484375, -0.637847900390625, -0.6156005859375, -0.593353271484375, -0.57110595703125, -0.548858642578125, -0.526611328125, -0.504364013671875, -0.48211669921875, -0.459869384765625, -0.4376220703125, -0.415374755859375, -0.39312744140625, -0.370880126953125, -0.3486328125, -0.326385498046875, -0.30413818359375, -0.281890869140625, -0.2596435546875, -0.237396240234375, -0.21514892578125, -0.192901611328125, -0.170654296875, -0.148406982421875, -0.12615966796875, -0.103912353515625, -0.0816650390625, -0.059417724609375, -0.03717041015625, -0.014923095703125, 0.00732421875, 0.029571533203125, 0.05181884765625, 0.074066162109375, 0.0963134765625, 0.118560791015625, 0.14080810546875, 0.163055419921875, 0.185302734375, 0.207550048828125, 0.22979736328125, 0.252044677734375, 0.2742919921875, 0.296539306640625, 0.31878662109375, 0.341033935546875, 0.36328125, 0.385528564453125, 0.40777587890625, 0.430023193359375, 0.4522705078125, 0.474517822265625, 0.49676513671875, 0.519012451171875, 0.541259765625, 0.563507080078125, 0.58575439453125, 0.608001708984375, 0.6302490234375, 0.652496337890625, 0.67474365234375, 0.696990966796875, 0.71923828125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 11.0, 10.0, 15.0, 17.0, 15.0, 25.0, 24.0, 28.0, 41.0, 38.0, 53.0, 61.0, 74.0, 122.0, 67.0, 57.0, 60.0, 34.0, 41.0, 34.0, 28.0, 24.0, 23.0, 11.0, 17.0, 14.0, 9.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.23464584350586e-05, -6.041862070560455e-05, -5.849078297615051e-05, -5.656294524669647e-05, -5.463510751724243e-05, -5.270726978778839e-05, -5.077943205833435e-05, -4.885159432888031e-05, -4.692375659942627e-05, -4.499591886997223e-05, -4.306808114051819e-05, -4.114024341106415e-05, -3.921240568161011e-05, -3.728456795215607e-05, -3.5356730222702026e-05, -3.3428892493247986e-05, -3.1501054763793945e-05, -2.9573217034339905e-05, -2.7645379304885864e-05, -2.5717541575431824e-05, -2.3789703845977783e-05, -2.1861866116523743e-05, -1.9934028387069702e-05, -1.800619065761566e-05, -1.607835292816162e-05, -1.415051519870758e-05, -1.222267746925354e-05, -1.02948397397995e-05, -8.367002010345459e-06, -6.4391642808914185e-06, -4.511326551437378e-06, -2.5834888219833374e-06, -6.556510925292969e-07, 1.2721866369247437e-06, 3.200024366378784e-06, 5.127862095832825e-06, 7.055699825286865e-06, 8.983537554740906e-06, 1.0911375284194946e-05, 1.2839213013648987e-05, 1.4767050743103027e-05, 1.6694888472557068e-05, 1.862272620201111e-05, 2.055056393146515e-05, 2.247840166091919e-05, 2.440623939037323e-05, 2.633407711982727e-05, 2.826191484928131e-05, 3.018975257873535e-05, 3.211759030818939e-05, 3.404542803764343e-05, 3.597326576709747e-05, 3.7901103496551514e-05, 3.9828941226005554e-05, 4.1756778955459595e-05, 4.3684616684913635e-05, 4.5612454414367676e-05, 4.7540292143821716e-05, 4.946812987327576e-05, 5.13959676027298e-05, 5.332380533218384e-05, 5.525164306163788e-05, 5.717948079109192e-05, 5.910731852054596e-05, 6.103515625e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 14.0, 13.0, 20.0, 25.0, 30.0, 40.0, 47.0, 59.0, 62.0, 88.0, 100.0, 110.0, 159.0, 284.0, 1162.0, 51577.0, 984820.0, 8411.0, 543.0, 205.0, 136.0, 113.0, 93.0, 77.0, 68.0, 54.0, 34.0, 49.0, 30.0, 26.0, 19.0, 13.0, 12.0, 8.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.001018524169921875, -0.0009869933128356934, -0.0009554624557495117, -0.0009239315986633301, -0.0008924007415771484, -0.0008608698844909668, -0.0008293390274047852, -0.0007978081703186035, -0.0007662773132324219, -0.0007347464561462402, -0.0007032155990600586, -0.000671684741973877, -0.0006401538848876953, -0.0006086230278015137, -0.000577092170715332, -0.0005455613136291504, -0.0005140304565429688, -0.0004824995994567871, -0.00045096874237060547, -0.00041943788528442383, -0.0003879070281982422, -0.00035637617111206055, -0.0003248453140258789, -0.00029331445693969727, -0.0002617835998535156, -0.00023025274276733398, -0.00019872188568115234, -0.0001671910285949707, -0.00013566017150878906, -0.00010412931442260742, -7.259845733642578e-05, -4.106760025024414e-05, -9.5367431640625e-06, 2.199411392211914e-05, 5.352497100830078e-05, 8.505582809448242e-05, 0.00011658668518066406, 0.0001481175422668457, 0.00017964839935302734, 0.00021117925643920898, 0.00024271011352539062, 0.00027424097061157227, 0.0003057718276977539, 0.00033730268478393555, 0.0003688335418701172, 0.00040036439895629883, 0.00043189525604248047, 0.0004634261131286621, 0.0004949569702148438, 0.0005264878273010254, 0.000558018684387207, 0.0005895495414733887, 0.0006210803985595703, 0.000652611255645752, 0.0006841421127319336, 0.0007156729698181152, 0.0007472038269042969, 0.0007787346839904785, 0.0008102655410766602, 0.0008417963981628418, 0.0008733272552490234, 0.0009048581123352051, 0.0009363889694213867, 0.0009679198265075684, 0.00099945068359375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 4.0, 31.0, 58.0, 107.0, 417.0, 248.0, 81.0, 32.0, 15.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.124879574694205e-05, -1.852347304520663e-05, -1.5798148524481803e-05, -1.3072825822746381e-05, -1.0347502211516257e-05, -7.622178600286134e-06, -4.8968558985507116e-06, -2.171531377825886e-06, 5.53791323909536e-07, 3.2791147077659843e-06, 6.004438091622433e-06, 8.729761248105206e-06, 1.145508485933533e-05, 1.4180408470565453e-05, 1.6905731172300875e-05, 1.96310556930257e-05, 2.2356378394761123e-05, 2.5081701096496545e-05, 2.780702561722137e-05, 3.053234831895679e-05, 3.3257671020692214e-05, 3.5982993722427636e-05, 3.8708320062141865e-05, 4.143364276387729e-05, 4.415896546561271e-05, 4.688428816734813e-05, 4.9609610869083554e-05, 5.233493720879778e-05, 5.5060259910533205e-05, 5.778558261226863e-05, 6.051090531400405e-05, 6.323622801573947e-05, 6.59615543554537e-05, 6.868688069516793e-05, 7.141219975892454e-05, 7.413752609863877e-05, 7.686284516239539e-05, 7.958817150210962e-05, 8.231349056586623e-05, 8.503881690558046e-05, 8.776414324529469e-05, 9.048946958500892e-05, 9.321478864876553e-05, 9.594011498847976e-05, 9.866543405223638e-05, 0.00010139076039195061, 0.00010411608673166484, 0.00010684140579542145, 0.00010956672485917807, 0.0001122920511988923, 0.00011501737026264891, 0.00011774269660236314, 0.00012046801566611975, 0.00012319334200583398, 0.0001259186683455482, 0.00012864399468526244, 0.00013136932102497667, 0.0001340946473646909, 0.00013681997370440513, 0.00013954528549220413, 0.00014227061183191836, 0.0001449959381716326, 0.00014772126451134682, 0.00015044659085106105, 0.00015317190263886005]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 8.0, 7.0, 14.0, 9.0, 14.0, 17.0, 25.0, 17.0, 25.0, 27.0, 23.0, 32.0, 32.0, 38.0, 30.0, 40.0, 43.0, 47.0, 37.0, 41.0, 38.0, 30.0, 43.0, 42.0, 25.0, 33.0, 42.0, 31.0, 34.0, 33.0, 20.0, 20.0, 15.0, 12.0, 10.0, 11.0, 4.0, 7.0, 5.0, 6.0, 1.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.24249267578125e-05, -3.145076334476471e-05, -3.047659993171692e-05, -2.950243651866913e-05, -2.8528273105621338e-05, -2.7554109692573547e-05, -2.6579946279525757e-05, -2.5605782866477966e-05, -2.4631619453430176e-05, -2.3657456040382385e-05, -2.2683292627334595e-05, -2.1709129214286804e-05, -2.0734965801239014e-05, -1.9760802388191223e-05, -1.8786638975143433e-05, -1.7812475562095642e-05, -1.683831214904785e-05, -1.586414873600006e-05, -1.488998532295227e-05, -1.391582190990448e-05, -1.294165849685669e-05, -1.1967495083808899e-05, -1.0993331670761108e-05, -1.0019168257713318e-05, -9.045004844665527e-06, -8.070841431617737e-06, -7.096678018569946e-06, -6.122514605522156e-06, -5.148351192474365e-06, -4.174187779426575e-06, -3.200024366378784e-06, -2.2258609533309937e-06, -1.2516975402832031e-06, -2.775341272354126e-07, 6.966292858123779e-07, 1.6707926988601685e-06, 2.644956111907959e-06, 3.6191195249557495e-06, 4.59328293800354e-06, 5.5674463510513306e-06, 6.541609764099121e-06, 7.515773177146912e-06, 8.489936590194702e-06, 9.464100003242493e-06, 1.0438263416290283e-05, 1.1412426829338074e-05, 1.2386590242385864e-05, 1.3360753655433655e-05, 1.4334917068481445e-05, 1.5309080481529236e-05, 1.6283243894577026e-05, 1.7257407307624817e-05, 1.8231570720672607e-05, 1.9205734133720398e-05, 2.017989754676819e-05, 2.115406095981598e-05, 2.212822437286377e-05, 2.310238778591156e-05, 2.407655119895935e-05, 2.505071461200714e-05, 2.602487802505493e-05, 2.6999041438102722e-05, 2.7973204851150513e-05, 2.8947368264198303e-05, 2.9921531677246094e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 3.0, 11.0, 9.0, 7.0, 11.0, 15.0, 10.0, 12.0, 14.0, 26.0, 23.0, 23.0, 29.0, 34.0, 54.0, 50.0, 61.0, 55.0, 61.0, 56.0, 52.0, 71.0, 54.0, 41.0, 44.0, 17.0, 25.0, 25.0, 18.0, 14.0, 16.0, 11.0, 7.0, 6.0, 5.0, 6.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-30.0, -29.124755859375, -28.24951171875, -27.374267578125, -26.4990234375, -25.623779296875, -24.74853515625, -23.873291015625, -22.998046875, -22.122802734375, -21.24755859375, -20.372314453125, -19.4970703125, -18.621826171875, -17.74658203125, -16.871337890625, -15.99609375, -15.120849609375, -14.24560546875, -13.370361328125, -12.4951171875, -11.619873046875, -10.74462890625, -9.869384765625, -8.994140625, -8.118896484375, -7.24365234375, -6.368408203125, -5.4931640625, -4.617919921875, -3.74267578125, -2.867431640625, -1.9921875, -1.116943359375, -0.24169921875, 0.633544921875, 1.5087890625, 2.384033203125, 3.25927734375, 4.134521484375, 5.009765625, 5.885009765625, 6.76025390625, 7.635498046875, 8.5107421875, 9.385986328125, 10.26123046875, 11.136474609375, 12.01171875, 12.886962890625, 13.76220703125, 14.637451171875, 15.5126953125, 16.387939453125, 17.26318359375, 18.138427734375, 19.013671875, 19.888916015625, 20.76416015625, 21.639404296875, 22.5146484375, 23.389892578125, 24.26513671875, 25.140380859375, 26.015625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 6.0, 8.0, 7.0, 12.0, 17.0, 22.0, 20.0, 31.0, 46.0, 53.0, 64.0, 83.0, 104.0, 132.0, 193.0, 291.0, 529.0, 793.0, 1431.0, 2903.0, 6420.0, 15968.0, 47355.0, 215330.0, 598497.0, 107270.0, 29836.0, 10922.0, 4807.0, 2326.0, 1096.0, 633.0, 397.0, 259.0, 183.0, 125.0, 95.0, 74.0, 51.0, 38.0, 34.0, 21.0, 23.0, 10.0, 7.0, 8.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0], "bins": [-26.8125, -26.03076171875, -25.2490234375, -24.46728515625, -23.685546875, -22.90380859375, -22.1220703125, -21.34033203125, -20.55859375, -19.77685546875, -18.9951171875, -18.21337890625, -17.431640625, -16.64990234375, -15.8681640625, -15.08642578125, -14.3046875, -13.52294921875, -12.7412109375, -11.95947265625, -11.177734375, -10.39599609375, -9.6142578125, -8.83251953125, -8.05078125, -7.26904296875, -6.4873046875, -5.70556640625, -4.923828125, -4.14208984375, -3.3603515625, -2.57861328125, -1.796875, -1.01513671875, -0.2333984375, 0.54833984375, 1.330078125, 2.11181640625, 2.8935546875, 3.67529296875, 4.45703125, 5.23876953125, 6.0205078125, 6.80224609375, 7.583984375, 8.36572265625, 9.1474609375, 9.92919921875, 10.7109375, 11.49267578125, 12.2744140625, 13.05615234375, 13.837890625, 14.61962890625, 15.4013671875, 16.18310546875, 16.96484375, 17.74658203125, 18.5283203125, 19.31005859375, 20.091796875, 20.87353515625, 21.6552734375, 22.43701171875, 23.21875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 9.0, 4.0, 5.0, 12.0, 8.0, 9.0, 15.0, 21.0, 17.0, 16.0, 25.0, 22.0, 31.0, 41.0, 36.0, 34.0, 38.0, 33.0, 40.0, 55.0, 257.0, 1844.0, 57.0, 51.0, 34.0, 43.0, 34.0, 35.0, 36.0, 23.0, 27.0, 19.0, 15.0, 14.0, 21.0, 11.0, 6.0, 13.0, 11.0, 3.0, 7.0, 7.0, 3.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.5625, -81.75, -78.9375, -76.125, -73.3125, -70.5, -67.6875, -64.875, -62.0625, -59.25, -56.4375, -53.625, -50.8125, -48.0, -45.1875, -42.375, -39.5625, -36.75, -33.9375, -31.125, -28.3125, -25.5, -22.6875, -19.875, -17.0625, -14.25, -11.4375, -8.625, -5.8125, -3.0, -0.1875, 2.625, 5.4375, 8.25, 11.0625, 13.875, 16.6875, 19.5, 22.3125, 25.125, 27.9375, 30.75, 33.5625, 36.375, 39.1875, 42.0, 44.8125, 47.625, 50.4375, 53.25, 56.0625, 58.875, 61.6875, 64.5, 67.3125, 70.125, 72.9375, 75.75, 78.5625, 81.375, 84.1875, 87.0, 89.8125, 92.625, 95.4375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 7.0, 6.0, 6.0, 8.0, 14.0, 6.0, 12.0, 22.0, 15.0, 14.0, 22.0, 38.0, 29.0, 61.0, 62.0, 98.0, 154.0, 259.0, 596.0, 1955.0, 3068127.0, 71898.0, 1068.0, 448.0, 224.0, 130.0, 88.0, 58.0, 56.0, 46.0, 27.0, 27.0, 14.0, 23.0, 19.0, 13.0, 7.0, 10.0, 10.0, 6.0, 3.0, 12.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-217.375, -210.947265625, -204.51953125, -198.091796875, -191.6640625, -185.236328125, -178.80859375, -172.380859375, -165.953125, -159.525390625, -153.09765625, -146.669921875, -140.2421875, -133.814453125, -127.38671875, -120.958984375, -114.53125, -108.103515625, -101.67578125, -95.248046875, -88.8203125, -82.392578125, -75.96484375, -69.537109375, -63.109375, -56.681640625, -50.25390625, -43.826171875, -37.3984375, -30.970703125, -24.54296875, -18.115234375, -11.6875, -5.259765625, 1.16796875, 7.595703125, 14.0234375, 20.451171875, 26.87890625, 33.306640625, 39.734375, 46.162109375, 52.58984375, 59.017578125, 65.4453125, 71.873046875, 78.30078125, 84.728515625, 91.15625, 97.583984375, 104.01171875, 110.439453125, 116.8671875, 123.294921875, 129.72265625, 136.150390625, 142.578125, 149.005859375, 155.43359375, 161.861328125, 168.2890625, 174.716796875, 181.14453125, 187.572265625, 194.0]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 718.0, 289.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.73577880859375, -59.19568634033203, -38.65559387207031, -18.115501403808594, 2.424591064453125, 22.964683532714844, 43.50477600097656, 64.04486083984375, 84.5849609375, 105.12505340576172, 125.66514587402344, 146.20523071289062, 166.74533081054688, 187.28543090820312, 207.8255157470703, 228.3656005859375, 248.90570068359375, 269.44580078125, 289.98590087890625, 310.5259704589844, 331.0660705566406, 351.6061706542969, 372.146240234375, 392.68634033203125, 413.2264404296875, 433.76654052734375, 454.306640625, 474.8467102050781, 495.3868103027344, 515.9268798828125, 536.4669799804688, 557.007080078125, 577.5472412109375, 598.0873413085938, 618.62744140625, 639.1675415039062, 659.7076416015625, 680.2476806640625, 700.7877807617188, 721.327880859375, 741.8679809570312, 762.4080810546875, 782.9481811523438, 803.48828125, 824.0283203125, 844.5684204101562, 865.1085205078125, 885.6486206054688, 906.188720703125, 926.7288208007812, 947.2689208984375, 967.8090209960938, 988.34912109375, 1008.88916015625, 1029.4293212890625, 1049.9693603515625, 1070.509521484375, 1091.049560546875, 1111.5897216796875, 1132.1297607421875, 1152.669921875, 1173.2099609375, 1193.7501220703125, 1214.2901611328125, 1234.8302001953125]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 8.0, 14.0, 7.0, 13.0, 19.0, 21.0, 20.0, 21.0, 24.0, 23.0, 35.0, 36.0, 32.0, 33.0, 32.0, 35.0, 30.0, 55.0, 40.0, 34.0, 38.0, 37.0, 43.0, 27.0, 27.0, 37.0, 31.0, 24.0, 19.0, 23.0, 27.0, 18.0, 20.0, 14.0, 11.0, 10.0, 7.0, 11.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-263.47332763671875, -255.39288330078125, -247.3124237060547, -239.2319793701172, -231.15151977539062, -223.07107543945312, -214.99063110351562, -206.91017150878906, -198.8297119140625, -190.749267578125, -182.66880798339844, -174.58836364746094, -166.50790405273438, -158.42745971679688, -150.34701538085938, -142.2665557861328, -134.1861114501953, -126.10565948486328, -118.02520751953125, -109.94476318359375, -101.86430358886719, -93.78385925292969, -85.70340728759766, -77.62295532226562, -69.5425033569336, -61.46205139160156, -53.38159942626953, -45.301151275634766, -37.220699310302734, -29.140247344970703, -21.059799194335938, -12.979347229003906, -4.8988800048828125, 3.1815710067749023, 11.262022018432617, 19.342472076416016, 27.422924041748047, 35.50337600708008, 43.583824157714844, 51.664276123046875, 59.744728088378906, 67.82518005371094, 75.90563201904297, 83.986083984375, 92.0665283203125, 100.14698791503906, 108.22743225097656, 116.3078842163086, 124.38833618164062, 132.46878051757812, 140.5492401123047, 148.6296844482422, 156.71014404296875, 164.79058837890625, 172.87103271484375, 180.9514923095703, 189.03195190429688, 197.11239624023438, 205.19285583496094, 213.27330017089844, 221.353759765625, 229.4342041015625, 237.5146484375, 245.59510803222656, 253.67555236816406]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 12.0, 7.0, 10.0, 10.0, 11.0, 14.0, 13.0, 22.0, 19.0, 24.0, 27.0, 33.0, 40.0, 51.0, 55.0, 62.0, 64.0, 52.0, 50.0, 69.0, 57.0, 56.0, 34.0, 34.0, 24.0, 23.0, 22.0, 12.0, 19.0, 13.0, 10.0, 5.0, 8.0, 7.0, 1.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-31.09375, -30.201416015625, -29.30908203125, -28.416748046875, -27.5244140625, -26.632080078125, -25.73974609375, -24.847412109375, -23.955078125, -23.062744140625, -22.17041015625, -21.278076171875, -20.3857421875, -19.493408203125, -18.60107421875, -17.708740234375, -16.81640625, -15.924072265625, -15.03173828125, -14.139404296875, -13.2470703125, -12.354736328125, -11.46240234375, -10.570068359375, -9.677734375, -8.785400390625, -7.89306640625, -7.000732421875, -6.1083984375, -5.216064453125, -4.32373046875, -3.431396484375, -2.5390625, -1.646728515625, -0.75439453125, 0.137939453125, 1.0302734375, 1.922607421875, 2.81494140625, 3.707275390625, 4.599609375, 5.491943359375, 6.38427734375, 7.276611328125, 8.1689453125, 9.061279296875, 9.95361328125, 10.845947265625, 11.73828125, 12.630615234375, 13.52294921875, 14.415283203125, 15.3076171875, 16.199951171875, 17.09228515625, 17.984619140625, 18.876953125, 19.769287109375, 20.66162109375, 21.553955078125, 22.4462890625, 23.338623046875, 24.23095703125, 25.123291015625, 26.015625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 8.0, 12.0, 11.0, 9.0, 10.0, 15.0, 14.0, 27.0, 35.0, 51.0, 86.0, 131.0, 260.0, 552.0, 1324.0, 3456.0, 12810.0, 3423262.0, 737802.0, 9984.0, 2566.0, 941.0, 366.0, 200.0, 107.0, 61.0, 46.0, 28.0, 23.0, 20.0, 14.0, 7.0, 8.0, 6.0, 9.0, 6.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-211.625, -205.38671875, -199.1484375, -192.91015625, -186.671875, -180.43359375, -174.1953125, -167.95703125, -161.71875, -155.48046875, -149.2421875, -143.00390625, -136.765625, -130.52734375, -124.2890625, -118.05078125, -111.8125, -105.57421875, -99.3359375, -93.09765625, -86.859375, -80.62109375, -74.3828125, -68.14453125, -61.90625, -55.66796875, -49.4296875, -43.19140625, -36.953125, -30.71484375, -24.4765625, -18.23828125, -12.0, -5.76171875, 0.4765625, 6.71484375, 12.953125, 19.19140625, 25.4296875, 31.66796875, 37.90625, 44.14453125, 50.3828125, 56.62109375, 62.859375, 69.09765625, 75.3359375, 81.57421875, 87.8125, 94.05078125, 100.2890625, 106.52734375, 112.765625, 119.00390625, 125.2421875, 131.48046875, 137.71875, 143.95703125, 150.1953125, 156.43359375, 162.671875, 168.91015625, 175.1484375, 181.38671875, 187.625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 9.0, 13.0, 12.0, 18.0, 22.0, 22.0, 34.0, 53.0, 104.0, 305.0, 803.0, 1490.0, 664.0, 225.0, 76.0, 42.0, 28.0, 24.0, 17.0, 14.0, 12.0, 7.0, 3.0, 13.0, 1.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-77.5, -74.861328125, -72.22265625, -69.583984375, -66.9453125, -64.306640625, -61.66796875, -59.029296875, -56.390625, -53.751953125, -51.11328125, -48.474609375, -45.8359375, -43.197265625, -40.55859375, -37.919921875, -35.28125, -32.642578125, -30.00390625, -27.365234375, -24.7265625, -22.087890625, -19.44921875, -16.810546875, -14.171875, -11.533203125, -8.89453125, -6.255859375, -3.6171875, -0.978515625, 1.66015625, 4.298828125, 6.9375, 9.576171875, 12.21484375, 14.853515625, 17.4921875, 20.130859375, 22.76953125, 25.408203125, 28.046875, 30.685546875, 33.32421875, 35.962890625, 38.6015625, 41.240234375, 43.87890625, 46.517578125, 49.15625, 51.794921875, 54.43359375, 57.072265625, 59.7109375, 62.349609375, 64.98828125, 67.626953125, 70.265625, 72.904296875, 75.54296875, 78.181640625, 80.8203125, 83.458984375, 86.09765625, 88.736328125, 91.375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 6.0, 1.0, 0.0, 6.0, 6.0, 8.0, 9.0, 15.0, 17.0, 23.0, 29.0, 45.0, 74.0, 86.0, 114.0, 152.0, 185.0, 300.0, 409.0, 536.0, 741.0, 1162.0, 1733.0, 2416.0, 3587.0, 5735.0, 9438.0, 17440.0, 37212.0, 140779.0, 3297075.0, 554559.0, 62193.0, 23970.0, 12652.0, 7451.0, 4493.0, 2964.0, 2005.0, 1392.0, 928.0, 643.0, 487.0, 346.0, 238.0, 153.0, 124.0, 104.0, 69.0, 58.0, 41.0, 24.0, 17.0, 14.0, 13.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-96.1875, -93.1572265625, -90.126953125, -87.0966796875, -84.06640625, -81.0361328125, -78.005859375, -74.9755859375, -71.9453125, -68.9150390625, -65.884765625, -62.8544921875, -59.82421875, -56.7939453125, -53.763671875, -50.7333984375, -47.703125, -44.6728515625, -41.642578125, -38.6123046875, -35.58203125, -32.5517578125, -29.521484375, -26.4912109375, -23.4609375, -20.4306640625, -17.400390625, -14.3701171875, -11.33984375, -8.3095703125, -5.279296875, -2.2490234375, 0.78125, 3.8115234375, 6.841796875, 9.8720703125, 12.90234375, 15.9326171875, 18.962890625, 21.9931640625, 25.0234375, 28.0537109375, 31.083984375, 34.1142578125, 37.14453125, 40.1748046875, 43.205078125, 46.2353515625, 49.265625, 52.2958984375, 55.326171875, 58.3564453125, 61.38671875, 64.4169921875, 67.447265625, 70.4775390625, 73.5078125, 76.5380859375, 79.568359375, 82.5986328125, 85.62890625, 88.6591796875, 91.689453125, 94.7197265625, 97.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 7.0, 13.0, 21.0, 29.0, 42.0, 54.0, 102.0, 202.0, 217.0, 112.0, 65.0, 38.0, 37.0, 17.0, 12.0, 13.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-425.1797790527344, -413.6929016113281, -402.2060241699219, -390.7191467285156, -379.2322692871094, -367.7453918457031, -356.258544921875, -344.77166748046875, -333.2847900390625, -321.79791259765625, -310.31103515625, -298.82415771484375, -287.3372802734375, -275.85040283203125, -264.363525390625, -252.8766632080078, -241.3897705078125, -229.90289306640625, -218.416015625, -206.92913818359375, -195.4422607421875, -183.95538330078125, -172.46852111816406, -160.9816436767578, -149.49476623535156, -138.0078887939453, -126.52101135253906, -115.03414154052734, -103.5472640991211, -92.06038665771484, -80.57351684570312, -69.08663940429688, -57.5997314453125, -46.11285400390625, -34.625980377197266, -23.13910675048828, -11.652229309082031, -0.16535186767578125, 11.321517944335938, 22.808395385742188, 34.29527282714844, 45.78215026855469, 57.26902389526367, 68.75589752197266, 80.2427749633789, 91.72965240478516, 103.21652221679688, 114.70339965820312, 126.19027709960938, 137.67715454101562, 149.16403198242188, 160.65090942382812, 172.13778686523438, 183.62466430664062, 195.1115264892578, 206.59840393066406, 218.0852813720703, 229.57215881347656, 241.0590362548828, 252.5458984375, 264.03277587890625, 275.5196533203125, 287.00653076171875, 298.493408203125, 309.98028564453125]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 4.0, 8.0, 12.0, 15.0, 16.0, 13.0, 30.0, 28.0, 29.0, 30.0, 29.0, 40.0, 39.0, 29.0, 39.0, 51.0, 45.0, 54.0, 40.0, 47.0, 42.0, 37.0, 37.0, 37.0, 40.0, 30.0, 29.0, 25.0, 28.0, 16.0, 10.0, 12.0, 12.0, 10.0, 9.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.86265563964844, -204.887451171875, -197.9122314453125, -190.93701171875, -183.96180725097656, -176.98660278320312, -170.01138305664062, -163.03616333007812, -156.0609588623047, -149.08575439453125, -142.11053466796875, -135.13531494140625, -128.1601104736328, -121.18489837646484, -114.20968627929688, -107.2344741821289, -100.25926208496094, -93.28404998779297, -86.308837890625, -79.33362579345703, -72.35841369628906, -65.3832015991211, -58.407989501953125, -51.432777404785156, -44.45756530761719, -37.48235321044922, -30.50714111328125, -23.53192901611328, -16.556716918945312, -9.581504821777344, -2.606292724609375, 4.368919372558594, 11.344131469726562, 18.31934356689453, 25.2945556640625, 32.26976776123047, 39.24497985839844, 46.220191955566406, 53.195404052734375, 60.170616149902344, 67.14582824707031, 74.12104034423828, 81.09625244140625, 88.07146453857422, 95.04667663574219, 102.02188873291016, 108.99710083007812, 115.9723129272461, 122.94752502441406, 129.9227294921875, 136.89794921875, 143.8731689453125, 150.84837341308594, 157.82357788085938, 164.79879760742188, 171.77401733398438, 178.7492218017578, 185.72442626953125, 192.69964599609375, 199.67486572265625, 206.6500701904297, 213.62527465820312, 220.60049438476562, 227.57571411132812, 234.55091857910156]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 7.0, 5.0, 5.0, 11.0, 12.0, 8.0, 10.0, 8.0, 18.0, 19.0, 21.0, 33.0, 35.0, 21.0, 32.0, 48.0, 53.0, 48.0, 44.0, 59.0, 45.0, 54.0, 47.0, 51.0, 49.0, 38.0, 29.0, 29.0, 24.0, 17.0, 20.0, 13.0, 20.0, 10.0, 12.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-29.0625, -28.19384765625, -27.3251953125, -26.45654296875, -25.587890625, -24.71923828125, -23.8505859375, -22.98193359375, -22.11328125, -21.24462890625, -20.3759765625, -19.50732421875, -18.638671875, -17.77001953125, -16.9013671875, -16.03271484375, -15.1640625, -14.29541015625, -13.4267578125, -12.55810546875, -11.689453125, -10.82080078125, -9.9521484375, -9.08349609375, -8.21484375, -7.34619140625, -6.4775390625, -5.60888671875, -4.740234375, -3.87158203125, -3.0029296875, -2.13427734375, -1.265625, -0.39697265625, 0.4716796875, 1.34033203125, 2.208984375, 3.07763671875, 3.9462890625, 4.81494140625, 5.68359375, 6.55224609375, 7.4208984375, 8.28955078125, 9.158203125, 10.02685546875, 10.8955078125, 11.76416015625, 12.6328125, 13.50146484375, 14.3701171875, 15.23876953125, 16.107421875, 16.97607421875, 17.8447265625, 18.71337890625, 19.58203125, 20.45068359375, 21.3193359375, 22.18798828125, 23.056640625, 23.92529296875, 24.7939453125, 25.66259765625, 26.53125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 8.0, 26.0, 32.0, 40.0, 68.0, 96.0, 118.0, 169.0, 213.0, 270.0, 450.0, 608.0, 900.0, 1141.0, 1690.0, 2414.0, 3446.0, 4815.0, 7474.0, 11149.0, 17394.0, 27925.0, 47708.0, 90412.0, 210802.0, 341008.0, 121503.0, 60715.0, 34512.0, 20754.0, 13105.0, 8610.0, 5856.0, 3912.0, 2619.0, 1891.0, 1372.0, 937.0, 657.0, 501.0, 367.0, 267.0, 169.0, 118.0, 97.0, 59.0, 47.0, 35.0, 22.0, 21.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0209808349609375, -0.988250732421875, -0.9555206298828125, -0.92279052734375, -0.8900604248046875, -0.857330322265625, -0.8246002197265625, -0.7918701171875, -0.7591400146484375, -0.726409912109375, -0.6936798095703125, -0.66094970703125, -0.6282196044921875, -0.595489501953125, -0.5627593994140625, -0.530029296875, -0.4972991943359375, -0.464569091796875, -0.4318389892578125, -0.39910888671875, -0.3663787841796875, -0.333648681640625, -0.3009185791015625, -0.2681884765625, -0.2354583740234375, -0.202728271484375, -0.1699981689453125, -0.13726806640625, -0.1045379638671875, -0.071807861328125, -0.0390777587890625, -0.00634765625, 0.0263824462890625, 0.059112548828125, 0.0918426513671875, 0.12457275390625, 0.1573028564453125, 0.190032958984375, 0.2227630615234375, 0.2554931640625, 0.2882232666015625, 0.320953369140625, 0.3536834716796875, 0.38641357421875, 0.4191436767578125, 0.451873779296875, 0.4846038818359375, 0.517333984375, 0.5500640869140625, 0.582794189453125, 0.6155242919921875, 0.64825439453125, 0.6809844970703125, 0.713714599609375, 0.7464447021484375, 0.7791748046875, 0.8119049072265625, 0.844635009765625, 0.8773651123046875, 0.91009521484375, 0.9428253173828125, 0.975555419921875, 1.0082855224609375, 1.041015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 3.0, 17.0, 7.0, 12.0, 11.0, 11.0, 22.0, 11.0, 25.0, 32.0, 31.0, 27.0, 26.0, 37.0, 33.0, 41.0, 29.0, 37.0, 40.0, 43.0, 1057.0, 38.0, 45.0, 29.0, 29.0, 31.0, 26.0, 29.0, 32.0, 24.0, 21.0, 22.0, 13.0, 23.0, 11.0, 16.0, 13.0, 10.0, 14.0, 6.0, 4.0, 7.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.2109375, -14.75048828125, -14.2900390625, -13.82958984375, -13.369140625, -12.90869140625, -12.4482421875, -11.98779296875, -11.52734375, -11.06689453125, -10.6064453125, -10.14599609375, -9.685546875, -9.22509765625, -8.7646484375, -8.30419921875, -7.84375, -7.38330078125, -6.9228515625, -6.46240234375, -6.001953125, -5.54150390625, -5.0810546875, -4.62060546875, -4.16015625, -3.69970703125, -3.2392578125, -2.77880859375, -2.318359375, -1.85791015625, -1.3974609375, -0.93701171875, -0.4765625, -0.01611328125, 0.4443359375, 0.90478515625, 1.365234375, 1.82568359375, 2.2861328125, 2.74658203125, 3.20703125, 3.66748046875, 4.1279296875, 4.58837890625, 5.048828125, 5.50927734375, 5.9697265625, 6.43017578125, 6.890625, 7.35107421875, 7.8115234375, 8.27197265625, 8.732421875, 9.19287109375, 9.6533203125, 10.11376953125, 10.57421875, 11.03466796875, 11.4951171875, 11.95556640625, 12.416015625, 12.87646484375, 13.3369140625, 13.79736328125, 14.2578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 3.0, 5.0, 12.0, 18.0, 29.0, 38.0, 52.0, 76.0, 104.0, 129.0, 208.0, 287.0, 377.0, 524.0, 770.0, 1067.0, 1569.0, 2244.0, 3148.0, 4552.0, 6679.0, 9515.0, 13876.0, 20287.0, 30397.0, 46526.0, 71992.0, 124037.0, 1343812.0, 162657.0, 86860.0, 54140.0, 35834.0, 23834.0, 15768.0, 10808.0, 7392.0, 5234.0, 3618.0, 2552.0, 1797.0, 1270.0, 901.0, 662.0, 424.0, 299.0, 235.0, 137.0, 116.0, 84.0, 49.0, 37.0, 36.0, 17.0, 20.0, 11.0, 3.0, 2.0, 2.0, 3.0, 5.0], "bins": [-0.6103515625, -0.5910873413085938, -0.5718231201171875, -0.5525588989257812, -0.533294677734375, -0.5140304565429688, -0.4947662353515625, -0.47550201416015625, -0.45623779296875, -0.43697357177734375, -0.4177093505859375, -0.39844512939453125, -0.379180908203125, -0.35991668701171875, -0.3406524658203125, -0.32138824462890625, -0.3021240234375, -0.28285980224609375, -0.2635955810546875, -0.24433135986328125, -0.225067138671875, -0.20580291748046875, -0.1865386962890625, -0.16727447509765625, -0.14801025390625, -0.12874603271484375, -0.1094818115234375, -0.09021759033203125, -0.070953369140625, -0.05168914794921875, -0.0324249267578125, -0.01316070556640625, 0.006103515625, 0.02536773681640625, 0.0446319580078125, 0.06389617919921875, 0.083160400390625, 0.10242462158203125, 0.1216888427734375, 0.14095306396484375, 0.16021728515625, 0.17948150634765625, 0.1987457275390625, 0.21800994873046875, 0.237274169921875, 0.25653839111328125, 0.2758026123046875, 0.29506683349609375, 0.3143310546875, 0.33359527587890625, 0.3528594970703125, 0.37212371826171875, 0.391387939453125, 0.41065216064453125, 0.4299163818359375, 0.44918060302734375, 0.46844482421875, 0.48770904541015625, 0.5069732666015625, 0.5262374877929688, 0.545501708984375, 0.5647659301757812, 0.5840301513671875, 0.6032943725585938, 0.62255859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 10.0, 6.0, 5.0, 9.0, 12.0, 13.0, 19.0, 21.0, 24.0, 19.0, 23.0, 41.0, 28.0, 50.0, 50.0, 53.0, 97.0, 95.0, 56.0, 58.0, 28.0, 38.0, 35.0, 23.0, 25.0, 27.0, 14.0, 19.0, 12.0, 15.0, 7.0, 10.0, 8.0, 8.0, 5.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.413459777832031e-05, -6.236415356397629e-05, -6.059370934963226e-05, -5.882326513528824e-05, -5.7052820920944214e-05, -5.528237670660019e-05, -5.3511932492256165e-05, -5.174148827791214e-05, -4.9971044063568115e-05, -4.820059984922409e-05, -4.6430155634880066e-05, -4.465971142053604e-05, -4.2889267206192017e-05, -4.111882299184799e-05, -3.934837877750397e-05, -3.757793456315994e-05, -3.580749034881592e-05, -3.403704613447189e-05, -3.226660192012787e-05, -3.0496157705783844e-05, -2.872571349143982e-05, -2.6955269277095795e-05, -2.518482506275177e-05, -2.3414380848407745e-05, -2.164393663406372e-05, -1.9873492419719696e-05, -1.810304820537567e-05, -1.6332603991031647e-05, -1.4562159776687622e-05, -1.2791715562343597e-05, -1.1021271347999573e-05, -9.250827133655548e-06, -7.4803829193115234e-06, -5.709938704967499e-06, -3.939494490623474e-06, -2.1690502762794495e-06, -3.986060619354248e-07, 1.3718381524085999e-06, 3.1422823667526245e-06, 4.912726581096649e-06, 6.683170795440674e-06, 8.453615009784698e-06, 1.0224059224128723e-05, 1.1994503438472748e-05, 1.3764947652816772e-05, 1.5535391867160797e-05, 1.7305836081504822e-05, 1.9076280295848846e-05, 2.084672451019287e-05, 2.2617168724536896e-05, 2.438761293888092e-05, 2.6158057153224945e-05, 2.792850136756897e-05, 2.9698945581912994e-05, 3.146938979625702e-05, 3.3239834010601044e-05, 3.501027822494507e-05, 3.678072243928909e-05, 3.855116665363312e-05, 4.032161086797714e-05, 4.209205508232117e-05, 4.386249929666519e-05, 4.5632943511009216e-05, 4.740338772535324e-05, 4.9173831939697266e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 10.0, 7.0, 9.0, 5.0, 12.0, 15.0, 21.0, 31.0, 31.0, 36.0, 43.0, 44.0, 56.0, 84.0, 101.0, 109.0, 167.0, 232.0, 871.0, 13233.0, 923992.0, 105140.0, 3017.0, 389.0, 187.0, 126.0, 107.0, 83.0, 63.0, 58.0, 48.0, 37.0, 33.0, 35.0, 25.0, 25.0, 24.0, 14.0, 10.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009188652038574219, -0.0008889958262443542, -0.0008591264486312866, -0.000829257071018219, -0.0007993876934051514, -0.0007695183157920837, -0.0007396489381790161, -0.0007097795605659485, -0.0006799101829528809, -0.0006500408053398132, -0.0006201714277267456, -0.000590302050113678, -0.0005604326725006104, -0.0005305632948875427, -0.0005006939172744751, -0.00047082453966140747, -0.00044095516204833984, -0.0004110857844352722, -0.0003812164068222046, -0.00035134702920913696, -0.00032147765159606934, -0.0002916082739830017, -0.0002617388963699341, -0.00023186951875686646, -0.00020200014114379883, -0.0001721307635307312, -0.00014226138591766357, -0.00011239200830459595, -8.252263069152832e-05, -5.265325307846069e-05, -2.2783875465393066e-05, 7.0855021476745605e-06, 3.695487976074219e-05, 6.682425737380981e-05, 9.669363498687744e-05, 0.00012656301259994507, 0.0001564323902130127, 0.00018630176782608032, 0.00021617114543914795, 0.0002460405230522156, 0.0002759099006652832, 0.00030577927827835083, 0.00033564865589141846, 0.0003655180335044861, 0.0003953874111175537, 0.00042525678873062134, 0.00045512616634368896, 0.0004849955439567566, 0.0005148649215698242, 0.0005447342991828918, 0.0005746036767959595, 0.0006044730544090271, 0.0006343424320220947, 0.0006642118096351624, 0.00069408118724823, 0.0007239505648612976, 0.0007538199424743652, 0.0007836893200874329, 0.0008135586977005005, 0.0008434280753135681, 0.0008732974529266357, 0.0009031668305397034, 0.000933036208152771, 0.0009629055857658386, 0.0009927749633789062]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 20.0, 90.0, 595.0, 242.0, 42.0, 11.0, 4.0, 1.0], "bins": [-0.0003470896335784346, -0.00034118382609449327, -0.0003352779895067215, -0.0003293721820227802, -0.0003234663454350084, -0.0003175605379510671, -0.0003116547013632953, -0.000305748893879354, -0.0002998430572915822, -0.0002939372498076409, -0.00028803141321986914, -0.0002821256057359278, -0.00027621976914815605, -0.00027031396166421473, -0.00026440812507644296, -0.00025850231759250164, -0.0002525965101085603, -0.000246690702624619, -0.00024078486603684723, -0.0002348790440009907, -0.00022897322196513414, -0.00022306741448119283, -0.00021716157789342105, -0.00021125577040947974, -0.00020534993382170796, -0.00019944411178585142, -0.00019353828974999487, -0.00018763246771413833, -0.00018172664567828178, -0.00017582083819434047, -0.0001699150016065687, -0.00016400919412262738, -0.00015810337208677083, -0.0001521975500509143, -0.00014629172801505774, -0.0001403859059792012, -0.00013448008394334465, -0.0001285742619074881, -0.0001226684544235468, -0.00011676263238769025, -0.0001108568103518337, -0.00010495098831597716, -9.904516628012061e-05, -9.313934424426407e-05, -8.723352948436514e-05, -8.132770744850859e-05, -7.542188541265205e-05, -6.951607065275311e-05, -6.361024134093896e-05, -5.770441930508241e-05, -5.179860090720467e-05, -4.589277887134813e-05, -3.998696047347039e-05, -3.4081138437613845e-05, -2.81753164017573e-05, -2.2269498003879562e-05, -1.6363675968023017e-05, -1.0457855751155876e-05, -4.5520346247940324e-06, 1.3537865015678108e-06, 7.259606718434952e-06, 1.3165426935302094e-05, 1.907124897115864e-05, 2.4977067369036376e-05, 3.088288940489292e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 3.0, 11.0, 5.0, 14.0, 19.0, 14.0, 11.0, 14.0, 19.0, 18.0, 23.0, 27.0, 45.0, 28.0, 42.0, 33.0, 34.0, 39.0, 42.0, 35.0, 34.0, 50.0, 39.0, 46.0, 37.0, 40.0, 40.0, 24.0, 21.0, 28.0, 24.0, 19.0, 15.0, 19.0, 14.0, 12.0, 9.0, 8.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7298927307128906e-05, -2.636108547449112e-05, -2.5423243641853333e-05, -2.4485401809215546e-05, -2.354755997657776e-05, -2.2609718143939972e-05, -2.1671876311302185e-05, -2.0734034478664398e-05, -1.979619264602661e-05, -1.8858350813388824e-05, -1.7920508980751038e-05, -1.698266714811325e-05, -1.6044825315475464e-05, -1.5106983482837677e-05, -1.416914165019989e-05, -1.3231299817562103e-05, -1.2293457984924316e-05, -1.135561615228653e-05, -1.0417774319648743e-05, -9.479932487010956e-06, -8.542090654373169e-06, -7.604248821735382e-06, -6.666406989097595e-06, -5.728565156459808e-06, -4.7907233238220215e-06, -3.852881491184235e-06, -2.9150396585464478e-06, -1.977197825908661e-06, -1.039355993270874e-06, -1.0151416063308716e-07, 8.363276720046997e-07, 1.7741695046424866e-06, 2.7120113372802734e-06, 3.6498531699180603e-06, 4.587695002555847e-06, 5.525536835193634e-06, 6.463378667831421e-06, 7.401220500469208e-06, 8.339062333106995e-06, 9.276904165744781e-06, 1.0214745998382568e-05, 1.1152587831020355e-05, 1.2090429663658142e-05, 1.3028271496295929e-05, 1.3966113328933716e-05, 1.4903955161571503e-05, 1.584179699420929e-05, 1.6779638826847076e-05, 1.7717480659484863e-05, 1.865532249212265e-05, 1.9593164324760437e-05, 2.0531006157398224e-05, 2.146884799003601e-05, 2.2406689822673798e-05, 2.3344531655311584e-05, 2.428237348794937e-05, 2.5220215320587158e-05, 2.6158057153224945e-05, 2.7095898985862732e-05, 2.803374081850052e-05, 2.8971582651138306e-05, 2.9909424483776093e-05, 3.084726631641388e-05, 3.1785108149051666e-05, 3.272294998168945e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 7.0, 5.0, 5.0, 11.0, 12.0, 8.0, 10.0, 8.0, 18.0, 19.0, 21.0, 33.0, 35.0, 21.0, 32.0, 48.0, 53.0, 48.0, 44.0, 59.0, 45.0, 54.0, 47.0, 51.0, 49.0, 38.0, 29.0, 29.0, 24.0, 17.0, 20.0, 13.0, 20.0, 10.0, 12.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-29.0625, -28.19384765625, -27.3251953125, -26.45654296875, -25.587890625, -24.71923828125, -23.8505859375, -22.98193359375, -22.11328125, -21.24462890625, -20.3759765625, -19.50732421875, -18.638671875, -17.77001953125, -16.9013671875, -16.03271484375, -15.1640625, -14.29541015625, -13.4267578125, -12.55810546875, -11.689453125, -10.82080078125, -9.9521484375, -9.08349609375, -8.21484375, -7.34619140625, -6.4775390625, -5.60888671875, -4.740234375, -3.87158203125, -3.0029296875, -2.13427734375, -1.265625, -0.39697265625, 0.4716796875, 1.34033203125, 2.208984375, 3.07763671875, 3.9462890625, 4.81494140625, 5.68359375, 6.55224609375, 7.4208984375, 8.28955078125, 9.158203125, 10.02685546875, 10.8955078125, 11.76416015625, 12.6328125, 13.50146484375, 14.3701171875, 15.23876953125, 16.107421875, 16.97607421875, 17.8447265625, 18.71337890625, 19.58203125, 20.45068359375, 21.3193359375, 22.18798828125, 23.056640625, 23.92529296875, 24.7939453125, 25.66259765625, 26.53125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 13.0, 13.0, 27.0, 29.0, 41.0, 59.0, 82.0, 95.0, 149.0, 208.0, 330.0, 543.0, 935.0, 1839.0, 4004.0, 11008.0, 37227.0, 212767.0, 657467.0, 87768.0, 20794.0, 6886.0, 2867.0, 1305.0, 699.0, 428.0, 317.0, 197.0, 128.0, 82.0, 62.0, 52.0, 30.0, 27.0, 14.0, 8.0, 12.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -25.095947265625, -24.23876953125, -23.381591796875, -22.5244140625, -21.667236328125, -20.81005859375, -19.952880859375, -19.095703125, -18.238525390625, -17.38134765625, -16.524169921875, -15.6669921875, -14.809814453125, -13.95263671875, -13.095458984375, -12.23828125, -11.381103515625, -10.52392578125, -9.666748046875, -8.8095703125, -7.952392578125, -7.09521484375, -6.238037109375, -5.380859375, -4.523681640625, -3.66650390625, -2.809326171875, -1.9521484375, -1.094970703125, -0.23779296875, 0.619384765625, 1.4765625, 2.333740234375, 3.19091796875, 4.048095703125, 4.9052734375, 5.762451171875, 6.61962890625, 7.476806640625, 8.333984375, 9.191162109375, 10.04833984375, 10.905517578125, 11.7626953125, 12.619873046875, 13.47705078125, 14.334228515625, 15.19140625, 16.048583984375, 16.90576171875, 17.762939453125, 18.6201171875, 19.477294921875, 20.33447265625, 21.191650390625, 22.048828125, 22.906005859375, 23.76318359375, 24.620361328125, 25.4775390625, 26.334716796875, 27.19189453125, 28.049072265625, 28.90625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 6.0, 11.0, 6.0, 10.0, 13.0, 22.0, 18.0, 23.0, 30.0, 20.0, 44.0, 24.0, 39.0, 49.0, 57.0, 42.0, 59.0, 105.0, 1910.0, 110.0, 52.0, 38.0, 43.0, 34.0, 36.0, 34.0, 36.0, 24.0, 26.0, 15.0, 20.0, 24.0, 9.0, 8.0, 7.0, 8.0, 6.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.125, -101.986328125, -98.84765625, -95.708984375, -92.5703125, -89.431640625, -86.29296875, -83.154296875, -80.015625, -76.876953125, -73.73828125, -70.599609375, -67.4609375, -64.322265625, -61.18359375, -58.044921875, -54.90625, -51.767578125, -48.62890625, -45.490234375, -42.3515625, -39.212890625, -36.07421875, -32.935546875, -29.796875, -26.658203125, -23.51953125, -20.380859375, -17.2421875, -14.103515625, -10.96484375, -7.826171875, -4.6875, -1.548828125, 1.58984375, 4.728515625, 7.8671875, 11.005859375, 14.14453125, 17.283203125, 20.421875, 23.560546875, 26.69921875, 29.837890625, 32.9765625, 36.115234375, 39.25390625, 42.392578125, 45.53125, 48.669921875, 51.80859375, 54.947265625, 58.0859375, 61.224609375, 64.36328125, 67.501953125, 70.640625, 73.779296875, 76.91796875, 80.056640625, 83.1953125, 86.333984375, 89.47265625, 92.611328125, 95.75]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 6.0, 10.0, 20.0, 21.0, 17.0, 24.0, 28.0, 44.0, 60.0, 78.0, 135.0, 253.0, 562.0, 1785.0, 13671.0, 3068146.0, 55654.0, 3322.0, 863.0, 368.0, 177.0, 112.0, 64.0, 50.0, 38.0, 34.0, 24.0, 23.0, 20.0, 13.0, 6.0, 9.0, 11.0, 5.0, 9.0, 3.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-166.375, -160.953125, -155.53125, -150.109375, -144.6875, -139.265625, -133.84375, -128.421875, -123.0, -117.578125, -112.15625, -106.734375, -101.3125, -95.890625, -90.46875, -85.046875, -79.625, -74.203125, -68.78125, -63.359375, -57.9375, -52.515625, -47.09375, -41.671875, -36.25, -30.828125, -25.40625, -19.984375, -14.5625, -9.140625, -3.71875, 1.703125, 7.125, 12.546875, 17.96875, 23.390625, 28.8125, 34.234375, 39.65625, 45.078125, 50.5, 55.921875, 61.34375, 66.765625, 72.1875, 77.609375, 83.03125, 88.453125, 93.875, 99.296875, 104.71875, 110.140625, 115.5625, 120.984375, 126.40625, 131.828125, 137.25, 142.671875, 148.09375, 153.515625, 158.9375, 164.359375, 169.78125, 175.203125, 180.625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 324.0, 673.0, 13.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.2940444946289, -65.51303100585938, -34.732017517089844, -3.9510040283203125, 26.83000946044922, 57.61101531982422, 88.39203643798828, 119.17305755615234, 149.95407104492188, 180.73507690429688, 211.51609802246094, 242.297119140625, 273.078125, 303.859130859375, 334.64013671875, 365.4211730957031, 396.2021789550781, 426.9831848144531, 457.76422119140625, 488.54522705078125, 519.3262329101562, 550.1072387695312, 580.8882446289062, 611.6693115234375, 642.4502563476562, 673.2312622070312, 704.0122680664062, 734.7932739257812, 765.5743408203125, 796.3553466796875, 827.1363525390625, 857.9173583984375, 888.6983642578125, 919.4793701171875, 950.2603759765625, 981.0413818359375, 1011.8223876953125, 1042.6033935546875, 1073.3843994140625, 1104.16552734375, 1134.946533203125, 1165.7275390625, 1196.508544921875, 1227.28955078125, 1258.070556640625, 1288.8515625, 1319.632568359375, 1350.41357421875, 1381.194580078125, 1411.9755859375, 1442.756591796875, 1473.53759765625, 1504.318603515625, 1535.099609375, 1565.880615234375, 1596.66162109375, 1627.442626953125, 1658.2236328125, 1689.004638671875, 1719.78564453125, 1750.566650390625, 1781.34765625, 1812.128662109375, 1842.90966796875, 1873.6907958984375]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 8.0, 6.0, 11.0, 21.0, 20.0, 19.0, 23.0, 12.0, 20.0, 20.0, 23.0, 22.0, 29.0, 48.0, 37.0, 34.0, 39.0, 45.0, 58.0, 33.0, 48.0, 29.0, 31.0, 34.0, 31.0, 40.0, 36.0, 29.0, 24.0, 24.0, 20.0, 16.0, 11.0, 16.0, 19.0, 18.0, 12.0, 2.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-325.37841796875, -315.216064453125, -305.0536804199219, -294.8913269042969, -284.7289733886719, -274.56658935546875, -264.40423583984375, -254.24188232421875, -244.0795135498047, -233.91714477539062, -223.75479125976562, -213.59242248535156, -203.4300537109375, -193.2677001953125, -183.10533142089844, -172.94296264648438, -162.78060913085938, -152.6182403564453, -142.4558868408203, -132.29351806640625, -122.13115692138672, -111.96879577636719, -101.80642700195312, -91.6440658569336, -81.48170471191406, -71.31934356689453, -61.156978607177734, -50.99461364746094, -40.832252502441406, -30.669891357421875, -20.507526397705078, -10.345161437988281, -0.182830810546875, 9.979532241821289, 20.141895294189453, 30.304258346557617, 40.46662139892578, 50.62898254394531, 60.79134750366211, 70.9537124633789, 81.11607360839844, 91.27843475341797, 101.4407958984375, 111.60316467285156, 121.7655258178711, 131.92788696289062, 142.0902557373047, 152.25262451171875, 162.41497802734375, 172.5773468017578, 182.7397003173828, 192.90206909179688, 203.06442260742188, 213.22679138183594, 223.38916015625, 233.551513671875, 243.71388244628906, 253.87625122070312, 264.0386047363281, 274.2009582519531, 284.36334228515625, 294.52569580078125, 304.68804931640625, 314.8504333496094, 325.0127868652344]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 8.0, 7.0, 2.0, 6.0, 9.0, 12.0, 7.0, 7.0, 11.0, 11.0, 22.0, 21.0, 36.0, 22.0, 25.0, 38.0, 41.0, 53.0, 38.0, 46.0, 56.0, 44.0, 57.0, 50.0, 52.0, 42.0, 52.0, 30.0, 22.0, 26.0, 29.0, 18.0, 9.0, 19.0, 15.0, 9.0, 12.0, 4.0, 10.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.765625, -28.88720703125, -28.0087890625, -27.13037109375, -26.251953125, -25.37353515625, -24.4951171875, -23.61669921875, -22.73828125, -21.85986328125, -20.9814453125, -20.10302734375, -19.224609375, -18.34619140625, -17.4677734375, -16.58935546875, -15.7109375, -14.83251953125, -13.9541015625, -13.07568359375, -12.197265625, -11.31884765625, -10.4404296875, -9.56201171875, -8.68359375, -7.80517578125, -6.9267578125, -6.04833984375, -5.169921875, -4.29150390625, -3.4130859375, -2.53466796875, -1.65625, -0.77783203125, 0.1005859375, 0.97900390625, 1.857421875, 2.73583984375, 3.6142578125, 4.49267578125, 5.37109375, 6.24951171875, 7.1279296875, 8.00634765625, 8.884765625, 9.76318359375, 10.6416015625, 11.52001953125, 12.3984375, 13.27685546875, 14.1552734375, 15.03369140625, 15.912109375, 16.79052734375, 17.6689453125, 18.54736328125, 19.42578125, 20.30419921875, 21.1826171875, 22.06103515625, 22.939453125, 23.81787109375, 24.6962890625, 25.57470703125, 26.453125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 9.0, 4.0, 3.0, 9.0, 8.0, 12.0, 11.0, 11.0, 14.0, 28.0, 54.0, 94.0, 154.0, 272.0, 469.0, 802.0, 1551.0, 3591.0, 9842.0, 323088.0, 3826396.0, 18821.0, 4943.0, 1986.0, 963.0, 475.0, 233.0, 137.0, 85.0, 57.0, 34.0, 23.0, 30.0, 12.0, 13.0, 7.0, 7.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-179.125, -173.88671875, -168.6484375, -163.41015625, -158.171875, -152.93359375, -147.6953125, -142.45703125, -137.21875, -131.98046875, -126.7421875, -121.50390625, -116.265625, -111.02734375, -105.7890625, -100.55078125, -95.3125, -90.07421875, -84.8359375, -79.59765625, -74.359375, -69.12109375, -63.8828125, -58.64453125, -53.40625, -48.16796875, -42.9296875, -37.69140625, -32.453125, -27.21484375, -21.9765625, -16.73828125, -11.5, -6.26171875, -1.0234375, 4.21484375, 9.453125, 14.69140625, 19.9296875, 25.16796875, 30.40625, 35.64453125, 40.8828125, 46.12109375, 51.359375, 56.59765625, 61.8359375, 67.07421875, 72.3125, 77.55078125, 82.7890625, 88.02734375, 93.265625, 98.50390625, 103.7421875, 108.98046875, 114.21875, 119.45703125, 124.6953125, 129.93359375, 135.171875, 140.41015625, 145.6484375, 150.88671875, 156.125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 6.0, 6.0, 9.0, 10.0, 10.0, 15.0, 26.0, 25.0, 43.0, 83.0, 244.0, 927.0, 1775.0, 558.0, 160.0, 55.0, 29.0, 32.0, 16.0, 12.0, 5.0, 3.0, 11.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-149.875, -146.4892578125, -143.103515625, -139.7177734375, -136.33203125, -132.9462890625, -129.560546875, -126.1748046875, -122.7890625, -119.4033203125, -116.017578125, -112.6318359375, -109.24609375, -105.8603515625, -102.474609375, -99.0888671875, -95.703125, -92.3173828125, -88.931640625, -85.5458984375, -82.16015625, -78.7744140625, -75.388671875, -72.0029296875, -68.6171875, -65.2314453125, -61.845703125, -58.4599609375, -55.07421875, -51.6884765625, -48.302734375, -44.9169921875, -41.53125, -38.1455078125, -34.759765625, -31.3740234375, -27.98828125, -24.6025390625, -21.216796875, -17.8310546875, -14.4453125, -11.0595703125, -7.673828125, -4.2880859375, -0.90234375, 2.4833984375, 5.869140625, 9.2548828125, 12.640625, 16.0263671875, 19.412109375, 22.7978515625, 26.18359375, 29.5693359375, 32.955078125, 36.3408203125, 39.7265625, 43.1123046875, 46.498046875, 49.8837890625, 53.26953125, 56.6552734375, 60.041015625, 63.4267578125, 66.8125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 8.0, 12.0, 13.0, 15.0, 49.0, 77.0, 107.0, 191.0, 331.0, 675.0, 1430.0, 3269.0, 8129.0, 27118.0, 300504.0, 3772522.0, 57065.0, 13871.0, 4810.0, 2004.0, 980.0, 483.0, 233.0, 131.0, 82.0, 42.0, 37.0, 29.0, 15.0, 9.0, 8.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.75, -152.19921875, -145.6484375, -139.09765625, -132.546875, -125.99609375, -119.4453125, -112.89453125, -106.34375, -99.79296875, -93.2421875, -86.69140625, -80.140625, -73.58984375, -67.0390625, -60.48828125, -53.9375, -47.38671875, -40.8359375, -34.28515625, -27.734375, -21.18359375, -14.6328125, -8.08203125, -1.53125, 5.01953125, 11.5703125, 18.12109375, 24.671875, 31.22265625, 37.7734375, 44.32421875, 50.875, 57.42578125, 63.9765625, 70.52734375, 77.078125, 83.62890625, 90.1796875, 96.73046875, 103.28125, 109.83203125, 116.3828125, 122.93359375, 129.484375, 136.03515625, 142.5859375, 149.13671875, 155.6875, 162.23828125, 168.7890625, 175.33984375, 181.890625, 188.44140625, 194.9921875, 201.54296875, 208.09375, 214.64453125, 221.1953125, 227.74609375, 234.296875, 240.84765625, 247.3984375, 253.94921875, 260.5]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 4.0, 6.0, 9.0, 16.0, 24.0, 27.0, 46.0, 54.0, 76.0, 160.0, 198.0, 139.0, 72.0, 49.0, 36.0, 28.0, 13.0, 10.0, 7.0, 3.0, 6.0, 1.0, 6.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-421.85284423828125, -411.6576843261719, -401.4625244140625, -391.267333984375, -381.0721740722656, -370.87701416015625, -360.6818542480469, -350.4866943359375, -340.29150390625, -330.0963439941406, -319.90118408203125, -309.70599365234375, -299.5108337402344, -289.315673828125, -279.1205139160156, -268.92535400390625, -258.7301940917969, -248.5350341796875, -238.33985900878906, -228.1446990966797, -217.94952392578125, -207.75436401367188, -197.5592041015625, -187.36404418945312, -177.1688690185547, -166.9737091064453, -156.77853393554688, -146.5833740234375, -136.38821411132812, -126.19303894042969, -115.99787902832031, -105.8027114868164, -95.6075439453125, -85.4123764038086, -75.21720886230469, -65.02204895019531, -54.826881408691406, -44.6317138671875, -34.43655014038086, -24.24138641357422, -14.046218872070312, -3.851053237915039, 6.344112396240234, 16.539278030395508, 26.73444366455078, 36.92961120605469, 47.12477493286133, 57.31993865966797, 67.51510620117188, 77.71027374267578, 87.90544128417969, 98.10060119628906, 108.29576873779297, 118.49093627929688, 128.68609619140625, 138.88125610351562, 149.07643127441406, 159.27159118652344, 169.46676635742188, 179.66192626953125, 189.85708618164062, 200.05226135253906, 210.24742126464844, 220.44259643554688, 230.63775634765625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 9.0, 10.0, 9.0, 11.0, 13.0, 13.0, 25.0, 31.0, 27.0, 24.0, 31.0, 35.0, 26.0, 34.0, 45.0, 32.0, 50.0, 34.0, 50.0, 53.0, 44.0, 35.0, 50.0, 30.0, 35.0, 30.0, 22.0, 27.0, 26.0, 26.0, 13.0, 23.0, 14.0, 16.0, 10.0, 4.0, 11.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.03485107421875, -165.90151977539062, -159.76817321777344, -153.63482666015625, -147.50149536132812, -141.3681640625, -135.2348175048828, -129.10147094726562, -122.9681396484375, -116.83480072021484, -110.70146179199219, -104.56812286376953, -98.43478393554688, -92.30144500732422, -86.16810607910156, -80.0347671508789, -73.90142822265625, -67.7680892944336, -61.63475036621094, -55.50141143798828, -49.368072509765625, -43.23473358154297, -37.10139465332031, -30.968055725097656, -24.834716796875, -18.701377868652344, -12.568038940429688, -6.434700012207031, -0.301361083984375, 5.831977844238281, 11.965316772460938, 18.098655700683594, 24.23199462890625, 30.365333557128906, 36.49867248535156, 42.63201141357422, 48.765350341796875, 54.89868927001953, 61.03202819824219, 67.16536712646484, 73.2987060546875, 79.43204498291016, 85.56538391113281, 91.69872283935547, 97.83206176757812, 103.96540069580078, 110.09873962402344, 116.2320785522461, 122.36541748046875, 128.49874877929688, 134.63209533691406, 140.76544189453125, 146.89877319335938, 153.0321044921875, 159.1654510498047, 165.29879760742188, 171.43212890625, 177.56546020507812, 183.6988067626953, 189.8321533203125, 195.96548461914062, 202.09881591796875, 208.23216247558594, 214.36550903320312, 220.49884033203125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 2.0, 5.0, 5.0, 8.0, 6.0, 8.0, 9.0, 12.0, 15.0, 14.0, 19.0, 21.0, 25.0, 21.0, 27.0, 36.0, 37.0, 32.0, 46.0, 50.0, 48.0, 43.0, 42.0, 47.0, 70.0, 40.0, 30.0, 43.0, 36.0, 26.0, 25.0, 20.0, 21.0, 14.0, 15.0, 10.0, 22.0, 12.0, 5.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-28.0625, -27.175048828125, -26.28759765625, -25.400146484375, -24.5126953125, -23.625244140625, -22.73779296875, -21.850341796875, -20.962890625, -20.075439453125, -19.18798828125, -18.300537109375, -17.4130859375, -16.525634765625, -15.63818359375, -14.750732421875, -13.86328125, -12.975830078125, -12.08837890625, -11.200927734375, -10.3134765625, -9.426025390625, -8.53857421875, -7.651123046875, -6.763671875, -5.876220703125, -4.98876953125, -4.101318359375, -3.2138671875, -2.326416015625, -1.43896484375, -0.551513671875, 0.3359375, 1.223388671875, 2.11083984375, 2.998291015625, 3.8857421875, 4.773193359375, 5.66064453125, 6.548095703125, 7.435546875, 8.322998046875, 9.21044921875, 10.097900390625, 10.9853515625, 11.872802734375, 12.76025390625, 13.647705078125, 14.53515625, 15.422607421875, 16.31005859375, 17.197509765625, 18.0849609375, 18.972412109375, 19.85986328125, 20.747314453125, 21.634765625, 22.522216796875, 23.40966796875, 24.297119140625, 25.1845703125, 26.072021484375, 26.95947265625, 27.846923828125, 28.734375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 13.0, 20.0, 30.0, 51.0, 76.0, 109.0, 197.0, 213.0, 400.0, 544.0, 740.0, 1108.0, 1710.0, 2458.0, 3958.0, 6025.0, 9450.0, 14731.0, 24148.0, 41030.0, 75450.0, 173667.0, 394028.0, 138316.0, 64901.0, 35645.0, 21685.0, 13336.0, 8448.0, 5372.0, 3591.0, 2391.0, 1660.0, 992.0, 657.0, 479.0, 285.0, 197.0, 135.0, 98.0, 76.0, 35.0, 25.0, 27.0, 15.0, 14.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2783203125, -1.2388458251953125, -1.199371337890625, -1.1598968505859375, -1.12042236328125, -1.0809478759765625, -1.041473388671875, -1.0019989013671875, -0.9625244140625, -0.9230499267578125, -0.883575439453125, -0.8441009521484375, -0.80462646484375, -0.7651519775390625, -0.725677490234375, -0.6862030029296875, -0.646728515625, -0.6072540283203125, -0.567779541015625, -0.5283050537109375, -0.48883056640625, -0.4493560791015625, -0.409881591796875, -0.3704071044921875, -0.3309326171875, -0.2914581298828125, -0.251983642578125, -0.2125091552734375, -0.17303466796875, -0.1335601806640625, -0.094085693359375, -0.0546112060546875, -0.01513671875, 0.0243377685546875, 0.063812255859375, 0.1032867431640625, 0.14276123046875, 0.1822357177734375, 0.221710205078125, 0.2611846923828125, 0.3006591796875, 0.3401336669921875, 0.379608154296875, 0.4190826416015625, 0.45855712890625, 0.4980316162109375, 0.537506103515625, 0.5769805908203125, 0.616455078125, 0.6559295654296875, 0.695404052734375, 0.7348785400390625, 0.77435302734375, 0.8138275146484375, 0.853302001953125, 0.8927764892578125, 0.9322509765625, 0.9717254638671875, 1.011199951171875, 1.0506744384765625, 1.09014892578125, 1.1296234130859375, 1.169097900390625, 1.2085723876953125, 1.248046875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 7.0, 10.0, 18.0, 13.0, 22.0, 24.0, 18.0, 16.0, 28.0, 22.0, 15.0, 35.0, 34.0, 32.0, 37.0, 41.0, 34.0, 43.0, 1061.0, 41.0, 42.0, 34.0, 37.0, 35.0, 39.0, 40.0, 27.0, 33.0, 21.0, 20.0, 16.0, 20.0, 9.0, 14.0, 9.0, 7.0, 11.0, 6.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.9337158203125, -14.422119140625, -13.9105224609375, -13.39892578125, -12.8873291015625, -12.375732421875, -11.8641357421875, -11.3525390625, -10.8409423828125, -10.329345703125, -9.8177490234375, -9.30615234375, -8.7945556640625, -8.282958984375, -7.7713623046875, -7.259765625, -6.7481689453125, -6.236572265625, -5.7249755859375, -5.21337890625, -4.7017822265625, -4.190185546875, -3.6785888671875, -3.1669921875, -2.6553955078125, -2.143798828125, -1.6322021484375, -1.12060546875, -0.6090087890625, -0.097412109375, 0.4141845703125, 0.92578125, 1.4373779296875, 1.948974609375, 2.4605712890625, 2.97216796875, 3.4837646484375, 3.995361328125, 4.5069580078125, 5.0185546875, 5.5301513671875, 6.041748046875, 6.5533447265625, 7.06494140625, 7.5765380859375, 8.088134765625, 8.5997314453125, 9.111328125, 9.6229248046875, 10.134521484375, 10.6461181640625, 11.15771484375, 11.6693115234375, 12.180908203125, 12.6925048828125, 13.2041015625, 13.7156982421875, 14.227294921875, 14.7388916015625, 15.25048828125, 15.7620849609375, 16.273681640625, 16.7852783203125, 17.296875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 15.0, 15.0, 30.0, 35.0, 44.0, 62.0, 97.0, 144.0, 179.0, 277.0, 388.0, 546.0, 766.0, 1070.0, 1571.0, 2128.0, 3156.0, 4610.0, 6645.0, 9815.0, 14421.0, 21705.0, 33534.0, 52836.0, 86389.0, 167280.0, 1357121.0, 127660.0, 72361.0, 44056.0, 28659.0, 18860.0, 12862.0, 8544.0, 5820.0, 4104.0, 2722.0, 1979.0, 1422.0, 958.0, 643.0, 474.0, 312.0, 221.0, 165.0, 125.0, 89.0, 68.0, 37.0, 33.0, 27.0, 19.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0], "bins": [-0.7080078125, -0.6861038208007812, -0.6641998291015625, -0.6422958374023438, -0.620391845703125, -0.5984878540039062, -0.5765838623046875, -0.5546798706054688, -0.53277587890625, -0.5108718872070312, -0.4889678955078125, -0.46706390380859375, -0.445159912109375, -0.42325592041015625, -0.4013519287109375, -0.37944793701171875, -0.3575439453125, -0.33563995361328125, -0.3137359619140625, -0.29183197021484375, -0.269927978515625, -0.24802398681640625, -0.2261199951171875, -0.20421600341796875, -0.18231201171875, -0.16040802001953125, -0.1385040283203125, -0.11660003662109375, -0.094696044921875, -0.07279205322265625, -0.0508880615234375, -0.02898406982421875, -0.007080078125, 0.01482391357421875, 0.0367279052734375, 0.05863189697265625, 0.080535888671875, 0.10243988037109375, 0.1243438720703125, 0.14624786376953125, 0.16815185546875, 0.19005584716796875, 0.2119598388671875, 0.23386383056640625, 0.255767822265625, 0.27767181396484375, 0.2995758056640625, 0.32147979736328125, 0.3433837890625, 0.36528778076171875, 0.3871917724609375, 0.40909576416015625, 0.430999755859375, 0.45290374755859375, 0.4748077392578125, 0.49671173095703125, 0.51861572265625, 0.5405197143554688, 0.5624237060546875, 0.5843276977539062, 0.606231689453125, 0.6281356811523438, 0.6500396728515625, 0.6719436645507812, 0.69384765625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 6.0, 12.0, 13.0, 18.0, 13.0, 20.0, 31.0, 32.0, 41.0, 47.0, 59.0, 88.0, 86.0, 103.0, 77.0, 55.0, 48.0, 43.0, 40.0, 24.0, 19.0, 26.0, 22.0, 13.0, 12.0, 6.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.788969039916992e-05, -6.585568189620972e-05, -6.382167339324951e-05, -6.17876648902893e-05, -5.97536563873291e-05, -5.7719647884368896e-05, -5.568563938140869e-05, -5.3651630878448486e-05, -5.161762237548828e-05, -4.9583613872528076e-05, -4.754960536956787e-05, -4.5515596866607666e-05, -4.348158836364746e-05, -4.1447579860687256e-05, -3.941357135772705e-05, -3.7379562854766846e-05, -3.534555435180664e-05, -3.3311545848846436e-05, -3.127753734588623e-05, -2.9243528842926025e-05, -2.720952033996582e-05, -2.5175511837005615e-05, -2.314150333404541e-05, -2.1107494831085205e-05, -1.9073486328125e-05, -1.7039477825164795e-05, -1.500546932220459e-05, -1.2971460819244385e-05, -1.093745231628418e-05, -8.903443813323975e-06, -6.8694353103637695e-06, -4.8354268074035645e-06, -2.8014183044433594e-06, -7.674098014831543e-07, 1.2665987014770508e-06, 3.300607204437256e-06, 5.334615707397461e-06, 7.368624210357666e-06, 9.402632713317871e-06, 1.1436641216278076e-05, 1.3470649719238281e-05, 1.5504658222198486e-05, 1.753866672515869e-05, 1.9572675228118896e-05, 2.16066837310791e-05, 2.3640692234039307e-05, 2.5674700736999512e-05, 2.7708709239959717e-05, 2.9742717742919922e-05, 3.177672624588013e-05, 3.381073474884033e-05, 3.584474325180054e-05, 3.787875175476074e-05, 3.991276025772095e-05, 4.194676876068115e-05, 4.398077726364136e-05, 4.601478576660156e-05, 4.804879426956177e-05, 5.008280277252197e-05, 5.211681127548218e-05, 5.415081977844238e-05, 5.618482828140259e-05, 5.821883678436279e-05, 6.0252845287323e-05, 6.22868537902832e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 6.0, 4.0, 20.0, 12.0, 24.0, 32.0, 44.0, 64.0, 61.0, 84.0, 121.0, 203.0, 377.0, 1688.0, 22540.0, 956718.0, 62199.0, 3061.0, 523.0, 216.0, 137.0, 104.0, 86.0, 50.0, 29.0, 43.0, 18.0, 21.0, 11.0, 14.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009441375732421875, -0.0009133219718933105, -0.0008825063705444336, -0.0008516907691955566, -0.0008208751678466797, -0.0007900595664978027, -0.0007592439651489258, -0.0007284283638000488, -0.0006976127624511719, -0.0006667971611022949, -0.000635981559753418, -0.000605165958404541, -0.0005743503570556641, -0.0005435347557067871, -0.0005127191543579102, -0.0004819035530090332, -0.00045108795166015625, -0.0004202723503112793, -0.00038945674896240234, -0.0003586411476135254, -0.00032782554626464844, -0.0002970099449157715, -0.00026619434356689453, -0.00023537874221801758, -0.00020456314086914062, -0.00017374753952026367, -0.00014293193817138672, -0.00011211633682250977, -8.130073547363281e-05, -5.048513412475586e-05, -1.9669532775878906e-05, 1.1146068572998047e-05, 4.1961669921875e-05, 7.277727127075195e-05, 0.0001035928726196289, 0.00013440847396850586, 0.0001652240753173828, 0.00019603967666625977, 0.00022685527801513672, 0.00025767087936401367, 0.0002884864807128906, 0.0003193020820617676, 0.00035011768341064453, 0.0003809332847595215, 0.00041174888610839844, 0.0004425644874572754, 0.00047338008880615234, 0.0005041956901550293, 0.0005350112915039062, 0.0005658268928527832, 0.0005966424942016602, 0.0006274580955505371, 0.0006582736968994141, 0.000689089298248291, 0.000719904899597168, 0.0007507205009460449, 0.0007815361022949219, 0.0008123517036437988, 0.0008431673049926758, 0.0008739829063415527, 0.0009047985076904297, 0.0009356141090393066, 0.0009664297103881836, 0.0009972453117370605, 0.0010280609130859375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 12.0, 23.0, 40.0, 60.0, 131.0, 342.0, 195.0, 81.0, 54.0, 29.0, 17.0, 14.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.198625513003208e-05, -4.95935782964807e-05, -4.7200897824950516e-05, -4.480822099139914e-05, -4.2415540519868955e-05, -4.002286368631758e-05, -3.7630183214787394e-05, -3.523750638123602e-05, -3.284482954768464e-05, -3.045215089514386e-05, -2.805947224260308e-05, -2.56667954090517e-05, -2.3274114937521517e-05, -2.088143810397014e-05, -1.848875945142936e-05, -1.609608079888858e-05, -1.3703400327358395e-05, -1.1310721674817614e-05, -8.918043022276834e-06, -6.525365279230755e-06, -4.132686626689974e-06, -1.7400079741491936e-06, 6.526697688968852e-07, 3.045348421437666e-06, 5.4380270739784464e-06, 7.830705726519227e-06, 1.0223384379060008e-05, 1.2616062122106086e-05, 1.5008740774646867e-05, 1.740142033668235e-05, 1.9794097170233727e-05, 2.2186775822774507e-05, 2.457945083733648e-05, 2.697212948987726e-05, 2.9364808142418042e-05, 3.175748497596942e-05, 3.41501654474996e-05, 3.654284228105098e-05, 3.893551911460236e-05, 4.132819958613254e-05, 4.3720880057662725e-05, 4.61135568912141e-05, 4.850623736274429e-05, 5.0898914196295664e-05, 5.329159466782585e-05, 5.5684271501377225e-05, 5.80769483349286e-05, 6.0469628806458786e-05, 6.286230927798897e-05, 6.525498611154035e-05, 6.764766294509172e-05, 7.004034705460072e-05, 7.243302388815209e-05, 7.482570072170347e-05, 7.721837755525485e-05, 7.961105438880622e-05, 8.20037312223576e-05, 8.439640805590898e-05, 8.678908488946036e-05, 8.918176899896935e-05, 9.157444583252072e-05, 9.39671226660721e-05, 9.635979949962348e-05, 9.875248360913247e-05, 0.00010114516044268385]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 6.0, 1.0, 7.0, 6.0, 5.0, 9.0, 6.0, 14.0, 12.0, 16.0, 25.0, 21.0, 25.0, 24.0, 22.0, 37.0, 40.0, 38.0, 47.0, 38.0, 39.0, 39.0, 39.0, 41.0, 36.0, 42.0, 39.0, 37.0, 26.0, 37.0, 30.0, 23.0, 23.0, 32.0, 26.0, 22.0, 15.0, 11.0, 8.0, 11.0, 6.0, 9.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.9087066650390625e-05, -2.820882946252823e-05, -2.7330592274665833e-05, -2.6452355086803436e-05, -2.557411789894104e-05, -2.4695880711078644e-05, -2.3817643523216248e-05, -2.293940633535385e-05, -2.2061169147491455e-05, -2.118293195962906e-05, -2.0304694771766663e-05, -1.9426457583904266e-05, -1.854822039604187e-05, -1.7669983208179474e-05, -1.6791746020317078e-05, -1.591350883245468e-05, -1.5035271644592285e-05, -1.4157034456729889e-05, -1.3278797268867493e-05, -1.2400560081005096e-05, -1.15223228931427e-05, -1.0644085705280304e-05, -9.765848517417908e-06, -8.887611329555511e-06, -8.009374141693115e-06, -7.131136953830719e-06, -6.252899765968323e-06, -5.3746625781059265e-06, -4.49642539024353e-06, -3.618188202381134e-06, -2.739951014518738e-06, -1.8617138266563416e-06, -9.834766387939453e-07, -1.0523945093154907e-07, 7.729977369308472e-07, 1.6512349247932434e-06, 2.5294721126556396e-06, 3.407709300518036e-06, 4.285946488380432e-06, 5.164183676242828e-06, 6.042420864105225e-06, 6.920658051967621e-06, 7.798895239830017e-06, 8.677132427692413e-06, 9.55536961555481e-06, 1.0433606803417206e-05, 1.1311843991279602e-05, 1.2190081179141998e-05, 1.3068318367004395e-05, 1.394655555486679e-05, 1.4824792742729187e-05, 1.5703029930591583e-05, 1.658126711845398e-05, 1.7459504306316376e-05, 1.8337741494178772e-05, 1.9215978682041168e-05, 2.0094215869903564e-05, 2.097245305776596e-05, 2.1850690245628357e-05, 2.2728927433490753e-05, 2.360716462135315e-05, 2.4485401809215546e-05, 2.5363638997077942e-05, 2.6241876184940338e-05, 2.7120113372802734e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 2.0, 5.0, 5.0, 8.0, 6.0, 8.0, 9.0, 12.0, 15.0, 14.0, 19.0, 21.0, 25.0, 21.0, 27.0, 36.0, 37.0, 32.0, 46.0, 50.0, 48.0, 43.0, 42.0, 47.0, 70.0, 40.0, 30.0, 43.0, 36.0, 26.0, 25.0, 20.0, 21.0, 14.0, 15.0, 10.0, 22.0, 12.0, 5.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-28.0625, -27.175048828125, -26.28759765625, -25.400146484375, -24.5126953125, -23.625244140625, -22.73779296875, -21.850341796875, -20.962890625, -20.075439453125, -19.18798828125, -18.300537109375, -17.4130859375, -16.525634765625, -15.63818359375, -14.750732421875, -13.86328125, -12.975830078125, -12.08837890625, -11.200927734375, -10.3134765625, -9.426025390625, -8.53857421875, -7.651123046875, -6.763671875, -5.876220703125, -4.98876953125, -4.101318359375, -3.2138671875, -2.326416015625, -1.43896484375, -0.551513671875, 0.3359375, 1.223388671875, 2.11083984375, 2.998291015625, 3.8857421875, 4.773193359375, 5.66064453125, 6.548095703125, 7.435546875, 8.322998046875, 9.21044921875, 10.097900390625, 10.9853515625, 11.872802734375, 12.76025390625, 13.647705078125, 14.53515625, 15.422607421875, 16.31005859375, 17.197509765625, 18.0849609375, 18.972412109375, 19.85986328125, 20.747314453125, 21.634765625, 22.522216796875, 23.40966796875, 24.297119140625, 25.1845703125, 26.072021484375, 26.95947265625, 27.846923828125, 28.734375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 9.0, 5.0, 8.0, 14.0, 10.0, 23.0, 37.0, 33.0, 53.0, 59.0, 76.0, 119.0, 171.0, 206.0, 327.0, 539.0, 820.0, 1371.0, 2531.0, 4958.0, 10593.0, 24702.0, 69137.0, 295966.0, 479075.0, 98380.0, 32107.0, 13325.0, 6165.0, 3160.0, 1712.0, 949.0, 630.0, 358.0, 249.0, 189.0, 135.0, 106.0, 57.0, 52.0, 38.0, 21.0, 20.0, 10.0, 18.0, 10.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-15.640625, -15.154052734375, -14.66748046875, -14.180908203125, -13.6943359375, -13.207763671875, -12.72119140625, -12.234619140625, -11.748046875, -11.261474609375, -10.77490234375, -10.288330078125, -9.8017578125, -9.315185546875, -8.82861328125, -8.342041015625, -7.85546875, -7.368896484375, -6.88232421875, -6.395751953125, -5.9091796875, -5.422607421875, -4.93603515625, -4.449462890625, -3.962890625, -3.476318359375, -2.98974609375, -2.503173828125, -2.0166015625, -1.530029296875, -1.04345703125, -0.556884765625, -0.0703125, 0.416259765625, 0.90283203125, 1.389404296875, 1.8759765625, 2.362548828125, 2.84912109375, 3.335693359375, 3.822265625, 4.308837890625, 4.79541015625, 5.281982421875, 5.7685546875, 6.255126953125, 6.74169921875, 7.228271484375, 7.71484375, 8.201416015625, 8.68798828125, 9.174560546875, 9.6611328125, 10.147705078125, 10.63427734375, 11.120849609375, 11.607421875, 12.093994140625, 12.58056640625, 13.067138671875, 13.5537109375, 14.040283203125, 14.52685546875, 15.013427734375, 15.5]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 7.0, 6.0, 7.0, 11.0, 8.0, 10.0, 20.0, 29.0, 21.0, 21.0, 37.0, 37.0, 35.0, 33.0, 48.0, 54.0, 45.0, 83.0, 1981.0, 91.0, 58.0, 65.0, 43.0, 37.0, 52.0, 28.0, 25.0, 25.0, 25.0, 22.0, 22.0, 18.0, 12.0, 12.0, 12.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.5625, -99.9248046875, -96.287109375, -92.6494140625, -89.01171875, -85.3740234375, -81.736328125, -78.0986328125, -74.4609375, -70.8232421875, -67.185546875, -63.5478515625, -59.91015625, -56.2724609375, -52.634765625, -48.9970703125, -45.359375, -41.7216796875, -38.083984375, -34.4462890625, -30.80859375, -27.1708984375, -23.533203125, -19.8955078125, -16.2578125, -12.6201171875, -8.982421875, -5.3447265625, -1.70703125, 1.9306640625, 5.568359375, 9.2060546875, 12.84375, 16.4814453125, 20.119140625, 23.7568359375, 27.39453125, 31.0322265625, 34.669921875, 38.3076171875, 41.9453125, 45.5830078125, 49.220703125, 52.8583984375, 56.49609375, 60.1337890625, 63.771484375, 67.4091796875, 71.046875, 74.6845703125, 78.322265625, 81.9599609375, 85.59765625, 89.2353515625, 92.873046875, 96.5107421875, 100.1484375, 103.7861328125, 107.423828125, 111.0615234375, 114.69921875, 118.3369140625, 121.974609375, 125.6123046875, 129.25]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 11.0, 14.0, 18.0, 21.0, 23.0, 28.0, 37.0, 31.0, 56.0, 113.0, 157.0, 244.0, 442.0, 1193.0, 9487.0, 3113266.0, 17917.0, 1312.0, 521.0, 264.0, 159.0, 91.0, 79.0, 48.0, 25.0, 26.0, 31.0, 22.0, 9.0, 9.0, 10.0, 9.0, 6.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-196.125, -190.611328125, -185.09765625, -179.583984375, -174.0703125, -168.556640625, -163.04296875, -157.529296875, -152.015625, -146.501953125, -140.98828125, -135.474609375, -129.9609375, -124.447265625, -118.93359375, -113.419921875, -107.90625, -102.392578125, -96.87890625, -91.365234375, -85.8515625, -80.337890625, -74.82421875, -69.310546875, -63.796875, -58.283203125, -52.76953125, -47.255859375, -41.7421875, -36.228515625, -30.71484375, -25.201171875, -19.6875, -14.173828125, -8.66015625, -3.146484375, 2.3671875, 7.880859375, 13.39453125, 18.908203125, 24.421875, 29.935546875, 35.44921875, 40.962890625, 46.4765625, 51.990234375, 57.50390625, 63.017578125, 68.53125, 74.044921875, 79.55859375, 85.072265625, 90.5859375, 96.099609375, 101.61328125, 107.126953125, 112.640625, 118.154296875, 123.66796875, 129.181640625, 134.6953125, 140.208984375, 145.72265625, 151.236328125, 156.75]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 267.0, 749.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.88456726074219, -79.25813293457031, -41.631690979003906, -4.0052490234375, 33.621185302734375, 71.24761962890625, 108.87406921386719, 146.50050354003906, 184.12693786621094, 221.7533721923828, 259.37982177734375, 297.0062561035156, 334.6326904296875, 372.2591247558594, 409.88555908203125, 447.51202392578125, 485.138427734375, 522.764892578125, 560.3912963867188, 598.0177612304688, 635.6441650390625, 673.2706298828125, 710.8970947265625, 748.5234985351562, 786.1499633789062, 823.7764282226562, 861.40283203125, 899.029296875, 936.6557006835938, 974.2821655273438, 1011.9085693359375, 1049.5350341796875, 1087.1614990234375, 1124.7879638671875, 1162.4144287109375, 1200.040771484375, 1237.667236328125, 1275.293701171875, 1312.920166015625, 1350.546630859375, 1388.1729736328125, 1425.7994384765625, 1463.4259033203125, 1501.05224609375, 1538.6787109375, 1576.30517578125, 1613.931640625, 1651.55810546875, 1689.1845703125, 1726.81103515625, 1764.4375, 1802.0638427734375, 1839.6903076171875, 1877.3167724609375, 1914.9432373046875, 1952.569580078125, 1990.196044921875, 2027.822509765625, 2065.448974609375, 2103.075439453125, 2140.701904296875, 2178.328125, 2215.95458984375, 2253.5810546875, 2291.20751953125]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 7.0, 15.0, 17.0, 12.0, 18.0, 18.0, 27.0, 32.0, 33.0, 37.0, 47.0, 36.0, 41.0, 41.0, 38.0, 42.0, 41.0, 49.0, 52.0, 39.0, 49.0, 40.0, 38.0, 23.0, 27.0, 27.0, 29.0, 24.0, 15.0, 12.0, 6.0, 16.0, 7.0, 9.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-378.63482666015625, -367.45819091796875, -356.2815246582031, -345.1048889160156, -333.9282531738281, -322.7515869140625, -311.574951171875, -300.3983154296875, -289.2216796875, -278.0450439453125, -266.8683776855469, -255.69174194335938, -244.51510620117188, -233.3384552001953, -222.16180419921875, -210.98516845703125, -199.80850219726562, -188.63185119628906, -177.45521545410156, -166.278564453125, -155.1019287109375, -143.92527770996094, -132.74862670898438, -121.57198333740234, -110.39533996582031, -99.21869659423828, -88.04205322265625, -76.86540222167969, -65.68875885009766, -54.512115478515625, -43.33546447753906, -32.15882110595703, -20.982147216796875, -9.805501937866211, 1.3711433410644531, 12.54779052734375, 23.72443389892578, 34.90107727050781, 46.077728271484375, 57.254371643066406, 68.43101501464844, 79.60765838623047, 90.7843017578125, 101.96095275878906, 113.1375961303711, 124.31423950195312, 135.4908905029297, 146.66754150390625, 157.84417724609375, 169.0208282470703, 180.1974639892578, 191.37411499023438, 202.55075073242188, 213.72740173339844, 224.904052734375, 236.0806884765625, 247.25733947753906, 258.4339904785156, 269.6106262207031, 280.78729248046875, 291.96392822265625, 303.14056396484375, 314.31719970703125, 325.4938659667969, 336.6705017089844]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 6.0, 4.0, 5.0, 4.0, 6.0, 8.0, 7.0, 7.0, 13.0, 18.0, 9.0, 17.0, 27.0, 24.0, 24.0, 18.0, 36.0, 36.0, 35.0, 48.0, 44.0, 54.0, 45.0, 34.0, 43.0, 64.0, 52.0, 33.0, 40.0, 39.0, 23.0, 29.0, 18.0, 18.0, 19.0, 14.0, 14.0, 13.0, 19.0, 4.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-28.390625, -27.498046875, -26.60546875, -25.712890625, -24.8203125, -23.927734375, -23.03515625, -22.142578125, -21.25, -20.357421875, -19.46484375, -18.572265625, -17.6796875, -16.787109375, -15.89453125, -15.001953125, -14.109375, -13.216796875, -12.32421875, -11.431640625, -10.5390625, -9.646484375, -8.75390625, -7.861328125, -6.96875, -6.076171875, -5.18359375, -4.291015625, -3.3984375, -2.505859375, -1.61328125, -0.720703125, 0.171875, 1.064453125, 1.95703125, 2.849609375, 3.7421875, 4.634765625, 5.52734375, 6.419921875, 7.3125, 8.205078125, 9.09765625, 9.990234375, 10.8828125, 11.775390625, 12.66796875, 13.560546875, 14.453125, 15.345703125, 16.23828125, 17.130859375, 18.0234375, 18.916015625, 19.80859375, 20.701171875, 21.59375, 22.486328125, 23.37890625, 24.271484375, 25.1640625, 26.056640625, 26.94921875, 27.841796875, 28.734375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 16.0, 19.0, 19.0, 23.0, 29.0, 58.0, 61.0, 81.0, 110.0, 144.0, 201.0, 227.0, 371.0, 454.0, 679.0, 912.0, 1266.0, 1772.0, 2546.0, 3801.0, 6014.0, 10273.0, 36984.0, 513258.0, 3348034.0, 218541.0, 23753.0, 8804.0, 5140.0, 3390.0, 2181.0, 1500.0, 1018.0, 693.0, 499.0, 349.0, 279.0, 216.0, 135.0, 117.0, 73.0, 50.0, 47.0, 32.0, 26.0, 14.0, 20.0, 10.0, 10.0, 7.0, 8.0, 3.0, 2.0, 7.0, 4.0, 3.0, 0.0, 1.0], "bins": [-62.9375, -60.86328125, -58.7890625, -56.71484375, -54.640625, -52.56640625, -50.4921875, -48.41796875, -46.34375, -44.26953125, -42.1953125, -40.12109375, -38.046875, -35.97265625, -33.8984375, -31.82421875, -29.75, -27.67578125, -25.6015625, -23.52734375, -21.453125, -19.37890625, -17.3046875, -15.23046875, -13.15625, -11.08203125, -9.0078125, -6.93359375, -4.859375, -2.78515625, -0.7109375, 1.36328125, 3.4375, 5.51171875, 7.5859375, 9.66015625, 11.734375, 13.80859375, 15.8828125, 17.95703125, 20.03125, 22.10546875, 24.1796875, 26.25390625, 28.328125, 30.40234375, 32.4765625, 34.55078125, 36.625, 38.69921875, 40.7734375, 42.84765625, 44.921875, 46.99609375, 49.0703125, 51.14453125, 53.21875, 55.29296875, 57.3671875, 59.44140625, 61.515625, 63.58984375, 65.6640625, 67.73828125, 69.8125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 4.0, 5.0, 10.0, 11.0, 17.0, 12.0, 22.0, 31.0, 40.0, 77.0, 227.0, 737.0, 1651.0, 772.0, 207.0, 78.0, 42.0, 27.0, 11.0, 12.0, 9.0, 13.0, 7.0, 9.0, 7.0, 4.0, 2.0, 1.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.375, -111.2412109375, -108.107421875, -104.9736328125, -101.83984375, -98.7060546875, -95.572265625, -92.4384765625, -89.3046875, -86.1708984375, -83.037109375, -79.9033203125, -76.76953125, -73.6357421875, -70.501953125, -67.3681640625, -64.234375, -61.1005859375, -57.966796875, -54.8330078125, -51.69921875, -48.5654296875, -45.431640625, -42.2978515625, -39.1640625, -36.0302734375, -32.896484375, -29.7626953125, -26.62890625, -23.4951171875, -20.361328125, -17.2275390625, -14.09375, -10.9599609375, -7.826171875, -4.6923828125, -1.55859375, 1.5751953125, 4.708984375, 7.8427734375, 10.9765625, 14.1103515625, 17.244140625, 20.3779296875, 23.51171875, 26.6455078125, 29.779296875, 32.9130859375, 36.046875, 39.1806640625, 42.314453125, 45.4482421875, 48.58203125, 51.7158203125, 54.849609375, 57.9833984375, 61.1171875, 64.2509765625, 67.384765625, 70.5185546875, 73.65234375, 76.7861328125, 79.919921875, 83.0537109375, 86.1875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 8.0, 7.0, 14.0, 13.0, 19.0, 28.0, 57.0, 66.0, 85.0, 116.0, 210.0, 318.0, 479.0, 740.0, 1116.0, 1710.0, 2698.0, 4330.0, 7267.0, 13141.0, 27867.0, 97445.0, 3269291.0, 664405.0, 55003.0, 20887.0, 10731.0, 6088.0, 3642.0, 2311.0, 1420.0, 916.0, 608.0, 401.0, 281.0, 183.0, 128.0, 88.0, 58.0, 32.0, 20.0, 20.0, 14.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-108.75, -104.9765625, -101.203125, -97.4296875, -93.65625, -89.8828125, -86.109375, -82.3359375, -78.5625, -74.7890625, -71.015625, -67.2421875, -63.46875, -59.6953125, -55.921875, -52.1484375, -48.375, -44.6015625, -40.828125, -37.0546875, -33.28125, -29.5078125, -25.734375, -21.9609375, -18.1875, -14.4140625, -10.640625, -6.8671875, -3.09375, 0.6796875, 4.453125, 8.2265625, 12.0, 15.7734375, 19.546875, 23.3203125, 27.09375, 30.8671875, 34.640625, 38.4140625, 42.1875, 45.9609375, 49.734375, 53.5078125, 57.28125, 61.0546875, 64.828125, 68.6015625, 72.375, 76.1484375, 79.921875, 83.6953125, 87.46875, 91.2421875, 95.015625, 98.7890625, 102.5625, 106.3359375, 110.109375, 113.8828125, 117.65625, 121.4296875, 125.203125, 128.9765625, 132.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 1.0, 4.0, 8.0, 12.0, 18.0, 13.0, 24.0, 26.0, 44.0, 73.0, 129.0, 183.0, 155.0, 92.0, 63.0, 32.0, 31.0, 23.0, 18.0, 16.0, 15.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.86236572265625, -259.8997802734375, -248.93719482421875, -237.97459411621094, -227.0120086669922, -216.04942321777344, -205.08682250976562, -194.12423706054688, -183.16165161132812, -172.19906616210938, -161.23648071289062, -150.2738800048828, -139.31129455566406, -128.3487091064453, -117.38611602783203, -106.42352294921875, -95.4609375, -84.49835205078125, -73.53575897216797, -62.57316970825195, -51.61058044433594, -40.64799118041992, -29.685401916503906, -18.722808837890625, -7.760223388671875, 3.2023658752441406, 14.164955139160156, 25.127544403076172, 36.09013366699219, 47.0527229309082, 58.01531219482422, 68.9779052734375, 79.94046020507812, 90.90304565429688, 101.86563873291016, 112.82823181152344, 123.79081726074219, 134.75340270996094, 145.71600341796875, 156.6785888671875, 167.64117431640625, 178.603759765625, 189.56634521484375, 200.52894592285156, 211.4915313720703, 222.45411682128906, 233.41671752929688, 244.37930297851562, 255.34188842773438, 266.3044738769531, 277.2670593261719, 288.2296447753906, 299.1922607421875, 310.15484619140625, 321.117431640625, 332.08001708984375, 343.0426025390625, 354.00518798828125, 364.9677734375, 375.93035888671875, 386.8929443359375, 397.8555603027344, 408.8181457519531, 419.7807312011719, 430.7433166503906]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 7.0, 10.0, 6.0, 11.0, 5.0, 12.0, 18.0, 10.0, 9.0, 18.0, 18.0, 23.0, 26.0, 18.0, 38.0, 27.0, 29.0, 44.0, 44.0, 32.0, 32.0, 28.0, 43.0, 30.0, 38.0, 32.0, 41.0, 30.0, 22.0, 35.0, 29.0, 33.0, 29.0, 25.0, 14.0, 27.0, 21.0, 17.0, 10.0, 9.0, 7.0, 10.0, 7.0, 9.0, 6.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-188.9227752685547, -183.27813720703125, -177.63348388671875, -171.98883056640625, -166.3441925048828, -160.69955444335938, -155.05490112304688, -149.41024780273438, -143.76560974121094, -138.1209716796875, -132.476318359375, -126.83167266845703, -121.18702697753906, -115.5423812866211, -109.89773559570312, -104.25308990478516, -98.60844421386719, -92.96379852294922, -87.31915283203125, -81.67450714111328, -76.02986145019531, -70.38521575927734, -64.74057006835938, -59.095924377441406, -53.45127868652344, -47.80663299560547, -42.1619873046875, -36.51734161376953, -30.872695922851562, -25.228050231933594, -19.583404541015625, -13.938758850097656, -8.29412841796875, -2.6494827270507812, 2.9951629638671875, 8.639808654785156, 14.284454345703125, 19.929100036621094, 25.573745727539062, 31.21839141845703, 36.863037109375, 42.50768280029297, 48.15232849121094, 53.796974182128906, 59.441619873046875, 65.08626556396484, 70.73091125488281, 76.37555694580078, 82.02020263671875, 87.66484832763672, 93.30949401855469, 98.95413970947266, 104.59878540039062, 110.2434310913086, 115.88807678222656, 121.53272247314453, 127.1773681640625, 132.822021484375, 138.46665954589844, 144.11129760742188, 149.75595092773438, 155.40060424804688, 161.0452423095703, 166.68988037109375, 172.33453369140625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 7.0, 8.0, 2.0, 6.0, 8.0, 8.0, 7.0, 17.0, 16.0, 17.0, 17.0, 17.0, 37.0, 28.0, 26.0, 32.0, 45.0, 48.0, 31.0, 49.0, 53.0, 46.0, 56.0, 40.0, 43.0, 31.0, 39.0, 39.0, 37.0, 25.0, 20.0, 19.0, 21.0, 15.0, 10.0, 16.0, 9.0, 12.0, 10.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.8125, -28.884033203125, -27.95556640625, -27.027099609375, -26.0986328125, -25.170166015625, -24.24169921875, -23.313232421875, -22.384765625, -21.456298828125, -20.52783203125, -19.599365234375, -18.6708984375, -17.742431640625, -16.81396484375, -15.885498046875, -14.95703125, -14.028564453125, -13.10009765625, -12.171630859375, -11.2431640625, -10.314697265625, -9.38623046875, -8.457763671875, -7.529296875, -6.600830078125, -5.67236328125, -4.743896484375, -3.8154296875, -2.886962890625, -1.95849609375, -1.030029296875, -0.1015625, 0.826904296875, 1.75537109375, 2.683837890625, 3.6123046875, 4.540771484375, 5.46923828125, 6.397705078125, 7.326171875, 8.254638671875, 9.18310546875, 10.111572265625, 11.0400390625, 11.968505859375, 12.89697265625, 13.825439453125, 14.75390625, 15.682373046875, 16.61083984375, 17.539306640625, 18.4677734375, 19.396240234375, 20.32470703125, 21.253173828125, 22.181640625, 23.110107421875, 24.03857421875, 24.967041015625, 25.8955078125, 26.823974609375, 27.75244140625, 28.680908203125, 29.609375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 11.0, 15.0, 26.0, 28.0, 68.0, 82.0, 117.0, 141.0, 217.0, 293.0, 435.0, 638.0, 917.0, 1279.0, 1933.0, 2687.0, 3753.0, 5241.0, 7696.0, 10953.0, 16064.0, 24807.0, 38175.0, 61607.0, 108594.0, 293793.0, 212464.0, 95006.0, 55759.0, 34738.0, 22025.0, 15184.0, 10272.0, 7021.0, 4847.0, 3496.0, 2394.0, 1673.0, 1214.0, 873.0, 582.0, 434.0, 302.0, 225.0, 129.0, 113.0, 62.0, 54.0, 36.0, 17.0, 22.0, 12.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.0283203125, -0.9960784912109375, -0.963836669921875, -0.9315948486328125, -0.89935302734375, -0.8671112060546875, -0.834869384765625, -0.8026275634765625, -0.7703857421875, -0.7381439208984375, -0.705902099609375, -0.6736602783203125, -0.64141845703125, -0.6091766357421875, -0.576934814453125, -0.5446929931640625, -0.512451171875, -0.4802093505859375, -0.447967529296875, -0.4157257080078125, -0.38348388671875, -0.3512420654296875, -0.319000244140625, -0.2867584228515625, -0.2545166015625, -0.2222747802734375, -0.190032958984375, -0.1577911376953125, -0.12554931640625, -0.0933074951171875, -0.061065673828125, -0.0288238525390625, 0.00341796875, 0.0356597900390625, 0.067901611328125, 0.1001434326171875, 0.13238525390625, 0.1646270751953125, 0.196868896484375, 0.2291107177734375, 0.2613525390625, 0.2935943603515625, 0.325836181640625, 0.3580780029296875, 0.39031982421875, 0.4225616455078125, 0.454803466796875, 0.4870452880859375, 0.519287109375, 0.5515289306640625, 0.583770751953125, 0.6160125732421875, 0.64825439453125, 0.6804962158203125, 0.712738037109375, 0.7449798583984375, 0.7772216796875, 0.8094635009765625, 0.841705322265625, 0.8739471435546875, 0.90618896484375, 0.9384307861328125, 0.970672607421875, 1.0029144287109375, 1.03515625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 11.0, 16.0, 12.0, 14.0, 13.0, 11.0, 20.0, 19.0, 23.0, 25.0, 17.0, 18.0, 21.0, 31.0, 35.0, 41.0, 31.0, 37.0, 1064.0, 34.0, 35.0, 39.0, 47.0, 37.0, 28.0, 31.0, 44.0, 30.0, 34.0, 21.0, 24.0, 26.0, 24.0, 12.0, 15.0, 16.0, 8.0, 5.0, 12.0, 10.0, 2.0, 6.0, 5.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.671875, -15.149169921875, -14.62646484375, -14.103759765625, -13.5810546875, -13.058349609375, -12.53564453125, -12.012939453125, -11.490234375, -10.967529296875, -10.44482421875, -9.922119140625, -9.3994140625, -8.876708984375, -8.35400390625, -7.831298828125, -7.30859375, -6.785888671875, -6.26318359375, -5.740478515625, -5.2177734375, -4.695068359375, -4.17236328125, -3.649658203125, -3.126953125, -2.604248046875, -2.08154296875, -1.558837890625, -1.0361328125, -0.513427734375, 0.00927734375, 0.531982421875, 1.0546875, 1.577392578125, 2.10009765625, 2.622802734375, 3.1455078125, 3.668212890625, 4.19091796875, 4.713623046875, 5.236328125, 5.759033203125, 6.28173828125, 6.804443359375, 7.3271484375, 7.849853515625, 8.37255859375, 8.895263671875, 9.41796875, 9.940673828125, 10.46337890625, 10.986083984375, 11.5087890625, 12.031494140625, 12.55419921875, 13.076904296875, 13.599609375, 14.122314453125, 14.64501953125, 15.167724609375, 15.6904296875, 16.213134765625, 16.73583984375, 17.258544921875, 17.78125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 9.0, 10.0, 13.0, 20.0, 24.0, 41.0, 61.0, 78.0, 129.0, 164.0, 252.0, 368.0, 506.0, 747.0, 1065.0, 1560.0, 2296.0, 3373.0, 4839.0, 7073.0, 10539.0, 15446.0, 23100.0, 34857.0, 53320.0, 86352.0, 162372.0, 1349895.0, 127704.0, 72643.0, 45334.0, 30121.0, 20018.0, 13436.0, 9229.0, 6375.0, 4334.0, 2961.0, 1954.0, 1417.0, 971.0, 669.0, 440.0, 335.0, 206.0, 158.0, 86.0, 77.0, 67.0, 32.0, 19.0, 17.0, 16.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.72802734375, -0.7055130004882812, -0.6829986572265625, -0.6604843139648438, -0.637969970703125, -0.6154556274414062, -0.5929412841796875, -0.5704269409179688, -0.54791259765625, -0.5253982543945312, -0.5028839111328125, -0.48036956787109375, -0.457855224609375, -0.43534088134765625, -0.4128265380859375, -0.39031219482421875, -0.3677978515625, -0.34528350830078125, -0.3227691650390625, -0.30025482177734375, -0.277740478515625, -0.25522613525390625, -0.2327117919921875, -0.21019744873046875, -0.18768310546875, -0.16516876220703125, -0.1426544189453125, -0.12014007568359375, -0.097625732421875, -0.07511138916015625, -0.0525970458984375, -0.03008270263671875, -0.007568359375, 0.01494598388671875, 0.0374603271484375, 0.05997467041015625, 0.082489013671875, 0.10500335693359375, 0.1275177001953125, 0.15003204345703125, 0.17254638671875, 0.19506072998046875, 0.2175750732421875, 0.24008941650390625, 0.262603759765625, 0.28511810302734375, 0.3076324462890625, 0.33014678955078125, 0.3526611328125, 0.37517547607421875, 0.3976898193359375, 0.42020416259765625, 0.442718505859375, 0.46523284912109375, 0.4877471923828125, 0.5102615356445312, 0.53277587890625, 0.5552902221679688, 0.5778045654296875, 0.6003189086914062, 0.622833251953125, 0.6453475952148438, 0.6678619384765625, 0.6903762817382812, 0.712890625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 9.0, 6.0, 4.0, 8.0, 8.0, 10.0, 28.0, 40.0, 47.0, 84.0, 162.0, 234.0, 112.0, 75.0, 35.0, 30.0, 18.0, 19.0, 12.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.721517562866211e-05, -9.42060723900795e-05, -9.119696915149689e-05, -8.818786591291428e-05, -8.517876267433167e-05, -8.216965943574905e-05, -7.916055619716644e-05, -7.615145295858383e-05, -7.314234972000122e-05, -7.013324648141861e-05, -6.7124143242836e-05, -6.411504000425339e-05, -6.110593676567078e-05, -5.8096833527088165e-05, -5.5087730288505554e-05, -5.207862704992294e-05, -4.906952381134033e-05, -4.606042057275772e-05, -4.305131733417511e-05, -4.00422140955925e-05, -3.703311085700989e-05, -3.4024007618427277e-05, -3.1014904379844666e-05, -2.8005801141262054e-05, -2.4996697902679443e-05, -2.1987594664096832e-05, -1.897849142551422e-05, -1.596938818693161e-05, -1.2960284948348999e-05, -9.951181709766388e-06, -6.942078471183777e-06, -3.932975232601166e-06, -9.238719940185547e-07, 2.0852312445640564e-06, 5.0943344831466675e-06, 8.103437721729279e-06, 1.111254096031189e-05, 1.41216441988945e-05, 1.7130747437477112e-05, 2.0139850676059723e-05, 2.3148953914642334e-05, 2.6158057153224945e-05, 2.9167160391807556e-05, 3.217626363039017e-05, 3.518536686897278e-05, 3.819447010755539e-05, 4.1203573346138e-05, 4.421267658472061e-05, 4.722177982330322e-05, 5.0230883061885834e-05, 5.3239986300468445e-05, 5.6249089539051056e-05, 5.925819277763367e-05, 6.226729601621628e-05, 6.527639925479889e-05, 6.82855024933815e-05, 7.129460573196411e-05, 7.430370897054672e-05, 7.731281220912933e-05, 8.032191544771194e-05, 8.333101868629456e-05, 8.634012192487717e-05, 8.934922516345978e-05, 9.235832840204239e-05, 9.5367431640625e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 4.0, 7.0, 15.0, 18.0, 27.0, 26.0, 51.0, 52.0, 89.0, 240.0, 1020.0, 10788.0, 994002.0, 39261.0, 2196.0, 367.0, 145.0, 80.0, 42.0, 25.0, 17.0, 14.0, 15.0, 10.0, 8.0, 2.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014514923095703125, -0.0014056861400604248, -0.0013598799705505371, -0.0013140738010406494, -0.0012682676315307617, -0.001222461462020874, -0.0011766552925109863, -0.0011308491230010986, -0.001085042953491211, -0.0010392367839813232, -0.0009934306144714355, -0.0009476244449615479, -0.0009018182754516602, -0.0008560121059417725, -0.0008102059364318848, -0.0007643997669219971, -0.0007185935974121094, -0.0006727874279022217, -0.000626981258392334, -0.0005811750888824463, -0.0005353689193725586, -0.0004895627498626709, -0.0004437565803527832, -0.0003979504108428955, -0.0003521442413330078, -0.0003063380718231201, -0.0002605319023132324, -0.00021472573280334473, -0.00016891956329345703, -0.00012311339378356934, -7.730722427368164e-05, -3.1501054763793945e-05, 1.430511474609375e-05, 6.0111284255981445e-05, 0.00010591745376586914, 0.00015172362327575684, 0.00019752979278564453, 0.00024333596229553223, 0.0002891421318054199, 0.0003349483013153076, 0.0003807544708251953, 0.000426560640335083, 0.0004723668098449707, 0.0005181729793548584, 0.0005639791488647461, 0.0006097853183746338, 0.0006555914878845215, 0.0007013976573944092, 0.0007472038269042969, 0.0007930099964141846, 0.0008388161659240723, 0.00088462233543396, 0.0009304285049438477, 0.0009762346744537354, 0.001022040843963623, 0.0010678470134735107, 0.0011136531829833984, 0.0011594593524932861, 0.0012052655220031738, 0.0012510716915130615, 0.0012968778610229492, 0.001342684030532837, 0.0013884902000427246, 0.0014342963695526123, 0.0014801025390625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 21.0, 29.0, 97.0, 190.0, 379.0, 151.0, 60.0, 31.0, 23.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83355935709551e-05, -7.511926378356293e-05, -7.190294127212837e-05, -6.86866114847362e-05, -6.547028169734403e-05, -6.225395190995187e-05, -5.903762939851731e-05, -5.582129961112514e-05, -5.260496982373297e-05, -4.938864367431961e-05, -4.617231388692744e-05, -4.295598773751408e-05, -3.973965795012191e-05, -3.652333180070855e-05, -3.3307005651295185e-05, -3.0090675863903016e-05, -2.6874349714489654e-05, -2.3658021746086888e-05, -2.0441693777684122e-05, -1.722536762827076e-05, -1.4009038750373293e-05, -1.0792711691465229e-05, -7.576383723062463e-06, -4.360055754659697e-06, -1.1437277862569317e-06, 2.0725999547721585e-06, 5.288927695801249e-06, 8.505255209456664e-06, 1.172158317785943e-05, 1.4937910236767493e-05, 1.815423820517026e-05, 2.1370566173573025e-05, 2.458689414197579e-05, 2.7803222110378556e-05, 3.101955007878132e-05, 3.4235876228194684e-05, 3.745220601558685e-05, 4.0668532165000215e-05, 4.388485831441358e-05, 4.7101188101805747e-05, 5.0317517889197916e-05, 5.353384403861128e-05, 5.675017382600345e-05, 5.996649997541681e-05, 6.318282976280898e-05, 6.639915227424353e-05, 6.96154820616357e-05, 7.283181184902787e-05, 7.604813436046243e-05, 7.92644641478546e-05, 8.248078665928915e-05, 8.569711644668132e-05, 8.891344623407349e-05, 9.212977602146566e-05, 9.534609853290021e-05, 9.856242832029238e-05, 0.00010177875810768455, 0.00010499508789507672, 0.00010821141040651128, 0.00011142774019390345, 0.00011464406998129562, 0.00011786039976868778, 0.00012107672228012234, 0.00012429305934347212, 0.00012750938185490668]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 12.0, 15.0, 14.0, 18.0, 15.0, 27.0, 32.0, 29.0, 41.0, 25.0, 43.0, 38.0, 36.0, 35.0, 46.0, 50.0, 44.0, 39.0, 40.0, 30.0, 34.0, 40.0, 40.0, 25.0, 31.0, 29.0, 23.0, 28.0, 14.0, 20.0, 15.0, 9.0, 9.0, 8.0, 3.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-05, -2.8777867555618286e-05, -2.775341272354126e-05, -2.6728957891464233e-05, -2.5704503059387207e-05, -2.468004822731018e-05, -2.3655593395233154e-05, -2.2631138563156128e-05, -2.16066837310791e-05, -2.0582228899002075e-05, -1.955777406692505e-05, -1.8533319234848022e-05, -1.7508864402770996e-05, -1.648440957069397e-05, -1.5459954738616943e-05, -1.4435499906539917e-05, -1.341104507446289e-05, -1.2386590242385864e-05, -1.1362135410308838e-05, -1.0337680578231812e-05, -9.313225746154785e-06, -8.288770914077759e-06, -7.264316082000732e-06, -6.239861249923706e-06, -5.21540641784668e-06, -4.190951585769653e-06, -3.166496753692627e-06, -2.1420419216156006e-06, -1.1175870895385742e-06, -9.313225746154785e-08, 9.313225746154785e-07, 1.955777406692505e-06, 2.9802322387695312e-06, 4.004687070846558e-06, 5.029141902923584e-06, 6.05359673500061e-06, 7.078051567077637e-06, 8.102506399154663e-06, 9.12696123123169e-06, 1.0151416063308716e-05, 1.1175870895385742e-05, 1.2200325727462769e-05, 1.3224780559539795e-05, 1.4249235391616821e-05, 1.5273690223693848e-05, 1.6298145055770874e-05, 1.73225998878479e-05, 1.8347054719924927e-05, 1.9371509552001953e-05, 2.039596438407898e-05, 2.1420419216156006e-05, 2.2444874048233032e-05, 2.346932888031006e-05, 2.4493783712387085e-05, 2.551823854446411e-05, 2.6542693376541138e-05, 2.7567148208618164e-05, 2.859160304069519e-05, 2.9616057872772217e-05, 3.064051270484924e-05, 3.166496753692627e-05, 3.2689422369003296e-05, 3.371387720108032e-05, 3.473833203315735e-05, 3.5762786865234375e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 7.0, 8.0, 2.0, 6.0, 8.0, 8.0, 7.0, 17.0, 16.0, 17.0, 17.0, 17.0, 37.0, 28.0, 26.0, 32.0, 45.0, 48.0, 31.0, 49.0, 53.0, 46.0, 56.0, 40.0, 43.0, 31.0, 39.0, 39.0, 37.0, 25.0, 20.0, 19.0, 21.0, 15.0, 10.0, 16.0, 9.0, 12.0, 10.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.8125, -28.884033203125, -27.95556640625, -27.027099609375, -26.0986328125, -25.170166015625, -24.24169921875, -23.313232421875, -22.384765625, -21.456298828125, -20.52783203125, -19.599365234375, -18.6708984375, -17.742431640625, -16.81396484375, -15.885498046875, -14.95703125, -14.028564453125, -13.10009765625, -12.171630859375, -11.2431640625, -10.314697265625, -9.38623046875, -8.457763671875, -7.529296875, -6.600830078125, -5.67236328125, -4.743896484375, -3.8154296875, -2.886962890625, -1.95849609375, -1.030029296875, -0.1015625, 0.826904296875, 1.75537109375, 2.683837890625, 3.6123046875, 4.540771484375, 5.46923828125, 6.397705078125, 7.326171875, 8.254638671875, 9.18310546875, 10.111572265625, 11.0400390625, 11.968505859375, 12.89697265625, 13.825439453125, 14.75390625, 15.682373046875, 16.61083984375, 17.539306640625, 18.4677734375, 19.396240234375, 20.32470703125, 21.253173828125, 22.181640625, 23.110107421875, 24.03857421875, 24.967041015625, 25.8955078125, 26.823974609375, 27.75244140625, 28.680908203125, 29.609375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 5.0, 7.0, 5.0, 6.0, 13.0, 4.0, 24.0, 26.0, 54.0, 48.0, 72.0, 150.0, 209.0, 320.0, 601.0, 1219.0, 2893.0, 7169.0, 19518.0, 61442.0, 233590.0, 521074.0, 138318.0, 39132.0, 13295.0, 4998.0, 2088.0, 997.0, 490.0, 246.0, 153.0, 112.0, 82.0, 53.0, 22.0, 28.0, 19.0, 16.0, 11.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.484375, -14.0361328125, -13.587890625, -13.1396484375, -12.69140625, -12.2431640625, -11.794921875, -11.3466796875, -10.8984375, -10.4501953125, -10.001953125, -9.5537109375, -9.10546875, -8.6572265625, -8.208984375, -7.7607421875, -7.3125, -6.8642578125, -6.416015625, -5.9677734375, -5.51953125, -5.0712890625, -4.623046875, -4.1748046875, -3.7265625, -3.2783203125, -2.830078125, -2.3818359375, -1.93359375, -1.4853515625, -1.037109375, -0.5888671875, -0.140625, 0.3076171875, 0.755859375, 1.2041015625, 1.65234375, 2.1005859375, 2.548828125, 2.9970703125, 3.4453125, 3.8935546875, 4.341796875, 4.7900390625, 5.23828125, 5.6865234375, 6.134765625, 6.5830078125, 7.03125, 7.4794921875, 7.927734375, 8.3759765625, 8.82421875, 9.2724609375, 9.720703125, 10.1689453125, 10.6171875, 11.0654296875, 11.513671875, 11.9619140625, 12.41015625, 12.8583984375, 13.306640625, 13.7548828125, 14.203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 1.0, 6.0, 7.0, 2.0, 12.0, 7.0, 17.0, 11.0, 21.0, 12.0, 21.0, 28.0, 25.0, 34.0, 26.0, 32.0, 23.0, 31.0, 34.0, 35.0, 36.0, 45.0, 1838.0, 268.0, 46.0, 41.0, 40.0, 31.0, 30.0, 24.0, 23.0, 33.0, 37.0, 21.0, 21.0, 16.0, 21.0, 17.0, 14.0, 10.0, 11.0, 9.0, 6.0, 4.0, 4.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-96.1875, -93.263671875, -90.33984375, -87.416015625, -84.4921875, -81.568359375, -78.64453125, -75.720703125, -72.796875, -69.873046875, -66.94921875, -64.025390625, -61.1015625, -58.177734375, -55.25390625, -52.330078125, -49.40625, -46.482421875, -43.55859375, -40.634765625, -37.7109375, -34.787109375, -31.86328125, -28.939453125, -26.015625, -23.091796875, -20.16796875, -17.244140625, -14.3203125, -11.396484375, -8.47265625, -5.548828125, -2.625, 0.298828125, 3.22265625, 6.146484375, 9.0703125, 11.994140625, 14.91796875, 17.841796875, 20.765625, 23.689453125, 26.61328125, 29.537109375, 32.4609375, 35.384765625, 38.30859375, 41.232421875, 44.15625, 47.080078125, 50.00390625, 52.927734375, 55.8515625, 58.775390625, 61.69921875, 64.623046875, 67.546875, 70.470703125, 73.39453125, 76.318359375, 79.2421875, 82.166015625, 85.08984375, 88.013671875, 90.9375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 9.0, 7.0, 9.0, 11.0, 14.0, 18.0, 24.0, 17.0, 31.0, 33.0, 55.0, 63.0, 71.0, 104.0, 156.0, 220.0, 350.0, 539.0, 1268.0, 236537.0, 2902640.0, 1612.0, 622.0, 343.0, 244.0, 173.0, 113.0, 85.0, 60.0, 51.0, 37.0, 37.0, 26.0, 11.0, 26.0, 11.0, 14.0, 10.0, 12.0, 3.0, 5.0, 7.0, 1.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-142.5, -137.916015625, -133.33203125, -128.748046875, -124.1640625, -119.580078125, -114.99609375, -110.412109375, -105.828125, -101.244140625, -96.66015625, -92.076171875, -87.4921875, -82.908203125, -78.32421875, -73.740234375, -69.15625, -64.572265625, -59.98828125, -55.404296875, -50.8203125, -46.236328125, -41.65234375, -37.068359375, -32.484375, -27.900390625, -23.31640625, -18.732421875, -14.1484375, -9.564453125, -4.98046875, -0.396484375, 4.1875, 8.771484375, 13.35546875, 17.939453125, 22.5234375, 27.107421875, 31.69140625, 36.275390625, 40.859375, 45.443359375, 50.02734375, 54.611328125, 59.1953125, 63.779296875, 68.36328125, 72.947265625, 77.53125, 82.115234375, 86.69921875, 91.283203125, 95.8671875, 100.451171875, 105.03515625, 109.619140625, 114.203125, 118.787109375, 123.37109375, 127.955078125, 132.5390625, 137.123046875, 141.70703125, 146.291015625, 150.875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [76.0, 942.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.193641662597656, -7.141706466674805, 18.910228729248047, 44.96216583251953, 71.01409912109375, 97.06603240966797, 123.11797332763672, 149.16989135742188, 175.22183227539062, 201.27377319335938, 227.32569885253906, 253.3776397705078, 279.4295654296875, 305.48150634765625, 331.533447265625, 357.58538818359375, 383.6373291015625, 409.68927001953125, 435.7412109375, 461.79315185546875, 487.8450622558594, 513.89697265625, 539.948974609375, 566.0008544921875, 592.0527954101562, 618.104736328125, 644.1566772460938, 670.2086181640625, 696.2605590820312, 722.3125, 748.3643798828125, 774.4163208007812, 800.4683227539062, 826.520263671875, 852.5722045898438, 878.6241455078125, 904.6760864257812, 930.72802734375, 956.7799072265625, 982.8318481445312, 1008.8837890625, 1034.9356689453125, 1060.9876708984375, 1087.03955078125, 1113.091552734375, 1139.1434326171875, 1165.1954345703125, 1191.247314453125, 1217.29931640625, 1243.3511962890625, 1269.4031982421875, 1295.455078125, 1321.507080078125, 1347.5589599609375, 1373.6109619140625, 1399.662841796875, 1425.7147216796875, 1451.7666015625, 1477.818603515625, 1503.8704833984375, 1529.9224853515625, 1555.974365234375, 1582.0263671875, 1608.0782470703125, 1634.1302490234375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 5.0, 2.0, 4.0, 8.0, 18.0, 12.0, 17.0, 19.0, 27.0, 15.0, 26.0, 22.0, 32.0, 38.0, 40.0, 49.0, 42.0, 43.0, 52.0, 51.0, 49.0, 43.0, 44.0, 42.0, 41.0, 33.0, 28.0, 34.0, 30.0, 27.0, 21.0, 16.0, 13.0, 15.0, 12.0, 4.0, 6.0, 3.0, 1.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-358.9853820800781, -348.2940673828125, -337.6027526855469, -326.91143798828125, -316.22015380859375, -305.5288391113281, -294.8375244140625, -284.1462097167969, -273.45489501953125, -262.7635803222656, -252.072265625, -241.38096618652344, -230.6896514892578, -219.9983367919922, -209.30703735351562, -198.61572265625, -187.92440795898438, -177.23309326171875, -166.54177856445312, -155.85047912597656, -145.15916442871094, -134.4678497314453, -123.77654266357422, -113.08523559570312, -102.3939208984375, -91.70260620117188, -81.01129913330078, -70.31999206542969, -59.62867736816406, -48.9373664855957, -38.246055603027344, -27.55474853515625, -16.8634033203125, -6.172092437744141, 4.519218444824219, 15.210529327392578, 25.901840209960938, 36.5931510925293, 47.284461975097656, 57.97576904296875, 68.66708374023438, 79.3583984375, 90.0497055053711, 100.74101257324219, 111.43232727050781, 122.12364196777344, 132.81494140625, 143.50625610351562, 154.19757080078125, 164.88888549804688, 175.5802001953125, 186.27149963378906, 196.9628143310547, 207.6541290283203, 218.34542846679688, 229.0367431640625, 239.72805786132812, 250.41937255859375, 261.1106872558594, 271.802001953125, 282.4932861328125, 293.1846008300781, 303.87591552734375, 314.5672302246094, 325.258544921875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 8.0, 6.0, 6.0, 3.0, 8.0, 9.0, 7.0, 9.0, 24.0, 17.0, 15.0, 22.0, 25.0, 29.0, 27.0, 37.0, 30.0, 47.0, 47.0, 41.0, 56.0, 48.0, 48.0, 43.0, 37.0, 41.0, 36.0, 39.0, 36.0, 28.0, 24.0, 19.0, 21.0, 14.0, 10.0, 20.0, 8.0, 12.0, 10.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.234375, -29.301025390625, -28.36767578125, -27.434326171875, -26.5009765625, -25.567626953125, -24.63427734375, -23.700927734375, -22.767578125, -21.834228515625, -20.90087890625, -19.967529296875, -19.0341796875, -18.100830078125, -17.16748046875, -16.234130859375, -15.30078125, -14.367431640625, -13.43408203125, -12.500732421875, -11.5673828125, -10.634033203125, -9.70068359375, -8.767333984375, -7.833984375, -6.900634765625, -5.96728515625, -5.033935546875, -4.1005859375, -3.167236328125, -2.23388671875, -1.300537109375, -0.3671875, 0.566162109375, 1.49951171875, 2.432861328125, 3.3662109375, 4.299560546875, 5.23291015625, 6.166259765625, 7.099609375, 8.032958984375, 8.96630859375, 9.899658203125, 10.8330078125, 11.766357421875, 12.69970703125, 13.633056640625, 14.56640625, 15.499755859375, 16.43310546875, 17.366455078125, 18.2998046875, 19.233154296875, 20.16650390625, 21.099853515625, 22.033203125, 22.966552734375, 23.89990234375, 24.833251953125, 25.7666015625, 26.699951171875, 27.63330078125, 28.566650390625, 29.5]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 28.0, 19.0, 15.0, 39.0, 46.0, 47.0, 120.0, 136.0, 208.0, 254.0, 366.0, 562.0, 749.0, 1145.0, 1589.0, 2461.0, 3772.0, 6385.0, 11756.0, 47462.0, 1301391.0, 2692568.0, 89722.0, 14079.0, 7329.0, 4138.0, 2616.0, 1663.0, 1159.0, 738.0, 518.0, 347.0, 231.0, 195.0, 117.0, 73.0, 56.0, 45.0, 23.0, 37.0, 23.0, 11.0, 9.0, 7.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-86.5, -83.8857421875, -81.271484375, -78.6572265625, -76.04296875, -73.4287109375, -70.814453125, -68.2001953125, -65.5859375, -62.9716796875, -60.357421875, -57.7431640625, -55.12890625, -52.5146484375, -49.900390625, -47.2861328125, -44.671875, -42.0576171875, -39.443359375, -36.8291015625, -34.21484375, -31.6005859375, -28.986328125, -26.3720703125, -23.7578125, -21.1435546875, -18.529296875, -15.9150390625, -13.30078125, -10.6865234375, -8.072265625, -5.4580078125, -2.84375, -0.2294921875, 2.384765625, 4.9990234375, 7.61328125, 10.2275390625, 12.841796875, 15.4560546875, 18.0703125, 20.6845703125, 23.298828125, 25.9130859375, 28.52734375, 31.1416015625, 33.755859375, 36.3701171875, 38.984375, 41.5986328125, 44.212890625, 46.8271484375, 49.44140625, 52.0556640625, 54.669921875, 57.2841796875, 59.8984375, 62.5126953125, 65.126953125, 67.7412109375, 70.35546875, 72.9697265625, 75.583984375, 78.1982421875, 80.8125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 8.0, 5.0, 4.0, 5.0, 7.0, 2.0, 13.0, 11.0, 11.0, 21.0, 23.0, 31.0, 48.0, 104.0, 271.0, 765.0, 1419.0, 716.0, 277.0, 104.0, 54.0, 36.0, 14.0, 17.0, 21.0, 12.0, 12.0, 6.0, 11.0, 7.0, 6.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-73.375, -70.703125, -68.03125, -65.359375, -62.6875, -60.015625, -57.34375, -54.671875, -52.0, -49.328125, -46.65625, -43.984375, -41.3125, -38.640625, -35.96875, -33.296875, -30.625, -27.953125, -25.28125, -22.609375, -19.9375, -17.265625, -14.59375, -11.921875, -9.25, -6.578125, -3.90625, -1.234375, 1.4375, 4.109375, 6.78125, 9.453125, 12.125, 14.796875, 17.46875, 20.140625, 22.8125, 25.484375, 28.15625, 30.828125, 33.5, 36.171875, 38.84375, 41.515625, 44.1875, 46.859375, 49.53125, 52.203125, 54.875, 57.546875, 60.21875, 62.890625, 65.5625, 68.234375, 70.90625, 73.578125, 76.25, 78.921875, 81.59375, 84.265625, 86.9375, 89.609375, 92.28125, 94.953125, 97.625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 10.0, 14.0, 23.0, 22.0, 46.0, 59.0, 79.0, 112.0, 121.0, 197.0, 246.0, 355.0, 534.0, 720.0, 1056.0, 1547.0, 2160.0, 3371.0, 5029.0, 8105.0, 13622.0, 24832.0, 60940.0, 587089.0, 3261498.0, 137941.0, 36598.0, 18092.0, 10334.0, 6497.0, 4177.0, 2674.0, 1883.0, 1251.0, 875.0, 621.0, 389.0, 342.0, 232.0, 164.0, 112.0, 81.0, 56.0, 48.0, 29.0, 19.0, 23.0, 15.0, 17.0, 3.0, 5.0, 2.0, 7.0, 1.0], "bins": [-108.5, -105.33203125, -102.1640625, -98.99609375, -95.828125, -92.66015625, -89.4921875, -86.32421875, -83.15625, -79.98828125, -76.8203125, -73.65234375, -70.484375, -67.31640625, -64.1484375, -60.98046875, -57.8125, -54.64453125, -51.4765625, -48.30859375, -45.140625, -41.97265625, -38.8046875, -35.63671875, -32.46875, -29.30078125, -26.1328125, -22.96484375, -19.796875, -16.62890625, -13.4609375, -10.29296875, -7.125, -3.95703125, -0.7890625, 2.37890625, 5.546875, 8.71484375, 11.8828125, 15.05078125, 18.21875, 21.38671875, 24.5546875, 27.72265625, 30.890625, 34.05859375, 37.2265625, 40.39453125, 43.5625, 46.73046875, 49.8984375, 53.06640625, 56.234375, 59.40234375, 62.5703125, 65.73828125, 68.90625, 72.07421875, 75.2421875, 78.41015625, 81.578125, 84.74609375, 87.9140625, 91.08203125, 94.25]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 12.0, 16.0, 17.0, 19.0, 22.0, 46.0, 45.0, 68.0, 127.0, 158.0, 142.0, 90.0, 54.0, 42.0, 32.0, 25.0, 17.0, 14.0, 12.0, 5.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-400.8241271972656, -389.8207702636719, -378.8174133300781, -367.8140563964844, -356.8106689453125, -345.80731201171875, -334.803955078125, -323.80059814453125, -312.7972412109375, -301.79388427734375, -290.79052734375, -279.78717041015625, -268.7838134765625, -257.7804260253906, -246.77706909179688, -235.77371215820312, -224.77035522460938, -213.76699829101562, -202.76364135742188, -191.76026916503906, -180.7569122314453, -169.75355529785156, -158.75018310546875, -147.746826171875, -136.74346923828125, -125.7401123046875, -114.73674774169922, -103.73338317871094, -92.73002624511719, -81.72666931152344, -70.72330474853516, -59.719940185546875, -48.71661376953125, -37.713253021240234, -26.70989227294922, -15.706531524658203, -4.7031707763671875, 6.300189971923828, 17.303550720214844, 28.306915283203125, 39.310272216796875, 50.31363296508789, 61.316993713378906, 72.32035827636719, 83.32371520996094, 94.32707214355469, 105.33043670654297, 116.33380126953125, 127.337158203125, 138.34051513671875, 149.3438720703125, 160.3472442626953, 171.35060119628906, 182.3539581298828, 193.35733032226562, 204.36068725585938, 215.36404418945312, 226.36740112304688, 237.37075805664062, 248.37413024902344, 259.37750244140625, 270.380859375, 281.38421630859375, 292.3875732421875, 303.39093017578125]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 8.0, 9.0, 14.0, 18.0, 17.0, 11.0, 20.0, 28.0, 23.0, 29.0, 24.0, 38.0, 40.0, 29.0, 31.0, 28.0, 42.0, 33.0, 29.0, 45.0, 35.0, 32.0, 42.0, 39.0, 36.0, 26.0, 39.0, 33.0, 23.0, 21.0, 24.0, 22.0, 19.0, 15.0, 16.0, 9.0, 9.0, 8.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-207.72976684570312, -201.13792419433594, -194.54608154296875, -187.95423889160156, -181.36239624023438, -174.7705535888672, -168.1787109375, -161.5868682861328, -154.99502563476562, -148.40318298339844, -141.81134033203125, -135.21949768066406, -128.62765502929688, -122.03581237792969, -115.4439697265625, -108.85212707519531, -102.2602767944336, -95.6684341430664, -89.07659149169922, -82.48474884033203, -75.89290618896484, -69.30105590820312, -62.7092170715332, -56.117374420166016, -49.52553176879883, -42.93368911743164, -36.34184646606445, -29.750001907348633, -23.158159255981445, -16.566314697265625, -9.974472045898438, -3.38262939453125, 3.2092132568359375, 9.801055908203125, 16.392898559570312, 22.984743118286133, 29.57658576965332, 36.16843032836914, 42.76027297973633, 49.352115631103516, 55.9439582824707, 62.53580093383789, 69.12764739990234, 75.71949005126953, 82.31133270263672, 88.9031753540039, 95.4950180053711, 102.08686065673828, 108.67870330810547, 115.27054595947266, 121.86238861083984, 128.45423889160156, 135.04608154296875, 141.63792419433594, 148.22976684570312, 154.8216094970703, 161.4134521484375, 168.0052947998047, 174.59713745117188, 181.18898010253906, 187.78082275390625, 194.37266540527344, 200.96450805664062, 207.5563507080078, 214.148193359375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 3.0, 7.0, 6.0, 16.0, 14.0, 11.0, 21.0, 22.0, 18.0, 37.0, 30.0, 31.0, 26.0, 44.0, 33.0, 46.0, 45.0, 55.0, 44.0, 45.0, 56.0, 47.0, 39.0, 27.0, 36.0, 30.0, 24.0, 21.0, 26.0, 20.0, 17.0, 19.0, 14.0, 19.0, 7.0, 6.0, 7.0, 3.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.3427734375, -30.341796875, -29.3408203125, -28.33984375, -27.3388671875, -26.337890625, -25.3369140625, -24.3359375, -23.3349609375, -22.333984375, -21.3330078125, -20.33203125, -19.3310546875, -18.330078125, -17.3291015625, -16.328125, -15.3271484375, -14.326171875, -13.3251953125, -12.32421875, -11.3232421875, -10.322265625, -9.3212890625, -8.3203125, -7.3193359375, -6.318359375, -5.3173828125, -4.31640625, -3.3154296875, -2.314453125, -1.3134765625, -0.3125, 0.6884765625, 1.689453125, 2.6904296875, 3.69140625, 4.6923828125, 5.693359375, 6.6943359375, 7.6953125, 8.6962890625, 9.697265625, 10.6982421875, 11.69921875, 12.7001953125, 13.701171875, 14.7021484375, 15.703125, 16.7041015625, 17.705078125, 18.7060546875, 19.70703125, 20.7080078125, 21.708984375, 22.7099609375, 23.7109375, 24.7119140625, 25.712890625, 26.7138671875, 27.71484375, 28.7158203125, 29.716796875, 30.7177734375, 31.71875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 7.0, 11.0, 16.0, 23.0, 33.0, 43.0, 62.0, 104.0, 141.0, 212.0, 308.0, 459.0, 616.0, 931.0, 1400.0, 2054.0, 3134.0, 4696.0, 7305.0, 11316.0, 17631.0, 27969.0, 45875.0, 80778.0, 178821.0, 368343.0, 127352.0, 64303.0, 38112.0, 23528.0, 14804.0, 9639.0, 6245.0, 4065.0, 2661.0, 1844.0, 1176.0, 792.0, 561.0, 366.0, 252.0, 181.0, 121.0, 84.0, 50.0, 42.0, 28.0, 26.0, 15.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.268096923828125, -1.22760009765625, -1.187103271484375, -1.1466064453125, -1.106109619140625, -1.06561279296875, -1.025115966796875, -0.984619140625, -0.944122314453125, -0.90362548828125, -0.863128662109375, -0.8226318359375, -0.782135009765625, -0.74163818359375, -0.701141357421875, -0.66064453125, -0.620147705078125, -0.57965087890625, -0.539154052734375, -0.4986572265625, -0.458160400390625, -0.41766357421875, -0.377166748046875, -0.336669921875, -0.296173095703125, -0.25567626953125, -0.215179443359375, -0.1746826171875, -0.134185791015625, -0.09368896484375, -0.053192138671875, -0.0126953125, 0.027801513671875, 0.06829833984375, 0.108795166015625, 0.1492919921875, 0.189788818359375, 0.23028564453125, 0.270782470703125, 0.311279296875, 0.351776123046875, 0.39227294921875, 0.432769775390625, 0.4732666015625, 0.513763427734375, 0.55426025390625, 0.594757080078125, 0.63525390625, 0.675750732421875, 0.71624755859375, 0.756744384765625, 0.7972412109375, 0.837738037109375, 0.87823486328125, 0.918731689453125, 0.959228515625, 0.999725341796875, 1.04022216796875, 1.080718994140625, 1.1212158203125, 1.161712646484375, 1.20220947265625, 1.242706298828125, 1.283203125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 5.0, 10.0, 10.0, 6.0, 13.0, 14.0, 17.0, 16.0, 20.0, 23.0, 35.0, 31.0, 27.0, 33.0, 39.0, 28.0, 51.0, 36.0, 45.0, 1078.0, 34.0, 36.0, 37.0, 36.0, 47.0, 30.0, 21.0, 37.0, 33.0, 36.0, 30.0, 15.0, 17.0, 16.0, 14.0, 14.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.265625, -18.656494140625, -18.04736328125, -17.438232421875, -16.8291015625, -16.219970703125, -15.61083984375, -15.001708984375, -14.392578125, -13.783447265625, -13.17431640625, -12.565185546875, -11.9560546875, -11.346923828125, -10.73779296875, -10.128662109375, -9.51953125, -8.910400390625, -8.30126953125, -7.692138671875, -7.0830078125, -6.473876953125, -5.86474609375, -5.255615234375, -4.646484375, -4.037353515625, -3.42822265625, -2.819091796875, -2.2099609375, -1.600830078125, -0.99169921875, -0.382568359375, 0.2265625, 0.835693359375, 1.44482421875, 2.053955078125, 2.6630859375, 3.272216796875, 3.88134765625, 4.490478515625, 5.099609375, 5.708740234375, 6.31787109375, 6.927001953125, 7.5361328125, 8.145263671875, 8.75439453125, 9.363525390625, 9.97265625, 10.581787109375, 11.19091796875, 11.800048828125, 12.4091796875, 13.018310546875, 13.62744140625, 14.236572265625, 14.845703125, 15.454833984375, 16.06396484375, 16.673095703125, 17.2822265625, 17.891357421875, 18.50048828125, 19.109619140625, 19.71875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 18.0, 21.0, 22.0, 38.0, 59.0, 69.0, 99.0, 129.0, 226.0, 287.0, 415.0, 637.0, 871.0, 1268.0, 1781.0, 2649.0, 4008.0, 6070.0, 9069.0, 13835.0, 21918.0, 33673.0, 53117.0, 88479.0, 165108.0, 1363647.0, 128420.0, 72911.0, 45197.0, 28448.0, 18455.0, 11882.0, 7921.0, 5292.0, 3551.0, 2336.0, 1593.0, 1039.0, 756.0, 543.0, 368.0, 259.0, 188.0, 132.0, 86.0, 61.0, 52.0, 30.0, 21.0, 20.0, 16.0, 11.0, 4.0, 3.0, 4.0, 3.0, 4.0], "bins": [-0.806640625, -0.7816848754882812, -0.7567291259765625, -0.7317733764648438, -0.706817626953125, -0.6818618774414062, -0.6569061279296875, -0.6319503784179688, -0.60699462890625, -0.5820388793945312, -0.5570831298828125, -0.5321273803710938, -0.507171630859375, -0.48221588134765625, -0.4572601318359375, -0.43230438232421875, -0.4073486328125, -0.38239288330078125, -0.3574371337890625, -0.33248138427734375, -0.307525634765625, -0.28256988525390625, -0.2576141357421875, -0.23265838623046875, -0.20770263671875, -0.18274688720703125, -0.1577911376953125, -0.13283538818359375, -0.107879638671875, -0.08292388916015625, -0.0579681396484375, -0.03301239013671875, -0.008056640625, 0.01689910888671875, 0.0418548583984375, 0.06681060791015625, 0.091766357421875, 0.11672210693359375, 0.1416778564453125, 0.16663360595703125, 0.19158935546875, 0.21654510498046875, 0.2415008544921875, 0.26645660400390625, 0.291412353515625, 0.31636810302734375, 0.3413238525390625, 0.36627960205078125, 0.3912353515625, 0.41619110107421875, 0.4411468505859375, 0.46610260009765625, 0.491058349609375, 0.5160140991210938, 0.5409698486328125, 0.5659255981445312, 0.59088134765625, 0.6158370971679688, 0.6407928466796875, 0.6657485961914062, 0.690704345703125, 0.7156600952148438, 0.7406158447265625, 0.7655715942382812, 0.79052734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 7.0, 3.0, 5.0, 4.0, 7.0, 10.0, 13.0, 14.0, 20.0, 17.0, 25.0, 22.0, 40.0, 30.0, 51.0, 47.0, 44.0, 76.0, 106.0, 76.0, 55.0, 39.0, 51.0, 39.0, 27.0, 26.0, 25.0, 21.0, 13.0, 24.0, 13.0, 12.0, 7.0, 11.0, 5.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.639957427978516e-05, -6.408244371414185e-05, -6.176531314849854e-05, -5.9448182582855225e-05, -5.7131052017211914e-05, -5.4813921451568604e-05, -5.249679088592529e-05, -5.017966032028198e-05, -4.786252975463867e-05, -4.554539918899536e-05, -4.322826862335205e-05, -4.091113805770874e-05, -3.859400749206543e-05, -3.627687692642212e-05, -3.395974636077881e-05, -3.16426157951355e-05, -2.9325485229492188e-05, -2.7008354663848877e-05, -2.4691224098205566e-05, -2.2374093532562256e-05, -2.0056962966918945e-05, -1.7739832401275635e-05, -1.5422701835632324e-05, -1.3105571269989014e-05, -1.0788440704345703e-05, -8.471310138702393e-06, -6.154179573059082e-06, -3.8370490074157715e-06, -1.519918441772461e-06, 7.972121238708496e-07, 3.11434268951416e-06, 5.431473255157471e-06, 7.748603820800781e-06, 1.0065734386444092e-05, 1.2382864952087402e-05, 1.4699995517730713e-05, 1.7017126083374023e-05, 1.9334256649017334e-05, 2.1651387214660645e-05, 2.3968517780303955e-05, 2.6285648345947266e-05, 2.8602778911590576e-05, 3.091990947723389e-05, 3.32370400428772e-05, 3.555417060852051e-05, 3.787130117416382e-05, 4.018843173980713e-05, 4.250556230545044e-05, 4.482269287109375e-05, 4.713982343673706e-05, 4.945695400238037e-05, 5.177408456802368e-05, 5.409121513366699e-05, 5.64083456993103e-05, 5.872547626495361e-05, 6.104260683059692e-05, 6.335973739624023e-05, 6.567686796188354e-05, 6.799399852752686e-05, 7.031112909317017e-05, 7.262825965881348e-05, 7.494539022445679e-05, 7.72625207901001e-05, 7.957965135574341e-05, 8.189678192138672e-05]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 13.0, 13.0, 18.0, 17.0, 29.0, 40.0, 44.0, 69.0, 102.0, 144.0, 256.0, 680.0, 4878.0, 90499.0, 917280.0, 31007.0, 2309.0, 441.0, 229.0, 117.0, 102.0, 56.0, 45.0, 33.0, 27.0, 21.0, 19.0, 5.0, 9.0, 6.0, 3.0, 3.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0012569427490234375, -0.0012213736772537231, -0.0011858046054840088, -0.0011502355337142944, -0.00111466646194458, -0.0010790973901748657, -0.0010435283184051514, -0.001007959246635437, -0.0009723901748657227, -0.0009368211030960083, -0.0009012520313262939, -0.0008656829595565796, -0.0008301138877868652, -0.0007945448160171509, -0.0007589757442474365, -0.0007234066724777222, -0.0006878376007080078, -0.0006522685289382935, -0.0006166994571685791, -0.0005811303853988647, -0.0005455613136291504, -0.000509992241859436, -0.0004744231700897217, -0.0004388540983200073, -0.00040328502655029297, -0.0003677159547805786, -0.00033214688301086426, -0.0002965778112411499, -0.00026100873947143555, -0.0002254396677017212, -0.00018987059593200684, -0.00015430152416229248, -0.00011873245239257812, -8.316338062286377e-05, -4.7594308853149414e-05, -1.2025237083435059e-05, 2.3543834686279297e-05, 5.911290645599365e-05, 9.468197822570801e-05, 0.00013025104999542236, 0.00016582012176513672, 0.00020138919353485107, 0.00023695826530456543, 0.0002725273370742798, 0.00030809640884399414, 0.0003436654806137085, 0.00037923455238342285, 0.0004148036241531372, 0.00045037269592285156, 0.0004859417676925659, 0.0005215108394622803, 0.0005570799112319946, 0.000592648983001709, 0.0006282180547714233, 0.0006637871265411377, 0.000699356198310852, 0.0007349252700805664, 0.0007704943418502808, 0.0008060634136199951, 0.0008416324853897095, 0.0008772015571594238, 0.0009127706289291382, 0.0009483397006988525, 0.000983908772468567, 0.0010194778442382812]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 16.0, 30.0, 69.0, 179.0, 463.0, 137.0, 52.0, 26.0, 14.0, 12.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002196619170717895, -0.00021538787405006588, -0.00021111383102834225, -0.0002068397734547034, -0.00020256573043297976, -0.00019829168741125613, -0.0001940176443895325, -0.00018974358681589365, -0.00018546954379417002, -0.0001811955007724464, -0.00017692145775072277, -0.0001726474001770839, -0.00016837335715536028, -0.00016409931413363665, -0.00015982527111191303, -0.00015555121353827417, -0.00015127717051655054, -0.0001470031274948269, -0.00014272908447310328, -0.00013845502689946443, -0.0001341809838777408, -0.00012990694085601717, -0.00012563289783429354, -0.0001213588475366123, -0.00011708481179084629, -0.00011281076876912266, -0.00010853671847144142, -0.00010426267544971779, -9.998862515203655e-05, -9.571458213031292e-05, -9.144053910858929e-05, -8.716648881090805e-05, -8.289243851322681e-05, -7.861839549150318e-05, -7.434434519382194e-05, -7.007030217209831e-05, -6.579625187441707e-05, -6.152220885269344e-05, -5.7248162192991003e-05, -5.297411553328857e-05, -4.8700065235607326e-05, -4.442601857590489e-05, -4.0151971916202456e-05, -3.587792889447883e-05, -3.1603878596797585e-05, -2.7329833756084554e-05, -2.3055788915371522e-05, -1.8781742255669087e-05, -1.4507695595966652e-05, -1.0233648936264217e-05, -5.9596031860564835e-06, -1.6855574358487502e-06, 2.588489223853685e-06, 6.86253588355612e-06, 1.1136580724269152e-05, 1.5410627383971587e-05, 1.9684674043674022e-05, 2.3958720703376457e-05, 2.8232767363078892e-05, 3.250681038480252e-05, 3.678086068248376e-05, 4.105490370420739e-05, 4.5328950363909826e-05, 4.960299702361226e-05, 5.3877043683314696e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 7.0, 6.0, 9.0, 10.0, 9.0, 11.0, 13.0, 17.0, 22.0, 24.0, 23.0, 28.0, 41.0, 30.0, 23.0, 31.0, 49.0, 56.0, 41.0, 42.0, 35.0, 41.0, 42.0, 41.0, 40.0, 33.0, 35.0, 31.0, 28.0, 31.0, 30.0, 15.0, 21.0, 12.0, 13.0, 7.0, 9.0, 4.0, 4.0, 8.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6776065826416016e-05, -3.563147038221359e-05, -3.448687493801117e-05, -3.3342279493808746e-05, -3.219768404960632e-05, -3.10530886054039e-05, -2.9908493161201477e-05, -2.8763897716999054e-05, -2.761930227279663e-05, -2.6474706828594208e-05, -2.5330111384391785e-05, -2.418551594018936e-05, -2.304092049598694e-05, -2.1896325051784515e-05, -2.0751729607582092e-05, -1.960713416337967e-05, -1.8462538719177246e-05, -1.7317943274974823e-05, -1.61733478307724e-05, -1.5028752386569977e-05, -1.3884156942367554e-05, -1.273956149816513e-05, -1.1594966053962708e-05, -1.0450370609760284e-05, -9.305775165557861e-06, -8.161179721355438e-06, -7.016584277153015e-06, -5.871988832950592e-06, -4.727393388748169e-06, -3.582797944545746e-06, -2.4382025003433228e-06, -1.2936070561408997e-06, -1.4901161193847656e-07, 9.955838322639465e-07, 2.1401792764663696e-06, 3.2847747206687927e-06, 4.429370164871216e-06, 5.573965609073639e-06, 6.718561053276062e-06, 7.863156497478485e-06, 9.007751941680908e-06, 1.0152347385883331e-05, 1.1296942830085754e-05, 1.2441538274288177e-05, 1.35861337184906e-05, 1.4730729162693024e-05, 1.5875324606895447e-05, 1.701992005109787e-05, 1.8164515495300293e-05, 1.9309110939502716e-05, 2.045370638370514e-05, 2.1598301827907562e-05, 2.2742897272109985e-05, 2.388749271631241e-05, 2.503208816051483e-05, 2.6176683604717255e-05, 2.7321279048919678e-05, 2.84658744931221e-05, 2.9610469937324524e-05, 3.075506538152695e-05, 3.189966082572937e-05, 3.304425626993179e-05, 3.4188851714134216e-05, 3.533344715833664e-05, 3.647804260253906e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 3.0, 7.0, 6.0, 16.0, 14.0, 11.0, 21.0, 22.0, 18.0, 37.0, 30.0, 31.0, 26.0, 44.0, 33.0, 46.0, 45.0, 55.0, 44.0, 45.0, 56.0, 47.0, 39.0, 27.0, 36.0, 30.0, 24.0, 21.0, 26.0, 20.0, 17.0, 19.0, 14.0, 19.0, 7.0, 6.0, 7.0, 3.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.3427734375, -30.341796875, -29.3408203125, -28.33984375, -27.3388671875, -26.337890625, -25.3369140625, -24.3359375, -23.3349609375, -22.333984375, -21.3330078125, -20.33203125, -19.3310546875, -18.330078125, -17.3291015625, -16.328125, -15.3271484375, -14.326171875, -13.3251953125, -12.32421875, -11.3232421875, -10.322265625, -9.3212890625, -8.3203125, -7.3193359375, -6.318359375, -5.3173828125, -4.31640625, -3.3154296875, -2.314453125, -1.3134765625, -0.3125, 0.6884765625, 1.689453125, 2.6904296875, 3.69140625, 4.6923828125, 5.693359375, 6.6943359375, 7.6953125, 8.6962890625, 9.697265625, 10.6982421875, 11.69921875, 12.7001953125, 13.701171875, 14.7021484375, 15.703125, 16.7041015625, 17.705078125, 18.7060546875, 19.70703125, 20.7080078125, 21.708984375, 22.7099609375, 23.7109375, 24.7119140625, 25.712890625, 26.7138671875, 27.71484375, 28.7158203125, 29.716796875, 30.7177734375, 31.71875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 4.0, 11.0, 11.0, 16.0, 21.0, 30.0, 32.0, 58.0, 76.0, 98.0, 144.0, 177.0, 260.0, 393.0, 559.0, 734.0, 1167.0, 1823.0, 2537.0, 4038.0, 6256.0, 10960.0, 55285.0, 887552.0, 47528.0, 10643.0, 6159.0, 3860.0, 2545.0, 1740.0, 1209.0, 795.0, 539.0, 397.0, 232.0, 182.0, 157.0, 85.0, 72.0, 44.0, 34.0, 25.0, 16.0, 11.0, 15.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-68.375, -66.26953125, -64.1640625, -62.05859375, -59.953125, -57.84765625, -55.7421875, -53.63671875, -51.53125, -49.42578125, -47.3203125, -45.21484375, -43.109375, -41.00390625, -38.8984375, -36.79296875, -34.6875, -32.58203125, -30.4765625, -28.37109375, -26.265625, -24.16015625, -22.0546875, -19.94921875, -17.84375, -15.73828125, -13.6328125, -11.52734375, -9.421875, -7.31640625, -5.2109375, -3.10546875, -1.0, 1.10546875, 3.2109375, 5.31640625, 7.421875, 9.52734375, 11.6328125, 13.73828125, 15.84375, 17.94921875, 20.0546875, 22.16015625, 24.265625, 26.37109375, 28.4765625, 30.58203125, 32.6875, 34.79296875, 36.8984375, 39.00390625, 41.109375, 43.21484375, 45.3203125, 47.42578125, 49.53125, 51.63671875, 53.7421875, 55.84765625, 57.953125, 60.05859375, 62.1640625, 64.26953125, 66.375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 11.0, 11.0, 8.0, 8.0, 15.0, 22.0, 28.0, 22.0, 28.0, 27.0, 37.0, 29.0, 37.0, 43.0, 58.0, 68.0, 369.0, 1706.0, 69.0, 51.0, 49.0, 51.0, 49.0, 46.0, 34.0, 30.0, 21.0, 35.0, 16.0, 10.0, 10.0, 12.0, 10.0, 7.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.5, -101.740234375, -97.98046875, -94.220703125, -90.4609375, -86.701171875, -82.94140625, -79.181640625, -75.421875, -71.662109375, -67.90234375, -64.142578125, -60.3828125, -56.623046875, -52.86328125, -49.103515625, -45.34375, -41.583984375, -37.82421875, -34.064453125, -30.3046875, -26.544921875, -22.78515625, -19.025390625, -15.265625, -11.505859375, -7.74609375, -3.986328125, -0.2265625, 3.533203125, 7.29296875, 11.052734375, 14.8125, 18.572265625, 22.33203125, 26.091796875, 29.8515625, 33.611328125, 37.37109375, 41.130859375, 44.890625, 48.650390625, 52.41015625, 56.169921875, 59.9296875, 63.689453125, 67.44921875, 71.208984375, 74.96875, 78.728515625, 82.48828125, 86.248046875, 90.0078125, 93.767578125, 97.52734375, 101.287109375, 105.046875, 108.806640625, 112.56640625, 116.326171875, 120.0859375, 123.845703125, 127.60546875, 131.365234375, 135.125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 5.0, 7.0, 16.0, 26.0, 21.0, 30.0, 52.0, 62.0, 119.0, 214.0, 434.0, 909.0, 2096.0, 5813.0, 23368.0, 3028451.0, 67631.0, 10565.0, 3283.0, 1280.0, 604.0, 256.0, 161.0, 92.0, 43.0, 45.0, 27.0, 20.0, 17.0, 14.0, 13.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-261.75, -254.625, -247.5, -240.375, -233.25, -226.125, -219.0, -211.875, -204.75, -197.625, -190.5, -183.375, -176.25, -169.125, -162.0, -154.875, -147.75, -140.625, -133.5, -126.375, -119.25, -112.125, -105.0, -97.875, -90.75, -83.625, -76.5, -69.375, -62.25, -55.125, -48.0, -40.875, -33.75, -26.625, -19.5, -12.375, -5.25, 1.875, 9.0, 16.125, 23.25, 30.375, 37.5, 44.625, 51.75, 58.875, 66.0, 73.125, 80.25, 87.375, 94.5, 101.625, 108.75, 115.875, 123.0, 130.125, 137.25, 144.375, 151.5, 158.625, 165.75, 172.875, 180.0, 187.125, 194.25]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 28.0, 71.0, 176.0, 419.0, 189.0, 67.0, 31.0, 15.0, 4.0, 3.0, 0.0, 1.0], "bins": [-999.427734375, -981.4186401367188, -963.4096069335938, -945.4005126953125, -927.3914794921875, -909.3823852539062, -891.373291015625, -873.3642578125, -855.3551635742188, -837.3460693359375, -819.3370361328125, -801.3279418945312, -783.31884765625, -765.309814453125, -747.3007202148438, -729.2916870117188, -711.2825927734375, -693.2734985351562, -675.2644653320312, -657.25537109375, -639.246337890625, -621.2372436523438, -603.2281494140625, -585.2191162109375, -567.2100219726562, -549.200927734375, -531.19189453125, -513.1828002929688, -495.1737365722656, -477.1646728515625, -459.15557861328125, -441.1465148925781, -423.13751220703125, -405.1284484863281, -387.119384765625, -369.11029052734375, -351.1012268066406, -333.0921630859375, -315.08306884765625, -297.0740051269531, -279.06494140625, -261.0558776855469, -243.0467987060547, -225.0377197265625, -207.02865600585938, -189.01959228515625, -171.01051330566406, -153.00143432617188, -134.99237060546875, -116.9832992553711, -98.97422790527344, -80.96515655517578, -62.956085205078125, -44.94701385498047, -26.937942504882812, -8.928871154785156, 9.0802001953125, 27.089271545410156, 45.09834289550781, 63.10741424560547, 81.11648559570312, 99.12555694580078, 117.13462829589844, 135.14370727539062, 153.15277099609375]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 3.0, 6.0, 6.0, 13.0, 8.0, 9.0, 7.0, 21.0, 19.0, 25.0, 19.0, 20.0, 31.0, 37.0, 40.0, 33.0, 39.0, 46.0, 44.0, 44.0, 38.0, 50.0, 33.0, 52.0, 42.0, 37.0, 48.0, 34.0, 29.0, 22.0, 25.0, 26.0, 23.0, 16.0, 12.0, 7.0, 12.0, 2.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-340.4291687011719, -329.4747009277344, -318.5202331542969, -307.5657653808594, -296.6112976074219, -285.6568298339844, -274.70233154296875, -263.74786376953125, -252.7934112548828, -241.8389434814453, -230.8844757080078, -219.92999267578125, -208.97552490234375, -198.02105712890625, -187.06658935546875, -176.11212158203125, -165.15765380859375, -154.20318603515625, -143.24871826171875, -132.29425048828125, -121.33977508544922, -110.38530731201172, -99.43083190917969, -88.47636413574219, -77.52189636230469, -66.56742858886719, -55.61295700073242, -44.658485412597656, -33.704017639160156, -22.749549865722656, -11.795074462890625, -0.840606689453125, 10.1138916015625, 21.068361282348633, 32.022830963134766, 42.97730255126953, 53.93177032470703, 64.88623809814453, 75.84071350097656, 86.79518127441406, 97.74964904785156, 108.70411682128906, 119.65858459472656, 130.61306762695312, 141.56753540039062, 152.52200317382812, 163.47647094726562, 174.43093872070312, 185.38540649414062, 196.33987426757812, 207.29434204101562, 218.24880981445312, 229.20327758789062, 240.15774536132812, 251.1122283935547, 262.06671142578125, 273.02117919921875, 283.97564697265625, 294.93011474609375, 305.88458251953125, 316.83905029296875, 327.79351806640625, 338.74798583984375, 349.70245361328125, 360.65692138671875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 4.0, 8.0, 7.0, 12.0, 12.0, 16.0, 19.0, 30.0, 27.0, 23.0, 30.0, 38.0, 34.0, 42.0, 38.0, 50.0, 42.0, 52.0, 40.0, 53.0, 49.0, 38.0, 50.0, 34.0, 39.0, 17.0, 23.0, 21.0, 24.0, 20.0, 19.0, 15.0, 22.0, 10.0, 8.0, 5.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -34.271484375, -33.23046875, -32.189453125, -31.1484375, -30.107421875, -29.06640625, -28.025390625, -26.984375, -25.943359375, -24.90234375, -23.861328125, -22.8203125, -21.779296875, -20.73828125, -19.697265625, -18.65625, -17.615234375, -16.57421875, -15.533203125, -14.4921875, -13.451171875, -12.41015625, -11.369140625, -10.328125, -9.287109375, -8.24609375, -7.205078125, -6.1640625, -5.123046875, -4.08203125, -3.041015625, -2.0, -0.958984375, 0.08203125, 1.123046875, 2.1640625, 3.205078125, 4.24609375, 5.287109375, 6.328125, 7.369140625, 8.41015625, 9.451171875, 10.4921875, 11.533203125, 12.57421875, 13.615234375, 14.65625, 15.697265625, 16.73828125, 17.779296875, 18.8203125, 19.861328125, 20.90234375, 21.943359375, 22.984375, 24.025390625, 25.06640625, 26.107421875, 27.1484375, 28.189453125, 29.23046875, 30.271484375, 31.3125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 13.0, 10.0, 24.0, 23.0, 28.0, 37.0, 51.0, 64.0, 94.0, 142.0, 182.0, 272.0, 321.0, 446.0, 625.0, 969.0, 1393.0, 2062.0, 3301.0, 5230.0, 9683.0, 23608.0, 378711.0, 3491683.0, 230455.0, 21845.0, 8895.0, 4883.0, 2946.0, 1980.0, 1316.0, 861.0, 594.0, 460.0, 307.0, 221.0, 147.0, 107.0, 75.0, 67.0, 44.0, 23.0, 23.0, 17.0, 9.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-93.1875, -90.3994140625, -87.611328125, -84.8232421875, -82.03515625, -79.2470703125, -76.458984375, -73.6708984375, -70.8828125, -68.0947265625, -65.306640625, -62.5185546875, -59.73046875, -56.9423828125, -54.154296875, -51.3662109375, -48.578125, -45.7900390625, -43.001953125, -40.2138671875, -37.42578125, -34.6376953125, -31.849609375, -29.0615234375, -26.2734375, -23.4853515625, -20.697265625, -17.9091796875, -15.12109375, -12.3330078125, -9.544921875, -6.7568359375, -3.96875, -1.1806640625, 1.607421875, 4.3955078125, 7.18359375, 9.9716796875, 12.759765625, 15.5478515625, 18.3359375, 21.1240234375, 23.912109375, 26.7001953125, 29.48828125, 32.2763671875, 35.064453125, 37.8525390625, 40.640625, 43.4287109375, 46.216796875, 49.0048828125, 51.79296875, 54.5810546875, 57.369140625, 60.1572265625, 62.9453125, 65.7333984375, 68.521484375, 71.3095703125, 74.09765625, 76.8857421875, 79.673828125, 82.4619140625, 85.25]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 11.0, 13.0, 10.0, 9.0, 14.0, 13.0, 22.0, 19.0, 30.0, 37.0, 74.0, 188.0, 564.0, 1414.0, 1013.0, 307.0, 121.0, 57.0, 30.0, 28.0, 16.0, 14.0, 20.0, 10.0, 12.0, 6.0, 4.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.8125, -87.416015625, -84.01953125, -80.623046875, -77.2265625, -73.830078125, -70.43359375, -67.037109375, -63.640625, -60.244140625, -56.84765625, -53.451171875, -50.0546875, -46.658203125, -43.26171875, -39.865234375, -36.46875, -33.072265625, -29.67578125, -26.279296875, -22.8828125, -19.486328125, -16.08984375, -12.693359375, -9.296875, -5.900390625, -2.50390625, 0.892578125, 4.2890625, 7.685546875, 11.08203125, 14.478515625, 17.875, 21.271484375, 24.66796875, 28.064453125, 31.4609375, 34.857421875, 38.25390625, 41.650390625, 45.046875, 48.443359375, 51.83984375, 55.236328125, 58.6328125, 62.029296875, 65.42578125, 68.822265625, 72.21875, 75.615234375, 79.01171875, 82.408203125, 85.8046875, 89.201171875, 92.59765625, 95.994140625, 99.390625, 102.787109375, 106.18359375, 109.580078125, 112.9765625, 116.373046875, 119.76953125, 123.166015625, 126.5625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 14.0, 8.0, 20.0, 38.0, 31.0, 62.0, 87.0, 121.0, 125.0, 195.0, 331.0, 460.0, 829.0, 1399.0, 2331.0, 3939.0, 7496.0, 14220.0, 29498.0, 88803.0, 2807933.0, 1113668.0, 68605.0, 25639.0, 12539.0, 6622.0, 3784.0, 2072.0, 1170.0, 771.0, 445.0, 324.0, 220.0, 133.0, 102.0, 63.0, 40.0, 34.0, 26.0, 19.0, 11.0, 8.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-141.875, -137.69140625, -133.5078125, -129.32421875, -125.140625, -120.95703125, -116.7734375, -112.58984375, -108.40625, -104.22265625, -100.0390625, -95.85546875, -91.671875, -87.48828125, -83.3046875, -79.12109375, -74.9375, -70.75390625, -66.5703125, -62.38671875, -58.203125, -54.01953125, -49.8359375, -45.65234375, -41.46875, -37.28515625, -33.1015625, -28.91796875, -24.734375, -20.55078125, -16.3671875, -12.18359375, -8.0, -3.81640625, 0.3671875, 4.55078125, 8.734375, 12.91796875, 17.1015625, 21.28515625, 25.46875, 29.65234375, 33.8359375, 38.01953125, 42.203125, 46.38671875, 50.5703125, 54.75390625, 58.9375, 63.12109375, 67.3046875, 71.48828125, 75.671875, 79.85546875, 84.0390625, 88.22265625, 92.40625, 96.58984375, 100.7734375, 104.95703125, 109.140625, 113.32421875, 117.5078125, 121.69140625, 125.875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 17.0, 18.0, 9.0, 19.0, 34.0, 45.0, 57.0, 80.0, 147.0, 156.0, 137.0, 71.0, 48.0, 39.0, 26.0, 23.0, 17.0, 16.0, 8.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-380.4411315917969, -368.7041015625, -356.9670715332031, -345.23004150390625, -333.4930114746094, -321.7559814453125, -310.01898193359375, -298.2819519042969, -286.544921875, -274.8078918457031, -263.07086181640625, -251.33383178710938, -239.59681701660156, -227.8597869873047, -216.1227569580078, -204.3857421875, -192.64869689941406, -180.9116668701172, -169.1746368408203, -157.4376220703125, -145.70059204101562, -133.96356201171875, -122.22653198242188, -110.48950958251953, -98.75247955322266, -87.01544952392578, -75.27842712402344, -63.54139709472656, -51.80437088012695, -40.067344665527344, -28.33031463623047, -16.593292236328125, -4.85626220703125, 6.880764961242676, 18.6177921295166, 30.354820251464844, 42.09184646606445, 53.82887268066406, 65.56590270996094, 77.30292510986328, 89.03995513916016, 100.77698516845703, 112.51400756835938, 124.25103759765625, 135.98806762695312, 147.72509765625, 159.46212768554688, 171.1991424560547, 182.93617248535156, 194.67320251464844, 206.4102325439453, 218.14724731445312, 229.88427734375, 241.62130737304688, 253.35833740234375, 265.0953674316406, 276.8323974609375, 288.5694274902344, 300.30645751953125, 312.0434875488281, 323.780517578125, 335.51751708984375, 347.25457763671875, 358.9915771484375, 370.7286071777344]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 7.0, 6.0, 4.0, 7.0, 6.0, 12.0, 14.0, 6.0, 6.0, 17.0, 21.0, 33.0, 18.0, 29.0, 34.0, 30.0, 35.0, 33.0, 44.0, 36.0, 44.0, 39.0, 39.0, 36.0, 25.0, 34.0, 41.0, 40.0, 30.0, 30.0, 20.0, 27.0, 30.0, 29.0, 20.0, 17.0, 12.0, 24.0, 16.0, 12.0, 5.0, 5.0, 4.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-212.4288330078125, -205.9185028076172, -199.40818786621094, -192.89785766601562, -186.38754272460938, -179.87721252441406, -173.3668975830078, -166.8565673828125, -160.34625244140625, -153.83592224121094, -147.3256072998047, -140.81527709960938, -134.30496215820312, -127.79463195800781, -121.28431701660156, -114.77398681640625, -108.26366424560547, -101.75334167480469, -95.2430191040039, -88.73269653320312, -82.22237396240234, -75.71205139160156, -69.20172119140625, -62.691402435302734, -56.18107986450195, -49.67075729370117, -43.16043472290039, -36.650108337402344, -30.139787673950195, -23.62946319580078, -17.119140625, -10.608818054199219, -4.0984954833984375, 2.411827564239502, 8.922150611877441, 15.432474136352539, 21.94279670715332, 28.453121185302734, 34.963443756103516, 41.4737663269043, 47.98408889770508, 54.49441146850586, 61.00473403930664, 67.51506042480469, 74.02538299560547, 80.53570556640625, 87.04602813720703, 93.55635070800781, 100.0666732788086, 106.57699584960938, 113.08731842041016, 119.59764099121094, 126.10796356201172, 132.6182861328125, 139.1286163330078, 145.63893127441406, 152.14926147460938, 158.6595916748047, 165.16990661621094, 171.68023681640625, 178.1905517578125, 184.7008819580078, 191.21119689941406, 197.72152709960938, 204.23184204101562]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 6.0, 11.0, 11.0, 12.0, 18.0, 23.0, 23.0, 29.0, 26.0, 29.0, 47.0, 35.0, 56.0, 46.0, 42.0, 46.0, 38.0, 44.0, 45.0, 50.0, 47.0, 34.0, 38.0, 25.0, 27.0, 20.0, 15.0, 19.0, 22.0, 17.0, 15.0, 13.0, 9.0, 8.0, 14.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.5625, -32.52197265625, -31.4814453125, -30.44091796875, -29.400390625, -28.35986328125, -27.3193359375, -26.27880859375, -25.23828125, -24.19775390625, -23.1572265625, -22.11669921875, -21.076171875, -20.03564453125, -18.9951171875, -17.95458984375, -16.9140625, -15.87353515625, -14.8330078125, -13.79248046875, -12.751953125, -11.71142578125, -10.6708984375, -9.63037109375, -8.58984375, -7.54931640625, -6.5087890625, -5.46826171875, -4.427734375, -3.38720703125, -2.3466796875, -1.30615234375, -0.265625, 0.77490234375, 1.8154296875, 2.85595703125, 3.896484375, 4.93701171875, 5.9775390625, 7.01806640625, 8.05859375, 9.09912109375, 10.1396484375, 11.18017578125, 12.220703125, 13.26123046875, 14.3017578125, 15.34228515625, 16.3828125, 17.42333984375, 18.4638671875, 19.50439453125, 20.544921875, 21.58544921875, 22.6259765625, 23.66650390625, 24.70703125, 25.74755859375, 26.7880859375, 27.82861328125, 28.869140625, 29.90966796875, 30.9501953125, 31.99072265625, 33.03125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 3.0, 9.0, 7.0, 24.0, 31.0, 33.0, 65.0, 82.0, 123.0, 187.0, 312.0, 486.0, 774.0, 1244.0, 2078.0, 3324.0, 5575.0, 9060.0, 14827.0, 25486.0, 45473.0, 87587.0, 201654.0, 374209.0, 129194.0, 62659.0, 33896.0, 19778.0, 11998.0, 7098.0, 4307.0, 2589.0, 1613.0, 998.0, 658.0, 384.0, 264.0, 171.0, 106.0, 62.0, 40.0, 35.0, 16.0, 16.0, 6.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59375, -1.544342041015625, -1.49493408203125, -1.445526123046875, -1.3961181640625, -1.346710205078125, -1.29730224609375, -1.247894287109375, -1.198486328125, -1.149078369140625, -1.09967041015625, -1.050262451171875, -1.0008544921875, -0.951446533203125, -0.90203857421875, -0.852630615234375, -0.80322265625, -0.753814697265625, -0.70440673828125, -0.654998779296875, -0.6055908203125, -0.556182861328125, -0.50677490234375, -0.457366943359375, -0.407958984375, -0.358551025390625, -0.30914306640625, -0.259735107421875, -0.2103271484375, -0.160919189453125, -0.11151123046875, -0.062103271484375, -0.0126953125, 0.036712646484375, 0.08612060546875, 0.135528564453125, 0.1849365234375, 0.234344482421875, 0.28375244140625, 0.333160400390625, 0.382568359375, 0.431976318359375, 0.48138427734375, 0.530792236328125, 0.5802001953125, 0.629608154296875, 0.67901611328125, 0.728424072265625, 0.77783203125, 0.827239990234375, 0.87664794921875, 0.926055908203125, 0.9754638671875, 1.024871826171875, 1.07427978515625, 1.123687744140625, 1.173095703125, 1.222503662109375, 1.27191162109375, 1.321319580078125, 1.3707275390625, 1.420135498046875, 1.46954345703125, 1.518951416015625, 1.568359375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 4.0, 10.0, 11.0, 8.0, 17.0, 17.0, 21.0, 20.0, 23.0, 26.0, 31.0, 35.0, 26.0, 29.0, 33.0, 34.0, 36.0, 46.0, 38.0, 1071.0, 49.0, 42.0, 36.0, 43.0, 32.0, 42.0, 31.0, 20.0, 27.0, 29.0, 19.0, 15.0, 17.0, 15.0, 15.0, 16.0, 8.0, 8.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.453125, -19.815673828125, -19.17822265625, -18.540771484375, -17.9033203125, -17.265869140625, -16.62841796875, -15.990966796875, -15.353515625, -14.716064453125, -14.07861328125, -13.441162109375, -12.8037109375, -12.166259765625, -11.52880859375, -10.891357421875, -10.25390625, -9.616455078125, -8.97900390625, -8.341552734375, -7.7041015625, -7.066650390625, -6.42919921875, -5.791748046875, -5.154296875, -4.516845703125, -3.87939453125, -3.241943359375, -2.6044921875, -1.967041015625, -1.32958984375, -0.692138671875, -0.0546875, 0.582763671875, 1.22021484375, 1.857666015625, 2.4951171875, 3.132568359375, 3.77001953125, 4.407470703125, 5.044921875, 5.682373046875, 6.31982421875, 6.957275390625, 7.5947265625, 8.232177734375, 8.86962890625, 9.507080078125, 10.14453125, 10.781982421875, 11.41943359375, 12.056884765625, 12.6943359375, 13.331787109375, 13.96923828125, 14.606689453125, 15.244140625, 15.881591796875, 16.51904296875, 17.156494140625, 17.7939453125, 18.431396484375, 19.06884765625, 19.706298828125, 20.34375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 0.0, 2.0, 7.0, 8.0, 14.0, 16.0, 18.0, 29.0, 64.0, 80.0, 95.0, 158.0, 246.0, 352.0, 447.0, 735.0, 994.0, 1549.0, 2261.0, 3434.0, 5123.0, 7700.0, 11386.0, 17238.0, 26041.0, 40176.0, 64234.0, 107813.0, 1328818.0, 211430.0, 97753.0, 58760.0, 37388.0, 24443.0, 16047.0, 10533.0, 7097.0, 4743.0, 3214.0, 2214.0, 1412.0, 950.0, 679.0, 436.0, 308.0, 229.0, 140.0, 93.0, 73.0, 66.0, 28.0, 15.0, 17.0, 10.0, 10.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0], "bins": [-0.83251953125, -0.8064346313476562, -0.7803497314453125, -0.7542648315429688, -0.728179931640625, -0.7020950317382812, -0.6760101318359375, -0.6499252319335938, -0.62384033203125, -0.5977554321289062, -0.5716705322265625, -0.5455856323242188, -0.519500732421875, -0.49341583251953125, -0.4673309326171875, -0.44124603271484375, -0.4151611328125, -0.38907623291015625, -0.3629913330078125, -0.33690643310546875, -0.310821533203125, -0.28473663330078125, -0.2586517333984375, -0.23256683349609375, -0.20648193359375, -0.18039703369140625, -0.1543121337890625, -0.12822723388671875, -0.102142333984375, -0.07605743408203125, -0.0499725341796875, -0.02388763427734375, 0.002197265625, 0.02828216552734375, 0.0543670654296875, 0.08045196533203125, 0.106536865234375, 0.13262176513671875, 0.1587066650390625, 0.18479156494140625, 0.21087646484375, 0.23696136474609375, 0.2630462646484375, 0.28913116455078125, 0.315216064453125, 0.34130096435546875, 0.3673858642578125, 0.39347076416015625, 0.4195556640625, 0.44564056396484375, 0.4717254638671875, 0.49781036376953125, 0.523895263671875, 0.5499801635742188, 0.5760650634765625, 0.6021499633789062, 0.62823486328125, 0.6543197631835938, 0.6804046630859375, 0.7064895629882812, 0.732574462890625, 0.7586593627929688, 0.7847442626953125, 0.8108291625976562, 0.8369140625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 10.0, 5.0, 15.0, 13.0, 12.0, 25.0, 23.0, 32.0, 40.0, 48.0, 95.0, 259.0, 121.0, 76.0, 58.0, 36.0, 28.0, 20.0, 24.0, 13.0, 7.0, 6.0, 3.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.785724639892578e-05, -8.479133248329163e-05, -8.172541856765747e-05, -7.865950465202332e-05, -7.559359073638916e-05, -7.2527676820755e-05, -6.946176290512085e-05, -6.63958489894867e-05, -6.332993507385254e-05, -6.0264021158218384e-05, -5.719810724258423e-05, -5.413219332695007e-05, -5.106627941131592e-05, -4.800036549568176e-05, -4.493445158004761e-05, -4.186853766441345e-05, -3.88026237487793e-05, -3.573670983314514e-05, -3.2670795917510986e-05, -2.960488200187683e-05, -2.6538968086242676e-05, -2.347305417060852e-05, -2.0407140254974365e-05, -1.734122633934021e-05, -1.4275312423706055e-05, -1.12093985080719e-05, -8.143484592437744e-06, -5.077570676803589e-06, -2.0116567611694336e-06, 1.0542571544647217e-06, 4.120171070098877e-06, 7.186084985733032e-06, 1.0251998901367188e-05, 1.3317912817001343e-05, 1.6383826732635498e-05, 1.9449740648269653e-05, 2.251565456390381e-05, 2.5581568479537964e-05, 2.864748239517212e-05, 3.1713396310806274e-05, 3.477931022644043e-05, 3.7845224142074585e-05, 4.091113805770874e-05, 4.3977051973342896e-05, 4.704296588897705e-05, 5.0108879804611206e-05, 5.317479372024536e-05, 5.6240707635879517e-05, 5.930662155151367e-05, 6.237253546714783e-05, 6.543844938278198e-05, 6.850436329841614e-05, 7.157027721405029e-05, 7.463619112968445e-05, 7.77021050453186e-05, 8.076801896095276e-05, 8.383393287658691e-05, 8.689984679222107e-05, 8.996576070785522e-05, 9.303167462348938e-05, 9.609758853912354e-05, 9.916350245475769e-05, 0.00010222941637039185, 0.000105295330286026, 0.00010836124420166016]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 3.0, 6.0, 16.0, 16.0, 23.0, 35.0, 42.0, 86.0, 169.0, 480.0, 2346.0, 42574.0, 986611.0, 14237.0, 1254.0, 308.0, 110.0, 65.0, 44.0, 24.0, 23.0, 20.0, 10.0, 12.0, 6.0, 9.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016164779663085938, -0.0015707463026046753, -0.0015250146389007568, -0.0014792829751968384, -0.00143355131149292, -0.0013878196477890015, -0.001342087984085083, -0.0012963563203811646, -0.001250624656677246, -0.0012048929929733276, -0.0011591613292694092, -0.0011134296655654907, -0.0010676980018615723, -0.0010219663381576538, -0.0009762346744537354, -0.0009305030107498169, -0.0008847713470458984, -0.00083903968334198, -0.0007933080196380615, -0.0007475763559341431, -0.0007018446922302246, -0.0006561130285263062, -0.0006103813648223877, -0.0005646497011184692, -0.0005189180374145508, -0.0004731863737106323, -0.00042745471000671387, -0.0003817230463027954, -0.00033599138259887695, -0.0002902597188949585, -0.00024452805519104004, -0.00019879639148712158, -0.00015306472778320312, -0.00010733306407928467, -6.160140037536621e-05, -1.5869736671447754e-05, 2.9861927032470703e-05, 7.559359073638916e-05, 0.00012132525444030762, 0.00016705691814422607, 0.00021278858184814453, 0.000258520245552063, 0.00030425190925598145, 0.0003499835729598999, 0.00039571523666381836, 0.0004414469003677368, 0.0004871785640716553, 0.0005329102277755737, 0.0005786418914794922, 0.0006243735551834106, 0.0006701052188873291, 0.0007158368825912476, 0.000761568546295166, 0.0008073002099990845, 0.0008530318737030029, 0.0008987635374069214, 0.0009444952011108398, 0.0009902268648147583, 0.0010359585285186768, 0.0010816901922225952, 0.0011274218559265137, 0.0011731535196304321, 0.0012188851833343506, 0.001264616847038269, 0.0013103485107421875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 11.0, 11.0, 18.0, 42.0, 69.0, 141.0, 322.0, 201.0, 87.0, 47.0, 22.0, 15.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.255185533314943e-05, -4.9569531256565824e-05, -4.6587207179982215e-05, -4.3604883103398606e-05, -4.0622559026815e-05, -3.764023495023139e-05, -3.465791087364778e-05, -3.167558679706417e-05, -2.869326272048056e-05, -2.5710938643896952e-05, -2.2728614567313343e-05, -1.9746290490729734e-05, -1.6763966414146125e-05, -1.3781642337562516e-05, -1.0799318260978907e-05, -7.816994184395298e-06, -4.834670107811689e-06, -1.8523460312280804e-06, 1.1299780453555286e-06, 4.112302121939138e-06, 7.0946261985227466e-06, 1.0076950275106356e-05, 1.3059274351689965e-05, 1.6041598428273574e-05, 1.9023922504857183e-05, 2.200624658144079e-05, 2.49885706580244e-05, 2.797089473460801e-05, 3.095321881119162e-05, 3.393554288777523e-05, 3.6917866964358836e-05, 3.9900191040942445e-05, 4.2882515117526054e-05, 4.586483919410966e-05, 4.884716327069327e-05, 5.182948734727688e-05, 5.481181142386049e-05, 5.77941355004441e-05, 6.077645957702771e-05, 6.375878001563251e-05, 6.674110773019493e-05, 6.972343544475734e-05, 7.270575588336214e-05, 7.568807632196695e-05, 7.867040403652936e-05, 8.165273175109178e-05, 8.463505218969658e-05, 8.761737262830138e-05, 9.05997003428638e-05, 9.358202805742621e-05, 9.656434849603102e-05, 9.954666893463582e-05, 0.00010252899664919823, 0.00010551132436376065, 0.00010849364480236545, 0.00011147596524097025, 0.00011445829295553267, 0.00011744062067009509, 0.00012042294110869989, 0.0001234052615473047, 0.0001263875892618671, 0.00012936991697642952, 0.0001323522301390767, 0.00013533455785363913, 0.00013831688556820154]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 6.0, 7.0, 14.0, 9.0, 17.0, 18.0, 21.0, 17.0, 21.0, 18.0, 29.0, 37.0, 26.0, 37.0, 31.0, 39.0, 38.0, 42.0, 31.0, 38.0, 39.0, 50.0, 52.0, 35.0, 36.0, 25.0, 34.0, 30.0, 23.0, 21.0, 35.0, 24.0, 15.0, 15.0, 12.0, 13.0, 6.0, 5.0, 7.0, 4.0, 3.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.254413604736328e-05, -3.14861536026001e-05, -3.0428171157836914e-05, -2.937018871307373e-05, -2.8312206268310547e-05, -2.7254223823547363e-05, -2.619624137878418e-05, -2.5138258934020996e-05, -2.4080276489257812e-05, -2.302229404449463e-05, -2.1964311599731445e-05, -2.0906329154968262e-05, -1.9848346710205078e-05, -1.8790364265441895e-05, -1.773238182067871e-05, -1.6674399375915527e-05, -1.5616416931152344e-05, -1.455843448638916e-05, -1.3500452041625977e-05, -1.2442469596862793e-05, -1.138448715209961e-05, -1.0326504707336426e-05, -9.268522262573242e-06, -8.210539817810059e-06, -7.152557373046875e-06, -6.094574928283691e-06, -5.036592483520508e-06, -3.978610038757324e-06, -2.9206275939941406e-06, -1.862645149230957e-06, -8.046627044677734e-07, 2.5331974029541016e-07, 1.3113021850585938e-06, 2.3692846298217773e-06, 3.427267074584961e-06, 4.4852495193481445e-06, 5.543231964111328e-06, 6.601214408874512e-06, 7.659196853637695e-06, 8.717179298400879e-06, 9.775161743164062e-06, 1.0833144187927246e-05, 1.189112663269043e-05, 1.2949109077453613e-05, 1.4007091522216797e-05, 1.506507396697998e-05, 1.6123056411743164e-05, 1.7181038856506348e-05, 1.823902130126953e-05, 1.9297003746032715e-05, 2.03549861907959e-05, 2.1412968635559082e-05, 2.2470951080322266e-05, 2.352893352508545e-05, 2.4586915969848633e-05, 2.5644898414611816e-05, 2.6702880859375e-05, 2.7760863304138184e-05, 2.8818845748901367e-05, 2.987682819366455e-05, 3.0934810638427734e-05, 3.199279308319092e-05, 3.30507755279541e-05, 3.4108757972717285e-05, 3.516674041748047e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 6.0, 11.0, 11.0, 12.0, 18.0, 23.0, 23.0, 29.0, 26.0, 29.0, 47.0, 35.0, 56.0, 46.0, 42.0, 46.0, 38.0, 44.0, 45.0, 50.0, 47.0, 34.0, 38.0, 25.0, 27.0, 20.0, 15.0, 19.0, 22.0, 17.0, 15.0, 13.0, 9.0, 8.0, 14.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.5625, -32.52197265625, -31.4814453125, -30.44091796875, -29.400390625, -28.35986328125, -27.3193359375, -26.27880859375, -25.23828125, -24.19775390625, -23.1572265625, -22.11669921875, -21.076171875, -20.03564453125, -18.9951171875, -17.95458984375, -16.9140625, -15.87353515625, -14.8330078125, -13.79248046875, -12.751953125, -11.71142578125, -10.6708984375, -9.63037109375, -8.58984375, -7.54931640625, -6.5087890625, -5.46826171875, -4.427734375, -3.38720703125, -2.3466796875, -1.30615234375, -0.265625, 0.77490234375, 1.8154296875, 2.85595703125, 3.896484375, 4.93701171875, 5.9775390625, 7.01806640625, 8.05859375, 9.09912109375, 10.1396484375, 11.18017578125, 12.220703125, 13.26123046875, 14.3017578125, 15.34228515625, 16.3828125, 17.42333984375, 18.4638671875, 19.50439453125, 20.544921875, 21.58544921875, 22.6259765625, 23.66650390625, 24.70703125, 25.74755859375, 26.7880859375, 27.82861328125, 28.869140625, 29.90966796875, 30.9501953125, 31.99072265625, 33.03125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 4.0, 11.0, 10.0, 29.0, 29.0, 42.0, 54.0, 69.0, 91.0, 133.0, 146.0, 201.0, 303.0, 404.0, 554.0, 827.0, 1146.0, 1743.0, 2532.0, 4372.0, 11026.0, 178529.0, 810441.0, 20620.0, 5600.0, 3022.0, 1971.0, 1321.0, 922.0, 656.0, 487.0, 338.0, 245.0, 172.0, 109.0, 108.0, 67.0, 56.0, 48.0, 23.0, 25.0, 16.0, 13.0, 7.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-68.25, -66.12890625, -64.0078125, -61.88671875, -59.765625, -57.64453125, -55.5234375, -53.40234375, -51.28125, -49.16015625, -47.0390625, -44.91796875, -42.796875, -40.67578125, -38.5546875, -36.43359375, -34.3125, -32.19140625, -30.0703125, -27.94921875, -25.828125, -23.70703125, -21.5859375, -19.46484375, -17.34375, -15.22265625, -13.1015625, -10.98046875, -8.859375, -6.73828125, -4.6171875, -2.49609375, -0.375, 1.74609375, 3.8671875, 5.98828125, 8.109375, 10.23046875, 12.3515625, 14.47265625, 16.59375, 18.71484375, 20.8359375, 22.95703125, 25.078125, 27.19921875, 29.3203125, 31.44140625, 33.5625, 35.68359375, 37.8046875, 39.92578125, 42.046875, 44.16796875, 46.2890625, 48.41015625, 50.53125, 52.65234375, 54.7734375, 56.89453125, 59.015625, 61.13671875, 63.2578125, 65.37890625, 67.5]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 8.0, 12.0, 15.0, 8.0, 30.0, 18.0, 31.0, 31.0, 49.0, 47.0, 45.0, 46.0, 56.0, 65.0, 104.0, 1792.0, 180.0, 102.0, 45.0, 52.0, 41.0, 37.0, 38.0, 27.0, 21.0, 17.0, 19.0, 21.0, 13.0, 12.0, 9.0, 8.0, 11.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-115.25, -111.5009765625, -107.751953125, -104.0029296875, -100.25390625, -96.5048828125, -92.755859375, -89.0068359375, -85.2578125, -81.5087890625, -77.759765625, -74.0107421875, -70.26171875, -66.5126953125, -62.763671875, -59.0146484375, -55.265625, -51.5166015625, -47.767578125, -44.0185546875, -40.26953125, -36.5205078125, -32.771484375, -29.0224609375, -25.2734375, -21.5244140625, -17.775390625, -14.0263671875, -10.27734375, -6.5283203125, -2.779296875, 0.9697265625, 4.71875, 8.4677734375, 12.216796875, 15.9658203125, 19.71484375, 23.4638671875, 27.212890625, 30.9619140625, 34.7109375, 38.4599609375, 42.208984375, 45.9580078125, 49.70703125, 53.4560546875, 57.205078125, 60.9541015625, 64.703125, 68.4521484375, 72.201171875, 75.9501953125, 79.69921875, 83.4482421875, 87.197265625, 90.9462890625, 94.6953125, 98.4443359375, 102.193359375, 105.9423828125, 109.69140625, 113.4404296875, 117.189453125, 120.9384765625, 124.6875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 7.0, 10.0, 6.0, 12.0, 9.0, 17.0, 30.0, 29.0, 25.0, 26.0, 65.0, 101.0, 159.0, 262.0, 549.0, 1244.0, 3366.0, 14152.0, 2894183.0, 217109.0, 9382.0, 2700.0, 1011.0, 465.0, 252.0, 150.0, 111.0, 73.0, 51.0, 31.0, 25.0, 16.0, 12.0, 13.0, 8.0, 12.0, 6.0, 9.0, 4.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-225.25, -218.185546875, -211.12109375, -204.056640625, -196.9921875, -189.927734375, -182.86328125, -175.798828125, -168.734375, -161.669921875, -154.60546875, -147.541015625, -140.4765625, -133.412109375, -126.34765625, -119.283203125, -112.21875, -105.154296875, -98.08984375, -91.025390625, -83.9609375, -76.896484375, -69.83203125, -62.767578125, -55.703125, -48.638671875, -41.57421875, -34.509765625, -27.4453125, -20.380859375, -13.31640625, -6.251953125, 0.8125, 7.876953125, 14.94140625, 22.005859375, 29.0703125, 36.134765625, 43.19921875, 50.263671875, 57.328125, 64.392578125, 71.45703125, 78.521484375, 85.5859375, 92.650390625, 99.71484375, 106.779296875, 113.84375, 120.908203125, 127.97265625, 135.037109375, 142.1015625, 149.166015625, 156.23046875, 163.294921875, 170.359375, 177.423828125, 184.48828125, 191.552734375, 198.6171875, 205.681640625, 212.74609375, 219.810546875, 226.875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 8.0, 5.0, 12.0, 7.0, 17.0, 22.0, 24.0, 26.0, 41.0, 43.0, 82.0, 118.0, 131.0, 134.0, 86.0, 65.0, 40.0, 33.0, 17.0, 16.0, 11.0, 20.0, 10.0, 5.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-167.5320281982422, -163.5190887451172, -159.5061492919922, -155.4932098388672, -151.4802703857422, -147.4673309326172, -143.4543914794922, -139.4414520263672, -135.4285125732422, -131.4155731201172, -127.40263366699219, -123.38969421386719, -119.37675476074219, -115.36381530761719, -111.35087585449219, -107.33793640136719, -103.32499694824219, -99.31205749511719, -95.29911804199219, -91.28617858886719, -87.27323913574219, -83.26029968261719, -79.24736022949219, -75.23442077636719, -71.22148132324219, -67.20854187011719, -63.19560241699219, -59.18266296386719, -55.16972351074219, -51.15678405761719, -47.14384460449219, -43.13090515136719, -39.11796569824219, -35.10502624511719, -31.092086791992188, -27.079147338867188, -23.066207885742188, -19.053268432617188, -15.040328979492188, -11.027389526367188, -7.0144500732421875, -3.0015106201171875, 1.0114288330078125, 5.0243682861328125, 9.037307739257812, 13.050247192382812, 17.063186645507812, 21.076126098632812, 25.089065551757812, 29.102005004882812, 33.11494445800781, 37.12788391113281, 41.14082336425781, 45.15376281738281, 49.16670227050781, 53.17964172363281, 57.19258117675781, 61.20552062988281, 65.21846008300781, 69.23139953613281, 73.24433898925781, 77.25727844238281, 81.27021789550781, 85.28315734863281, 89.29609680175781]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 8.0, 5.0, 16.0, 10.0, 12.0, 15.0, 17.0, 20.0, 24.0, 21.0, 26.0, 29.0, 30.0, 29.0, 35.0, 35.0, 43.0, 36.0, 47.0, 45.0, 39.0, 38.0, 49.0, 39.0, 27.0, 32.0, 28.0, 21.0, 23.0, 23.0, 30.0, 22.0, 14.0, 15.0, 19.0, 11.0, 9.0, 13.0, 11.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-304.0479431152344, -295.5722351074219, -287.0965576171875, -278.620849609375, -270.1451721191406, -261.6694641113281, -253.1937713623047, -244.71807861328125, -236.24237060546875, -227.7666778564453, -219.29098510742188, -210.81527709960938, -202.33958435058594, -193.8638916015625, -185.38819885253906, -176.91250610351562, -168.4368133544922, -159.96112060546875, -151.4854278564453, -143.00973510742188, -134.53402709960938, -126.05833435058594, -117.5826416015625, -109.10694885253906, -100.6312484741211, -92.15555572509766, -83.67985534667969, -75.20416259765625, -66.72846984863281, -58.252769470214844, -49.777076721191406, -41.3013801574707, -32.82569885253906, -24.35000228881836, -15.874307632446289, -7.398612976074219, 1.0770835876464844, 9.552780151367188, 18.028472900390625, 26.504169464111328, 34.97986602783203, 43.455562591552734, 51.93125915527344, 60.406951904296875, 68.88264465332031, 77.35834503173828, 85.83403778076172, 94.30973815917969, 102.78543090820312, 111.26112365722656, 119.73682403564453, 128.2125244140625, 136.68821716308594, 145.16390991210938, 153.6396026611328, 162.11529541015625, 170.59100341796875, 179.0666961669922, 187.54238891601562, 196.01809692382812, 204.49378967285156, 212.969482421875, 221.44517517089844, 229.92086791992188, 238.3965606689453]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 1.0, 3.0, 5.0, 9.0, 11.0, 8.0, 12.0, 11.0, 22.0, 21.0, 22.0, 26.0, 27.0, 33.0, 39.0, 51.0, 37.0, 44.0, 47.0, 40.0, 38.0, 52.0, 28.0, 51.0, 43.0, 50.0, 37.0, 27.0, 18.0, 24.0, 21.0, 20.0, 21.0, 18.0, 18.0, 12.0, 10.0, 6.0, 13.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.59375, -31.590087890625, -30.58642578125, -29.582763671875, -28.5791015625, -27.575439453125, -26.57177734375, -25.568115234375, -24.564453125, -23.560791015625, -22.55712890625, -21.553466796875, -20.5498046875, -19.546142578125, -18.54248046875, -17.538818359375, -16.53515625, -15.531494140625, -14.52783203125, -13.524169921875, -12.5205078125, -11.516845703125, -10.51318359375, -9.509521484375, -8.505859375, -7.502197265625, -6.49853515625, -5.494873046875, -4.4912109375, -3.487548828125, -2.48388671875, -1.480224609375, -0.4765625, 0.527099609375, 1.53076171875, 2.534423828125, 3.5380859375, 4.541748046875, 5.54541015625, 6.549072265625, 7.552734375, 8.556396484375, 9.56005859375, 10.563720703125, 11.5673828125, 12.571044921875, 13.57470703125, 14.578369140625, 15.58203125, 16.585693359375, 17.58935546875, 18.593017578125, 19.5966796875, 20.600341796875, 21.60400390625, 22.607666015625, 23.611328125, 24.614990234375, 25.61865234375, 26.622314453125, 27.6259765625, 28.629638671875, 29.63330078125, 30.636962890625, 31.640625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 10.0, 7.0, 11.0, 9.0, 13.0, 17.0, 29.0, 37.0, 51.0, 51.0, 83.0, 129.0, 159.0, 198.0, 335.0, 413.0, 641.0, 938.0, 1372.0, 2115.0, 3341.0, 5629.0, 10336.0, 24293.0, 302462.0, 3475968.0, 310761.0, 28333.0, 10817.0, 5846.0, 3436.0, 2212.0, 1349.0, 908.0, 585.0, 412.0, 301.0, 175.0, 141.0, 114.0, 85.0, 44.0, 39.0, 25.0, 25.0, 8.0, 12.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0], "bins": [-94.9375, -92.1865234375, -89.435546875, -86.6845703125, -83.93359375, -81.1826171875, -78.431640625, -75.6806640625, -72.9296875, -70.1787109375, -67.427734375, -64.6767578125, -61.92578125, -59.1748046875, -56.423828125, -53.6728515625, -50.921875, -48.1708984375, -45.419921875, -42.6689453125, -39.91796875, -37.1669921875, -34.416015625, -31.6650390625, -28.9140625, -26.1630859375, -23.412109375, -20.6611328125, -17.91015625, -15.1591796875, -12.408203125, -9.6572265625, -6.90625, -4.1552734375, -1.404296875, 1.3466796875, 4.09765625, 6.8486328125, 9.599609375, 12.3505859375, 15.1015625, 17.8525390625, 20.603515625, 23.3544921875, 26.10546875, 28.8564453125, 31.607421875, 34.3583984375, 37.109375, 39.8603515625, 42.611328125, 45.3623046875, 48.11328125, 50.8642578125, 53.615234375, 56.3662109375, 59.1171875, 61.8681640625, 64.619140625, 67.3701171875, 70.12109375, 72.8720703125, 75.623046875, 78.3740234375, 81.125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 11.0, 11.0, 8.0, 6.0, 9.0, 14.0, 20.0, 26.0, 29.0, 42.0, 80.0, 193.0, 600.0, 1555.0, 907.0, 269.0, 75.0, 52.0, 43.0, 22.0, 22.0, 13.0, 9.0, 11.0, 10.0, 5.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.25, -95.7841796875, -92.318359375, -88.8525390625, -85.38671875, -81.9208984375, -78.455078125, -74.9892578125, -71.5234375, -68.0576171875, -64.591796875, -61.1259765625, -57.66015625, -54.1943359375, -50.728515625, -47.2626953125, -43.796875, -40.3310546875, -36.865234375, -33.3994140625, -29.93359375, -26.4677734375, -23.001953125, -19.5361328125, -16.0703125, -12.6044921875, -9.138671875, -5.6728515625, -2.20703125, 1.2587890625, 4.724609375, 8.1904296875, 11.65625, 15.1220703125, 18.587890625, 22.0537109375, 25.51953125, 28.9853515625, 32.451171875, 35.9169921875, 39.3828125, 42.8486328125, 46.314453125, 49.7802734375, 53.24609375, 56.7119140625, 60.177734375, 63.6435546875, 67.109375, 70.5751953125, 74.041015625, 77.5068359375, 80.97265625, 84.4384765625, 87.904296875, 91.3701171875, 94.8359375, 98.3017578125, 101.767578125, 105.2333984375, 108.69921875, 112.1650390625, 115.630859375, 119.0966796875, 122.5625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 4.0, 11.0, 20.0, 25.0, 40.0, 100.0, 145.0, 316.0, 597.0, 1240.0, 2592.0, 5877.0, 14847.0, 48501.0, 2089864.0, 1956504.0, 47973.0, 14601.0, 5936.0, 2613.0, 1223.0, 598.0, 276.0, 158.0, 77.0, 52.0, 39.0, 18.0, 16.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-253.875, -246.822265625, -239.76953125, -232.716796875, -225.6640625, -218.611328125, -211.55859375, -204.505859375, -197.453125, -190.400390625, -183.34765625, -176.294921875, -169.2421875, -162.189453125, -155.13671875, -148.083984375, -141.03125, -133.978515625, -126.92578125, -119.873046875, -112.8203125, -105.767578125, -98.71484375, -91.662109375, -84.609375, -77.556640625, -70.50390625, -63.451171875, -56.3984375, -49.345703125, -42.29296875, -35.240234375, -28.1875, -21.134765625, -14.08203125, -7.029296875, 0.0234375, 7.076171875, 14.12890625, 21.181640625, 28.234375, 35.287109375, 42.33984375, 49.392578125, 56.4453125, 63.498046875, 70.55078125, 77.603515625, 84.65625, 91.708984375, 98.76171875, 105.814453125, 112.8671875, 119.919921875, 126.97265625, 134.025390625, 141.078125, 148.130859375, 155.18359375, 162.236328125, 169.2890625, 176.341796875, 183.39453125, 190.447265625, 197.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 15.0, 20.0, 29.0, 81.0, 130.0, 334.0, 203.0, 72.0, 45.0, 31.0, 16.0, 11.0, 9.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-627.7488403320312, -603.3330688476562, -578.9172973632812, -554.5015258789062, -530.0857543945312, -505.66998291015625, -481.25421142578125, -456.83843994140625, -432.42266845703125, -408.00689697265625, -383.59112548828125, -359.17535400390625, -334.75958251953125, -310.34381103515625, -285.92803955078125, -261.51226806640625, -237.09646606445312, -212.68069458007812, -188.26492309570312, -163.84915161132812, -139.43338012695312, -115.0176010131836, -90.60182189941406, -66.18605041503906, -41.77027893066406, -17.35450553894043, 7.061267852783203, 31.47704315185547, 55.89281463623047, 80.30858612060547, 104.724365234375, 129.14013671875, 153.555908203125, 177.9716796875, 202.387451171875, 226.80322265625, 251.218994140625, 275.634765625, 300.050537109375, 324.46630859375, 348.882080078125, 373.2978515625, 397.713623046875, 422.12939453125, 446.545166015625, 470.9609375, 495.376708984375, 519.79248046875, 544.208251953125, 568.6240234375, 593.039794921875, 617.45556640625, 641.871337890625, 666.287109375, 690.702880859375, 715.11865234375, 739.5344848632812, 763.9502563476562, 788.3660278320312, 812.7817993164062, 837.1975708007812, 861.6133422851562, 886.0291137695312, 910.4448852539062, 934.8606567382812]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 11.0, 5.0, 16.0, 18.0, 21.0, 21.0, 20.0, 23.0, 35.0, 29.0, 39.0, 30.0, 34.0, 41.0, 47.0, 46.0, 46.0, 44.0, 50.0, 42.0, 50.0, 41.0, 48.0, 38.0, 31.0, 23.0, 24.0, 20.0, 20.0, 12.0, 10.0, 11.0, 15.0, 11.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-303.9730224609375, -296.0724792480469, -288.17193603515625, -280.2713623046875, -272.3708190917969, -264.47027587890625, -256.5697326660156, -248.669189453125, -240.7686309814453, -232.8680877685547, -224.967529296875, -217.06698608398438, -209.16644287109375, -201.26588439941406, -193.36534118652344, -185.46478271484375, -177.56423950195312, -169.6636962890625, -161.7631378173828, -153.8625946044922, -145.96205139160156, -138.06149291992188, -130.16094970703125, -122.2603988647461, -114.35986328125, -106.45931243896484, -98.55876922607422, -90.65821838378906, -82.7576675415039, -74.85711669921875, -66.95657348632812, -59.05602264404297, -51.15547180175781, -43.25492477416992, -35.354373931884766, -27.453826904296875, -19.55327796936035, -11.652729034423828, -3.7521820068359375, 4.148368835449219, 12.04891586303711, 19.949464797973633, 27.850013732910156, 35.75056076049805, 43.65110778808594, 51.551658630371094, 59.452205657958984, 67.35275268554688, 75.25330352783203, 83.15385437011719, 91.05439758300781, 98.95494842529297, 106.85549926757812, 114.75604248046875, 122.6565933227539, 130.55714416503906, 138.4576873779297, 146.3582305908203, 154.2587890625, 162.15933227539062, 170.05987548828125, 177.96043395996094, 185.86097717285156, 193.76153564453125, 201.66207885742188]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 7.0, 11.0, 12.0, 24.0, 18.0, 22.0, 24.0, 30.0, 28.0, 31.0, 27.0, 37.0, 44.0, 35.0, 37.0, 44.0, 44.0, 39.0, 41.0, 44.0, 37.0, 31.0, 44.0, 38.0, 27.0, 31.0, 20.0, 21.0, 18.0, 21.0, 21.0, 16.0, 8.0, 15.0, 14.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-34.59375, -33.603271484375, -32.61279296875, -31.622314453125, -30.6318359375, -29.641357421875, -28.65087890625, -27.660400390625, -26.669921875, -25.679443359375, -24.68896484375, -23.698486328125, -22.7080078125, -21.717529296875, -20.72705078125, -19.736572265625, -18.74609375, -17.755615234375, -16.76513671875, -15.774658203125, -14.7841796875, -13.793701171875, -12.80322265625, -11.812744140625, -10.822265625, -9.831787109375, -8.84130859375, -7.850830078125, -6.8603515625, -5.869873046875, -4.87939453125, -3.888916015625, -2.8984375, -1.907958984375, -0.91748046875, 0.072998046875, 1.0634765625, 2.053955078125, 3.04443359375, 4.034912109375, 5.025390625, 6.015869140625, 7.00634765625, 7.996826171875, 8.9873046875, 9.977783203125, 10.96826171875, 11.958740234375, 12.94921875, 13.939697265625, 14.93017578125, 15.920654296875, 16.9111328125, 17.901611328125, 18.89208984375, 19.882568359375, 20.873046875, 21.863525390625, 22.85400390625, 23.844482421875, 24.8349609375, 25.825439453125, 26.81591796875, 27.806396484375, 28.796875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 11.0, 6.0, 11.0, 21.0, 25.0, 44.0, 56.0, 96.0, 134.0, 181.0, 267.0, 406.0, 535.0, 833.0, 1192.0, 1823.0, 2644.0, 3991.0, 5833.0, 8598.0, 12997.0, 19816.0, 30328.0, 47649.0, 77383.0, 141894.0, 316392.0, 151471.0, 81068.0, 49724.0, 31287.0, 20510.0, 13679.0, 9121.0, 6013.0, 4024.0, 2671.0, 1836.0, 1223.0, 830.0, 612.0, 396.0, 286.0, 171.0, 152.0, 103.0, 78.0, 46.0, 27.0, 26.0, 25.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.109893798828125, -1.07232666015625, -1.034759521484375, -0.9971923828125, -0.959625244140625, -0.92205810546875, -0.884490966796875, -0.846923828125, -0.809356689453125, -0.77178955078125, -0.734222412109375, -0.6966552734375, -0.659088134765625, -0.62152099609375, -0.583953857421875, -0.54638671875, -0.508819580078125, -0.47125244140625, -0.433685302734375, -0.3961181640625, -0.358551025390625, -0.32098388671875, -0.283416748046875, -0.245849609375, -0.208282470703125, -0.17071533203125, -0.133148193359375, -0.0955810546875, -0.058013916015625, -0.02044677734375, 0.017120361328125, 0.0546875, 0.092254638671875, 0.12982177734375, 0.167388916015625, 0.2049560546875, 0.242523193359375, 0.28009033203125, 0.317657470703125, 0.355224609375, 0.392791748046875, 0.43035888671875, 0.467926025390625, 0.5054931640625, 0.543060302734375, 0.58062744140625, 0.618194580078125, 0.65576171875, 0.693328857421875, 0.73089599609375, 0.768463134765625, 0.8060302734375, 0.843597412109375, 0.88116455078125, 0.918731689453125, 0.956298828125, 0.993865966796875, 1.03143310546875, 1.069000244140625, 1.1065673828125, 1.144134521484375, 1.18170166015625, 1.219268798828125, 1.2568359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 8.0, 5.0, 8.0, 5.0, 8.0, 8.0, 21.0, 11.0, 19.0, 17.0, 20.0, 17.0, 28.0, 18.0, 28.0, 23.0, 39.0, 28.0, 44.0, 47.0, 42.0, 32.0, 1061.0, 29.0, 43.0, 45.0, 34.0, 27.0, 37.0, 34.0, 36.0, 21.0, 22.0, 32.0, 22.0, 9.0, 8.0, 22.0, 4.0, 13.0, 9.0, 10.0, 6.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.703125, -18.10986328125, -17.5166015625, -16.92333984375, -16.330078125, -15.73681640625, -15.1435546875, -14.55029296875, -13.95703125, -13.36376953125, -12.7705078125, -12.17724609375, -11.583984375, -10.99072265625, -10.3974609375, -9.80419921875, -9.2109375, -8.61767578125, -8.0244140625, -7.43115234375, -6.837890625, -6.24462890625, -5.6513671875, -5.05810546875, -4.46484375, -3.87158203125, -3.2783203125, -2.68505859375, -2.091796875, -1.49853515625, -0.9052734375, -0.31201171875, 0.28125, 0.87451171875, 1.4677734375, 2.06103515625, 2.654296875, 3.24755859375, 3.8408203125, 4.43408203125, 5.02734375, 5.62060546875, 6.2138671875, 6.80712890625, 7.400390625, 7.99365234375, 8.5869140625, 9.18017578125, 9.7734375, 10.36669921875, 10.9599609375, 11.55322265625, 12.146484375, 12.73974609375, 13.3330078125, 13.92626953125, 14.51953125, 15.11279296875, 15.7060546875, 16.29931640625, 16.892578125, 17.48583984375, 18.0791015625, 18.67236328125, 19.265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 3.0, 12.0, 18.0, 23.0, 23.0, 36.0, 64.0, 95.0, 110.0, 160.0, 222.0, 328.0, 441.0, 661.0, 921.0, 1253.0, 1851.0, 2605.0, 3709.0, 5238.0, 7413.0, 10633.0, 15393.0, 22907.0, 34487.0, 53106.0, 86190.0, 165012.0, 1342301.0, 128607.0, 72433.0, 45412.0, 29814.0, 19991.0, 13866.0, 9468.0, 6659.0, 4552.0, 3257.0, 2340.0, 1637.0, 1123.0, 814.0, 547.0, 412.0, 289.0, 214.0, 134.0, 104.0, 80.0, 56.0, 35.0, 23.0, 24.0, 13.0, 5.0, 5.0, 3.0, 4.0, 4.0], "bins": [-0.78857421875, -0.7641830444335938, -0.7397918701171875, -0.7154006958007812, -0.691009521484375, -0.6666183471679688, -0.6422271728515625, -0.6178359985351562, -0.59344482421875, -0.5690536499023438, -0.5446624755859375, -0.5202713012695312, -0.495880126953125, -0.47148895263671875, -0.4470977783203125, -0.42270660400390625, -0.3983154296875, -0.37392425537109375, -0.3495330810546875, -0.32514190673828125, -0.300750732421875, -0.27635955810546875, -0.2519683837890625, -0.22757720947265625, -0.20318603515625, -0.17879486083984375, -0.1544036865234375, -0.13001251220703125, -0.105621337890625, -0.08123016357421875, -0.0568389892578125, -0.03244781494140625, -0.008056640625, 0.01633453369140625, 0.0407257080078125, 0.06511688232421875, 0.089508056640625, 0.11389923095703125, 0.1382904052734375, 0.16268157958984375, 0.18707275390625, 0.21146392822265625, 0.2358551025390625, 0.26024627685546875, 0.284637451171875, 0.30902862548828125, 0.3334197998046875, 0.35781097412109375, 0.3822021484375, 0.40659332275390625, 0.4309844970703125, 0.45537567138671875, 0.479766845703125, 0.5041580200195312, 0.5285491943359375, 0.5529403686523438, 0.57733154296875, 0.6017227172851562, 0.6261138916015625, 0.6505050659179688, 0.674896240234375, 0.6992874145507812, 0.7236785888671875, 0.7480697631835938, 0.7724609375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 8.0, 2.0, 8.0, 9.0, 11.0, 9.0, 9.0, 10.0, 11.0, 21.0, 21.0, 25.0, 28.0, 48.0, 70.0, 128.0, 139.0, 134.0, 81.0, 53.0, 37.0, 20.0, 25.0, 21.0, 15.0, 13.0, 10.0, 6.0, 6.0, 7.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.389617919921875e-05, -6.187707185745239e-05, -5.9857964515686035e-05, -5.783885717391968e-05, -5.581974983215332e-05, -5.380064249038696e-05, -5.1781535148620605e-05, -4.976242780685425e-05, -4.774332046508789e-05, -4.572421312332153e-05, -4.3705105781555176e-05, -4.168599843978882e-05, -3.966689109802246e-05, -3.7647783756256104e-05, -3.5628676414489746e-05, -3.360956907272339e-05, -3.159046173095703e-05, -2.9571354389190674e-05, -2.7552247047424316e-05, -2.553313970565796e-05, -2.35140323638916e-05, -2.1494925022125244e-05, -1.9475817680358887e-05, -1.745671033859253e-05, -1.5437602996826172e-05, -1.3418495655059814e-05, -1.1399388313293457e-05, -9.3802809715271e-06, -7.361173629760742e-06, -5.342066287994385e-06, -3.3229589462280273e-06, -1.30385160446167e-06, 7.152557373046875e-07, 2.734363079071045e-06, 4.753470420837402e-06, 6.77257776260376e-06, 8.791685104370117e-06, 1.0810792446136475e-05, 1.2829899787902832e-05, 1.484900712966919e-05, 1.6868114471435547e-05, 1.8887221813201904e-05, 2.0906329154968262e-05, 2.292543649673462e-05, 2.4944543838500977e-05, 2.6963651180267334e-05, 2.898275852203369e-05, 3.100186586380005e-05, 3.3020973205566406e-05, 3.5040080547332764e-05, 3.705918788909912e-05, 3.907829523086548e-05, 4.1097402572631836e-05, 4.311650991439819e-05, 4.513561725616455e-05, 4.715472459793091e-05, 4.9173831939697266e-05, 5.119293928146362e-05, 5.321204662322998e-05, 5.523115396499634e-05, 5.7250261306762695e-05, 5.926936864852905e-05, 6.128847599029541e-05, 6.330758333206177e-05, 6.532669067382812e-05]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 4.0, 9.0, 6.0, 11.0, 15.0, 15.0, 27.0, 46.0, 63.0, 151.0, 399.0, 2523.0, 53044.0, 971231.0, 18962.0, 1463.0, 242.0, 111.0, 67.0, 33.0, 23.0, 16.0, 14.0, 10.0, 8.0, 10.0, 10.0, 10.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0010623931884765625, -0.0010295659303665161, -0.0009967386722564697, -0.0009639114141464233, -0.000931084156036377, -0.0008982568979263306, -0.0008654296398162842, -0.0008326023817062378, -0.0007997751235961914, -0.000766947865486145, -0.0007341206073760986, -0.0007012933492660522, -0.0006684660911560059, -0.0006356388330459595, -0.0006028115749359131, -0.0005699843168258667, -0.0005371570587158203, -0.0005043298006057739, -0.00047150254249572754, -0.00043867528438568115, -0.00040584802627563477, -0.0003730207681655884, -0.000340193510055542, -0.0003073662519454956, -0.0002745389938354492, -0.00024171173572540283, -0.00020888447761535645, -0.00017605721950531006, -0.00014322996139526367, -0.00011040270328521729, -7.75754451751709e-05, -4.474818706512451e-05, -1.1920928955078125e-05, 2.0906329154968262e-05, 5.373358726501465e-05, 8.656084537506104e-05, 0.00011938810348510742, 0.0001522153615951538, 0.0001850426197052002, 0.00021786987781524658, 0.00025069713592529297, 0.00028352439403533936, 0.00031635165214538574, 0.00034917891025543213, 0.0003820061683654785, 0.0004148334264755249, 0.0004476606845855713, 0.0004804879426956177, 0.0005133152008056641, 0.0005461424589157104, 0.0005789697170257568, 0.0006117969751358032, 0.0006446242332458496, 0.000677451491355896, 0.0007102787494659424, 0.0007431060075759888, 0.0007759332656860352, 0.0008087605237960815, 0.0008415877819061279, 0.0008744150400161743, 0.0009072422981262207, 0.0009400695562362671, 0.0009728968143463135, 0.0010057240724563599, 0.0010385513305664062]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 19.0, 30.0, 82.0, 381.0, 348.0, 86.0, 33.0, 20.0, 8.0, 4.0, 1.0, 2.0], "bins": [-0.00021893756638746709, -0.00021502682648133487, -0.00021111610112711787, -0.00020720536122098565, -0.00020329462131485343, -0.0001993838814087212, -0.000195473141502589, -0.000191562416148372, -0.00018765167624223977, -0.00018374093633610755, -0.00017983021098189056, -0.00017591947107575834, -0.00017200873116962612, -0.0001680979912634939, -0.00016418725135736167, -0.00016027652600314468, -0.00015636578609701246, -0.00015245504619088024, -0.00014854432083666325, -0.00014463358093053102, -0.0001407228410243988, -0.00013681210111826658, -0.00013290136121213436, -0.00012899063585791737, -0.00012507989595178515, -0.00012116915604565293, -0.00011725842341547832, -0.00011334769078530371, -0.00010943695087917149, -0.00010552621097303927, -0.00010161547834286466, -9.770474571269006e-05, -9.379399853060022e-05, -8.988326590042561e-05, -8.597252599429339e-05, -8.206178608816117e-05, -7.815105345798656e-05, -7.424032082781196e-05, -7.032958092167974e-05, -6.641884101554751e-05, -6.250810838537291e-05, -5.859737211721949e-05, -5.468663584906608e-05, -5.0775899580912665e-05, -4.686516331275925e-05, -4.2954427044605836e-05, -3.904369077645242e-05, -3.513295450829901e-05, -3.1222218240145594e-05, -2.731148197199218e-05, -2.3400745703838766e-05, -1.949000943568535e-05, -1.5579273167531937e-05, -1.1668536899378523e-05, -7.757800631225109e-06, -3.847064363071695e-06, 6.367190508171916e-08, 3.974408173235133e-06, 7.885144441388547e-06, 1.1795880709541962e-05, 1.5706616977695376e-05, 1.961735324584879e-05, 2.3528089514002204e-05, 2.7438825782155618e-05, 3.134956205030903e-05]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 8.0, 4.0, 5.0, 7.0, 12.0, 6.0, 10.0, 16.0, 13.0, 23.0, 22.0, 18.0, 31.0, 33.0, 31.0, 35.0, 41.0, 49.0, 43.0, 56.0, 30.0, 39.0, 37.0, 38.0, 36.0, 38.0, 46.0, 35.0, 30.0, 27.0, 24.0, 16.0, 26.0, 23.0, 12.0, 16.0, 12.0, 11.0, 11.0, 8.0, 6.0, 4.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7835369110107422e-05, -2.7008354663848877e-05, -2.6181340217590332e-05, -2.5354325771331787e-05, -2.4527311325073242e-05, -2.3700296878814697e-05, -2.2873282432556152e-05, -2.2046267986297607e-05, -2.1219253540039062e-05, -2.0392239093780518e-05, -1.9565224647521973e-05, -1.8738210201263428e-05, -1.7911195755004883e-05, -1.7084181308746338e-05, -1.6257166862487793e-05, -1.5430152416229248e-05, -1.4603137969970703e-05, -1.3776123523712158e-05, -1.2949109077453613e-05, -1.2122094631195068e-05, -1.1295080184936523e-05, -1.0468065738677979e-05, -9.641051292419434e-06, -8.814036846160889e-06, -7.987022399902344e-06, -7.160007953643799e-06, -6.332993507385254e-06, -5.505979061126709e-06, -4.678964614868164e-06, -3.851950168609619e-06, -3.0249357223510742e-06, -2.1979212760925293e-06, -1.3709068298339844e-06, -5.438923835754395e-07, 2.8312206268310547e-07, 1.1101365089416504e-06, 1.9371509552001953e-06, 2.7641654014587402e-06, 3.591179847717285e-06, 4.41819429397583e-06, 5.245208740234375e-06, 6.07222318649292e-06, 6.899237632751465e-06, 7.72625207901001e-06, 8.553266525268555e-06, 9.3802809715271e-06, 1.0207295417785645e-05, 1.103430986404419e-05, 1.1861324310302734e-05, 1.268833875656128e-05, 1.3515353202819824e-05, 1.4342367649078369e-05, 1.5169382095336914e-05, 1.599639654159546e-05, 1.6823410987854004e-05, 1.765042543411255e-05, 1.8477439880371094e-05, 1.930445432662964e-05, 2.0131468772888184e-05, 2.095848321914673e-05, 2.1785497665405273e-05, 2.261251211166382e-05, 2.3439526557922363e-05, 2.4266541004180908e-05, 2.5093555450439453e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 7.0, 11.0, 12.0, 24.0, 18.0, 22.0, 24.0, 30.0, 28.0, 31.0, 27.0, 37.0, 44.0, 35.0, 37.0, 44.0, 44.0, 39.0, 41.0, 44.0, 37.0, 31.0, 44.0, 38.0, 27.0, 31.0, 20.0, 21.0, 18.0, 21.0, 21.0, 16.0, 8.0, 15.0, 14.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-34.59375, -33.603271484375, -32.61279296875, -31.622314453125, -30.6318359375, -29.641357421875, -28.65087890625, -27.660400390625, -26.669921875, -25.679443359375, -24.68896484375, -23.698486328125, -22.7080078125, -21.717529296875, -20.72705078125, -19.736572265625, -18.74609375, -17.755615234375, -16.76513671875, -15.774658203125, -14.7841796875, -13.793701171875, -12.80322265625, -11.812744140625, -10.822265625, -9.831787109375, -8.84130859375, -7.850830078125, -6.8603515625, -5.869873046875, -4.87939453125, -3.888916015625, -2.8984375, -1.907958984375, -0.91748046875, 0.072998046875, 1.0634765625, 2.053955078125, 3.04443359375, 4.034912109375, 5.025390625, 6.015869140625, 7.00634765625, 7.996826171875, 8.9873046875, 9.977783203125, 10.96826171875, 11.958740234375, 12.94921875, 13.939697265625, 14.93017578125, 15.920654296875, 16.9111328125, 17.901611328125, 18.89208984375, 19.882568359375, 20.873046875, 21.863525390625, 22.85400390625, 23.844482421875, 24.8349609375, 25.825439453125, 26.81591796875, 27.806396484375, 28.796875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 9.0, 8.0, 12.0, 17.0, 23.0, 29.0, 44.0, 35.0, 71.0, 99.0, 122.0, 164.0, 233.0, 330.0, 427.0, 596.0, 775.0, 1033.0, 1304.0, 1838.0, 2513.0, 3424.0, 5291.0, 8718.0, 19904.0, 128408.0, 754558.0, 77564.0, 16265.0, 7597.0, 4722.0, 3272.0, 2272.0, 1776.0, 1360.0, 956.0, 690.0, 493.0, 414.0, 308.0, 232.0, 154.0, 134.0, 107.0, 74.0, 47.0, 37.0, 30.0, 16.0, 12.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-43.0, -41.6728515625, -40.345703125, -39.0185546875, -37.69140625, -36.3642578125, -35.037109375, -33.7099609375, -32.3828125, -31.0556640625, -29.728515625, -28.4013671875, -27.07421875, -25.7470703125, -24.419921875, -23.0927734375, -21.765625, -20.4384765625, -19.111328125, -17.7841796875, -16.45703125, -15.1298828125, -13.802734375, -12.4755859375, -11.1484375, -9.8212890625, -8.494140625, -7.1669921875, -5.83984375, -4.5126953125, -3.185546875, -1.8583984375, -0.53125, 0.7958984375, 2.123046875, 3.4501953125, 4.77734375, 6.1044921875, 7.431640625, 8.7587890625, 10.0859375, 11.4130859375, 12.740234375, 14.0673828125, 15.39453125, 16.7216796875, 18.048828125, 19.3759765625, 20.703125, 22.0302734375, 23.357421875, 24.6845703125, 26.01171875, 27.3388671875, 28.666015625, 29.9931640625, 31.3203125, 32.6474609375, 33.974609375, 35.3017578125, 36.62890625, 37.9560546875, 39.283203125, 40.6103515625, 41.9375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 4.0, 5.0, 8.0, 9.0, 17.0, 14.0, 15.0, 15.0, 24.0, 36.0, 38.0, 30.0, 43.0, 39.0, 58.0, 56.0, 66.0, 189.0, 1810.0, 83.0, 70.0, 65.0, 49.0, 48.0, 37.0, 38.0, 36.0, 26.0, 18.0, 17.0, 12.0, 9.0, 13.0, 12.0, 12.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.25, -92.72265625, -89.1953125, -85.66796875, -82.140625, -78.61328125, -75.0859375, -71.55859375, -68.03125, -64.50390625, -60.9765625, -57.44921875, -53.921875, -50.39453125, -46.8671875, -43.33984375, -39.8125, -36.28515625, -32.7578125, -29.23046875, -25.703125, -22.17578125, -18.6484375, -15.12109375, -11.59375, -8.06640625, -4.5390625, -1.01171875, 2.515625, 6.04296875, 9.5703125, 13.09765625, 16.625, 20.15234375, 23.6796875, 27.20703125, 30.734375, 34.26171875, 37.7890625, 41.31640625, 44.84375, 48.37109375, 51.8984375, 55.42578125, 58.953125, 62.48046875, 66.0078125, 69.53515625, 73.0625, 76.58984375, 80.1171875, 83.64453125, 87.171875, 90.69921875, 94.2265625, 97.75390625, 101.28125, 104.80859375, 108.3359375, 111.86328125, 115.390625, 118.91796875, 122.4453125, 125.97265625, 129.5]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 13.0, 18.0, 34.0, 41.0, 50.0, 93.0, 222.0, 605.0, 2162.0, 14902.0, 3018000.0, 100794.0, 6674.0, 1297.0, 405.0, 164.0, 60.0, 58.0, 27.0, 14.0, 23.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.75, -353.28515625, -341.8203125, -330.35546875, -318.890625, -307.42578125, -295.9609375, -284.49609375, -273.03125, -261.56640625, -250.1015625, -238.63671875, -227.171875, -215.70703125, -204.2421875, -192.77734375, -181.3125, -169.84765625, -158.3828125, -146.91796875, -135.453125, -123.98828125, -112.5234375, -101.05859375, -89.59375, -78.12890625, -66.6640625, -55.19921875, -43.734375, -32.26953125, -20.8046875, -9.33984375, 2.125, 13.58984375, 25.0546875, 36.51953125, 47.984375, 59.44921875, 70.9140625, 82.37890625, 93.84375, 105.30859375, 116.7734375, 128.23828125, 139.703125, 151.16796875, 162.6328125, 174.09765625, 185.5625, 197.02734375, 208.4921875, 219.95703125, 231.421875, 242.88671875, 254.3515625, 265.81640625, 277.28125, 288.74609375, 300.2109375, 311.67578125, 323.140625, 334.60546875, 346.0703125, 357.53515625, 369.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 10.0, 14.0, 10.0, 52.0, 53.0, 118.0, 233.0, 209.0, 150.0, 90.0, 36.0, 13.0, 8.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0], "bins": [-558.7932739257812, -548.0675048828125, -537.341796875, -526.6160278320312, -515.8903198242188, -505.16455078125, -494.4388122558594, -483.71307373046875, -472.9873352050781, -462.2615966796875, -451.5358581542969, -440.81011962890625, -430.0843505859375, -419.3586120605469, -408.63287353515625, -397.9071350097656, -387.181396484375, -376.4556579589844, -365.72991943359375, -355.0041809082031, -344.2784423828125, -333.55267333984375, -322.8269348144531, -312.1011962890625, -301.3754577636719, -290.64971923828125, -279.9239807128906, -269.1982421875, -258.47247314453125, -247.7467498779297, -237.02099609375, -226.29525756835938, -215.56954956054688, -204.84381103515625, -194.11807250976562, -183.39231872558594, -172.6665802001953, -161.9408416748047, -151.215087890625, -140.48934936523438, -129.76361083984375, -119.03787231445312, -108.31212615966797, -97.58638000488281, -86.86064147949219, -76.13490295410156, -65.4091567993164, -54.68341064453125, -43.957672119140625, -33.231929779052734, -22.506187438964844, -11.780445098876953, -1.0547027587890625, 9.671039581298828, 20.39678192138672, 31.122528076171875, 41.8482666015625, 52.57400894165039, 63.29975128173828, 74.02549743652344, 84.75123596191406, 95.47697448730469, 106.20272064208984, 116.928466796875, 127.65420532226562]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 9.0, 10.0, 10.0, 10.0, 16.0, 8.0, 16.0, 18.0, 18.0, 21.0, 22.0, 16.0, 27.0, 42.0, 34.0, 23.0, 32.0, 40.0, 39.0, 41.0, 34.0, 40.0, 28.0, 31.0, 36.0, 27.0, 33.0, 23.0, 23.0, 31.0, 27.0, 23.0, 21.0, 32.0, 14.0, 26.0, 15.0, 13.0, 6.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 1.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-256.8808898925781, -248.49310302734375, -240.1053009033203, -231.71749877929688, -223.3297119140625, -214.94192504882812, -206.5541229248047, -198.16632080078125, -189.77853393554688, -181.3907470703125, -173.00294494628906, -164.61514282226562, -156.22735595703125, -147.83956909179688, -139.45176696777344, -131.06396484375, -122.67617797851562, -114.28838348388672, -105.90058898925781, -97.5127944946289, -89.125, -80.7372055053711, -72.34941101074219, -63.96161651611328, -55.573822021484375, -47.18602752685547, -38.79823303222656, -30.410438537597656, -22.02264404296875, -13.634849548339844, -5.2470550537109375, 3.1407394409179688, 11.52850341796875, 19.916297912597656, 28.304092407226562, 36.69188690185547, 45.079681396484375, 53.46747589111328, 61.85527038574219, 70.2430648803711, 78.630859375, 87.0186538696289, 95.40644836425781, 103.79424285888672, 112.18203735351562, 120.56983184814453, 128.95762634277344, 137.34542846679688, 145.73321533203125, 154.12100219726562, 162.50880432128906, 170.8966064453125, 179.28439331054688, 187.67218017578125, 196.0599822998047, 204.44778442382812, 212.8355712890625, 221.22335815429688, 229.6111602783203, 237.99896240234375, 246.38674926757812, 254.7745361328125, 263.162353515625, 271.5501403808594, 279.93792724609375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 3.0, 11.0, 7.0, 13.0, 18.0, 20.0, 20.0, 30.0, 18.0, 21.0, 36.0, 29.0, 35.0, 39.0, 37.0, 34.0, 33.0, 47.0, 37.0, 36.0, 53.0, 43.0, 23.0, 47.0, 33.0, 27.0, 39.0, 23.0, 24.0, 23.0, 21.0, 24.0, 19.0, 11.0, 10.0, 9.0, 8.0, 11.0, 4.0, 2.0, 6.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-35.0625, -34.052978515625, -33.04345703125, -32.033935546875, -31.0244140625, -30.014892578125, -29.00537109375, -27.995849609375, -26.986328125, -25.976806640625, -24.96728515625, -23.957763671875, -22.9482421875, -21.938720703125, -20.92919921875, -19.919677734375, -18.91015625, -17.900634765625, -16.89111328125, -15.881591796875, -14.8720703125, -13.862548828125, -12.85302734375, -11.843505859375, -10.833984375, -9.824462890625, -8.81494140625, -7.805419921875, -6.7958984375, -5.786376953125, -4.77685546875, -3.767333984375, -2.7578125, -1.748291015625, -0.73876953125, 0.270751953125, 1.2802734375, 2.289794921875, 3.29931640625, 4.308837890625, 5.318359375, 6.327880859375, 7.33740234375, 8.346923828125, 9.3564453125, 10.365966796875, 11.37548828125, 12.385009765625, 13.39453125, 14.404052734375, 15.41357421875, 16.423095703125, 17.4326171875, 18.442138671875, 19.45166015625, 20.461181640625, 21.470703125, 22.480224609375, 23.48974609375, 24.499267578125, 25.5087890625, 26.518310546875, 27.52783203125, 28.537353515625, 29.546875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 9.0, 16.0, 16.0, 27.0, 21.0, 35.0, 41.0, 61.0, 93.0, 104.0, 146.0, 223.0, 291.0, 385.0, 500.0, 660.0, 876.0, 1323.0, 1875.0, 2636.0, 3778.0, 6198.0, 10447.0, 20423.0, 121684.0, 2164392.0, 1705184.0, 103720.0, 20139.0, 10159.0, 6059.0, 3924.0, 2528.0, 1774.0, 1294.0, 907.0, 619.0, 446.0, 349.0, 252.0, 183.0, 112.0, 109.0, 80.0, 44.0, 27.0, 40.0, 15.0, 12.0, 15.0, 9.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0], "bins": [-79.1875, -76.78515625, -74.3828125, -71.98046875, -69.578125, -67.17578125, -64.7734375, -62.37109375, -59.96875, -57.56640625, -55.1640625, -52.76171875, -50.359375, -47.95703125, -45.5546875, -43.15234375, -40.75, -38.34765625, -35.9453125, -33.54296875, -31.140625, -28.73828125, -26.3359375, -23.93359375, -21.53125, -19.12890625, -16.7265625, -14.32421875, -11.921875, -9.51953125, -7.1171875, -4.71484375, -2.3125, 0.08984375, 2.4921875, 4.89453125, 7.296875, 9.69921875, 12.1015625, 14.50390625, 16.90625, 19.30859375, 21.7109375, 24.11328125, 26.515625, 28.91796875, 31.3203125, 33.72265625, 36.125, 38.52734375, 40.9296875, 43.33203125, 45.734375, 48.13671875, 50.5390625, 52.94140625, 55.34375, 57.74609375, 60.1484375, 62.55078125, 64.953125, 67.35546875, 69.7578125, 72.16015625, 74.5625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 20.0, 10.0, 14.0, 16.0, 35.0, 35.0, 53.0, 84.0, 224.0, 669.0, 1489.0, 844.0, 277.0, 96.0, 40.0, 32.0, 30.0, 21.0, 13.0, 10.0, 8.0, 7.0, 8.0, 8.0, 1.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.0, -87.580078125, -84.16015625, -80.740234375, -77.3203125, -73.900390625, -70.48046875, -67.060546875, -63.640625, -60.220703125, -56.80078125, -53.380859375, -49.9609375, -46.541015625, -43.12109375, -39.701171875, -36.28125, -32.861328125, -29.44140625, -26.021484375, -22.6015625, -19.181640625, -15.76171875, -12.341796875, -8.921875, -5.501953125, -2.08203125, 1.337890625, 4.7578125, 8.177734375, 11.59765625, 15.017578125, 18.4375, 21.857421875, 25.27734375, 28.697265625, 32.1171875, 35.537109375, 38.95703125, 42.376953125, 45.796875, 49.216796875, 52.63671875, 56.056640625, 59.4765625, 62.896484375, 66.31640625, 69.736328125, 73.15625, 76.576171875, 79.99609375, 83.416015625, 86.8359375, 90.255859375, 93.67578125, 97.095703125, 100.515625, 103.935546875, 107.35546875, 110.775390625, 114.1953125, 117.615234375, 121.03515625, 124.455078125, 127.875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 6.0, 12.0, 5.0, 20.0, 30.0, 45.0, 58.0, 93.0, 140.0, 214.0, 309.0, 420.0, 726.0, 1142.0, 1929.0, 3503.0, 6073.0, 12006.0, 27030.0, 80995.0, 2166147.0, 1764416.0, 76593.0, 25996.0, 12013.0, 5889.0, 3240.0, 2037.0, 1138.0, 713.0, 421.0, 300.0, 183.0, 131.0, 105.0, 68.0, 34.0, 30.0, 22.0, 15.0, 17.0, 6.0, 2.0, 0.0, 2.0, 1.0, 4.0], "bins": [-157.75, -153.5966796875, -149.443359375, -145.2900390625, -141.13671875, -136.9833984375, -132.830078125, -128.6767578125, -124.5234375, -120.3701171875, -116.216796875, -112.0634765625, -107.91015625, -103.7568359375, -99.603515625, -95.4501953125, -91.296875, -87.1435546875, -82.990234375, -78.8369140625, -74.68359375, -70.5302734375, -66.376953125, -62.2236328125, -58.0703125, -53.9169921875, -49.763671875, -45.6103515625, -41.45703125, -37.3037109375, -33.150390625, -28.9970703125, -24.84375, -20.6904296875, -16.537109375, -12.3837890625, -8.23046875, -4.0771484375, 0.076171875, 4.2294921875, 8.3828125, 12.5361328125, 16.689453125, 20.8427734375, 24.99609375, 29.1494140625, 33.302734375, 37.4560546875, 41.609375, 45.7626953125, 49.916015625, 54.0693359375, 58.22265625, 62.3759765625, 66.529296875, 70.6826171875, 74.8359375, 78.9892578125, 83.142578125, 87.2958984375, 91.44921875, 95.6025390625, 99.755859375, 103.9091796875, 108.0625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 10.0, 8.0, 8.0, 9.0, 14.0, 21.0, 26.0, 38.0, 44.0, 81.0, 104.0, 185.0, 122.0, 97.0, 55.0, 46.0, 32.0, 15.0, 17.0, 8.0, 14.0, 11.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.21136474609375, -283.2371826171875, -272.2630310058594, -261.28887939453125, -250.314697265625, -239.3405303955078, -228.36636352539062, -217.39219665527344, -206.41802978515625, -195.44386291503906, -184.46969604492188, -173.4955291748047, -162.5213623046875, -151.5471954345703, -140.57302856445312, -129.59886169433594, -118.62469482421875, -107.65052795410156, -96.67636108398438, -85.70219421386719, -74.72802734375, -63.75386047363281, -52.779693603515625, -41.80552673339844, -30.83135986328125, -19.857192993164062, -8.883026123046875, 2.0911407470703125, 13.0653076171875, 24.039474487304688, 35.013641357421875, 45.98780822753906, 56.961944580078125, 67.93611145019531, 78.9102783203125, 89.88444519042969, 100.85861206054688, 111.83277893066406, 122.80694580078125, 133.78111267089844, 144.75527954101562, 155.7294464111328, 166.70361328125, 177.6777801513672, 188.65194702148438, 199.62611389160156, 210.60028076171875, 221.57444763183594, 232.54861450195312, 243.5227813720703, 254.4969482421875, 265.47113037109375, 276.4452819824219, 287.41943359375, 298.39361572265625, 309.3677978515625, 320.3419494628906, 331.31610107421875, 342.290283203125, 353.26446533203125, 364.2386169433594, 375.2127685546875, 386.18695068359375, 397.1611328125, 408.1352844238281]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 1.0, 0.0, 2.0, 6.0, 6.0, 1.0, 9.0, 4.0, 9.0, 10.0, 11.0, 5.0, 22.0, 11.0, 23.0, 16.0, 17.0, 23.0, 29.0, 37.0, 40.0, 35.0, 36.0, 39.0, 37.0, 44.0, 40.0, 35.0, 44.0, 30.0, 32.0, 29.0, 43.0, 37.0, 31.0, 34.0, 23.0, 17.0, 30.0, 18.0, 18.0, 19.0, 12.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-200.75729370117188, -194.22927856445312, -187.70126342773438, -181.17324829101562, -174.64523315429688, -168.11721801757812, -161.58920288085938, -155.06117248535156, -148.5331573486328, -142.00514221191406, -135.4771270751953, -128.94911193847656, -122.42108917236328, -115.89307403564453, -109.36505889892578, -102.8370361328125, -96.30902862548828, -89.78101348876953, -83.25299835205078, -76.7249755859375, -70.19696044921875, -63.6689453125, -57.14093017578125, -50.612911224365234, -44.084896087646484, -37.556880950927734, -31.02886199951172, -24.50084686279297, -17.972829818725586, -11.444812774658203, -4.916797637939453, 1.6112213134765625, 8.139236450195312, 14.667253494262695, 21.195270538330078, 27.723285675048828, 34.251304626464844, 40.779319763183594, 47.307334899902344, 53.83535385131836, 60.36336898803711, 66.89138793945312, 73.41940307617188, 79.94741821289062, 86.47543334960938, 93.00344848632812, 99.53146362304688, 106.05948638916016, 112.5875015258789, 119.11551666259766, 125.6435317993164, 132.1715545654297, 138.69956970214844, 145.2275848388672, 151.75559997558594, 158.2836151123047, 164.81163024902344, 171.3396453857422, 177.86766052246094, 184.3956756591797, 190.92369079589844, 197.45172119140625, 203.979736328125, 210.50775146484375, 217.0357666015625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 7.0, 14.0, 19.0, 10.0, 18.0, 18.0, 28.0, 17.0, 26.0, 38.0, 27.0, 27.0, 29.0, 41.0, 38.0, 44.0, 46.0, 45.0, 43.0, 43.0, 36.0, 49.0, 27.0, 31.0, 31.0, 17.0, 28.0, 22.0, 21.0, 25.0, 20.0, 25.0, 16.0, 11.0, 9.0, 11.0, 9.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.34375, -32.332275390625, -31.32080078125, -30.309326171875, -29.2978515625, -28.286376953125, -27.27490234375, -26.263427734375, -25.251953125, -24.240478515625, -23.22900390625, -22.217529296875, -21.2060546875, -20.194580078125, -19.18310546875, -18.171630859375, -17.16015625, -16.148681640625, -15.13720703125, -14.125732421875, -13.1142578125, -12.102783203125, -11.09130859375, -10.079833984375, -9.068359375, -8.056884765625, -7.04541015625, -6.033935546875, -5.0224609375, -4.010986328125, -2.99951171875, -1.988037109375, -0.9765625, 0.034912109375, 1.04638671875, 2.057861328125, 3.0693359375, 4.080810546875, 5.09228515625, 6.103759765625, 7.115234375, 8.126708984375, 9.13818359375, 10.149658203125, 11.1611328125, 12.172607421875, 13.18408203125, 14.195556640625, 15.20703125, 16.218505859375, 17.22998046875, 18.241455078125, 19.2529296875, 20.264404296875, 21.27587890625, 22.287353515625, 23.298828125, 24.310302734375, 25.32177734375, 26.333251953125, 27.3447265625, 28.356201171875, 29.36767578125, 30.379150390625, 31.390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 6.0, 15.0, 16.0, 22.0, 25.0, 37.0, 45.0, 80.0, 71.0, 96.0, 146.0, 203.0, 276.0, 381.0, 573.0, 815.0, 1088.0, 1499.0, 2090.0, 2898.0, 4120.0, 5794.0, 8470.0, 12227.0, 17487.0, 25857.0, 37875.0, 57692.0, 97707.0, 226233.0, 257183.0, 102827.0, 59510.0, 38532.0, 26354.0, 18132.0, 12532.0, 8664.0, 6037.0, 4231.0, 3095.0, 2174.0, 1526.0, 1105.0, 764.0, 558.0, 398.0, 306.0, 203.0, 159.0, 107.0, 79.0, 71.0, 60.0, 33.0, 27.0, 20.0, 18.0, 8.0, 8.0, 2.0, 2.0, 1.0], "bins": [-1.052734375, -1.0188140869140625, -0.984893798828125, -0.9509735107421875, -0.91705322265625, -0.8831329345703125, -0.849212646484375, -0.8152923583984375, -0.7813720703125, -0.7474517822265625, -0.713531494140625, -0.6796112060546875, -0.64569091796875, -0.6117706298828125, -0.577850341796875, -0.5439300537109375, -0.510009765625, -0.4760894775390625, -0.442169189453125, -0.4082489013671875, -0.37432861328125, -0.3404083251953125, -0.306488037109375, -0.2725677490234375, -0.2386474609375, -0.2047271728515625, -0.170806884765625, -0.1368865966796875, -0.10296630859375, -0.0690460205078125, -0.035125732421875, -0.0012054443359375, 0.03271484375, 0.0666351318359375, 0.100555419921875, 0.1344757080078125, 0.16839599609375, 0.2023162841796875, 0.236236572265625, 0.2701568603515625, 0.3040771484375, 0.3379974365234375, 0.371917724609375, 0.4058380126953125, 0.43975830078125, 0.4736785888671875, 0.507598876953125, 0.5415191650390625, 0.575439453125, 0.6093597412109375, 0.643280029296875, 0.6772003173828125, 0.71112060546875, 0.7450408935546875, 0.778961181640625, 0.8128814697265625, 0.8468017578125, 0.8807220458984375, 0.914642333984375, 0.9485626220703125, 0.98248291015625, 1.0164031982421875, 1.050323486328125, 1.0842437744140625, 1.1181640625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 6.0, 7.0, 13.0, 6.0, 12.0, 8.0, 17.0, 18.0, 9.0, 22.0, 32.0, 26.0, 30.0, 37.0, 34.0, 41.0, 26.0, 39.0, 36.0, 50.0, 1061.0, 39.0, 40.0, 39.0, 29.0, 43.0, 45.0, 24.0, 29.0, 37.0, 29.0, 14.0, 16.0, 19.0, 11.0, 10.0, 9.0, 12.0, 10.0, 11.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-21.421875, -20.79052734375, -20.1591796875, -19.52783203125, -18.896484375, -18.26513671875, -17.6337890625, -17.00244140625, -16.37109375, -15.73974609375, -15.1083984375, -14.47705078125, -13.845703125, -13.21435546875, -12.5830078125, -11.95166015625, -11.3203125, -10.68896484375, -10.0576171875, -9.42626953125, -8.794921875, -8.16357421875, -7.5322265625, -6.90087890625, -6.26953125, -5.63818359375, -5.0068359375, -4.37548828125, -3.744140625, -3.11279296875, -2.4814453125, -1.85009765625, -1.21875, -0.58740234375, 0.0439453125, 0.67529296875, 1.306640625, 1.93798828125, 2.5693359375, 3.20068359375, 3.83203125, 4.46337890625, 5.0947265625, 5.72607421875, 6.357421875, 6.98876953125, 7.6201171875, 8.25146484375, 8.8828125, 9.51416015625, 10.1455078125, 10.77685546875, 11.408203125, 12.03955078125, 12.6708984375, 13.30224609375, 13.93359375, 14.56494140625, 15.1962890625, 15.82763671875, 16.458984375, 17.09033203125, 17.7216796875, 18.35302734375, 18.984375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 9.0, 23.0, 37.0, 38.0, 47.0, 75.0, 110.0, 135.0, 213.0, 304.0, 443.0, 565.0, 884.0, 1254.0, 1742.0, 2497.0, 3746.0, 5389.0, 7942.0, 11911.0, 17937.0, 27834.0, 44488.0, 73245.0, 129136.0, 1364709.0, 166071.0, 87362.0, 52491.0, 32876.0, 20968.0, 13570.0, 9073.0, 6163.0, 4279.0, 2830.0, 2029.0, 1439.0, 999.0, 650.0, 489.0, 342.0, 220.0, 158.0, 140.0, 86.0, 46.0, 30.0, 31.0, 31.0, 20.0, 11.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0], "bins": [-0.859375, -0.8322372436523438, -0.8050994873046875, -0.7779617309570312, -0.750823974609375, -0.7236862182617188, -0.6965484619140625, -0.6694107055664062, -0.64227294921875, -0.6151351928710938, -0.5879974365234375, -0.5608596801757812, -0.533721923828125, -0.5065841674804688, -0.4794464111328125, -0.45230865478515625, -0.4251708984375, -0.39803314208984375, -0.3708953857421875, -0.34375762939453125, -0.316619873046875, -0.28948211669921875, -0.2623443603515625, -0.23520660400390625, -0.20806884765625, -0.18093109130859375, -0.1537933349609375, -0.12665557861328125, -0.099517822265625, -0.07238006591796875, -0.0452423095703125, -0.01810455322265625, 0.009033203125, 0.03617095947265625, 0.0633087158203125, 0.09044647216796875, 0.117584228515625, 0.14472198486328125, 0.1718597412109375, 0.19899749755859375, 0.22613525390625, 0.25327301025390625, 0.2804107666015625, 0.30754852294921875, 0.334686279296875, 0.36182403564453125, 0.3889617919921875, 0.41609954833984375, 0.4432373046875, 0.47037506103515625, 0.4975128173828125, 0.5246505737304688, 0.551788330078125, 0.5789260864257812, 0.6060638427734375, 0.6332015991210938, 0.66033935546875, 0.6874771118164062, 0.7146148681640625, 0.7417526245117188, 0.768890380859375, 0.7960281372070312, 0.8231658935546875, 0.8503036499023438, 0.87744140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 14.0, 14.0, 16.0, 28.0, 24.0, 32.0, 46.0, 52.0, 87.0, 185.0, 166.0, 72.0, 53.0, 51.0, 38.0, 30.0, 25.0, 10.0, 10.0, 6.0, 2.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.104873657226562e-05, -6.851088255643845e-05, -6.597302854061127e-05, -6.343517452478409e-05, -6.089732050895691e-05, -5.835946649312973e-05, -5.582161247730255e-05, -5.328375846147537e-05, -5.074590444564819e-05, -4.8208050429821014e-05, -4.5670196413993835e-05, -4.3132342398166656e-05, -4.059448838233948e-05, -3.80566343665123e-05, -3.551878035068512e-05, -3.298092633485794e-05, -3.0443072319030762e-05, -2.7905218303203583e-05, -2.5367364287376404e-05, -2.2829510271549225e-05, -2.0291656255722046e-05, -1.7753802239894867e-05, -1.5215948224067688e-05, -1.2678094208240509e-05, -1.014024019241333e-05, -7.602386176586151e-06, -5.064532160758972e-06, -2.5266781449317932e-06, 1.1175870895385742e-08, 2.5490298867225647e-06, 5.086883902549744e-06, 7.624737918376923e-06, 1.0162591934204102e-05, 1.270044595003128e-05, 1.523829996585846e-05, 1.777615398168564e-05, 2.0314007997512817e-05, 2.2851862013339996e-05, 2.5389716029167175e-05, 2.7927570044994354e-05, 3.0465424060821533e-05, 3.300327807664871e-05, 3.554113209247589e-05, 3.807898610830307e-05, 4.061684012413025e-05, 4.315469413995743e-05, 4.569254815578461e-05, 4.8230402171611786e-05, 5.0768256187438965e-05, 5.3306110203266144e-05, 5.584396421909332e-05, 5.83818182349205e-05, 6.091967225074768e-05, 6.345752626657486e-05, 6.599538028240204e-05, 6.853323429822922e-05, 7.10710883140564e-05, 7.360894232988358e-05, 7.614679634571075e-05, 7.868465036153793e-05, 8.122250437736511e-05, 8.376035839319229e-05, 8.629821240901947e-05, 8.883606642484665e-05, 9.137392044067383e-05]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 3.0, 5.0, 10.0, 21.0, 26.0, 55.0, 82.0, 115.0, 607.0, 5637.0, 347447.0, 686985.0, 6493.0, 694.0, 148.0, 61.0, 37.0, 28.0, 26.0, 13.0, 20.0, 10.0, 6.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0014858245849609375, -0.0014445781707763672, -0.0014033317565917969, -0.0013620853424072266, -0.0013208389282226562, -0.001279592514038086, -0.0012383460998535156, -0.0011970996856689453, -0.001155853271484375, -0.0011146068572998047, -0.0010733604431152344, -0.001032114028930664, -0.0009908676147460938, -0.0009496212005615234, -0.0009083747863769531, -0.0008671283721923828, -0.0008258819580078125, -0.0007846355438232422, -0.0007433891296386719, -0.0007021427154541016, -0.0006608963012695312, -0.0006196498870849609, -0.0005784034729003906, -0.0005371570587158203, -0.00049591064453125, -0.0004546642303466797, -0.0004134178161621094, -0.00037217140197753906, -0.00033092498779296875, -0.00028967857360839844, -0.0002484321594238281, -0.0002071857452392578, -0.0001659393310546875, -0.0001246929168701172, -8.344650268554688e-05, -4.220008850097656e-05, -9.5367431640625e-07, 4.029273986816406e-05, 8.153915405273438e-05, 0.0001227855682373047, 0.000164031982421875, 0.0002052783966064453, 0.0002465248107910156, 0.00028777122497558594, 0.00032901763916015625, 0.00037026405334472656, 0.0004115104675292969, 0.0004527568817138672, 0.0004940032958984375, 0.0005352497100830078, 0.0005764961242675781, 0.0006177425384521484, 0.0006589889526367188, 0.0007002353668212891, 0.0007414817810058594, 0.0007827281951904297, 0.000823974609375, 0.0008652210235595703, 0.0009064674377441406, 0.0009477138519287109, 0.0009889602661132812, 0.0010302066802978516, 0.0010714530944824219, 0.0011126995086669922, 0.0011539459228515625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 13.0, 13.0, 15.0, 37.0, 43.0, 56.0, 98.0, 143.0, 174.0, 121.0, 72.0, 52.0, 33.0, 20.0, 18.0, 10.0, 9.0, 11.0, 5.0, 5.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.753056418849155e-05, -4.622126289177686e-05, -4.4911961595062166e-05, -4.360266029834747e-05, -4.229335900163278e-05, -4.0984057704918087e-05, -3.967475640820339e-05, -3.83654551114887e-05, -3.7056153814774007e-05, -3.574685251805931e-05, -3.443755122134462e-05, -3.312824992462993e-05, -3.181894862791523e-05, -3.050964733120054e-05, -2.9200344215496443e-05, -2.789104291878175e-05, -2.6581739803077653e-05, -2.527243850636296e-05, -2.3963137209648266e-05, -2.2653835912933573e-05, -2.134453461621888e-05, -2.0035233319504187e-05, -1.872593020380009e-05, -1.7416628907085396e-05, -1.6107327610370703e-05, -1.479802631365601e-05, -1.3488725016941316e-05, -1.2179422810731921e-05, -1.0870121514017228e-05, -9.560820217302535e-06, -8.25151801109314e-06, -6.942216714378446e-06, -5.632911779684946e-06, -4.323610482970253e-06, -3.0143087315082084e-06, -1.7050069800461642e-06, -3.9570568333147094e-07, 9.135956133832224e-07, 2.2228978195926175e-06, 3.5321991163073108e-06, 4.841500413022004e-06, 6.150801709736697e-06, 7.4601034611987416e-06, 8.769405212660786e-06, 1.0078706509375479e-05, 1.1388007806090172e-05, 1.2697310012299567e-05, 1.400661130901426e-05, 1.5315912605728954e-05, 1.6625213902443647e-05, 1.793451519915834e-05, 1.9243816495873034e-05, 2.0553117792587727e-05, 2.186241908930242e-05, 2.3171722205006517e-05, 2.448102350172121e-05, 2.5790324798435904e-05, 2.7099626095150597e-05, 2.840892739186529e-05, 2.9718230507569388e-05, 3.102753180428408e-05, 3.2336833100998774e-05, 3.364613439771347e-05, 3.495543569442816e-05, 3.6264736991142854e-05]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 4.0, 4.0, 6.0, 19.0, 7.0, 18.0, 17.0, 32.0, 29.0, 28.0, 24.0, 29.0, 36.0, 26.0, 18.0, 27.0, 44.0, 46.0, 32.0, 50.0, 44.0, 40.0, 39.0, 32.0, 23.0, 29.0, 29.0, 25.0, 29.0, 25.0, 18.0, 18.0, 15.0, 10.0, 14.0, 14.0, 8.0, 16.0, 9.0, 5.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.6881694793701172e-05, -2.6081688702106476e-05, -2.528168261051178e-05, -2.4481676518917084e-05, -2.3681670427322388e-05, -2.288166433572769e-05, -2.2081658244132996e-05, -2.12816521525383e-05, -2.0481646060943604e-05, -1.9681639969348907e-05, -1.888163387775421e-05, -1.8081627786159515e-05, -1.728162169456482e-05, -1.6481615602970123e-05, -1.5681609511375427e-05, -1.4881603419780731e-05, -1.4081597328186035e-05, -1.3281591236591339e-05, -1.2481585144996643e-05, -1.1681579053401947e-05, -1.0881572961807251e-05, -1.0081566870212555e-05, -9.281560778617859e-06, -8.481554687023163e-06, -7.681548595428467e-06, -6.881542503833771e-06, -6.081536412239075e-06, -5.281530320644379e-06, -4.481524229049683e-06, -3.6815181374549866e-06, -2.8815120458602905e-06, -2.0815059542655945e-06, -1.2814998626708984e-06, -4.814937710762024e-07, 3.1851232051849365e-07, 1.1185184121131897e-06, 1.9185245037078857e-06, 2.7185305953025818e-06, 3.518536686897278e-06, 4.318542778491974e-06, 5.11854887008667e-06, 5.918554961681366e-06, 6.718561053276062e-06, 7.518567144870758e-06, 8.318573236465454e-06, 9.11857932806015e-06, 9.918585419654846e-06, 1.0718591511249542e-05, 1.1518597602844238e-05, 1.2318603694438934e-05, 1.311860978603363e-05, 1.3918615877628326e-05, 1.4718621969223022e-05, 1.551862806081772e-05, 1.6318634152412415e-05, 1.711864024400711e-05, 1.7918646335601807e-05, 1.8718652427196503e-05, 1.95186585187912e-05, 2.0318664610385895e-05, 2.111867070198059e-05, 2.1918676793575287e-05, 2.2718682885169983e-05, 2.351868897676468e-05, 2.4318695068359375e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 7.0, 14.0, 19.0, 10.0, 18.0, 18.0, 28.0, 17.0, 26.0, 38.0, 27.0, 27.0, 29.0, 41.0, 38.0, 44.0, 46.0, 45.0, 43.0, 43.0, 36.0, 49.0, 27.0, 31.0, 31.0, 17.0, 28.0, 22.0, 21.0, 25.0, 20.0, 25.0, 16.0, 11.0, 9.0, 11.0, 9.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.34375, -32.332275390625, -31.32080078125, -30.309326171875, -29.2978515625, -28.286376953125, -27.27490234375, -26.263427734375, -25.251953125, -24.240478515625, -23.22900390625, -22.217529296875, -21.2060546875, -20.194580078125, -19.18310546875, -18.171630859375, -17.16015625, -16.148681640625, -15.13720703125, -14.125732421875, -13.1142578125, -12.102783203125, -11.09130859375, -10.079833984375, -9.068359375, -8.056884765625, -7.04541015625, -6.033935546875, -5.0224609375, -4.010986328125, -2.99951171875, -1.988037109375, -0.9765625, 0.034912109375, 1.04638671875, 2.057861328125, 3.0693359375, 4.080810546875, 5.09228515625, 6.103759765625, 7.115234375, 8.126708984375, 9.13818359375, 10.149658203125, 11.1611328125, 12.172607421875, 13.18408203125, 14.195556640625, 15.20703125, 16.218505859375, 17.22998046875, 18.241455078125, 19.2529296875, 20.264404296875, 21.27587890625, 22.287353515625, 23.298828125, 24.310302734375, 25.32177734375, 26.333251953125, 27.3447265625, 28.356201171875, 29.36767578125, 30.379150390625, 31.390625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 2.0, 5.0, 3.0, 14.0, 11.0, 19.0, 16.0, 27.0, 38.0, 54.0, 75.0, 89.0, 112.0, 191.0, 296.0, 424.0, 643.0, 973.0, 1502.0, 2372.0, 4009.0, 13342.0, 406454.0, 590686.0, 15936.0, 4173.0, 2409.0, 1546.0, 1017.0, 671.0, 427.0, 288.0, 192.0, 143.0, 98.0, 76.0, 60.0, 29.0, 38.0, 21.0, 12.0, 5.0, 18.0, 7.0, 5.0, 2.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-84.4375, -81.8818359375, -79.326171875, -76.7705078125, -74.21484375, -71.6591796875, -69.103515625, -66.5478515625, -63.9921875, -61.4365234375, -58.880859375, -56.3251953125, -53.76953125, -51.2138671875, -48.658203125, -46.1025390625, -43.546875, -40.9912109375, -38.435546875, -35.8798828125, -33.32421875, -30.7685546875, -28.212890625, -25.6572265625, -23.1015625, -20.5458984375, -17.990234375, -15.4345703125, -12.87890625, -10.3232421875, -7.767578125, -5.2119140625, -2.65625, -0.1005859375, 2.455078125, 5.0107421875, 7.56640625, 10.1220703125, 12.677734375, 15.2333984375, 17.7890625, 20.3447265625, 22.900390625, 25.4560546875, 28.01171875, 30.5673828125, 33.123046875, 35.6787109375, 38.234375, 40.7900390625, 43.345703125, 45.9013671875, 48.45703125, 51.0126953125, 53.568359375, 56.1240234375, 58.6796875, 61.2353515625, 63.791015625, 66.3466796875, 68.90234375, 71.4580078125, 74.013671875, 76.5693359375, 79.125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 8.0, 9.0, 4.0, 10.0, 7.0, 13.0, 16.0, 12.0, 18.0, 15.0, 25.0, 26.0, 22.0, 27.0, 37.0, 42.0, 42.0, 51.0, 50.0, 79.0, 396.0, 1596.0, 91.0, 60.0, 50.0, 38.0, 35.0, 35.0, 35.0, 32.0, 33.0, 23.0, 22.0, 12.0, 11.0, 9.0, 19.0, 10.0, 10.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.6875, -99.3837890625, -96.080078125, -92.7763671875, -89.47265625, -86.1689453125, -82.865234375, -79.5615234375, -76.2578125, -72.9541015625, -69.650390625, -66.3466796875, -63.04296875, -59.7392578125, -56.435546875, -53.1318359375, -49.828125, -46.5244140625, -43.220703125, -39.9169921875, -36.61328125, -33.3095703125, -30.005859375, -26.7021484375, -23.3984375, -20.0947265625, -16.791015625, -13.4873046875, -10.18359375, -6.8798828125, -3.576171875, -0.2724609375, 3.03125, 6.3349609375, 9.638671875, 12.9423828125, 16.24609375, 19.5498046875, 22.853515625, 26.1572265625, 29.4609375, 32.7646484375, 36.068359375, 39.3720703125, 42.67578125, 45.9794921875, 49.283203125, 52.5869140625, 55.890625, 59.1943359375, 62.498046875, 65.8017578125, 69.10546875, 72.4091796875, 75.712890625, 79.0166015625, 82.3203125, 85.6240234375, 88.927734375, 92.2314453125, 95.53515625, 98.8388671875, 102.142578125, 105.4462890625, 108.75]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 12.0, 28.0, 18.0, 20.0, 27.0, 36.0, 60.0, 90.0, 97.0, 143.0, 234.0, 519.0, 1146.0, 3292.0, 15417.0, 3009257.0, 103908.0, 7480.0, 2069.0, 782.0, 364.0, 184.0, 120.0, 78.0, 57.0, 66.0, 35.0, 33.0, 23.0, 20.0, 11.0, 10.0, 7.0, 6.0, 11.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.875, -229.423828125, -221.97265625, -214.521484375, -207.0703125, -199.619140625, -192.16796875, -184.716796875, -177.265625, -169.814453125, -162.36328125, -154.912109375, -147.4609375, -140.009765625, -132.55859375, -125.107421875, -117.65625, -110.205078125, -102.75390625, -95.302734375, -87.8515625, -80.400390625, -72.94921875, -65.498046875, -58.046875, -50.595703125, -43.14453125, -35.693359375, -28.2421875, -20.791015625, -13.33984375, -5.888671875, 1.5625, 9.013671875, 16.46484375, 23.916015625, 31.3671875, 38.818359375, 46.26953125, 53.720703125, 61.171875, 68.623046875, 76.07421875, 83.525390625, 90.9765625, 98.427734375, 105.87890625, 113.330078125, 120.78125, 128.232421875, 135.68359375, 143.134765625, 150.5859375, 158.037109375, 165.48828125, 172.939453125, 180.390625, 187.841796875, 195.29296875, 202.744140625, 210.1953125, 217.646484375, 225.09765625, 232.548828125, 240.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 3.0, 8.0, 14.0, 29.0, 40.0, 90.0, 190.0, 271.0, 171.0, 100.0, 43.0, 24.0, 14.0, 5.0, 2.0, 1.0, 4.0, 2.0], "bins": [-488.95184326171875, -479.8100891113281, -470.6683349609375, -461.5265808105469, -452.38482666015625, -443.2430725097656, -434.101318359375, -424.9595642089844, -415.81781005859375, -406.6760559082031, -397.5343017578125, -388.3925476074219, -379.25079345703125, -370.1090393066406, -360.96728515625, -351.8255310058594, -342.68377685546875, -333.5420227050781, -324.4002685546875, -315.2585144042969, -306.11676025390625, -296.9750061035156, -287.833251953125, -278.6914978027344, -269.5497741699219, -260.40802001953125, -251.26626586914062, -242.12451171875, -232.98275756835938, -223.84100341796875, -214.69924926757812, -205.5574951171875, -196.41574096679688, -187.27398681640625, -178.13223266601562, -168.990478515625, -159.84872436523438, -150.70697021484375, -141.56521606445312, -132.4234619140625, -123.28172302246094, -114.13996887207031, -104.99821472167969, -95.85646057128906, -86.71470642089844, -77.57295227050781, -68.43120574951172, -59.289451599121094, -50.14769744873047, -41.005943298339844, -31.86419105529785, -22.72243881225586, -13.580684661865234, -4.438930511474609, 4.70281982421875, 13.844573974609375, 22.986328125, 32.128082275390625, 41.26983642578125, 50.41158676147461, 59.553340911865234, 68.69509887695312, 77.83684539794922, 86.97859954833984, 96.12035369873047]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 6.0, 12.0, 13.0, 10.0, 10.0, 12.0, 18.0, 27.0, 24.0, 24.0, 25.0, 36.0, 45.0, 36.0, 36.0, 43.0, 38.0, 42.0, 50.0, 54.0, 44.0, 46.0, 37.0, 30.0, 30.0, 35.0, 31.0, 30.0, 27.0, 20.0, 16.0, 14.0, 15.0, 18.0, 3.0, 5.0, 3.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.15704345703125, -252.15626525878906, -243.15548706054688, -234.1547088623047, -225.1539306640625, -216.1531524658203, -207.15237426757812, -198.15159606933594, -189.15081787109375, -180.15003967285156, -171.14926147460938, -162.1484832763672, -153.147705078125, -144.1469268798828, -135.14614868164062, -126.14537048339844, -117.14459228515625, -108.14381408691406, -99.14303588867188, -90.14225769042969, -81.1414794921875, -72.14070129394531, -63.139923095703125, -54.13914489746094, -45.13836669921875, -36.13758850097656, -27.136810302734375, -18.136032104492188, -9.13525390625, -0.1344757080078125, 8.866302490234375, 17.867080688476562, 26.867889404296875, 35.86866760253906, 44.86944580078125, 53.87022399902344, 62.871002197265625, 71.87178039550781, 80.87255859375, 89.87333679199219, 98.87411499023438, 107.87489318847656, 116.87567138671875, 125.87644958496094, 134.87722778320312, 143.8780059814453, 152.8787841796875, 161.8795623779297, 170.88034057617188, 179.88111877441406, 188.88189697265625, 197.88267517089844, 206.88345336914062, 215.8842315673828, 224.885009765625, 233.8857879638672, 242.88656616210938, 251.88734436035156, 260.88812255859375, 269.888916015625, 278.8896789550781, 287.89044189453125, 296.8912353515625, 305.89202880859375, 314.8927917480469]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 12.0, 9.0, 14.0, 19.0, 15.0, 19.0, 16.0, 25.0, 28.0, 31.0, 30.0, 43.0, 32.0, 36.0, 32.0, 39.0, 47.0, 38.0, 44.0, 56.0, 32.0, 31.0, 33.0, 27.0, 34.0, 27.0, 15.0, 29.0, 22.0, 23.0, 26.0, 17.0, 17.0, 12.0, 13.0, 8.0, 4.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-32.4375, -31.41748046875, -30.3974609375, -29.37744140625, -28.357421875, -27.33740234375, -26.3173828125, -25.29736328125, -24.27734375, -23.25732421875, -22.2373046875, -21.21728515625, -20.197265625, -19.17724609375, -18.1572265625, -17.13720703125, -16.1171875, -15.09716796875, -14.0771484375, -13.05712890625, -12.037109375, -11.01708984375, -9.9970703125, -8.97705078125, -7.95703125, -6.93701171875, -5.9169921875, -4.89697265625, -3.876953125, -2.85693359375, -1.8369140625, -0.81689453125, 0.203125, 1.22314453125, 2.2431640625, 3.26318359375, 4.283203125, 5.30322265625, 6.3232421875, 7.34326171875, 8.36328125, 9.38330078125, 10.4033203125, 11.42333984375, 12.443359375, 13.46337890625, 14.4833984375, 15.50341796875, 16.5234375, 17.54345703125, 18.5634765625, 19.58349609375, 20.603515625, 21.62353515625, 22.6435546875, 23.66357421875, 24.68359375, 25.70361328125, 26.7236328125, 27.74365234375, 28.763671875, 29.78369140625, 30.8037109375, 31.82373046875, 32.84375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 7.0, 11.0, 16.0, 14.0, 23.0, 32.0, 40.0, 54.0, 73.0, 97.0, 110.0, 157.0, 206.0, 287.0, 410.0, 526.0, 720.0, 1150.0, 1657.0, 2476.0, 3972.0, 6805.0, 12842.0, 48155.0, 950340.0, 2988085.0, 135308.0, 17735.0, 8577.0, 4849.0, 3089.0, 1961.0, 1247.0, 856.0, 632.0, 460.0, 343.0, 237.0, 182.0, 117.0, 103.0, 74.0, 47.0, 42.0, 40.0, 28.0, 19.0, 16.0, 11.0, 6.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0], "bins": [-96.625, -93.7138671875, -90.802734375, -87.8916015625, -84.98046875, -82.0693359375, -79.158203125, -76.2470703125, -73.3359375, -70.4248046875, -67.513671875, -64.6025390625, -61.69140625, -58.7802734375, -55.869140625, -52.9580078125, -50.046875, -47.1357421875, -44.224609375, -41.3134765625, -38.40234375, -35.4912109375, -32.580078125, -29.6689453125, -26.7578125, -23.8466796875, -20.935546875, -18.0244140625, -15.11328125, -12.2021484375, -9.291015625, -6.3798828125, -3.46875, -0.5576171875, 2.353515625, 5.2646484375, 8.17578125, 11.0869140625, 13.998046875, 16.9091796875, 19.8203125, 22.7314453125, 25.642578125, 28.5537109375, 31.46484375, 34.3759765625, 37.287109375, 40.1982421875, 43.109375, 46.0205078125, 48.931640625, 51.8427734375, 54.75390625, 57.6650390625, 60.576171875, 63.4873046875, 66.3984375, 69.3095703125, 72.220703125, 75.1318359375, 78.04296875, 80.9541015625, 83.865234375, 86.7763671875, 89.6875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 5.0, 13.0, 22.0, 22.0, 29.0, 42.0, 79.0, 212.0, 924.0, 1820.0, 602.0, 122.0, 46.0, 35.0, 28.0, 17.0, 16.0, 11.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.875, -160.3359375, -155.796875, -151.2578125, -146.71875, -142.1796875, -137.640625, -133.1015625, -128.5625, -124.0234375, -119.484375, -114.9453125, -110.40625, -105.8671875, -101.328125, -96.7890625, -92.25, -87.7109375, -83.171875, -78.6328125, -74.09375, -69.5546875, -65.015625, -60.4765625, -55.9375, -51.3984375, -46.859375, -42.3203125, -37.78125, -33.2421875, -28.703125, -24.1640625, -19.625, -15.0859375, -10.546875, -6.0078125, -1.46875, 3.0703125, 7.609375, 12.1484375, 16.6875, 21.2265625, 25.765625, 30.3046875, 34.84375, 39.3828125, 43.921875, 48.4609375, 53.0, 57.5390625, 62.078125, 66.6171875, 71.15625, 75.6953125, 80.234375, 84.7734375, 89.3125, 93.8515625, 98.390625, 102.9296875, 107.46875, 112.0078125, 116.546875, 121.0859375, 125.625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 12.0, 13.0, 14.0, 19.0, 18.0, 34.0, 58.0, 96.0, 196.0, 341.0, 551.0, 1164.0, 2705.0, 6947.0, 20817.0, 99405.0, 3870288.0, 152403.0, 25319.0, 7976.0, 3112.0, 1319.0, 670.0, 314.0, 157.0, 113.0, 73.0, 54.0, 39.0, 14.0, 13.0, 3.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-185.875, -179.134765625, -172.39453125, -165.654296875, -158.9140625, -152.173828125, -145.43359375, -138.693359375, -131.953125, -125.212890625, -118.47265625, -111.732421875, -104.9921875, -98.251953125, -91.51171875, -84.771484375, -78.03125, -71.291015625, -64.55078125, -57.810546875, -51.0703125, -44.330078125, -37.58984375, -30.849609375, -24.109375, -17.369140625, -10.62890625, -3.888671875, 2.8515625, 9.591796875, 16.33203125, 23.072265625, 29.8125, 36.552734375, 43.29296875, 50.033203125, 56.7734375, 63.513671875, 70.25390625, 76.994140625, 83.734375, 90.474609375, 97.21484375, 103.955078125, 110.6953125, 117.435546875, 124.17578125, 130.916015625, 137.65625, 144.396484375, 151.13671875, 157.876953125, 164.6171875, 171.357421875, 178.09765625, 184.837890625, 191.578125, 198.318359375, 205.05859375, 211.798828125, 218.5390625, 225.279296875, 232.01953125, 238.759765625, 245.5]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 5.0, 8.0, 16.0, 26.0, 39.0, 45.0, 87.0, 196.0, 242.0, 125.0, 77.0, 50.0, 22.0, 15.0, 15.0, 10.0, 11.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-709.44775390625, -693.0075073242188, -676.5672607421875, -660.126953125, -643.6867065429688, -627.2464599609375, -610.8062133789062, -594.365966796875, -577.9256591796875, -561.4854125976562, -545.045166015625, -528.6048583984375, -512.1646118164062, -495.724365234375, -479.28411865234375, -462.8438415527344, -446.4035949707031, -429.9633483886719, -413.5230712890625, -397.08282470703125, -380.6425476074219, -364.2023010253906, -347.76202392578125, -331.32177734375, -314.88153076171875, -298.4412841796875, -282.0010070800781, -265.5607604980469, -249.1204833984375, -232.68023681640625, -216.23997497558594, -199.79971313476562, -183.35946655273438, -166.91920471191406, -150.47894287109375, -134.0386962890625, -117.59842681884766, -101.15816497802734, -84.71791076660156, -68.27764892578125, -51.83738708496094, -35.397125244140625, -18.956867218017578, -2.5166091918945312, 13.923652648925781, 30.363914489746094, 46.804168701171875, 63.24443054199219, 79.6846923828125, 96.12495422363281, 112.56521606445312, 129.00546264648438, 145.44573974609375, 161.885986328125, 178.3262481689453, 194.76651000976562, 211.20677185058594, 227.64703369140625, 244.08729553222656, 260.5275573730469, 276.9678039550781, 293.4080810546875, 309.84832763671875, 326.28857421875, 342.7288513183594]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 7.0, 8.0, 9.0, 14.0, 13.0, 13.0, 23.0, 18.0, 20.0, 20.0, 29.0, 35.0, 28.0, 33.0, 34.0, 43.0, 46.0, 43.0, 45.0, 49.0, 40.0, 39.0, 39.0, 43.0, 33.0, 36.0, 43.0, 28.0, 14.0, 22.0, 19.0, 27.0, 14.0, 16.0, 14.0, 13.0, 6.0, 10.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.5008544921875, -230.16421508789062, -222.82757568359375, -215.4909210205078, -208.15428161621094, -200.81764221191406, -193.48098754882812, -186.14434814453125, -178.80770874023438, -171.4710693359375, -164.13442993164062, -156.7977752685547, -149.4611358642578, -142.12449645996094, -134.787841796875, -127.45120239257812, -120.11456298828125, -112.77792358398438, -105.44127655029297, -98.10462951660156, -90.76799011230469, -83.43135070800781, -76.0947036743164, -68.758056640625, -61.421417236328125, -54.084774017333984, -46.748130798339844, -39.4114875793457, -32.07484436035156, -24.738201141357422, -17.40155792236328, -10.06491470336914, -2.7282562255859375, 4.608386993408203, 11.945030212402344, 19.281673431396484, 26.618316650390625, 33.954959869384766, 41.291603088378906, 48.62824630737305, 55.96488952636719, 63.30153274536133, 70.63817596435547, 77.97482299804688, 85.31146240234375, 92.64810180664062, 99.98474884033203, 107.32139587402344, 114.65803527832031, 121.99467468261719, 129.33132934570312, 136.66796875, 144.00460815429688, 151.34124755859375, 158.67788696289062, 166.01454162597656, 173.35118103027344, 180.6878204345703, 188.02447509765625, 195.36111450195312, 202.69775390625, 210.03439331054688, 217.37103271484375, 224.7076873779297, 232.04432678222656]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 6.0, 1.0, 6.0, 10.0, 11.0, 12.0, 15.0, 8.0, 17.0, 25.0, 23.0, 29.0, 35.0, 22.0, 39.0, 41.0, 46.0, 42.0, 44.0, 46.0, 49.0, 51.0, 29.0, 42.0, 33.0, 42.0, 37.0, 27.0, 38.0, 22.0, 27.0, 28.0, 19.0, 16.0, 13.0, 17.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.48291015625, -30.3095703125, -29.13623046875, -27.962890625, -26.78955078125, -25.6162109375, -24.44287109375, -23.26953125, -22.09619140625, -20.9228515625, -19.74951171875, -18.576171875, -17.40283203125, -16.2294921875, -15.05615234375, -13.8828125, -12.70947265625, -11.5361328125, -10.36279296875, -9.189453125, -8.01611328125, -6.8427734375, -5.66943359375, -4.49609375, -3.32275390625, -2.1494140625, -0.97607421875, 0.197265625, 1.37060546875, 2.5439453125, 3.71728515625, 4.890625, 6.06396484375, 7.2373046875, 8.41064453125, 9.583984375, 10.75732421875, 11.9306640625, 13.10400390625, 14.27734375, 15.45068359375, 16.6240234375, 17.79736328125, 18.970703125, 20.14404296875, 21.3173828125, 22.49072265625, 23.6640625, 24.83740234375, 26.0107421875, 27.18408203125, 28.357421875, 29.53076171875, 30.7041015625, 31.87744140625, 33.05078125, 34.22412109375, 35.3974609375, 36.57080078125, 37.744140625, 38.91748046875, 40.0908203125, 41.26416015625, 42.4375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 11.0, 16.0, 20.0, 35.0, 49.0, 79.0, 125.0, 157.0, 252.0, 349.0, 551.0, 842.0, 1275.0, 1966.0, 3041.0, 4568.0, 7180.0, 11439.0, 17759.0, 29327.0, 48954.0, 86574.0, 175210.0, 347696.0, 132517.0, 70825.0, 40765.0, 24408.0, 15214.0, 9732.0, 6155.0, 4021.0, 2594.0, 1718.0, 1051.0, 709.0, 430.0, 307.0, 190.0, 138.0, 106.0, 59.0, 42.0, 36.0, 18.0, 11.0, 15.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4609375, -1.415740966796875, -1.37054443359375, -1.325347900390625, -1.2801513671875, -1.234954833984375, -1.18975830078125, -1.144561767578125, -1.099365234375, -1.054168701171875, -1.00897216796875, -0.963775634765625, -0.9185791015625, -0.873382568359375, -0.82818603515625, -0.782989501953125, -0.73779296875, -0.692596435546875, -0.64739990234375, -0.602203369140625, -0.5570068359375, -0.511810302734375, -0.46661376953125, -0.421417236328125, -0.376220703125, -0.331024169921875, -0.28582763671875, -0.240631103515625, -0.1954345703125, -0.150238037109375, -0.10504150390625, -0.059844970703125, -0.0146484375, 0.030548095703125, 0.07574462890625, 0.120941162109375, 0.1661376953125, 0.211334228515625, 0.25653076171875, 0.301727294921875, 0.346923828125, 0.392120361328125, 0.43731689453125, 0.482513427734375, 0.5277099609375, 0.572906494140625, 0.61810302734375, 0.663299560546875, 0.70849609375, 0.753692626953125, 0.79888916015625, 0.844085693359375, 0.8892822265625, 0.934478759765625, 0.97967529296875, 1.024871826171875, 1.070068359375, 1.115264892578125, 1.16046142578125, 1.205657958984375, 1.2508544921875, 1.296051025390625, 1.34124755859375, 1.386444091796875, 1.431640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 6.0, 16.0, 15.0, 13.0, 25.0, 14.0, 20.0, 32.0, 25.0, 34.0, 27.0, 38.0, 56.0, 38.0, 37.0, 36.0, 30.0, 1063.0, 40.0, 44.0, 40.0, 31.0, 33.0, 27.0, 48.0, 30.0, 37.0, 25.0, 14.0, 13.0, 22.0, 16.0, 9.0, 11.0, 9.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.421875, -20.73681640625, -20.0517578125, -19.36669921875, -18.681640625, -17.99658203125, -17.3115234375, -16.62646484375, -15.94140625, -15.25634765625, -14.5712890625, -13.88623046875, -13.201171875, -12.51611328125, -11.8310546875, -11.14599609375, -10.4609375, -9.77587890625, -9.0908203125, -8.40576171875, -7.720703125, -7.03564453125, -6.3505859375, -5.66552734375, -4.98046875, -4.29541015625, -3.6103515625, -2.92529296875, -2.240234375, -1.55517578125, -0.8701171875, -0.18505859375, 0.5, 1.18505859375, 1.8701171875, 2.55517578125, 3.240234375, 3.92529296875, 4.6103515625, 5.29541015625, 5.98046875, 6.66552734375, 7.3505859375, 8.03564453125, 8.720703125, 9.40576171875, 10.0908203125, 10.77587890625, 11.4609375, 12.14599609375, 12.8310546875, 13.51611328125, 14.201171875, 14.88623046875, 15.5712890625, 16.25634765625, 16.94140625, 17.62646484375, 18.3115234375, 18.99658203125, 19.681640625, 20.36669921875, 21.0517578125, 21.73681640625, 22.421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 12.0, 23.0, 26.0, 35.0, 53.0, 67.0, 128.0, 156.0, 201.0, 293.0, 460.0, 618.0, 887.0, 1318.0, 1867.0, 2826.0, 4182.0, 6216.0, 9323.0, 13754.0, 21394.0, 33832.0, 54343.0, 88826.0, 167610.0, 1350347.0, 132094.0, 75806.0, 45473.0, 29221.0, 18572.0, 12100.0, 8091.0, 5403.0, 3549.0, 2487.0, 1667.0, 1183.0, 827.0, 562.0, 392.0, 273.0, 177.0, 136.0, 89.0, 62.0, 45.0, 40.0, 31.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0], "bins": [-0.91845703125, -0.8900527954101562, -0.8616485595703125, -0.8332443237304688, -0.804840087890625, -0.7764358520507812, -0.7480316162109375, -0.7196273803710938, -0.69122314453125, -0.6628189086914062, -0.6344146728515625, -0.6060104370117188, -0.577606201171875, -0.5492019653320312, -0.5207977294921875, -0.49239349365234375, -0.4639892578125, -0.43558502197265625, -0.4071807861328125, -0.37877655029296875, -0.350372314453125, -0.32196807861328125, -0.2935638427734375, -0.26515960693359375, -0.23675537109375, -0.20835113525390625, -0.1799468994140625, -0.15154266357421875, -0.123138427734375, -0.09473419189453125, -0.0663299560546875, -0.03792572021484375, -0.009521484375, 0.01888275146484375, 0.0472869873046875, 0.07569122314453125, 0.104095458984375, 0.13249969482421875, 0.1609039306640625, 0.18930816650390625, 0.21771240234375, 0.24611663818359375, 0.2745208740234375, 0.30292510986328125, 0.331329345703125, 0.35973358154296875, 0.3881378173828125, 0.41654205322265625, 0.4449462890625, 0.47335052490234375, 0.5017547607421875, 0.5301589965820312, 0.558563232421875, 0.5869674682617188, 0.6153717041015625, 0.6437759399414062, 0.67218017578125, 0.7005844116210938, 0.7289886474609375, 0.7573928833007812, 0.785797119140625, 0.8142013549804688, 0.8426055908203125, 0.8710098266601562, 0.8994140625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 2.0, 2.0, 16.0, 17.0, 23.0, 19.0, 41.0, 68.0, 209.0, 280.0, 107.0, 55.0, 37.0, 25.0, 19.0, 10.0, 10.0, 9.0, 6.0, 6.0, 8.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.179115295410156e-05, -8.894223719835281e-05, -8.609332144260406e-05, -8.324440568685532e-05, -8.039548993110657e-05, -7.754657417535782e-05, -7.469765841960907e-05, -7.184874266386032e-05, -6.899982690811157e-05, -6.615091115236282e-05, -6.330199539661407e-05, -6.0453079640865326e-05, -5.760416388511658e-05, -5.475524812936783e-05, -5.190633237361908e-05, -4.905741661787033e-05, -4.620850086212158e-05, -4.335958510637283e-05, -4.0510669350624084e-05, -3.7661753594875336e-05, -3.481283783912659e-05, -3.196392208337784e-05, -2.911500632762909e-05, -2.626609057188034e-05, -2.3417174816131592e-05, -2.0568259060382843e-05, -1.7719343304634094e-05, -1.4870427548885345e-05, -1.2021511793136597e-05, -9.172596037387848e-06, -6.323680281639099e-06, -3.4747645258903503e-06, -6.258487701416016e-07, 2.2230669856071472e-06, 5.071982741355896e-06, 7.920898497104645e-06, 1.0769814252853394e-05, 1.3618730008602142e-05, 1.646764576435089e-05, 1.931656152009964e-05, 2.216547727584839e-05, 2.5014393031597137e-05, 2.7863308787345886e-05, 3.0712224543094635e-05, 3.3561140298843384e-05, 3.641005605459213e-05, 3.925897181034088e-05, 4.210788756608963e-05, 4.495680332183838e-05, 4.780571907758713e-05, 5.0654634833335876e-05, 5.3503550589084625e-05, 5.6352466344833374e-05, 5.920138210058212e-05, 6.205029785633087e-05, 6.489921361207962e-05, 6.774812936782837e-05, 7.059704512357712e-05, 7.344596087932587e-05, 7.629487663507462e-05, 7.914379239082336e-05, 8.199270814657211e-05, 8.484162390232086e-05, 8.769053965806961e-05, 9.053945541381836e-05]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 10.0, 12.0, 14.0, 14.0, 21.0, 24.0, 49.0, 91.0, 273.0, 1210.0, 7499.0, 950305.0, 83957.0, 3943.0, 722.0, 187.0, 72.0, 35.0, 25.0, 19.0, 14.0, 10.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013303756713867188, -0.00128859281539917, -0.001246809959411621, -0.0012050271034240723, -0.0011632442474365234, -0.0011214613914489746, -0.0010796785354614258, -0.001037895679473877, -0.0009961128234863281, -0.0009543299674987793, -0.0009125471115112305, -0.0008707642555236816, -0.0008289813995361328, -0.000787198543548584, -0.0007454156875610352, -0.0007036328315734863, -0.0006618499755859375, -0.0006200671195983887, -0.0005782842636108398, -0.000536501407623291, -0.0004947185516357422, -0.00045293569564819336, -0.00041115283966064453, -0.0003693699836730957, -0.0003275871276855469, -0.00028580427169799805, -0.00024402141571044922, -0.0002022385597229004, -0.00016045570373535156, -0.00011867284774780273, -7.68899917602539e-05, -3.510713577270508e-05, 6.67572021484375e-06, 4.845857620239258e-05, 9.02414321899414e-05, 0.00013202428817749023, 0.00017380714416503906, 0.0002155900001525879, 0.0002573728561401367, 0.00029915571212768555, 0.0003409385681152344, 0.0003827214241027832, 0.00042450428009033203, 0.00046628713607788086, 0.0005080699920654297, 0.0005498528480529785, 0.0005916357040405273, 0.0006334185600280762, 0.000675201416015625, 0.0007169842720031738, 0.0007587671279907227, 0.0008005499839782715, 0.0008423328399658203, 0.0008841156959533691, 0.000925898551940918, 0.0009676814079284668, 0.0010094642639160156, 0.0010512471199035645, 0.0010930299758911133, 0.0011348128318786621, 0.001176595687866211, 0.0012183785438537598, 0.0012601613998413086, 0.0013019442558288574, 0.0013437271118164062]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 7.0, 12.0, 12.0, 20.0, 29.0, 38.0, 72.0, 140.0, 228.0, 162.0, 107.0, 64.0, 34.0, 28.0, 16.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.389992919750512e-05, -9.204779780702665e-05, -9.019565914059058e-05, -8.834352775011212e-05, -8.649138908367604e-05, -8.463925769319758e-05, -8.278712630271912e-05, -8.093498763628304e-05, -7.908285624580458e-05, -7.723072485532612e-05, -7.537858618889004e-05, -7.352645479841158e-05, -7.16743161319755e-05, -6.982218474149704e-05, -6.797005335101858e-05, -6.61179146845825e-05, -6.426578329410404e-05, -6.241365190362558e-05, -6.05615132371895e-05, -5.870938184671104e-05, -5.685724681825377e-05, -5.50051117897965e-05, -5.315297676133923e-05, -5.130084173288196e-05, -4.9448706704424694e-05, -4.7596571675967425e-05, -4.5744436647510156e-05, -4.3892305257031694e-05, -4.2040170228574425e-05, -4.0188035200117156e-05, -3.833590017165989e-05, -3.6483768781181425e-05, -3.463163739070296e-05, -3.2779502362245694e-05, -3.0927367333788425e-05, -2.907523412432056e-05, -2.7223100914852694e-05, -2.5370965886395425e-05, -2.3518830857938156e-05, -2.166669764847029e-05, -1.9814560801023617e-05, -1.796242577256635e-05, -1.6110292563098483e-05, -1.4258157534641214e-05, -1.2406024325173348e-05, -1.0553889296716079e-05, -8.701755177753512e-06, -6.8496210587909445e-06, -4.997487849323079e-06, -3.1453537303605117e-06, -1.293219384024269e-06, 5.589149623119738e-07, 2.411049081274541e-06, 4.263183654984459e-06, 6.115317773947027e-06, 7.967451892909594e-06, 9.819586011872161e-06, 1.1671720130834728e-05, 1.3523854249797296e-05, 1.5375988368759863e-05, 1.7228123397217132e-05, 1.9080256606684998e-05, 2.0932391635142267e-05, 2.2784526663599536e-05, 2.46366598730674e-05]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 0.0, 0.0, 3.0, 5.0, 8.0, 8.0, 6.0, 5.0, 13.0, 10.0, 19.0, 16.0, 12.0, 29.0, 14.0, 20.0, 18.0, 31.0, 27.0, 46.0, 29.0, 42.0, 29.0, 34.0, 43.0, 35.0, 43.0, 42.0, 47.0, 34.0, 50.0, 35.0, 30.0, 22.0, 38.0, 21.0, 21.0, 24.0, 14.0, 17.0, 6.0, 11.0, 6.0, 15.0, 7.0, 0.0, 8.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.057718276977539e-05, -2.9704533517360687e-05, -2.8831884264945984e-05, -2.795923501253128e-05, -2.7086585760116577e-05, -2.6213936507701874e-05, -2.534128725528717e-05, -2.4468638002872467e-05, -2.3595988750457764e-05, -2.272333949804306e-05, -2.1850690245628357e-05, -2.0978040993213654e-05, -2.010539174079895e-05, -1.9232742488384247e-05, -1.8360093235969543e-05, -1.748744398355484e-05, -1.6614794731140137e-05, -1.5742145478725433e-05, -1.486949622631073e-05, -1.3996846973896027e-05, -1.3124197721481323e-05, -1.225154846906662e-05, -1.1378899216651917e-05, -1.0506249964237213e-05, -9.63360071182251e-06, -8.760951459407806e-06, -7.888302206993103e-06, -7.0156529545784e-06, -6.143003702163696e-06, -5.270354449748993e-06, -4.3977051973342896e-06, -3.525055944919586e-06, -2.652406692504883e-06, -1.7797574400901794e-06, -9.071081876754761e-07, -3.4458935260772705e-08, 8.381903171539307e-07, 1.710839569568634e-06, 2.5834888219833374e-06, 3.4561380743980408e-06, 4.328787326812744e-06, 5.2014365792274475e-06, 6.074085831642151e-06, 6.946735084056854e-06, 7.819384336471558e-06, 8.692033588886261e-06, 9.564682841300964e-06, 1.0437332093715668e-05, 1.1309981346130371e-05, 1.2182630598545074e-05, 1.3055279850959778e-05, 1.3927929103374481e-05, 1.4800578355789185e-05, 1.5673227608203888e-05, 1.654587686061859e-05, 1.7418526113033295e-05, 1.8291175365447998e-05, 1.91638246178627e-05, 2.0036473870277405e-05, 2.0909123122692108e-05, 2.178177237510681e-05, 2.2654421627521515e-05, 2.3527070879936218e-05, 2.439972013235092e-05, 2.5272369384765625e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 6.0, 1.0, 6.0, 10.0, 11.0, 12.0, 15.0, 8.0, 17.0, 25.0, 23.0, 29.0, 35.0, 22.0, 39.0, 41.0, 46.0, 42.0, 44.0, 46.0, 49.0, 51.0, 29.0, 42.0, 33.0, 42.0, 37.0, 27.0, 38.0, 22.0, 27.0, 28.0, 19.0, 16.0, 13.0, 17.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.48291015625, -30.3095703125, -29.13623046875, -27.962890625, -26.78955078125, -25.6162109375, -24.44287109375, -23.26953125, -22.09619140625, -20.9228515625, -19.74951171875, -18.576171875, -17.40283203125, -16.2294921875, -15.05615234375, -13.8828125, -12.70947265625, -11.5361328125, -10.36279296875, -9.189453125, -8.01611328125, -6.8427734375, -5.66943359375, -4.49609375, -3.32275390625, -2.1494140625, -0.97607421875, 0.197265625, 1.37060546875, 2.5439453125, 3.71728515625, 4.890625, 6.06396484375, 7.2373046875, 8.41064453125, 9.583984375, 10.75732421875, 11.9306640625, 13.10400390625, 14.27734375, 15.45068359375, 16.6240234375, 17.79736328125, 18.970703125, 20.14404296875, 21.3173828125, 22.49072265625, 23.6640625, 24.83740234375, 26.0107421875, 27.18408203125, 28.357421875, 29.53076171875, 30.7041015625, 31.87744140625, 33.05078125, 34.22412109375, 35.3974609375, 36.57080078125, 37.744140625, 38.91748046875, 40.0908203125, 41.26416015625, 42.4375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 9.0, 14.0, 9.0, 14.0, 17.0, 23.0, 33.0, 44.0, 59.0, 76.0, 96.0, 142.0, 189.0, 250.0, 378.0, 442.0, 624.0, 842.0, 1107.0, 1563.0, 2348.0, 4294.0, 11985.0, 60328.0, 505009.0, 388034.0, 48362.0, 10406.0, 3929.0, 2195.0, 1486.0, 1077.0, 838.0, 572.0, 456.0, 326.0, 263.0, 196.0, 132.0, 104.0, 75.0, 54.0, 43.0, 29.0, 20.0, 14.0, 11.0, 10.0, 8.0, 5.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0], "bins": [-29.140625, -28.228271484375, -27.31591796875, -26.403564453125, -25.4912109375, -24.578857421875, -23.66650390625, -22.754150390625, -21.841796875, -20.929443359375, -20.01708984375, -19.104736328125, -18.1923828125, -17.280029296875, -16.36767578125, -15.455322265625, -14.54296875, -13.630615234375, -12.71826171875, -11.805908203125, -10.8935546875, -9.981201171875, -9.06884765625, -8.156494140625, -7.244140625, -6.331787109375, -5.41943359375, -4.507080078125, -3.5947265625, -2.682373046875, -1.77001953125, -0.857666015625, 0.0546875, 0.967041015625, 1.87939453125, 2.791748046875, 3.7041015625, 4.616455078125, 5.52880859375, 6.441162109375, 7.353515625, 8.265869140625, 9.17822265625, 10.090576171875, 11.0029296875, 11.915283203125, 12.82763671875, 13.739990234375, 14.65234375, 15.564697265625, 16.47705078125, 17.389404296875, 18.3017578125, 19.214111328125, 20.12646484375, 21.038818359375, 21.951171875, 22.863525390625, 23.77587890625, 24.688232421875, 25.6005859375, 26.512939453125, 27.42529296875, 28.337646484375, 29.25]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 17.0, 13.0, 14.0, 10.0, 14.0, 10.0, 16.0, 33.0, 26.0, 37.0, 37.0, 40.0, 30.0, 44.0, 45.0, 64.0, 321.0, 1715.0, 75.0, 50.0, 43.0, 44.0, 48.0, 47.0, 33.0, 37.0, 27.0, 34.0, 16.0, 23.0, 11.0, 9.0, 3.0, 8.0, 13.0, 8.0, 7.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.25, -101.8642578125, -98.478515625, -95.0927734375, -91.70703125, -88.3212890625, -84.935546875, -81.5498046875, -78.1640625, -74.7783203125, -71.392578125, -68.0068359375, -64.62109375, -61.2353515625, -57.849609375, -54.4638671875, -51.078125, -47.6923828125, -44.306640625, -40.9208984375, -37.53515625, -34.1494140625, -30.763671875, -27.3779296875, -23.9921875, -20.6064453125, -17.220703125, -13.8349609375, -10.44921875, -7.0634765625, -3.677734375, -0.2919921875, 3.09375, 6.4794921875, 9.865234375, 13.2509765625, 16.63671875, 20.0224609375, 23.408203125, 26.7939453125, 30.1796875, 33.5654296875, 36.951171875, 40.3369140625, 43.72265625, 47.1083984375, 50.494140625, 53.8798828125, 57.265625, 60.6513671875, 64.037109375, 67.4228515625, 70.80859375, 74.1943359375, 77.580078125, 80.9658203125, 84.3515625, 87.7373046875, 91.123046875, 94.5087890625, 97.89453125, 101.2802734375, 104.666015625, 108.0517578125, 111.4375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 7.0, 13.0, 9.0, 5.0, 10.0, 11.0, 32.0, 34.0, 52.0, 56.0, 68.0, 75.0, 114.0, 146.0, 194.0, 317.0, 915.0, 5423.0, 2946235.0, 186753.0, 3546.0, 709.0, 257.0, 153.0, 106.0, 83.0, 96.0, 63.0, 51.0, 33.0, 17.0, 20.0, 17.0, 16.0, 10.0, 20.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-244.0, -236.58203125, -229.1640625, -221.74609375, -214.328125, -206.91015625, -199.4921875, -192.07421875, -184.65625, -177.23828125, -169.8203125, -162.40234375, -154.984375, -147.56640625, -140.1484375, -132.73046875, -125.3125, -117.89453125, -110.4765625, -103.05859375, -95.640625, -88.22265625, -80.8046875, -73.38671875, -65.96875, -58.55078125, -51.1328125, -43.71484375, -36.296875, -28.87890625, -21.4609375, -14.04296875, -6.625, 0.79296875, 8.2109375, 15.62890625, 23.046875, 30.46484375, 37.8828125, 45.30078125, 52.71875, 60.13671875, 67.5546875, 74.97265625, 82.390625, 89.80859375, 97.2265625, 104.64453125, 112.0625, 119.48046875, 126.8984375, 134.31640625, 141.734375, 149.15234375, 156.5703125, 163.98828125, 171.40625, 178.82421875, 186.2421875, 193.66015625, 201.078125, 208.49609375, 215.9140625, 223.33203125, 230.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 18.0, 312.0, 556.0, 114.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-695.890869140625, -680.5185546875, -665.1463012695312, -649.7739868164062, -634.4016723632812, -619.0294189453125, -603.6571044921875, -588.2847900390625, -572.9125366210938, -557.5402221679688, -542.16796875, -526.795654296875, -511.4233703613281, -496.05108642578125, -480.67877197265625, -465.3064880371094, -449.9341735839844, -434.5618896484375, -419.1895751953125, -403.8172912597656, -388.44500732421875, -373.07269287109375, -357.7004089355469, -342.328125, -326.955810546875, -311.5835266113281, -296.2112121582031, -280.83892822265625, -265.4666442871094, -250.09434509277344, -234.7220458984375, -219.34976196289062, -203.97747802734375, -188.6051788330078, -173.23289489746094, -157.860595703125, -142.48831176757812, -127.11601257324219, -111.74371337890625, -96.37142181396484, -80.99913024902344, -65.62683868408203, -50.25454330444336, -34.88224792480469, -19.50995635986328, -4.137664794921875, 11.234634399414062, 26.60692596435547, 41.979217529296875, 57.35150909423828, 72.72380065917969, 88.09609985351562, 103.46839141845703, 118.84068298339844, 134.21298217773438, 149.58526611328125, 164.9575653076172, 180.32986450195312, 195.7021484375, 211.07444763183594, 226.44674682617188, 241.81903076171875, 257.19134521484375, 272.5636291503906, 287.9359130859375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 10.0, 14.0, 13.0, 17.0, 23.0, 20.0, 22.0, 28.0, 24.0, 34.0, 24.0, 45.0, 43.0, 46.0, 49.0, 44.0, 46.0, 44.0, 38.0, 46.0, 32.0, 46.0, 45.0, 34.0, 29.0, 30.0, 16.0, 19.0, 17.0, 18.0, 11.0, 13.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-295.79742431640625, -285.4211730957031, -275.0448913574219, -264.66864013671875, -254.29237365722656, -243.91610717773438, -233.53985595703125, -223.16358947753906, -212.78732299804688, -202.4110565185547, -192.0347900390625, -181.65853881835938, -171.2822723388672, -160.906005859375, -150.52975463867188, -140.1534881591797, -129.7772216796875, -119.40095520019531, -109.02469635009766, -98.6484375, -88.27217102050781, -77.89590454101562, -67.51964569091797, -57.14338684082031, -46.767120361328125, -36.3908576965332, -26.01459503173828, -15.63833236694336, -5.2620697021484375, 5.114192962646484, 15.490455627441406, 25.866714477539062, 36.242950439453125, 46.61921310424805, 56.99547576904297, 67.37173461914062, 77.74800109863281, 88.124267578125, 98.50052642822266, 108.87678527832031, 119.2530517578125, 129.6293182373047, 140.00558471679688, 150.3818359375, 160.7581024169922, 171.13436889648438, 181.5106201171875, 191.8868865966797, 202.26315307617188, 212.63941955566406, 223.01568603515625, 233.39193725585938, 243.76820373535156, 254.14447021484375, 264.5207214355469, 274.89697265625, 285.27325439453125, 295.6495056152344, 306.0257873535156, 316.40203857421875, 326.7783203125, 337.1545715332031, 347.53082275390625, 357.9071044921875, 368.2833557128906]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 9.0, 5.0, 7.0, 13.0, 14.0, 10.0, 15.0, 22.0, 23.0, 28.0, 27.0, 31.0, 37.0, 31.0, 41.0, 44.0, 45.0, 50.0, 42.0, 47.0, 44.0, 37.0, 37.0, 39.0, 34.0, 31.0, 32.0, 27.0, 29.0, 29.0, 22.0, 16.0, 16.0, 20.0, 8.0, 15.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.3125, -31.13037109375, -29.9482421875, -28.76611328125, -27.583984375, -26.40185546875, -25.2197265625, -24.03759765625, -22.85546875, -21.67333984375, -20.4912109375, -19.30908203125, -18.126953125, -16.94482421875, -15.7626953125, -14.58056640625, -13.3984375, -12.21630859375, -11.0341796875, -9.85205078125, -8.669921875, -7.48779296875, -6.3056640625, -5.12353515625, -3.94140625, -2.75927734375, -1.5771484375, -0.39501953125, 0.787109375, 1.96923828125, 3.1513671875, 4.33349609375, 5.515625, 6.69775390625, 7.8798828125, 9.06201171875, 10.244140625, 11.42626953125, 12.6083984375, 13.79052734375, 14.97265625, 16.15478515625, 17.3369140625, 18.51904296875, 19.701171875, 20.88330078125, 22.0654296875, 23.24755859375, 24.4296875, 25.61181640625, 26.7939453125, 27.97607421875, 29.158203125, 30.34033203125, 31.5224609375, 32.70458984375, 33.88671875, 35.06884765625, 36.2509765625, 37.43310546875, 38.615234375, 39.79736328125, 40.9794921875, 42.16162109375, 43.34375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 13.0, 14.0, 22.0, 31.0, 44.0, 57.0, 67.0, 97.0, 149.0, 206.0, 281.0, 414.0, 630.0, 1000.0, 1701.0, 3209.0, 6550.0, 15923.0, 107923.0, 3344770.0, 661933.0, 28622.0, 9761.0, 4614.0, 2312.0, 1280.0, 806.0, 556.0, 368.0, 255.0, 181.0, 128.0, 88.0, 62.0, 53.0, 34.0, 30.0, 24.0, 14.0, 11.0, 8.0, 13.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.25, -107.509765625, -103.76953125, -100.029296875, -96.2890625, -92.548828125, -88.80859375, -85.068359375, -81.328125, -77.587890625, -73.84765625, -70.107421875, -66.3671875, -62.626953125, -58.88671875, -55.146484375, -51.40625, -47.666015625, -43.92578125, -40.185546875, -36.4453125, -32.705078125, -28.96484375, -25.224609375, -21.484375, -17.744140625, -14.00390625, -10.263671875, -6.5234375, -2.783203125, 0.95703125, 4.697265625, 8.4375, 12.177734375, 15.91796875, 19.658203125, 23.3984375, 27.138671875, 30.87890625, 34.619140625, 38.359375, 42.099609375, 45.83984375, 49.580078125, 53.3203125, 57.060546875, 60.80078125, 64.541015625, 68.28125, 72.021484375, 75.76171875, 79.501953125, 83.2421875, 86.982421875, 90.72265625, 94.462890625, 98.203125, 101.943359375, 105.68359375, 109.423828125, 113.1640625, 116.904296875, 120.64453125, 124.384765625, 128.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 4.0, 18.0, 12.0, 17.0, 21.0, 30.0, 28.0, 36.0, 43.0, 109.0, 251.0, 673.0, 1360.0, 771.0, 353.0, 120.0, 44.0, 42.0, 26.0, 25.0, 14.0, 12.0, 10.0, 10.0, 4.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.625, -97.4375, -94.25, -91.0625, -87.875, -84.6875, -81.5, -78.3125, -75.125, -71.9375, -68.75, -65.5625, -62.375, -59.1875, -56.0, -52.8125, -49.625, -46.4375, -43.25, -40.0625, -36.875, -33.6875, -30.5, -27.3125, -24.125, -20.9375, -17.75, -14.5625, -11.375, -8.1875, -5.0, -1.8125, 1.375, 4.5625, 7.75, 10.9375, 14.125, 17.3125, 20.5, 23.6875, 26.875, 30.0625, 33.25, 36.4375, 39.625, 42.8125, 46.0, 49.1875, 52.375, 55.5625, 58.75, 61.9375, 65.125, 68.3125, 71.5, 74.6875, 77.875, 81.0625, 84.25, 87.4375, 90.625, 93.8125, 97.0, 100.1875, 103.375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 11.0, 9.0, 17.0, 14.0, 28.0, 51.0, 86.0, 168.0, 412.0, 1004.0, 2404.0, 7092.0, 25398.0, 185188.0, 3862281.0, 84823.0, 16940.0, 5056.0, 1908.0, 664.0, 332.0, 149.0, 84.0, 52.0, 33.0, 29.0, 11.0, 6.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.75, -242.03125, -234.3125, -226.59375, -218.875, -211.15625, -203.4375, -195.71875, -188.0, -180.28125, -172.5625, -164.84375, -157.125, -149.40625, -141.6875, -133.96875, -126.25, -118.53125, -110.8125, -103.09375, -95.375, -87.65625, -79.9375, -72.21875, -64.5, -56.78125, -49.0625, -41.34375, -33.625, -25.90625, -18.1875, -10.46875, -2.75, 4.96875, 12.6875, 20.40625, 28.125, 35.84375, 43.5625, 51.28125, 59.0, 66.71875, 74.4375, 82.15625, 89.875, 97.59375, 105.3125, 113.03125, 120.75, 128.46875, 136.1875, 143.90625, 151.625, 159.34375, 167.0625, 174.78125, 182.5, 190.21875, 197.9375, 205.65625, 213.375, 221.09375, 228.8125, 236.53125, 244.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 8.0, 8.0, 12.0, 24.0, 18.0, 51.0, 70.0, 140.0, 280.0, 203.0, 89.0, 53.0, 21.0, 14.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.4799346923828, -229.0304412841797, -207.58096313476562, -186.1314697265625, -164.68197631835938, -143.2324981689453, -121.78300476074219, -100.33352661132812, -78.884033203125, -57.434547424316406, -35.98505783081055, -14.535568237304688, 6.913917541503906, 28.3634033203125, 49.812896728515625, 71.26237487792969, 92.71186828613281, 114.1613540649414, 135.61083984375, 157.06033325195312, 178.50982666015625, 199.9593048095703, 221.40879821777344, 242.8582763671875, 264.3077697753906, 285.75726318359375, 307.2067565917969, 328.65625, 350.105712890625, 371.5552062988281, 393.00469970703125, 414.45416259765625, 435.90362548828125, 457.3531188964844, 478.8026123046875, 500.2520751953125, 521.7015991210938, 543.1510620117188, 564.6005859375, 586.050048828125, 607.49951171875, 628.948974609375, 650.3984985351562, 671.8479614257812, 693.2974853515625, 714.7469482421875, 736.1964111328125, 757.6459350585938, 779.095458984375, 800.544921875, 821.9944458007812, 843.4439086914062, 864.8934326171875, 886.3428955078125, 907.7923583984375, 929.2418823242188, 950.6913452148438, 972.1408081054688, 993.59033203125, 1015.039794921875, 1036.4892578125, 1057.938720703125, 1079.3883056640625, 1100.8377685546875, 1122.2872314453125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 8.0, 3.0, 8.0, 13.0, 11.0, 9.0, 19.0, 17.0, 13.0, 27.0, 23.0, 31.0, 14.0, 38.0, 43.0, 38.0, 42.0, 40.0, 48.0, 43.0, 42.0, 26.0, 35.0, 35.0, 41.0, 24.0, 38.0, 33.0, 26.0, 29.0, 23.0, 21.0, 19.0, 20.0, 16.0, 16.0, 8.0, 8.0, 10.0, 3.0, 8.0, 0.0, 4.0, 6.0, 3.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-208.52981567382812, -201.77549743652344, -195.0211639404297, -188.266845703125, -181.5125274658203, -174.75820922851562, -168.00387573242188, -161.2495574951172, -154.4952392578125, -147.7409210205078, -140.98658752441406, -134.23226928710938, -127.47795104980469, -120.72362518310547, -113.96929931640625, -107.21498107910156, -100.46064758300781, -93.7063217163086, -86.9520034790039, -80.19767761230469, -73.443359375, -66.68903350830078, -59.93470764160156, -53.18038558959961, -46.426063537597656, -39.6717414855957, -32.91741943359375, -26.16309356689453, -19.408771514892578, -12.654449462890625, -5.900123596191406, 0.8541984558105469, 7.6085205078125, 14.36284351348877, 21.11716651916504, 27.871490478515625, 34.62581253051758, 41.38013458251953, 48.13446044921875, 54.8887825012207, 61.643104553222656, 68.39743041992188, 75.15174865722656, 81.90607452392578, 88.660400390625, 95.41471862792969, 102.1690444946289, 108.92337036132812, 115.67768859863281, 122.43201446533203, 129.18634033203125, 135.94065856933594, 142.69497680664062, 149.44931030273438, 156.20362854003906, 162.95794677734375, 169.7122802734375, 176.4665985107422, 183.22093200683594, 189.97525024414062, 196.7295684814453, 203.48388671875, 210.23822021484375, 216.99253845214844, 223.74685668945312]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 11.0, 6.0, 8.0, 14.0, 12.0, 15.0, 20.0, 12.0, 20.0, 28.0, 30.0, 29.0, 43.0, 35.0, 30.0, 50.0, 35.0, 35.0, 52.0, 49.0, 43.0, 43.0, 37.0, 27.0, 38.0, 28.0, 34.0, 38.0, 25.0, 25.0, 16.0, 21.0, 17.0, 12.0, 8.0, 11.0, 10.0, 4.0, 4.0, 4.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.46875, -32.3173828125, -31.166015625, -30.0146484375, -28.86328125, -27.7119140625, -26.560546875, -25.4091796875, -24.2578125, -23.1064453125, -21.955078125, -20.8037109375, -19.65234375, -18.5009765625, -17.349609375, -16.1982421875, -15.046875, -13.8955078125, -12.744140625, -11.5927734375, -10.44140625, -9.2900390625, -8.138671875, -6.9873046875, -5.8359375, -4.6845703125, -3.533203125, -2.3818359375, -1.23046875, -0.0791015625, 1.072265625, 2.2236328125, 3.375, 4.5263671875, 5.677734375, 6.8291015625, 7.98046875, 9.1318359375, 10.283203125, 11.4345703125, 12.5859375, 13.7373046875, 14.888671875, 16.0400390625, 17.19140625, 18.3427734375, 19.494140625, 20.6455078125, 21.796875, 22.9482421875, 24.099609375, 25.2509765625, 26.40234375, 27.5537109375, 28.705078125, 29.8564453125, 31.0078125, 32.1591796875, 33.310546875, 34.4619140625, 35.61328125, 36.7646484375, 37.916015625, 39.0673828125, 40.21875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 12.0, 8.0, 11.0, 33.0, 37.0, 59.0, 81.0, 138.0, 190.0, 283.0, 386.0, 601.0, 948.0, 1321.0, 1915.0, 2915.0, 4177.0, 6337.0, 9697.0, 14948.0, 23761.0, 37484.0, 62092.0, 109445.0, 285302.0, 227461.0, 101411.0, 58079.0, 35279.0, 22035.0, 14275.0, 9318.0, 5993.0, 4072.0, 2729.0, 1842.0, 1249.0, 789.0, 576.0, 412.0, 276.0, 185.0, 110.0, 87.0, 53.0, 44.0, 31.0, 23.0, 14.0, 13.0, 7.0, 2.0, 4.0, 4.0], "bins": [-1.4638671875, -1.421966552734375, -1.38006591796875, -1.338165283203125, -1.2962646484375, -1.254364013671875, -1.21246337890625, -1.170562744140625, -1.128662109375, -1.086761474609375, -1.04486083984375, -1.002960205078125, -0.9610595703125, -0.919158935546875, -0.87725830078125, -0.835357666015625, -0.79345703125, -0.751556396484375, -0.70965576171875, -0.667755126953125, -0.6258544921875, -0.583953857421875, -0.54205322265625, -0.500152587890625, -0.458251953125, -0.416351318359375, -0.37445068359375, -0.332550048828125, -0.2906494140625, -0.248748779296875, -0.20684814453125, -0.164947509765625, -0.123046875, -0.081146240234375, -0.03924560546875, 0.002655029296875, 0.0445556640625, 0.086456298828125, 0.12835693359375, 0.170257568359375, 0.212158203125, 0.254058837890625, 0.29595947265625, 0.337860107421875, 0.3797607421875, 0.421661376953125, 0.46356201171875, 0.505462646484375, 0.54736328125, 0.589263916015625, 0.63116455078125, 0.673065185546875, 0.7149658203125, 0.756866455078125, 0.79876708984375, 0.840667724609375, 0.882568359375, 0.924468994140625, 0.96636962890625, 1.008270263671875, 1.0501708984375, 1.092071533203125, 1.13397216796875, 1.175872802734375, 1.2177734375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 3.0, 8.0, 11.0, 10.0, 15.0, 15.0, 21.0, 22.0, 14.0, 24.0, 26.0, 22.0, 33.0, 45.0, 34.0, 35.0, 38.0, 39.0, 39.0, 32.0, 1071.0, 45.0, 33.0, 35.0, 32.0, 34.0, 34.0, 28.0, 29.0, 28.0, 21.0, 23.0, 17.0, 17.0, 10.0, 15.0, 14.0, 9.0, 12.0, 6.0, 5.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.734375, -19.055419921875, -18.37646484375, -17.697509765625, -17.0185546875, -16.339599609375, -15.66064453125, -14.981689453125, -14.302734375, -13.623779296875, -12.94482421875, -12.265869140625, -11.5869140625, -10.907958984375, -10.22900390625, -9.550048828125, -8.87109375, -8.192138671875, -7.51318359375, -6.834228515625, -6.1552734375, -5.476318359375, -4.79736328125, -4.118408203125, -3.439453125, -2.760498046875, -2.08154296875, -1.402587890625, -0.7236328125, -0.044677734375, 0.63427734375, 1.313232421875, 1.9921875, 2.671142578125, 3.35009765625, 4.029052734375, 4.7080078125, 5.386962890625, 6.06591796875, 6.744873046875, 7.423828125, 8.102783203125, 8.78173828125, 9.460693359375, 10.1396484375, 10.818603515625, 11.49755859375, 12.176513671875, 12.85546875, 13.534423828125, 14.21337890625, 14.892333984375, 15.5712890625, 16.250244140625, 16.92919921875, 17.608154296875, 18.287109375, 18.966064453125, 19.64501953125, 20.323974609375, 21.0029296875, 21.681884765625, 22.36083984375, 23.039794921875, 23.71875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 9.0, 11.0, 26.0, 25.0, 26.0, 44.0, 64.0, 88.0, 125.0, 198.0, 276.0, 408.0, 640.0, 886.0, 1249.0, 1803.0, 2607.0, 4059.0, 6044.0, 9091.0, 13531.0, 20978.0, 32871.0, 52618.0, 87603.0, 167808.0, 1365369.0, 129052.0, 73164.0, 44669.0, 27761.0, 18165.0, 11810.0, 7914.0, 5244.0, 3470.0, 2345.0, 1566.0, 1090.0, 725.0, 520.0, 346.0, 269.0, 166.0, 112.0, 76.0, 69.0, 49.0, 29.0, 20.0, 16.0, 13.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.970703125, -0.940673828125, -0.91064453125, -0.880615234375, -0.8505859375, -0.820556640625, -0.79052734375, -0.760498046875, -0.73046875, -0.700439453125, -0.67041015625, -0.640380859375, -0.6103515625, -0.580322265625, -0.55029296875, -0.520263671875, -0.490234375, -0.460205078125, -0.43017578125, -0.400146484375, -0.3701171875, -0.340087890625, -0.31005859375, -0.280029296875, -0.25, -0.219970703125, -0.18994140625, -0.159912109375, -0.1298828125, -0.099853515625, -0.06982421875, -0.039794921875, -0.009765625, 0.020263671875, 0.05029296875, 0.080322265625, 0.1103515625, 0.140380859375, 0.17041015625, 0.200439453125, 0.23046875, 0.260498046875, 0.29052734375, 0.320556640625, 0.3505859375, 0.380615234375, 0.41064453125, 0.440673828125, 0.470703125, 0.500732421875, 0.53076171875, 0.560791015625, 0.5908203125, 0.620849609375, 0.65087890625, 0.680908203125, 0.7109375, 0.740966796875, 0.77099609375, 0.801025390625, 0.8310546875, 0.861083984375, 0.89111328125, 0.921142578125, 0.951171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 3.0, 9.0, 9.0, 8.0, 26.0, 23.0, 31.0, 42.0, 70.0, 120.0, 332.0, 87.0, 73.0, 31.0, 29.0, 27.0, 14.0, 12.0, 6.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.987022399902344e-05, -7.731374353170395e-05, -7.475726306438446e-05, -7.220078259706497e-05, -6.964430212974548e-05, -6.7087821662426e-05, -6.45313411951065e-05, -6.197486072778702e-05, -5.941838026046753e-05, -5.686189979314804e-05, -5.430541932582855e-05, -5.1748938858509064e-05, -4.9192458391189575e-05, -4.663597792387009e-05, -4.40794974565506e-05, -4.152301698923111e-05, -3.896653652191162e-05, -3.641005605459213e-05, -3.3853575587272644e-05, -3.1297095119953156e-05, -2.8740614652633667e-05, -2.618413418531418e-05, -2.362765371799469e-05, -2.10711732506752e-05, -1.8514692783355713e-05, -1.5958212316036224e-05, -1.3401731848716736e-05, -1.0845251381397247e-05, -8.288770914077759e-06, -5.73229044675827e-06, -3.1758099794387817e-06, -6.193295121192932e-07, 1.9371509552001953e-06, 4.493631422519684e-06, 7.050111889839172e-06, 9.606592357158661e-06, 1.216307282447815e-05, 1.4719553291797638e-05, 1.7276033759117126e-05, 1.9832514226436615e-05, 2.2388994693756104e-05, 2.4945475161075592e-05, 2.750195562839508e-05, 3.005843609571457e-05, 3.261491656303406e-05, 3.5171397030353546e-05, 3.7727877497673035e-05, 4.028435796499252e-05, 4.284083843231201e-05, 4.53973188996315e-05, 4.795379936695099e-05, 5.051027983427048e-05, 5.3066760301589966e-05, 5.5623240768909454e-05, 5.817972123622894e-05, 6.073620170354843e-05, 6.329268217086792e-05, 6.584916263818741e-05, 6.84056431055069e-05, 7.096212357282639e-05, 7.351860404014587e-05, 7.607508450746536e-05, 7.863156497478485e-05, 8.118804544210434e-05, 8.374452590942383e-05]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 10.0, 19.0, 22.0, 34.0, 60.0, 114.0, 555.0, 6154.0, 986418.0, 53136.0, 1549.0, 247.0, 71.0, 34.0, 32.0, 14.0, 11.0, 10.0, 8.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001468658447265625, -0.0014238208532333374, -0.0013789832592010498, -0.0013341456651687622, -0.0012893080711364746, -0.001244470477104187, -0.0011996328830718994, -0.0011547952890396118, -0.0011099576950073242, -0.0010651201009750366, -0.001020282506942749, -0.0009754449129104614, -0.0009306073188781738, -0.0008857697248458862, -0.0008409321308135986, -0.000796094536781311, -0.0007512569427490234, -0.0007064193487167358, -0.0006615817546844482, -0.0006167441606521606, -0.000571906566619873, -0.0005270689725875854, -0.00048223137855529785, -0.00043739378452301025, -0.00039255619049072266, -0.00034771859645843506, -0.00030288100242614746, -0.00025804340839385986, -0.00021320581436157227, -0.00016836822032928467, -0.00012353062629699707, -7.869303226470947e-05, -3.3855438232421875e-05, 1.0982155799865723e-05, 5.581974983215332e-05, 0.00010065734386444092, 0.00014549493789672852, 0.0001903325319290161, 0.0002351701259613037, 0.0002800077199935913, 0.0003248453140258789, 0.0003696829080581665, 0.0004145205020904541, 0.0004593580961227417, 0.0005041956901550293, 0.0005490332841873169, 0.0005938708782196045, 0.0006387084722518921, 0.0006835460662841797, 0.0007283836603164673, 0.0007732212543487549, 0.0008180588483810425, 0.0008628964424133301, 0.0009077340364456177, 0.0009525716304779053, 0.0009974092245101929, 0.0010422468185424805, 0.001087084412574768, 0.0011319220066070557, 0.0011767596006393433, 0.0012215971946716309, 0.0012664347887039185, 0.001311272382736206, 0.0013561099767684937, 0.0014009475708007812]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 24.0, 42.0, 80.0, 246.0, 388.0, 133.0, 39.0, 25.0, 13.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00015841747517697513, -0.00015544008056167513, -0.0001524626713944599, -0.0001494852767791599, -0.0001465078821638599, -0.0001435304875485599, -0.00014055307838134468, -0.00013757568376604468, -0.00013459828915074468, -0.00013162089453544468, -0.00012864348536822945, -0.00012566609075292945, -0.00012268869613762945, -0.00011971129424637184, -0.00011673389235511422, -0.00011375649773981422, -0.000110779088572599, -0.00010780168668134138, -0.00010482429206604138, -0.00010184689017478377, -9.886949555948377e-05, -9.589209366822615e-05, -9.291469177696854e-05, -8.993729716166854e-05, -8.695990254636854e-05, -8.398250065511093e-05, -8.100510603981093e-05, -7.802770414855331e-05, -7.505030953325331e-05, -7.20729076419957e-05, -6.909550575073808e-05, -6.611811113543808e-05, -6.314070924418047e-05, -6.0163310990901664e-05, -5.718591273762286e-05, -5.420851084636524e-05, -5.1231112593086436e-05, -4.825371433980763e-05, -4.527631608652882e-05, -4.2298917833250016e-05, -3.93215159419924e-05, -3.6344117688713595e-05, -3.336671943543479e-05, -3.0389319363166578e-05, -2.7411919290898368e-05, -2.443452103761956e-05, -2.1457122784340754e-05, -1.8479722712072544e-05, -1.550232627778314e-05, -1.2524927115009632e-05, -9.547527952236123e-06, -6.570129698957317e-06, -3.592730536183808e-06, -6.153313734102994e-07, 2.3620668798685074e-06, 5.339466952136718e-06, 8.316865205415525e-06, 1.1294264368189033e-05, 1.4271663530962542e-05, 1.724906178424135e-05, 2.0226460037520155e-05, 2.3203860109788366e-05, 2.6181258363067172e-05, 2.9158658435335383e-05, 3.213605668861419e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 3.0, 11.0, 7.0, 17.0, 7.0, 16.0, 12.0, 17.0, 16.0, 23.0, 23.0, 22.0, 21.0, 29.0, 42.0, 29.0, 34.0, 35.0, 34.0, 38.0, 38.0, 39.0, 34.0, 25.0, 40.0, 39.0, 42.0, 40.0, 29.0, 21.0, 25.0, 22.0, 20.0, 24.0, 17.0, 13.0, 16.0, 13.0, 15.0, 13.0, 4.0, 7.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5093555450439453e-05, -2.4335458874702454e-05, -2.3577362298965454e-05, -2.2819265723228455e-05, -2.2061169147491455e-05, -2.1303072571754456e-05, -2.0544975996017456e-05, -1.9786879420280457e-05, -1.9028782844543457e-05, -1.8270686268806458e-05, -1.7512589693069458e-05, -1.675449311733246e-05, -1.599639654159546e-05, -1.523829996585846e-05, -1.448020339012146e-05, -1.372210681438446e-05, -1.2964010238647461e-05, -1.2205913662910461e-05, -1.1447817087173462e-05, -1.0689720511436462e-05, -9.931623935699463e-06, -9.173527359962463e-06, -8.415430784225464e-06, -7.657334208488464e-06, -6.899237632751465e-06, -6.141141057014465e-06, -5.383044481277466e-06, -4.624947905540466e-06, -3.866851329803467e-06, -3.1087547540664673e-06, -2.3506581783294678e-06, -1.5925616025924683e-06, -8.344650268554688e-07, -7.636845111846924e-08, 6.817281246185303e-07, 1.4398247003555298e-06, 2.1979212760925293e-06, 2.956017851829529e-06, 3.7141144275665283e-06, 4.472211003303528e-06, 5.230307579040527e-06, 5.988404154777527e-06, 6.746500730514526e-06, 7.504597306251526e-06, 8.262693881988525e-06, 9.020790457725525e-06, 9.778887033462524e-06, 1.0536983609199524e-05, 1.1295080184936523e-05, 1.2053176760673523e-05, 1.2811273336410522e-05, 1.3569369912147522e-05, 1.4327466487884521e-05, 1.5085563063621521e-05, 1.584365963935852e-05, 1.660175621509552e-05, 1.735985279083252e-05, 1.811794936656952e-05, 1.887604594230652e-05, 1.9634142518043518e-05, 2.0392239093780518e-05, 2.1150335669517517e-05, 2.1908432245254517e-05, 2.2666528820991516e-05, 2.3424625396728516e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 11.0, 6.0, 8.0, 14.0, 12.0, 15.0, 20.0, 12.0, 20.0, 28.0, 30.0, 29.0, 43.0, 35.0, 30.0, 50.0, 35.0, 35.0, 52.0, 49.0, 43.0, 43.0, 37.0, 27.0, 38.0, 28.0, 34.0, 38.0, 25.0, 25.0, 16.0, 21.0, 17.0, 12.0, 8.0, 11.0, 10.0, 4.0, 4.0, 4.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.46875, -32.3173828125, -31.166015625, -30.0146484375, -28.86328125, -27.7119140625, -26.560546875, -25.4091796875, -24.2578125, -23.1064453125, -21.955078125, -20.8037109375, -19.65234375, -18.5009765625, -17.349609375, -16.1982421875, -15.046875, -13.8955078125, -12.744140625, -11.5927734375, -10.44140625, -9.2900390625, -8.138671875, -6.9873046875, -5.8359375, -4.6845703125, -3.533203125, -2.3818359375, -1.23046875, -0.0791015625, 1.072265625, 2.2236328125, 3.375, 4.5263671875, 5.677734375, 6.8291015625, 7.98046875, 9.1318359375, 10.283203125, 11.4345703125, 12.5859375, 13.7373046875, 14.888671875, 16.0400390625, 17.19140625, 18.3427734375, 19.494140625, 20.6455078125, 21.796875, 22.9482421875, 24.099609375, 25.2509765625, 26.40234375, 27.5537109375, 28.705078125, 29.8564453125, 31.0078125, 32.1591796875, 33.310546875, 34.4619140625, 35.61328125, 36.7646484375, 37.916015625, 39.0673828125, 40.21875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 11.0, 15.0, 16.0, 23.0, 29.0, 52.0, 56.0, 109.0, 135.0, 215.0, 274.0, 407.0, 598.0, 894.0, 1182.0, 1875.0, 2788.0, 4336.0, 8806.0, 148015.0, 843968.0, 18932.0, 5490.0, 3434.0, 2205.0, 1464.0, 955.0, 644.0, 486.0, 314.0, 231.0, 166.0, 114.0, 82.0, 56.0, 51.0, 39.0, 17.0, 18.0, 10.0, 7.0, 4.0, 10.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.1875, -73.8935546875, -71.599609375, -69.3056640625, -67.01171875, -64.7177734375, -62.423828125, -60.1298828125, -57.8359375, -55.5419921875, -53.248046875, -50.9541015625, -48.66015625, -46.3662109375, -44.072265625, -41.7783203125, -39.484375, -37.1904296875, -34.896484375, -32.6025390625, -30.30859375, -28.0146484375, -25.720703125, -23.4267578125, -21.1328125, -18.8388671875, -16.544921875, -14.2509765625, -11.95703125, -9.6630859375, -7.369140625, -5.0751953125, -2.78125, -0.4873046875, 1.806640625, 4.1005859375, 6.39453125, 8.6884765625, 10.982421875, 13.2763671875, 15.5703125, 17.8642578125, 20.158203125, 22.4521484375, 24.74609375, 27.0400390625, 29.333984375, 31.6279296875, 33.921875, 36.2158203125, 38.509765625, 40.8037109375, 43.09765625, 45.3916015625, 47.685546875, 49.9794921875, 52.2734375, 54.5673828125, 56.861328125, 59.1552734375, 61.44921875, 63.7431640625, 66.037109375, 68.3310546875, 70.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 9.0, 12.0, 11.0, 12.0, 15.0, 17.0, 19.0, 24.0, 19.0, 24.0, 29.0, 30.0, 33.0, 29.0, 39.0, 55.0, 71.0, 117.0, 1910.0, 79.0, 63.0, 48.0, 45.0, 34.0, 26.0, 30.0, 30.0, 23.0, 26.0, 32.0, 22.0, 17.0, 10.0, 8.0, 5.0, 12.0, 11.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-101.25, -98.1181640625, -94.986328125, -91.8544921875, -88.72265625, -85.5908203125, -82.458984375, -79.3271484375, -76.1953125, -73.0634765625, -69.931640625, -66.7998046875, -63.66796875, -60.5361328125, -57.404296875, -54.2724609375, -51.140625, -48.0087890625, -44.876953125, -41.7451171875, -38.61328125, -35.4814453125, -32.349609375, -29.2177734375, -26.0859375, -22.9541015625, -19.822265625, -16.6904296875, -13.55859375, -10.4267578125, -7.294921875, -4.1630859375, -1.03125, 2.1005859375, 5.232421875, 8.3642578125, 11.49609375, 14.6279296875, 17.759765625, 20.8916015625, 24.0234375, 27.1552734375, 30.287109375, 33.4189453125, 36.55078125, 39.6826171875, 42.814453125, 45.9462890625, 49.078125, 52.2099609375, 55.341796875, 58.4736328125, 61.60546875, 64.7373046875, 67.869140625, 71.0009765625, 74.1328125, 77.2646484375, 80.396484375, 83.5283203125, 86.66015625, 89.7919921875, 92.923828125, 96.0556640625, 99.1875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 13.0, 8.0, 28.0, 34.0, 49.0, 67.0, 93.0, 190.0, 306.0, 759.0, 3523.0, 58204.0, 3073650.0, 6689.0, 1180.0, 400.0, 202.0, 103.0, 76.0, 49.0, 23.0, 15.0, 10.0, 6.0, 6.0, 4.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-380.75, -367.6953125, -354.640625, -341.5859375, -328.53125, -315.4765625, -302.421875, -289.3671875, -276.3125, -263.2578125, -250.203125, -237.1484375, -224.09375, -211.0390625, -197.984375, -184.9296875, -171.875, -158.8203125, -145.765625, -132.7109375, -119.65625, -106.6015625, -93.546875, -80.4921875, -67.4375, -54.3828125, -41.328125, -28.2734375, -15.21875, -2.1640625, 10.890625, 23.9453125, 37.0, 50.0546875, 63.109375, 76.1640625, 89.21875, 102.2734375, 115.328125, 128.3828125, 141.4375, 154.4921875, 167.546875, 180.6015625, 193.65625, 206.7109375, 219.765625, 232.8203125, 245.875, 258.9296875, 271.984375, 285.0390625, 298.09375, 311.1484375, 324.203125, 337.2578125, 350.3125, 363.3671875, 376.421875, 389.4765625, 402.53125, 415.5859375, 428.640625, 441.6953125, 454.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 13.0, 150.0, 667.0, 159.0, 20.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1370.9456787109375, -1343.770751953125, -1316.5958251953125, -1289.4208984375, -1262.2459716796875, -1235.071044921875, -1207.8961181640625, -1180.72119140625, -1153.5462646484375, -1126.371337890625, -1099.1964111328125, -1072.021484375, -1044.8465576171875, -1017.671630859375, -990.4967041015625, -963.32177734375, -936.1469116210938, -908.9719848632812, -881.7970581054688, -854.6221313476562, -827.4472045898438, -800.2722778320312, -773.097412109375, -745.9224853515625, -718.74755859375, -691.5726318359375, -664.397705078125, -637.2227783203125, -610.0478515625, -582.8729248046875, -555.697998046875, -528.5230712890625, -501.34820556640625, -474.17327880859375, -446.99835205078125, -419.82342529296875, -392.64849853515625, -365.47357177734375, -338.2986755371094, -311.1237487792969, -283.9488220214844, -256.7738952636719, -229.59896850585938, -202.42405700683594, -175.24913024902344, -148.07420349121094, -120.8992919921875, -93.724365234375, -66.5494384765625, -39.374515533447266, -12.199592590332031, 14.975326538085938, 42.15025329589844, 69.32518005371094, 96.50009155273438, 123.67501831054688, 150.84994506835938, 178.02487182617188, 205.19979858398438, 232.3747100830078, 259.54962158203125, 286.72454833984375, 313.89947509765625, 341.07440185546875, 368.24932861328125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 1.0, 6.0, 12.0, 6.0, 12.0, 15.0, 18.0, 16.0, 21.0, 22.0, 31.0, 32.0, 33.0, 47.0, 38.0, 47.0, 36.0, 31.0, 51.0, 52.0, 41.0, 42.0, 41.0, 42.0, 38.0, 31.0, 30.0, 24.0, 25.0, 26.0, 23.0, 20.0, 14.0, 20.0, 11.0, 7.0, 13.0, 9.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-287.1763610839844, -277.3305969238281, -267.4848327636719, -257.6390686035156, -247.7932891845703, -237.94752502441406, -228.10174560546875, -218.2559814453125, -208.41021728515625, -198.564453125, -188.71868896484375, -178.87290954589844, -169.0271453857422, -159.18138122558594, -149.33560180664062, -139.48983764648438, -129.64407348632812, -119.79830932617188, -109.9525375366211, -100.10676574707031, -90.26100158691406, -80.41523742675781, -70.56946563720703, -60.72369384765625, -50.8779296875, -41.032161712646484, -31.18639373779297, -21.340625762939453, -11.494857788085938, -1.6490898132324219, 8.196678161621094, 18.042449951171875, 27.888214111328125, 37.73398208618164, 47.579750061035156, 57.42551803588867, 67.27128601074219, 77.11705017089844, 86.96282196044922, 96.80859375, 106.65435791015625, 116.5001220703125, 126.34589385986328, 136.19166564941406, 146.0374298095703, 155.88319396972656, 165.72897338867188, 175.57473754882812, 185.42050170898438, 195.26626586914062, 205.11203002929688, 214.9578094482422, 224.80357360839844, 234.6493377685547, 244.4951171875, 254.34088134765625, 264.1866455078125, 274.03240966796875, 283.878173828125, 293.72393798828125, 303.5697021484375, 313.4154968261719, 323.2612609863281, 333.1070251464844, 342.9527893066406]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 10.0, 5.0, 8.0, 14.0, 9.0, 14.0, 23.0, 21.0, 17.0, 35.0, 27.0, 30.0, 28.0, 35.0, 37.0, 42.0, 47.0, 42.0, 41.0, 48.0, 38.0, 32.0, 50.0, 42.0, 36.0, 24.0, 36.0, 27.0, 29.0, 27.0, 18.0, 16.0, 12.0, 12.0, 16.0, 10.0, 7.0, 4.0, 6.0, 4.0, 7.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-34.40625, -33.22021484375, -32.0341796875, -30.84814453125, -29.662109375, -28.47607421875, -27.2900390625, -26.10400390625, -24.91796875, -23.73193359375, -22.5458984375, -21.35986328125, -20.173828125, -18.98779296875, -17.8017578125, -16.61572265625, -15.4296875, -14.24365234375, -13.0576171875, -11.87158203125, -10.685546875, -9.49951171875, -8.3134765625, -7.12744140625, -5.94140625, -4.75537109375, -3.5693359375, -2.38330078125, -1.197265625, -0.01123046875, 1.1748046875, 2.36083984375, 3.546875, 4.73291015625, 5.9189453125, 7.10498046875, 8.291015625, 9.47705078125, 10.6630859375, 11.84912109375, 13.03515625, 14.22119140625, 15.4072265625, 16.59326171875, 17.779296875, 18.96533203125, 20.1513671875, 21.33740234375, 22.5234375, 23.70947265625, 24.8955078125, 26.08154296875, 27.267578125, 28.45361328125, 29.6396484375, 30.82568359375, 32.01171875, 33.19775390625, 34.3837890625, 35.56982421875, 36.755859375, 37.94189453125, 39.1279296875, 40.31396484375, 41.5]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 10.0, 12.0, 20.0, 32.0, 34.0, 64.0, 94.0, 125.0, 153.0, 242.0, 347.0, 408.0, 612.0, 866.0, 1258.0, 1890.0, 3093.0, 4953.0, 8521.0, 18988.0, 108854.0, 2237765.0, 1679946.0, 87767.0, 16560.0, 8287.0, 4617.0, 2875.0, 1793.0, 1211.0, 841.0, 519.0, 390.0, 322.0, 229.0, 153.0, 109.0, 84.0, 70.0, 55.0, 30.0, 17.0, 24.0, 10.0, 7.0, 12.0, 6.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-92.9375, -90.029296875, -87.12109375, -84.212890625, -81.3046875, -78.396484375, -75.48828125, -72.580078125, -69.671875, -66.763671875, -63.85546875, -60.947265625, -58.0390625, -55.130859375, -52.22265625, -49.314453125, -46.40625, -43.498046875, -40.58984375, -37.681640625, -34.7734375, -31.865234375, -28.95703125, -26.048828125, -23.140625, -20.232421875, -17.32421875, -14.416015625, -11.5078125, -8.599609375, -5.69140625, -2.783203125, 0.125, 3.033203125, 5.94140625, 8.849609375, 11.7578125, 14.666015625, 17.57421875, 20.482421875, 23.390625, 26.298828125, 29.20703125, 32.115234375, 35.0234375, 37.931640625, 40.83984375, 43.748046875, 46.65625, 49.564453125, 52.47265625, 55.380859375, 58.2890625, 61.197265625, 64.10546875, 67.013671875, 69.921875, 72.830078125, 75.73828125, 78.646484375, 81.5546875, 84.462890625, 87.37109375, 90.279296875, 93.1875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 11.0, 14.0, 14.0, 11.0, 19.0, 21.0, 30.0, 44.0, 76.0, 139.0, 291.0, 689.0, 1135.0, 821.0, 315.0, 150.0, 71.0, 49.0, 37.0, 18.0, 19.0, 10.0, 11.0, 13.0, 2.0, 7.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.375, -89.6240234375, -86.873046875, -84.1220703125, -81.37109375, -78.6201171875, -75.869140625, -73.1181640625, -70.3671875, -67.6162109375, -64.865234375, -62.1142578125, -59.36328125, -56.6123046875, -53.861328125, -51.1103515625, -48.359375, -45.6083984375, -42.857421875, -40.1064453125, -37.35546875, -34.6044921875, -31.853515625, -29.1025390625, -26.3515625, -23.6005859375, -20.849609375, -18.0986328125, -15.34765625, -12.5966796875, -9.845703125, -7.0947265625, -4.34375, -1.5927734375, 1.158203125, 3.9091796875, 6.66015625, 9.4111328125, 12.162109375, 14.9130859375, 17.6640625, 20.4150390625, 23.166015625, 25.9169921875, 28.66796875, 31.4189453125, 34.169921875, 36.9208984375, 39.671875, 42.4228515625, 45.173828125, 47.9248046875, 50.67578125, 53.4267578125, 56.177734375, 58.9287109375, 61.6796875, 64.4306640625, 67.181640625, 69.9326171875, 72.68359375, 75.4345703125, 78.185546875, 80.9365234375, 83.6875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 3.0, 5.0, 5.0, 4.0, 8.0, 8.0, 15.0, 31.0, 38.0, 102.0, 154.0, 230.0, 418.0, 834.0, 1524.0, 3128.0, 7198.0, 19407.0, 85447.0, 3690900.0, 330569.0, 34235.0, 10951.0, 4500.0, 2113.0, 1120.0, 520.0, 337.0, 162.0, 96.0, 62.0, 43.0, 28.0, 18.0, 12.0, 12.0, 6.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-202.25, -195.875, -189.5, -183.125, -176.75, -170.375, -164.0, -157.625, -151.25, -144.875, -138.5, -132.125, -125.75, -119.375, -113.0, -106.625, -100.25, -93.875, -87.5, -81.125, -74.75, -68.375, -62.0, -55.625, -49.25, -42.875, -36.5, -30.125, -23.75, -17.375, -11.0, -4.625, 1.75, 8.125, 14.5, 20.875, 27.25, 33.625, 40.0, 46.375, 52.75, 59.125, 65.5, 71.875, 78.25, 84.625, 91.0, 97.375, 103.75, 110.125, 116.5, 122.875, 129.25, 135.625, 142.0, 148.375, 154.75, 161.125, 167.5, 173.875, 180.25, 186.625, 193.0, 199.375, 205.75]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 8.0, 9.0, 22.0, 35.0, 69.0, 133.0, 292.0, 225.0, 118.0, 56.0, 26.0, 9.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-259.5345458984375, -233.40792846679688, -207.28131103515625, -181.15467834472656, -155.02806091308594, -128.9014434814453, -102.77481079101562, -76.648193359375, -50.521575927734375, -24.394954681396484, 1.7316665649414062, 27.858291625976562, 53.98490905761719, 80.11152648925781, 106.2381591796875, 132.36477661132812, 158.49139404296875, 184.61801147460938, 210.74462890625, 236.8712615966797, 262.99786376953125, 289.12451171875, 315.2511291503906, 341.37774658203125, 367.5043640136719, 393.6309814453125, 419.7575988769531, 445.88421630859375, 472.0108642578125, 498.137451171875, 524.2640991210938, 550.3907470703125, 576.517333984375, 602.6439819335938, 628.7705688476562, 654.897216796875, 681.0238037109375, 707.1504516601562, 733.277099609375, 759.4036865234375, 785.5302734375, 811.6569213867188, 837.7835083007812, 863.91015625, 890.0367431640625, 916.1633911132812, 942.2900390625, 968.4166259765625, 994.5432739257812, 1020.669921875, 1046.7965087890625, 1072.923095703125, 1099.0498046875, 1125.1763916015625, 1151.302978515625, 1177.4296875, 1203.5562744140625, 1229.682861328125, 1255.8095703125, 1281.9361572265625, 1308.062744140625, 1334.1893310546875, 1360.3160400390625, 1386.442626953125, 1412.5692138671875]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 3.0, 7.0, 8.0, 8.0, 17.0, 14.0, 14.0, 24.0, 29.0, 25.0, 34.0, 41.0, 29.0, 37.0, 30.0, 45.0, 42.0, 41.0, 38.0, 50.0, 44.0, 35.0, 46.0, 32.0, 39.0, 33.0, 36.0, 27.0, 21.0, 26.0, 16.0, 22.0, 9.0, 13.0, 9.0, 9.0, 6.0, 8.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 4.0], "bins": [-263.22503662109375, -255.7518310546875, -248.27862548828125, -240.805419921875, -233.33221435546875, -225.8590087890625, -218.38580322265625, -210.91261291503906, -203.4394073486328, -195.96620178222656, -188.4929962158203, -181.01979064941406, -173.5465850830078, -166.07339477539062, -158.60018920898438, -151.12698364257812, -143.65377807617188, -136.18057250976562, -128.70736694335938, -121.23416137695312, -113.7609634399414, -106.28775787353516, -98.8145523071289, -91.34135437011719, -83.86813354492188, -76.39492797851562, -68.92172241210938, -61.44852066040039, -53.975318908691406, -46.502113342285156, -39.028907775878906, -31.555706024169922, -24.082504272460938, -16.60930061340332, -9.136096000671387, -1.6628913879394531, 5.810312271118164, 13.283515930175781, 20.75672149658203, 28.229923248291016, 35.703128814697266, 43.176334381103516, 50.6495361328125, 58.12274169921875, 65.595947265625, 73.06915283203125, 80.5423583984375, 88.01555633544922, 95.48876190185547, 102.96196746826172, 110.43517303466797, 117.90837097167969, 125.38157653808594, 132.8547821044922, 140.32798767089844, 147.8011932373047, 155.27439880371094, 162.7476043701172, 170.22080993652344, 177.6940155029297, 185.16722106933594, 192.64041137695312, 200.11361694335938, 207.58682250976562, 215.06002807617188]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 6.0, 3.0, 4.0, 11.0, 13.0, 8.0, 9.0, 25.0, 27.0, 19.0, 25.0, 34.0, 28.0, 32.0, 46.0, 43.0, 38.0, 44.0, 57.0, 42.0, 47.0, 33.0, 40.0, 44.0, 36.0, 45.0, 33.0, 26.0, 23.0, 20.0, 25.0, 18.0, 17.0, 14.0, 13.0, 12.0, 9.0, 5.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.84375, -34.59814453125, -33.3525390625, -32.10693359375, -30.861328125, -29.61572265625, -28.3701171875, -27.12451171875, -25.87890625, -24.63330078125, -23.3876953125, -22.14208984375, -20.896484375, -19.65087890625, -18.4052734375, -17.15966796875, -15.9140625, -14.66845703125, -13.4228515625, -12.17724609375, -10.931640625, -9.68603515625, -8.4404296875, -7.19482421875, -5.94921875, -4.70361328125, -3.4580078125, -2.21240234375, -0.966796875, 0.27880859375, 1.5244140625, 2.77001953125, 4.015625, 5.26123046875, 6.5068359375, 7.75244140625, 8.998046875, 10.24365234375, 11.4892578125, 12.73486328125, 13.98046875, 15.22607421875, 16.4716796875, 17.71728515625, 18.962890625, 20.20849609375, 21.4541015625, 22.69970703125, 23.9453125, 25.19091796875, 26.4365234375, 27.68212890625, 28.927734375, 30.17333984375, 31.4189453125, 32.66455078125, 33.91015625, 35.15576171875, 36.4013671875, 37.64697265625, 38.892578125, 40.13818359375, 41.3837890625, 42.62939453125, 43.875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 14.0, 20.0, 23.0, 34.0, 35.0, 85.0, 107.0, 149.0, 220.0, 358.0, 506.0, 736.0, 1091.0, 1650.0, 2481.0, 3701.0, 5723.0, 8879.0, 13792.0, 21338.0, 34632.0, 57022.0, 100943.0, 221083.0, 293758.0, 112834.0, 63262.0, 37786.0, 23368.0, 14878.0, 9570.0, 6258.0, 4011.0, 2677.0, 1921.0, 1089.0, 832.0, 562.0, 339.0, 243.0, 156.0, 126.0, 75.0, 55.0, 36.0, 23.0, 22.0, 15.0, 11.0, 12.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.43359375, -1.385955810546875, -1.33831787109375, -1.290679931640625, -1.2430419921875, -1.195404052734375, -1.14776611328125, -1.100128173828125, -1.052490234375, -1.004852294921875, -0.95721435546875, -0.909576416015625, -0.8619384765625, -0.814300537109375, -0.76666259765625, -0.719024658203125, -0.67138671875, -0.623748779296875, -0.57611083984375, -0.528472900390625, -0.4808349609375, -0.433197021484375, -0.38555908203125, -0.337921142578125, -0.290283203125, -0.242645263671875, -0.19500732421875, -0.147369384765625, -0.0997314453125, -0.052093505859375, -0.00445556640625, 0.043182373046875, 0.0908203125, 0.138458251953125, 0.18609619140625, 0.233734130859375, 0.2813720703125, 0.329010009765625, 0.37664794921875, 0.424285888671875, 0.471923828125, 0.519561767578125, 0.56719970703125, 0.614837646484375, 0.6624755859375, 0.710113525390625, 0.75775146484375, 0.805389404296875, 0.85302734375, 0.900665283203125, 0.94830322265625, 0.995941162109375, 1.0435791015625, 1.091217041015625, 1.13885498046875, 1.186492919921875, 1.234130859375, 1.281768798828125, 1.32940673828125, 1.377044677734375, 1.4246826171875, 1.472320556640625, 1.51995849609375, 1.567596435546875, 1.615234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 5.0, 4.0, 9.0, 7.0, 5.0, 12.0, 8.0, 16.0, 21.0, 27.0, 17.0, 22.0, 30.0, 38.0, 24.0, 29.0, 34.0, 38.0, 42.0, 37.0, 31.0, 39.0, 1060.0, 34.0, 36.0, 35.0, 37.0, 32.0, 28.0, 32.0, 35.0, 28.0, 17.0, 23.0, 18.0, 15.0, 19.0, 13.0, 11.0, 13.0, 9.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-23.0625, -22.370361328125, -21.67822265625, -20.986083984375, -20.2939453125, -19.601806640625, -18.90966796875, -18.217529296875, -17.525390625, -16.833251953125, -16.14111328125, -15.448974609375, -14.7568359375, -14.064697265625, -13.37255859375, -12.680419921875, -11.98828125, -11.296142578125, -10.60400390625, -9.911865234375, -9.2197265625, -8.527587890625, -7.83544921875, -7.143310546875, -6.451171875, -5.759033203125, -5.06689453125, -4.374755859375, -3.6826171875, -2.990478515625, -2.29833984375, -1.606201171875, -0.9140625, -0.221923828125, 0.47021484375, 1.162353515625, 1.8544921875, 2.546630859375, 3.23876953125, 3.930908203125, 4.623046875, 5.315185546875, 6.00732421875, 6.699462890625, 7.3916015625, 8.083740234375, 8.77587890625, 9.468017578125, 10.16015625, 10.852294921875, 11.54443359375, 12.236572265625, 12.9287109375, 13.620849609375, 14.31298828125, 15.005126953125, 15.697265625, 16.389404296875, 17.08154296875, 17.773681640625, 18.4658203125, 19.157958984375, 19.85009765625, 20.542236328125, 21.234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 6.0, 5.0, 17.0, 26.0, 31.0, 44.0, 64.0, 91.0, 118.0, 159.0, 241.0, 364.0, 503.0, 682.0, 1006.0, 1402.0, 2053.0, 2872.0, 4264.0, 6293.0, 9172.0, 13536.0, 19917.0, 30335.0, 47117.0, 74390.0, 128081.0, 1342736.0, 161685.0, 88216.0, 54375.0, 35339.0, 23317.0, 15280.0, 10481.0, 6964.0, 4848.0, 3367.0, 2326.0, 1625.0, 1181.0, 775.0, 531.0, 388.0, 253.0, 186.0, 152.0, 92.0, 67.0, 52.0, 30.0, 27.0, 18.0, 17.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.9248046875, -0.895599365234375, -0.86639404296875, -0.837188720703125, -0.8079833984375, -0.778778076171875, -0.74957275390625, -0.720367431640625, -0.691162109375, -0.661956787109375, -0.63275146484375, -0.603546142578125, -0.5743408203125, -0.545135498046875, -0.51593017578125, -0.486724853515625, -0.45751953125, -0.428314208984375, -0.39910888671875, -0.369903564453125, -0.3406982421875, -0.311492919921875, -0.28228759765625, -0.253082275390625, -0.223876953125, -0.194671630859375, -0.16546630859375, -0.136260986328125, -0.1070556640625, -0.077850341796875, -0.04864501953125, -0.019439697265625, 0.009765625, 0.038970947265625, 0.06817626953125, 0.097381591796875, 0.1265869140625, 0.155792236328125, 0.18499755859375, 0.214202880859375, 0.243408203125, 0.272613525390625, 0.30181884765625, 0.331024169921875, 0.3602294921875, 0.389434814453125, 0.41864013671875, 0.447845458984375, 0.47705078125, 0.506256103515625, 0.53546142578125, 0.564666748046875, 0.5938720703125, 0.623077392578125, 0.65228271484375, 0.681488037109375, 0.710693359375, 0.739898681640625, 0.76910400390625, 0.798309326171875, 0.8275146484375, 0.856719970703125, 0.88592529296875, 0.915130615234375, 0.9443359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 2.0, 6.0, 8.0, 8.0, 9.0, 17.0, 20.0, 15.0, 13.0, 32.0, 29.0, 48.0, 66.0, 71.0, 137.0, 117.0, 78.0, 72.0, 43.0, 32.0, 36.0, 28.0, 17.0, 9.0, 16.0, 9.0, 12.0, 8.0, 7.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.537271499633789e-05, -5.338899791240692e-05, -5.140528082847595e-05, -4.942156374454498e-05, -4.7437846660614014e-05, -4.5454129576683044e-05, -4.3470412492752075e-05, -4.1486695408821106e-05, -3.950297832489014e-05, -3.751926124095917e-05, -3.55355441570282e-05, -3.355182707309723e-05, -3.156810998916626e-05, -2.958439290523529e-05, -2.760067582130432e-05, -2.5616958737373352e-05, -2.3633241653442383e-05, -2.1649524569511414e-05, -1.9665807485580444e-05, -1.7682090401649475e-05, -1.5698373317718506e-05, -1.3714656233787537e-05, -1.1730939149856567e-05, -9.747222065925598e-06, -7.763504981994629e-06, -5.77978789806366e-06, -3.7960708141326904e-06, -1.8123537302017212e-06, 1.7136335372924805e-07, 2.1550804376602173e-06, 4.1387975215911865e-06, 6.122514605522156e-06, 8.106231689453125e-06, 1.0089948773384094e-05, 1.2073665857315063e-05, 1.4057382941246033e-05, 1.6041100025177002e-05, 1.802481710910797e-05, 2.000853419303894e-05, 2.199225127696991e-05, 2.397596836090088e-05, 2.5959685444831848e-05, 2.7943402528762817e-05, 2.9927119612693787e-05, 3.1910836696624756e-05, 3.3894553780555725e-05, 3.5878270864486694e-05, 3.7861987948417664e-05, 3.984570503234863e-05, 4.18294221162796e-05, 4.381313920021057e-05, 4.579685628414154e-05, 4.778057336807251e-05, 4.976429045200348e-05, 5.174800753593445e-05, 5.373172461986542e-05, 5.571544170379639e-05, 5.7699158787727356e-05, 5.9682875871658325e-05, 6.16665929555893e-05, 6.365031003952026e-05, 6.563402712345123e-05, 6.76177442073822e-05, 6.960146129131317e-05, 7.158517837524414e-05]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 8.0, 11.0, 13.0, 12.0, 18.0, 21.0, 19.0, 34.0, 36.0, 61.0, 95.0, 192.0, 1055.0, 21005.0, 976526.0, 47007.0, 1859.0, 243.0, 100.0, 58.0, 38.0, 25.0, 24.0, 21.0, 12.0, 5.0, 11.0, 7.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012416839599609375, -0.0012058019638061523, -0.0011699199676513672, -0.001134037971496582, -0.0010981559753417969, -0.0010622739791870117, -0.0010263919830322266, -0.0009905099868774414, -0.0009546279907226562, -0.0009187459945678711, -0.0008828639984130859, -0.0008469820022583008, -0.0008111000061035156, -0.0007752180099487305, -0.0007393360137939453, -0.0007034540176391602, -0.000667572021484375, -0.0006316900253295898, -0.0005958080291748047, -0.0005599260330200195, -0.0005240440368652344, -0.0004881620407104492, -0.00045228004455566406, -0.0004163980484008789, -0.00038051605224609375, -0.0003446340560913086, -0.00030875205993652344, -0.0002728700637817383, -0.00023698806762695312, -0.00020110607147216797, -0.0001652240753173828, -0.00012934207916259766, -9.34600830078125e-05, -5.7578086853027344e-05, -2.1696090698242188e-05, 1.4185905456542969e-05, 5.0067901611328125e-05, 8.594989776611328e-05, 0.00012183189392089844, 0.0001577138900756836, 0.00019359588623046875, 0.0002294778823852539, 0.00026535987854003906, 0.0003012418746948242, 0.0003371238708496094, 0.00037300586700439453, 0.0004088878631591797, 0.00044476985931396484, 0.00048065185546875, 0.0005165338516235352, 0.0005524158477783203, 0.0005882978439331055, 0.0006241798400878906, 0.0006600618362426758, 0.0006959438323974609, 0.0007318258285522461, 0.0007677078247070312, 0.0008035898208618164, 0.0008394718170166016, 0.0008753538131713867, 0.0009112358093261719, 0.000947117805480957, 0.0009829998016357422, 0.0010188817977905273, 0.0010547637939453125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 16.0, 39.0, 98.0, 233.0, 352.0, 157.0, 52.0, 31.0, 14.0, 3.0, 6.0, 1.0, 5.0], "bins": [-0.00018189776164945215, -0.00017860790831036866, -0.00017531805497128516, -0.00017202820163220167, -0.00016873834829311818, -0.00016544849495403469, -0.00016215862706303596, -0.00015886877372395247, -0.00015557892038486898, -0.0001522890670457855, -0.000148999213706702, -0.0001457093603676185, -0.000142419507028535, -0.0001391296391375363, -0.0001358397857984528, -0.0001325499324593693, -0.0001292600791202858, -0.00012597022578120232, -0.00012268037244211882, -0.00011939051182707772, -0.00011610065848799422, -0.00011281080514891073, -0.00010952095180982724, -0.00010623109119478613, -0.00010294124513166025, -9.965139179257676e-05, -9.636153845349327e-05, -9.307167783845216e-05, -8.978182449936867e-05, -8.649197116028517e-05, -8.320211782120168e-05, -7.991226448211819e-05, -7.662240386707708e-05, -7.333255052799359e-05, -7.00426971889101e-05, -6.675283657386899e-05, -6.34629832347855e-05, -6.0173129895702004e-05, -5.688327655661851e-05, -5.359341957955621e-05, -5.030356624047272e-05, -4.7013712901389226e-05, -4.3723855924326926e-05, -4.0434002585243434e-05, -3.7144145608181134e-05, -3.385429226909764e-05, -3.056443529203534e-05, -2.727458195295185e-05, -2.3984726794878952e-05, -2.0694871636806056e-05, -1.740501647873316e-05, -1.4115162230154965e-05, -1.0825307072082069e-05, -7.535452823503874e-06, -4.245597665430978e-06, -9.557425073580816e-07, 2.3341126507148147e-06, 5.623967808787711e-06, 8.913822966860607e-06, 1.2203677215438802e-05, 1.54935332830064e-05, 1.8783386622089893e-05, 2.207324178016279e-05, 2.5363096938235685e-05, 2.865295209630858e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 1.0, 12.0, 12.0, 7.0, 10.0, 11.0, 12.0, 13.0, 19.0, 32.0, 23.0, 26.0, 29.0, 22.0, 42.0, 32.0, 36.0, 43.0, 34.0, 42.0, 47.0, 33.0, 38.0, 29.0, 37.0, 29.0, 30.0, 42.0, 36.0, 35.0, 20.0, 16.0, 22.0, 22.0, 20.0, 17.0, 11.0, 9.0, 9.0, 5.0, 7.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.568960189819336e-05, -2.4870038032531738e-05, -2.4050474166870117e-05, -2.3230910301208496e-05, -2.2411346435546875e-05, -2.1591782569885254e-05, -2.0772218704223633e-05, -1.9952654838562012e-05, -1.913309097290039e-05, -1.831352710723877e-05, -1.749396324157715e-05, -1.6674399375915527e-05, -1.5854835510253906e-05, -1.5035271644592285e-05, -1.4215707778930664e-05, -1.3396143913269043e-05, -1.2576580047607422e-05, -1.17570161819458e-05, -1.093745231628418e-05, -1.0117888450622559e-05, -9.298324584960938e-06, -8.478760719299316e-06, -7.659196853637695e-06, -6.839632987976074e-06, -6.020069122314453e-06, -5.200505256652832e-06, -4.380941390991211e-06, -3.56137752532959e-06, -2.7418136596679688e-06, -1.9222497940063477e-06, -1.1026859283447266e-06, -2.8312206268310547e-07, 5.364418029785156e-07, 1.3560056686401367e-06, 2.175569534301758e-06, 2.995133399963379e-06, 3.814697265625e-06, 4.634261131286621e-06, 5.453824996948242e-06, 6.273388862609863e-06, 7.092952728271484e-06, 7.912516593933105e-06, 8.732080459594727e-06, 9.551644325256348e-06, 1.0371208190917969e-05, 1.119077205657959e-05, 1.2010335922241211e-05, 1.2829899787902832e-05, 1.3649463653564453e-05, 1.4469027519226074e-05, 1.5288591384887695e-05, 1.6108155250549316e-05, 1.6927719116210938e-05, 1.774728298187256e-05, 1.856684684753418e-05, 1.93864107131958e-05, 2.0205974578857422e-05, 2.1025538444519043e-05, 2.1845102310180664e-05, 2.2664666175842285e-05, 2.3484230041503906e-05, 2.4303793907165527e-05, 2.512335777282715e-05, 2.594292163848877e-05, 2.676248550415039e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 6.0, 3.0, 4.0, 11.0, 13.0, 8.0, 9.0, 25.0, 27.0, 19.0, 25.0, 34.0, 28.0, 32.0, 46.0, 43.0, 38.0, 44.0, 57.0, 42.0, 47.0, 33.0, 40.0, 44.0, 36.0, 45.0, 33.0, 26.0, 23.0, 20.0, 25.0, 18.0, 17.0, 14.0, 13.0, 12.0, 9.0, 5.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.84375, -34.59814453125, -33.3525390625, -32.10693359375, -30.861328125, -29.61572265625, -28.3701171875, -27.12451171875, -25.87890625, -24.63330078125, -23.3876953125, -22.14208984375, -20.896484375, -19.65087890625, -18.4052734375, -17.15966796875, -15.9140625, -14.66845703125, -13.4228515625, -12.17724609375, -10.931640625, -9.68603515625, -8.4404296875, -7.19482421875, -5.94921875, -4.70361328125, -3.4580078125, -2.21240234375, -0.966796875, 0.27880859375, 1.5244140625, 2.77001953125, 4.015625, 5.26123046875, 6.5068359375, 7.75244140625, 8.998046875, 10.24365234375, 11.4892578125, 12.73486328125, 13.98046875, 15.22607421875, 16.4716796875, 17.71728515625, 18.962890625, 20.20849609375, 21.4541015625, 22.69970703125, 23.9453125, 25.19091796875, 26.4365234375, 27.68212890625, 28.927734375, 30.17333984375, 31.4189453125, 32.66455078125, 33.91015625, 35.15576171875, 36.4013671875, 37.64697265625, 38.892578125, 40.13818359375, 41.3837890625, 42.62939453125, 43.875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 12.0, 10.0, 10.0, 13.0, 26.0, 37.0, 33.0, 57.0, 83.0, 107.0, 163.0, 241.0, 382.0, 539.0, 845.0, 1421.0, 2307.0, 4389.0, 10803.0, 50042.0, 724192.0, 215026.0, 22566.0, 6812.0, 3322.0, 1874.0, 1101.0, 696.0, 449.0, 309.0, 207.0, 123.0, 93.0, 60.0, 44.0, 48.0, 28.0, 24.0, 17.0, 13.0, 9.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.1875, -33.96484375, -32.7421875, -31.51953125, -30.296875, -29.07421875, -27.8515625, -26.62890625, -25.40625, -24.18359375, -22.9609375, -21.73828125, -20.515625, -19.29296875, -18.0703125, -16.84765625, -15.625, -14.40234375, -13.1796875, -11.95703125, -10.734375, -9.51171875, -8.2890625, -7.06640625, -5.84375, -4.62109375, -3.3984375, -2.17578125, -0.953125, 0.26953125, 1.4921875, 2.71484375, 3.9375, 5.16015625, 6.3828125, 7.60546875, 8.828125, 10.05078125, 11.2734375, 12.49609375, 13.71875, 14.94140625, 16.1640625, 17.38671875, 18.609375, 19.83203125, 21.0546875, 22.27734375, 23.5, 24.72265625, 25.9453125, 27.16796875, 28.390625, 29.61328125, 30.8359375, 32.05859375, 33.28125, 34.50390625, 35.7265625, 36.94921875, 38.171875, 39.39453125, 40.6171875, 41.83984375, 43.0625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 4.0, 4.0, 3.0, 8.0, 8.0, 22.0, 12.0, 20.0, 26.0, 20.0, 14.0, 31.0, 24.0, 19.0, 34.0, 27.0, 46.0, 38.0, 45.0, 62.0, 1962.0, 129.0, 54.0, 53.0, 36.0, 46.0, 35.0, 31.0, 35.0, 36.0, 16.0, 30.0, 23.0, 24.0, 11.0, 14.0, 8.0, 6.0, 5.0, 7.0, 7.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-112.5, -108.958984375, -105.41796875, -101.876953125, -98.3359375, -94.794921875, -91.25390625, -87.712890625, -84.171875, -80.630859375, -77.08984375, -73.548828125, -70.0078125, -66.466796875, -62.92578125, -59.384765625, -55.84375, -52.302734375, -48.76171875, -45.220703125, -41.6796875, -38.138671875, -34.59765625, -31.056640625, -27.515625, -23.974609375, -20.43359375, -16.892578125, -13.3515625, -9.810546875, -6.26953125, -2.728515625, 0.8125, 4.353515625, 7.89453125, 11.435546875, 14.9765625, 18.517578125, 22.05859375, 25.599609375, 29.140625, 32.681640625, 36.22265625, 39.763671875, 43.3046875, 46.845703125, 50.38671875, 53.927734375, 57.46875, 61.009765625, 64.55078125, 68.091796875, 71.6328125, 75.173828125, 78.71484375, 82.255859375, 85.796875, 89.337890625, 92.87890625, 96.419921875, 99.9609375, 103.501953125, 107.04296875, 110.583984375, 114.125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 9.0, 15.0, 18.0, 27.0, 51.0, 54.0, 72.0, 87.0, 128.0, 192.0, 279.0, 638.0, 2638.0, 50425.0, 3083123.0, 5880.0, 960.0, 331.0, 199.0, 135.0, 102.0, 71.0, 53.0, 36.0, 41.0, 21.0, 30.0, 16.0, 12.0, 5.0, 7.0, 4.0, 8.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-329.25, -320.15234375, -311.0546875, -301.95703125, -292.859375, -283.76171875, -274.6640625, -265.56640625, -256.46875, -247.37109375, -238.2734375, -229.17578125, -220.078125, -210.98046875, -201.8828125, -192.78515625, -183.6875, -174.58984375, -165.4921875, -156.39453125, -147.296875, -138.19921875, -129.1015625, -120.00390625, -110.90625, -101.80859375, -92.7109375, -83.61328125, -74.515625, -65.41796875, -56.3203125, -47.22265625, -38.125, -29.02734375, -19.9296875, -10.83203125, -1.734375, 7.36328125, 16.4609375, 25.55859375, 34.65625, 43.75390625, 52.8515625, 61.94921875, 71.046875, 80.14453125, 89.2421875, 98.33984375, 107.4375, 116.53515625, 125.6328125, 134.73046875, 143.828125, 152.92578125, 162.0234375, 171.12109375, 180.21875, 189.31640625, 198.4140625, 207.51171875, 216.609375, 225.70703125, 234.8046875, 243.90234375, 253.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 13.0, 150.0, 682.0, 158.0, 14.0], "bins": [-1178.568359375, -1159.3905029296875, -1140.2127685546875, -1121.034912109375, -1101.857177734375, -1082.6793212890625, -1063.50146484375, -1044.32373046875, -1025.1458740234375, -1005.9680786132812, -986.790283203125, -967.6124267578125, -948.4346313476562, -929.2568359375, -910.0789794921875, -890.9011840820312, -871.723388671875, -852.5455932617188, -833.3677978515625, -814.18994140625, -795.0121459960938, -775.8343505859375, -756.656494140625, -737.4786987304688, -718.3009033203125, -699.1231079101562, -679.9453125, -660.7674560546875, -641.5896606445312, -622.411865234375, -603.2340087890625, -584.0562133789062, -564.8784790039062, -545.70068359375, -526.5228271484375, -507.34503173828125, -488.167236328125, -468.98944091796875, -449.8116149902344, -430.6337890625, -411.45599365234375, -392.2781982421875, -373.1003723144531, -353.92254638671875, -334.7447509765625, -315.56695556640625, -296.3891296386719, -277.2113037109375, -258.03350830078125, -238.85569763183594, -219.67788696289062, -200.5000762939453, -181.322265625, -162.1444549560547, -142.96664428710938, -123.78883361816406, -104.61102294921875, -85.43321228027344, -66.25540161132812, -47.07759094238281, -27.8997802734375, -8.721969604492188, 10.455841064453125, 29.633651733398438, 48.81146240234375]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 6.0, 8.0, 25.0, 19.0, 18.0, 21.0, 31.0, 23.0, 33.0, 31.0, 49.0, 42.0, 36.0, 41.0, 39.0, 42.0, 34.0, 43.0, 48.0, 47.0, 40.0, 38.0, 36.0, 34.0, 22.0, 34.0, 15.0, 17.0, 18.0, 18.0, 9.0, 12.0, 11.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-281.3603210449219, -271.6579284667969, -261.95550537109375, -252.25311279296875, -242.55072021484375, -232.84832763671875, -223.1459197998047, -213.44351196289062, -203.74111938476562, -194.03872680664062, -184.33631896972656, -174.6339111328125, -164.9315185546875, -155.2291259765625, -145.52671813964844, -135.82431030273438, -126.12191772460938, -116.41951751708984, -106.71711730957031, -97.01471710205078, -87.31231689453125, -77.60991668701172, -67.90751647949219, -58.205116271972656, -48.502716064453125, -38.800315856933594, -29.097915649414062, -19.39551544189453, -9.693115234375, 0.00928497314453125, 9.711685180664062, 19.414085388183594, 29.116485595703125, 38.818885803222656, 48.52128601074219, 58.22368621826172, 67.92608642578125, 77.62848663330078, 87.33088684082031, 97.03328704833984, 106.73568725585938, 116.4380874633789, 126.14048767089844, 135.8428955078125, 145.5452880859375, 155.2476806640625, 164.95008850097656, 174.65249633789062, 184.35488891601562, 194.05728149414062, 203.7596893310547, 213.46209716796875, 223.16448974609375, 232.86688232421875, 242.5692901611328, 252.27169799804688, 261.9740905761719, 271.6764831542969, 281.37890625, 291.081298828125, 300.78369140625, 310.486083984375, 320.1884765625, 329.8908996582031, 339.5932922363281]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 8.0, 5.0, 8.0, 8.0, 11.0, 10.0, 21.0, 18.0, 19.0, 29.0, 27.0, 24.0, 39.0, 36.0, 34.0, 49.0, 44.0, 43.0, 48.0, 52.0, 35.0, 40.0, 47.0, 44.0, 38.0, 35.0, 31.0, 17.0, 26.0, 21.0, 23.0, 25.0, 16.0, 10.0, 16.0, 5.0, 12.0, 10.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.375, -35.0986328125, -33.822265625, -32.5458984375, -31.26953125, -29.9931640625, -28.716796875, -27.4404296875, -26.1640625, -24.8876953125, -23.611328125, -22.3349609375, -21.05859375, -19.7822265625, -18.505859375, -17.2294921875, -15.953125, -14.6767578125, -13.400390625, -12.1240234375, -10.84765625, -9.5712890625, -8.294921875, -7.0185546875, -5.7421875, -4.4658203125, -3.189453125, -1.9130859375, -0.63671875, 0.6396484375, 1.916015625, 3.1923828125, 4.46875, 5.7451171875, 7.021484375, 8.2978515625, 9.57421875, 10.8505859375, 12.126953125, 13.4033203125, 14.6796875, 15.9560546875, 17.232421875, 18.5087890625, 19.78515625, 21.0615234375, 22.337890625, 23.6142578125, 24.890625, 26.1669921875, 27.443359375, 28.7197265625, 29.99609375, 31.2724609375, 32.548828125, 33.8251953125, 35.1015625, 36.3779296875, 37.654296875, 38.9306640625, 40.20703125, 41.4833984375, 42.759765625, 44.0361328125, 45.3125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 8.0, 11.0, 9.0, 14.0, 16.0, 28.0, 41.0, 68.0, 108.0, 153.0, 177.0, 287.0, 406.0, 612.0, 1000.0, 1714.0, 2937.0, 5573.0, 11900.0, 51021.0, 886964.0, 3031486.0, 165579.0, 17289.0, 7293.0, 3821.0, 2077.0, 1240.0, 793.0, 508.0, 338.0, 231.0, 163.0, 126.0, 76.0, 63.0, 42.0, 29.0, 18.0, 18.0, 16.0, 10.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-86.5625, -83.4951171875, -80.427734375, -77.3603515625, -74.29296875, -71.2255859375, -68.158203125, -65.0908203125, -62.0234375, -58.9560546875, -55.888671875, -52.8212890625, -49.75390625, -46.6865234375, -43.619140625, -40.5517578125, -37.484375, -34.4169921875, -31.349609375, -28.2822265625, -25.21484375, -22.1474609375, -19.080078125, -16.0126953125, -12.9453125, -9.8779296875, -6.810546875, -3.7431640625, -0.67578125, 2.3916015625, 5.458984375, 8.5263671875, 11.59375, 14.6611328125, 17.728515625, 20.7958984375, 23.86328125, 26.9306640625, 29.998046875, 33.0654296875, 36.1328125, 39.2001953125, 42.267578125, 45.3349609375, 48.40234375, 51.4697265625, 54.537109375, 57.6044921875, 60.671875, 63.7392578125, 66.806640625, 69.8740234375, 72.94140625, 76.0087890625, 79.076171875, 82.1435546875, 85.2109375, 88.2783203125, 91.345703125, 94.4130859375, 97.48046875, 100.5478515625, 103.615234375, 106.6826171875, 109.75]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 6.0, 10.0, 18.0, 18.0, 24.0, 26.0, 31.0, 66.0, 141.0, 265.0, 734.0, 1268.0, 775.0, 312.0, 122.0, 64.0, 45.0, 38.0, 18.0, 16.0, 12.0, 14.0, 5.0, 4.0, 3.0, 10.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.4375, -86.41015625, -83.3828125, -80.35546875, -77.328125, -74.30078125, -71.2734375, -68.24609375, -65.21875, -62.19140625, -59.1640625, -56.13671875, -53.109375, -50.08203125, -47.0546875, -44.02734375, -41.0, -37.97265625, -34.9453125, -31.91796875, -28.890625, -25.86328125, -22.8359375, -19.80859375, -16.78125, -13.75390625, -10.7265625, -7.69921875, -4.671875, -1.64453125, 1.3828125, 4.41015625, 7.4375, 10.46484375, 13.4921875, 16.51953125, 19.546875, 22.57421875, 25.6015625, 28.62890625, 31.65625, 34.68359375, 37.7109375, 40.73828125, 43.765625, 46.79296875, 49.8203125, 52.84765625, 55.875, 58.90234375, 61.9296875, 64.95703125, 67.984375, 71.01171875, 74.0390625, 77.06640625, 80.09375, 83.12109375, 86.1484375, 89.17578125, 92.203125, 95.23046875, 98.2578125, 101.28515625, 104.3125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 11.0, 4.0, 5.0, 12.0, 16.0, 17.0, 39.0, 70.0, 194.0, 468.0, 1146.0, 3350.0, 13470.0, 136179.0, 3968166.0, 58203.0, 8903.0, 2440.0, 908.0, 370.0, 137.0, 61.0, 33.0, 23.0, 15.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-347.25, -337.14453125, -327.0390625, -316.93359375, -306.828125, -296.72265625, -286.6171875, -276.51171875, -266.40625, -256.30078125, -246.1953125, -236.08984375, -225.984375, -215.87890625, -205.7734375, -195.66796875, -185.5625, -175.45703125, -165.3515625, -155.24609375, -145.140625, -135.03515625, -124.9296875, -114.82421875, -104.71875, -94.61328125, -84.5078125, -74.40234375, -64.296875, -54.19140625, -44.0859375, -33.98046875, -23.875, -13.76953125, -3.6640625, 6.44140625, 16.546875, 26.65234375, 36.7578125, 46.86328125, 56.96875, 67.07421875, 77.1796875, 87.28515625, 97.390625, 107.49609375, 117.6015625, 127.70703125, 137.8125, 147.91796875, 158.0234375, 168.12890625, 178.234375, 188.33984375, 198.4453125, 208.55078125, 218.65625, 228.76171875, 238.8671875, 248.97265625, 259.078125, 269.18359375, 279.2890625, 289.39453125, 299.5]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 11.0, 7.0, 16.0, 24.0, 45.0, 73.0, 176.0, 213.0, 197.0, 97.0, 52.0, 32.0, 21.0, 13.0, 13.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-411.0187072753906, -394.3304748535156, -377.6422119140625, -360.9539794921875, -344.2657470703125, -327.5775146484375, -310.8892822265625, -294.2010192871094, -277.5127868652344, -260.8245544433594, -244.1363067626953, -227.44805908203125, -210.75982666015625, -194.07159423828125, -177.3833465576172, -160.69509887695312, -144.00686645507812, -127.3186264038086, -110.63038635253906, -93.94214630126953, -77.25390625, -60.56566619873047, -43.87742614746094, -27.189186096191406, -10.500946044921875, 6.187294006347656, 22.875534057617188, 39.56377410888672, 56.25201416015625, 72.94025421142578, 89.62849426269531, 106.31673431396484, 123.0050048828125, 139.6932373046875, 156.38148498535156, 173.06973266601562, 189.75796508789062, 206.44619750976562, 223.1344451904297, 239.82269287109375, 256.51092529296875, 273.19915771484375, 289.88739013671875, 306.5756530761719, 323.2638854980469, 339.9521179199219, 356.640380859375, 373.32861328125, 390.016845703125, 406.705078125, 423.393310546875, 440.0815734863281, 456.7698059082031, 473.4580383300781, 490.14630126953125, 506.83453369140625, 523.5227661132812, 540.2109985351562, 556.8992309570312, 573.5874633789062, 590.2757568359375, 606.9639892578125, 623.6522216796875, 640.3404541015625, 657.0286865234375]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 4.0, 7.0, 12.0, 5.0, 10.0, 11.0, 21.0, 14.0, 20.0, 16.0, 28.0, 37.0, 20.0, 30.0, 34.0, 32.0, 39.0, 37.0, 31.0, 43.0, 43.0, 46.0, 34.0, 37.0, 43.0, 22.0, 31.0, 39.0, 29.0, 25.0, 29.0, 26.0, 28.0, 14.0, 17.0, 14.0, 12.0, 13.0, 11.0, 4.0, 2.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.2861328125, -189.0306396484375, -182.775146484375, -176.51966857910156, -170.26417541503906, -164.00868225097656, -157.75320434570312, -151.49771118164062, -145.24221801757812, -138.98672485351562, -132.73123168945312, -126.47575378417969, -120.22026062011719, -113.96476745605469, -107.70928192138672, -101.45379638671875, -95.19830322265625, -88.94281005859375, -82.68732452392578, -76.43183898925781, -70.17634582519531, -63.92085647583008, -57.665367126464844, -51.40987777709961, -45.154388427734375, -38.89889907836914, -32.643409729003906, -26.387920379638672, -20.132431030273438, -13.876941680908203, -7.621452331542969, -1.3659629821777344, 4.8895263671875, 11.145015716552734, 17.40050506591797, 23.655994415283203, 29.911483764648438, 36.16697311401367, 42.422462463378906, 48.67795181274414, 54.933441162109375, 61.18893051147461, 67.44441986083984, 73.69990539550781, 79.95539855957031, 86.21089172363281, 92.46637725830078, 98.72186279296875, 104.97735595703125, 111.23284912109375, 117.48833465576172, 123.74382019042969, 129.9993133544922, 136.2548065185547, 142.51028442382812, 148.76577758789062, 155.02127075195312, 161.27676391601562, 167.53225708007812, 173.78773498535156, 180.04322814941406, 186.29872131347656, 192.55419921875, 198.8096923828125, 205.065185546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 9.0, 10.0, 18.0, 11.0, 19.0, 15.0, 29.0, 18.0, 40.0, 37.0, 38.0, 28.0, 43.0, 42.0, 53.0, 48.0, 48.0, 45.0, 42.0, 44.0, 39.0, 38.0, 48.0, 35.0, 28.0, 34.0, 19.0, 25.0, 23.0, 18.0, 14.0, 6.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.84375, -37.45068359375, -36.0576171875, -34.66455078125, -33.271484375, -31.87841796875, -30.4853515625, -29.09228515625, -27.69921875, -26.30615234375, -24.9130859375, -23.52001953125, -22.126953125, -20.73388671875, -19.3408203125, -17.94775390625, -16.5546875, -15.16162109375, -13.7685546875, -12.37548828125, -10.982421875, -9.58935546875, -8.1962890625, -6.80322265625, -5.41015625, -4.01708984375, -2.6240234375, -1.23095703125, 0.162109375, 1.55517578125, 2.9482421875, 4.34130859375, 5.734375, 7.12744140625, 8.5205078125, 9.91357421875, 11.306640625, 12.69970703125, 14.0927734375, 15.48583984375, 16.87890625, 18.27197265625, 19.6650390625, 21.05810546875, 22.451171875, 23.84423828125, 25.2373046875, 26.63037109375, 28.0234375, 29.41650390625, 30.8095703125, 32.20263671875, 33.595703125, 34.98876953125, 36.3818359375, 37.77490234375, 39.16796875, 40.56103515625, 41.9541015625, 43.34716796875, 44.740234375, 46.13330078125, 47.5263671875, 48.91943359375, 50.3125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 10.0, 5.0, 15.0, 15.0, 25.0, 41.0, 58.0, 92.0, 135.0, 174.0, 283.0, 448.0, 677.0, 1117.0, 1696.0, 2798.0, 4456.0, 7290.0, 11867.0, 19730.0, 33352.0, 59518.0, 111470.0, 314561.0, 246962.0, 100212.0, 53389.0, 31241.0, 18229.0, 10916.0, 6631.0, 4131.0, 2532.0, 1666.0, 1030.0, 635.0, 418.0, 265.0, 160.0, 106.0, 51.0, 40.0, 34.0, 21.0, 17.0, 12.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1.8193359375, -1.7657012939453125, -1.712066650390625, -1.6584320068359375, -1.60479736328125, -1.5511627197265625, -1.497528076171875, -1.4438934326171875, -1.3902587890625, -1.3366241455078125, -1.282989501953125, -1.2293548583984375, -1.17572021484375, -1.1220855712890625, -1.068450927734375, -1.0148162841796875, -0.961181640625, -0.9075469970703125, -0.853912353515625, -0.8002777099609375, -0.74664306640625, -0.6930084228515625, -0.639373779296875, -0.5857391357421875, -0.5321044921875, -0.4784698486328125, -0.424835205078125, -0.3712005615234375, -0.31756591796875, -0.2639312744140625, -0.210296630859375, -0.1566619873046875, -0.10302734375, -0.0493927001953125, 0.004241943359375, 0.0578765869140625, 0.11151123046875, 0.1651458740234375, 0.218780517578125, 0.2724151611328125, 0.3260498046875, 0.3796844482421875, 0.433319091796875, 0.4869537353515625, 0.54058837890625, 0.5942230224609375, 0.647857666015625, 0.7014923095703125, 0.755126953125, 0.8087615966796875, 0.862396240234375, 0.9160308837890625, 0.96966552734375, 1.0233001708984375, 1.076934814453125, 1.1305694580078125, 1.1842041015625, 1.2378387451171875, 1.291473388671875, 1.3451080322265625, 1.39874267578125, 1.4523773193359375, 1.506011962890625, 1.5596466064453125, 1.61328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 4.0, 11.0, 8.0, 13.0, 14.0, 14.0, 24.0, 23.0, 13.0, 24.0, 21.0, 29.0, 35.0, 41.0, 32.0, 31.0, 44.0, 52.0, 35.0, 1062.0, 30.0, 37.0, 35.0, 33.0, 45.0, 37.0, 38.0, 29.0, 22.0, 20.0, 28.0, 21.0, 21.0, 13.0, 18.0, 15.0, 12.0, 8.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.921875, -24.114013671875, -23.30615234375, -22.498291015625, -21.6904296875, -20.882568359375, -20.07470703125, -19.266845703125, -18.458984375, -17.651123046875, -16.84326171875, -16.035400390625, -15.2275390625, -14.419677734375, -13.61181640625, -12.803955078125, -11.99609375, -11.188232421875, -10.38037109375, -9.572509765625, -8.7646484375, -7.956787109375, -7.14892578125, -6.341064453125, -5.533203125, -4.725341796875, -3.91748046875, -3.109619140625, -2.3017578125, -1.493896484375, -0.68603515625, 0.121826171875, 0.9296875, 1.737548828125, 2.54541015625, 3.353271484375, 4.1611328125, 4.968994140625, 5.77685546875, 6.584716796875, 7.392578125, 8.200439453125, 9.00830078125, 9.816162109375, 10.6240234375, 11.431884765625, 12.23974609375, 13.047607421875, 13.85546875, 14.663330078125, 15.47119140625, 16.279052734375, 17.0869140625, 17.894775390625, 18.70263671875, 19.510498046875, 20.318359375, 21.126220703125, 21.93408203125, 22.741943359375, 23.5498046875, 24.357666015625, 25.16552734375, 25.973388671875, 26.78125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 12.0, 15.0, 25.0, 30.0, 34.0, 58.0, 86.0, 121.0, 155.0, 236.0, 357.0, 462.0, 710.0, 994.0, 1455.0, 1986.0, 2909.0, 4337.0, 6584.0, 9809.0, 14701.0, 21995.0, 33799.0, 53570.0, 89443.0, 168485.0, 1348478.0, 130062.0, 73576.0, 45521.0, 28933.0, 18802.0, 12589.0, 8514.0, 5805.0, 3803.0, 2731.0, 1809.0, 1282.0, 906.0, 582.0, 411.0, 291.0, 196.0, 129.0, 96.0, 68.0, 57.0, 38.0, 31.0, 17.0, 16.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.095703125, -1.061798095703125, -1.02789306640625, -0.993988037109375, -0.9600830078125, -0.926177978515625, -0.89227294921875, -0.858367919921875, -0.824462890625, -0.790557861328125, -0.75665283203125, -0.722747802734375, -0.6888427734375, -0.654937744140625, -0.62103271484375, -0.587127685546875, -0.55322265625, -0.519317626953125, -0.48541259765625, -0.451507568359375, -0.4176025390625, -0.383697509765625, -0.34979248046875, -0.315887451171875, -0.281982421875, -0.248077392578125, -0.21417236328125, -0.180267333984375, -0.1463623046875, -0.112457275390625, -0.07855224609375, -0.044647216796875, -0.0107421875, 0.023162841796875, 0.05706787109375, 0.090972900390625, 0.1248779296875, 0.158782958984375, 0.19268798828125, 0.226593017578125, 0.260498046875, 0.294403076171875, 0.32830810546875, 0.362213134765625, 0.3961181640625, 0.430023193359375, 0.46392822265625, 0.497833251953125, 0.53173828125, 0.565643310546875, 0.59954833984375, 0.633453369140625, 0.6673583984375, 0.701263427734375, 0.73516845703125, 0.769073486328125, 0.802978515625, 0.836883544921875, 0.87078857421875, 0.904693603515625, 0.9385986328125, 0.972503662109375, 1.00640869140625, 1.040313720703125, 1.07421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 5.0, 7.0, 8.0, 13.0, 10.0, 9.0, 8.0, 25.0, 36.0, 21.0, 38.0, 51.0, 77.0, 216.0, 172.0, 72.0, 45.0, 36.0, 26.0, 27.0, 15.0, 14.0, 13.0, 10.0, 16.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.759166717529297e-05, -6.540119647979736e-05, -6.321072578430176e-05, -6.102025508880615e-05, -5.882978439331055e-05, -5.663931369781494e-05, -5.4448843002319336e-05, -5.225837230682373e-05, -5.0067901611328125e-05, -4.787743091583252e-05, -4.5686960220336914e-05, -4.349648952484131e-05, -4.13060188293457e-05, -3.91155481338501e-05, -3.692507743835449e-05, -3.473460674285889e-05, -3.254413604736328e-05, -3.0353665351867676e-05, -2.816319465637207e-05, -2.5972723960876465e-05, -2.378225326538086e-05, -2.1591782569885254e-05, -1.940131187438965e-05, -1.7210841178894043e-05, -1.5020370483398438e-05, -1.2829899787902832e-05, -1.0639429092407227e-05, -8.448958396911621e-06, -6.258487701416016e-06, -4.06801700592041e-06, -1.8775463104248047e-06, 3.129243850708008e-07, 2.5033950805664062e-06, 4.693865776062012e-06, 6.884336471557617e-06, 9.074807167053223e-06, 1.1265277862548828e-05, 1.3455748558044434e-05, 1.564621925354004e-05, 1.7836689949035645e-05, 2.002716064453125e-05, 2.2217631340026855e-05, 2.440810203552246e-05, 2.6598572731018066e-05, 2.8789043426513672e-05, 3.097951412200928e-05, 3.316998481750488e-05, 3.536045551300049e-05, 3.7550926208496094e-05, 3.97413969039917e-05, 4.1931867599487305e-05, 4.412233829498291e-05, 4.6312808990478516e-05, 4.850327968597412e-05, 5.0693750381469727e-05, 5.288422107696533e-05, 5.507469177246094e-05, 5.726516246795654e-05, 5.945563316345215e-05, 6.164610385894775e-05, 6.383657455444336e-05, 6.602704524993896e-05, 6.821751594543457e-05, 7.040798664093018e-05, 7.259845733642578e-05]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 10.0, 18.0, 13.0, 24.0, 15.0, 51.0, 60.0, 90.0, 198.0, 1090.0, 20304.0, 986601.0, 37998.0, 1462.0, 288.0, 93.0, 61.0, 45.0, 20.0, 26.0, 12.0, 16.0, 7.0, 6.0, 6.0, 6.0, 7.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013179779052734375, -0.0012798607349395752, -0.0012417435646057129, -0.0012036263942718506, -0.0011655092239379883, -0.001127392053604126, -0.0010892748832702637, -0.0010511577129364014, -0.001013040542602539, -0.0009749233722686768, -0.0009368062019348145, -0.0008986890316009521, -0.0008605718612670898, -0.0008224546909332275, -0.0007843375205993652, -0.0007462203502655029, -0.0007081031799316406, -0.0006699860095977783, -0.000631868839263916, -0.0005937516689300537, -0.0005556344985961914, -0.0005175173282623291, -0.0004794001579284668, -0.0004412829875946045, -0.0004031658172607422, -0.0003650486469268799, -0.0003269314765930176, -0.0002888143062591553, -0.00025069713592529297, -0.00021257996559143066, -0.00017446279525756836, -0.00013634562492370605, -9.822845458984375e-05, -6.0111284255981445e-05, -2.199411392211914e-05, 1.6123056411743164e-05, 5.424022674560547e-05, 9.235739707946777e-05, 0.00013047456741333008, 0.00016859173774719238, 0.0002067089080810547, 0.000244826078414917, 0.0002829432487487793, 0.0003210604190826416, 0.0003591775894165039, 0.0003972947597503662, 0.0004354119300842285, 0.0004735291004180908, 0.0005116462707519531, 0.0005497634410858154, 0.0005878806114196777, 0.00062599778175354, 0.0006641149520874023, 0.0007022321224212646, 0.000740349292755127, 0.0007784664630889893, 0.0008165836334228516, 0.0008547008037567139, 0.0008928179740905762, 0.0009309351444244385, 0.0009690523147583008, 0.001007169485092163, 0.0010452866554260254, 0.0010834038257598877, 0.00112152099609375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 10.0, 26.0, 45.0, 48.0, 76.0, 161.0, 250.0, 146.0, 92.0, 55.0, 32.0, 18.0, 12.0, 5.0, 11.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208517440129071e-05, -9.006063919514418e-05, -8.803609671304002e-05, -8.601155423093587e-05, -8.398701902478933e-05, -8.19624838186428e-05, -7.993794133653864e-05, -7.791339885443449e-05, -7.588886364828795e-05, -7.386432844214141e-05, -7.183978596003726e-05, -6.981524347793311e-05, -6.779070827178657e-05, -6.576617306564003e-05, -6.374163058353588e-05, -6.171708810143173e-05, -5.969255289528519e-05, -5.7668014051159844e-05, -5.56434752070345e-05, -5.361893636290915e-05, -5.159439751878381e-05, -4.956985867465846e-05, -4.754531983053312e-05, -4.552078098640777e-05, -4.3496242142282426e-05, -4.147170329815708e-05, -3.9447164454031736e-05, -3.742262560990639e-05, -3.5398086765781045e-05, -3.33735479216557e-05, -3.1349009077530354e-05, -2.932447023340501e-05, -2.7299927751300856e-05, -2.527538890717551e-05, -2.3250850063050166e-05, -2.122631121892482e-05, -1.9201772374799475e-05, -1.717723353067413e-05, -1.5152694686548784e-05, -1.3128155842423439e-05, -1.1103616998298094e-05, -9.079078154172748e-06, -7.054539310047403e-06, -5.030000465922058e-06, -3.0054616217967123e-06, -9.80922777671367e-07, 1.0436160664539784e-06, 3.0681549105793238e-06, 5.092693754704669e-06, 7.1172325988300145e-06, 9.14177144295536e-06, 1.1166310287080705e-05, 1.319084913120605e-05, 1.5215387975331396e-05, 1.723992681945674e-05, 1.9264465663582087e-05, 2.1289004507707432e-05, 2.3313543351832777e-05, 2.5338082195958123e-05, 2.7362621040083468e-05, 2.9387159884208813e-05, 3.141169872833416e-05, 3.3436237572459504e-05, 3.546077641658485e-05, 3.7485315260710195e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 6.0, 7.0, 9.0, 15.0, 8.0, 12.0, 19.0, 8.0, 26.0, 31.0, 23.0, 26.0, 39.0, 27.0, 38.0, 42.0, 28.0, 29.0, 43.0, 38.0, 49.0, 33.0, 36.0, 29.0, 45.0, 27.0, 50.0, 32.0, 18.0, 34.0, 15.0, 23.0, 23.0, 22.0, 14.0, 9.0, 11.0, 14.0, 1.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.485513687133789e-05, -2.406258136034012e-05, -2.3270025849342346e-05, -2.2477470338344574e-05, -2.1684914827346802e-05, -2.089235931634903e-05, -2.0099803805351257e-05, -1.9307248294353485e-05, -1.8514692783355713e-05, -1.772213727235794e-05, -1.692958176136017e-05, -1.6137026250362396e-05, -1.5344470739364624e-05, -1.4551915228366852e-05, -1.375935971736908e-05, -1.2966804206371307e-05, -1.2174248695373535e-05, -1.1381693184375763e-05, -1.058913767337799e-05, -9.796582162380219e-06, -9.004026651382446e-06, -8.211471140384674e-06, -7.418915629386902e-06, -6.62636011838913e-06, -5.833804607391357e-06, -5.041249096393585e-06, -4.248693585395813e-06, -3.4561380743980408e-06, -2.6635825634002686e-06, -1.8710270524024963e-06, -1.0784715414047241e-06, -2.859160304069519e-07, 5.066394805908203e-07, 1.2991949915885925e-06, 2.0917505025863647e-06, 2.884306013584137e-06, 3.676861524581909e-06, 4.469417035579681e-06, 5.261972546577454e-06, 6.054528057575226e-06, 6.847083568572998e-06, 7.63963907957077e-06, 8.432194590568542e-06, 9.224750101566315e-06, 1.0017305612564087e-05, 1.0809861123561859e-05, 1.1602416634559631e-05, 1.2394972145557404e-05, 1.3187527656555176e-05, 1.3980083167552948e-05, 1.477263867855072e-05, 1.5565194189548492e-05, 1.6357749700546265e-05, 1.7150305211544037e-05, 1.794286072254181e-05, 1.873541623353958e-05, 1.9527971744537354e-05, 2.0320527255535126e-05, 2.1113082766532898e-05, 2.190563827753067e-05, 2.2698193788528442e-05, 2.3490749299526215e-05, 2.4283304810523987e-05, 2.507586032152176e-05, 2.586841583251953e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 9.0, 10.0, 18.0, 11.0, 19.0, 15.0, 29.0, 18.0, 40.0, 37.0, 38.0, 28.0, 43.0, 42.0, 53.0, 48.0, 48.0, 45.0, 42.0, 44.0, 39.0, 38.0, 48.0, 35.0, 28.0, 34.0, 19.0, 25.0, 23.0, 18.0, 14.0, 6.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.84375, -37.45068359375, -36.0576171875, -34.66455078125, -33.271484375, -31.87841796875, -30.4853515625, -29.09228515625, -27.69921875, -26.30615234375, -24.9130859375, -23.52001953125, -22.126953125, -20.73388671875, -19.3408203125, -17.94775390625, -16.5546875, -15.16162109375, -13.7685546875, -12.37548828125, -10.982421875, -9.58935546875, -8.1962890625, -6.80322265625, -5.41015625, -4.01708984375, -2.6240234375, -1.23095703125, 0.162109375, 1.55517578125, 2.9482421875, 4.34130859375, 5.734375, 7.12744140625, 8.5205078125, 9.91357421875, 11.306640625, 12.69970703125, 14.0927734375, 15.48583984375, 16.87890625, 18.27197265625, 19.6650390625, 21.05810546875, 22.451171875, 23.84423828125, 25.2373046875, 26.63037109375, 28.0234375, 29.41650390625, 30.8095703125, 32.20263671875, 33.595703125, 34.98876953125, 36.3818359375, 37.77490234375, 39.16796875, 40.56103515625, 41.9541015625, 43.34716796875, 44.740234375, 46.13330078125, 47.5263671875, 48.91943359375, 50.3125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 2.0, 13.0, 16.0, 16.0, 19.0, 31.0, 36.0, 76.0, 120.0, 185.0, 325.0, 554.0, 1190.0, 2268.0, 4898.0, 12892.0, 39410.0, 142655.0, 558944.0, 204445.0, 52006.0, 16658.0, 6154.0, 2705.0, 1273.0, 712.0, 353.0, 215.0, 130.0, 73.0, 55.0, 41.0, 30.0, 16.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.140625, -19.411376953125, -18.68212890625, -17.952880859375, -17.2236328125, -16.494384765625, -15.76513671875, -15.035888671875, -14.306640625, -13.577392578125, -12.84814453125, -12.118896484375, -11.3896484375, -10.660400390625, -9.93115234375, -9.201904296875, -8.47265625, -7.743408203125, -7.01416015625, -6.284912109375, -5.5556640625, -4.826416015625, -4.09716796875, -3.367919921875, -2.638671875, -1.909423828125, -1.18017578125, -0.450927734375, 0.2783203125, 1.007568359375, 1.73681640625, 2.466064453125, 3.1953125, 3.924560546875, 4.65380859375, 5.383056640625, 6.1123046875, 6.841552734375, 7.57080078125, 8.300048828125, 9.029296875, 9.758544921875, 10.48779296875, 11.217041015625, 11.9462890625, 12.675537109375, 13.40478515625, 14.134033203125, 14.86328125, 15.592529296875, 16.32177734375, 17.051025390625, 17.7802734375, 18.509521484375, 19.23876953125, 19.968017578125, 20.697265625, 21.426513671875, 22.15576171875, 22.885009765625, 23.6142578125, 24.343505859375, 25.07275390625, 25.802001953125, 26.53125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 7.0, 10.0, 9.0, 15.0, 5.0, 6.0, 21.0, 10.0, 23.0, 33.0, 31.0, 29.0, 32.0, 31.0, 39.0, 49.0, 37.0, 43.0, 132.0, 1929.0, 92.0, 56.0, 41.0, 39.0, 40.0, 38.0, 29.0, 23.0, 35.0, 23.0, 22.0, 18.0, 18.0, 12.0, 16.0, 11.0, 3.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-123.25, -119.560546875, -115.87109375, -112.181640625, -108.4921875, -104.802734375, -101.11328125, -97.423828125, -93.734375, -90.044921875, -86.35546875, -82.666015625, -78.9765625, -75.287109375, -71.59765625, -67.908203125, -64.21875, -60.529296875, -56.83984375, -53.150390625, -49.4609375, -45.771484375, -42.08203125, -38.392578125, -34.703125, -31.013671875, -27.32421875, -23.634765625, -19.9453125, -16.255859375, -12.56640625, -8.876953125, -5.1875, -1.498046875, 2.19140625, 5.880859375, 9.5703125, 13.259765625, 16.94921875, 20.638671875, 24.328125, 28.017578125, 31.70703125, 35.396484375, 39.0859375, 42.775390625, 46.46484375, 50.154296875, 53.84375, 57.533203125, 61.22265625, 64.912109375, 68.6015625, 72.291015625, 75.98046875, 79.669921875, 83.359375, 87.048828125, 90.73828125, 94.427734375, 98.1171875, 101.806640625, 105.49609375, 109.185546875, 112.875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 6.0, 5.0, 7.0, 10.0, 15.0, 20.0, 25.0, 22.0, 37.0, 38.0, 60.0, 62.0, 74.0, 113.0, 136.0, 172.0, 253.0, 496.0, 2205.0, 3085687.0, 53840.0, 1074.0, 353.0, 232.0, 176.0, 119.0, 66.0, 77.0, 66.0, 62.0, 46.0, 31.0, 19.0, 16.0, 12.0, 16.0, 11.0, 9.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-272.25, -263.41796875, -254.5859375, -245.75390625, -236.921875, -228.08984375, -219.2578125, -210.42578125, -201.59375, -192.76171875, -183.9296875, -175.09765625, -166.265625, -157.43359375, -148.6015625, -139.76953125, -130.9375, -122.10546875, -113.2734375, -104.44140625, -95.609375, -86.77734375, -77.9453125, -69.11328125, -60.28125, -51.44921875, -42.6171875, -33.78515625, -24.953125, -16.12109375, -7.2890625, 1.54296875, 10.375, 19.20703125, 28.0390625, 36.87109375, 45.703125, 54.53515625, 63.3671875, 72.19921875, 81.03125, 89.86328125, 98.6953125, 107.52734375, 116.359375, 125.19140625, 134.0234375, 142.85546875, 151.6875, 160.51953125, 169.3515625, 178.18359375, 187.015625, 195.84765625, 204.6796875, 213.51171875, 222.34375, 231.17578125, 240.0078125, 248.83984375, 257.671875, 266.50390625, 275.3359375, 284.16796875, 293.0]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 171.0, 755.0, 90.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.08861541748047, -74.3661880493164, -60.64376449584961, -46.92134094238281, -33.19891357421875, -19.476486206054688, -5.754066467285156, 7.968360900878906, 21.69078826904297, 35.41321563720703, 49.13563919067383, 62.858062744140625, 76.58049011230469, 90.30291748046875, 104.02533721923828, 117.74776458740234, 131.47018432617188, 145.19261169433594, 158.9150390625, 172.637451171875, 186.35989379882812, 200.08230590820312, 213.8047332763672, 227.52716064453125, 241.24960327148438, 254.97203063964844, 268.6944580078125, 282.4168701171875, 296.1393127441406, 309.8617248535156, 323.58416748046875, 337.30657958984375, 351.02899169921875, 364.75140380859375, 378.4738464355469, 392.1962585449219, 405.918701171875, 419.64111328125, 433.363525390625, 447.0859680175781, 460.80841064453125, 474.53082275390625, 488.2532653808594, 501.9756774902344, 515.6981201171875, 529.4205322265625, 543.1429443359375, 556.8653564453125, 570.5877685546875, 584.3101806640625, 598.0325927734375, 611.7550659179688, 625.4774780273438, 639.1998901367188, 652.9223022460938, 666.644775390625, 680.3671875, 694.089599609375, 707.81201171875, 721.5344848632812, 735.2568969726562, 748.9793090820312, 762.7017211914062, 776.4241943359375, 790.1466064453125]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 7.0, 3.0, 6.0, 10.0, 10.0, 10.0, 6.0, 16.0, 21.0, 24.0, 21.0, 23.0, 25.0, 38.0, 33.0, 32.0, 40.0, 43.0, 43.0, 32.0, 42.0, 49.0, 44.0, 49.0, 46.0, 40.0, 42.0, 29.0, 35.0, 35.0, 21.0, 25.0, 21.0, 8.0, 12.0, 10.0, 7.0, 11.0, 11.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-336.6199645996094, -326.78619384765625, -316.95245361328125, -307.1186828613281, -297.284912109375, -287.451171875, -277.6174011230469, -267.78363037109375, -257.94989013671875, -248.1161346435547, -238.28237915039062, -228.4486083984375, -218.61485290527344, -208.78109741210938, -198.94732666015625, -189.1135711669922, -179.27981567382812, -169.44606018066406, -159.6123046875, -149.77853393554688, -139.9447784423828, -130.11102294921875, -120.27725982666016, -110.44349670410156, -100.6097412109375, -90.77598571777344, -80.94222259521484, -71.10845947265625, -61.27470397949219, -51.44094467163086, -41.60718536376953, -31.773422241210938, -21.939697265625, -12.105937957763672, -2.2721786499023438, 7.561580657958984, 17.395339965820312, 27.22909927368164, 37.06285858154297, 46.89662170410156, 56.730377197265625, 66.56413269042969, 76.39789581298828, 86.23165893554688, 96.06541442871094, 105.899169921875, 115.7329330444336, 125.56669616699219, 135.40045166015625, 145.2342071533203, 155.06796264648438, 164.9017333984375, 174.73548889160156, 184.56924438476562, 194.40301513671875, 204.2367706298828, 214.07052612304688, 223.90428161621094, 233.738037109375, 243.57180786132812, 253.4055633544922, 263.23931884765625, 273.0730895996094, 282.9068603515625, 292.7406005859375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 12.0, 9.0, 15.0, 12.0, 17.0, 19.0, 26.0, 32.0, 34.0, 38.0, 35.0, 30.0, 46.0, 40.0, 45.0, 62.0, 44.0, 44.0, 44.0, 41.0, 39.0, 44.0, 43.0, 36.0, 28.0, 28.0, 22.0, 22.0, 30.0, 13.0, 13.0, 8.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.34375, -37.92138671875, -36.4990234375, -35.07666015625, -33.654296875, -32.23193359375, -30.8095703125, -29.38720703125, -27.96484375, -26.54248046875, -25.1201171875, -23.69775390625, -22.275390625, -20.85302734375, -19.4306640625, -18.00830078125, -16.5859375, -15.16357421875, -13.7412109375, -12.31884765625, -10.896484375, -9.47412109375, -8.0517578125, -6.62939453125, -5.20703125, -3.78466796875, -2.3623046875, -0.93994140625, 0.482421875, 1.90478515625, 3.3271484375, 4.74951171875, 6.171875, 7.59423828125, 9.0166015625, 10.43896484375, 11.861328125, 13.28369140625, 14.7060546875, 16.12841796875, 17.55078125, 18.97314453125, 20.3955078125, 21.81787109375, 23.240234375, 24.66259765625, 26.0849609375, 27.50732421875, 28.9296875, 30.35205078125, 31.7744140625, 33.19677734375, 34.619140625, 36.04150390625, 37.4638671875, 38.88623046875, 40.30859375, 41.73095703125, 43.1533203125, 44.57568359375, 45.998046875, 47.42041015625, 48.8427734375, 50.26513671875, 51.6875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 19.0, 16.0, 29.0, 28.0, 38.0, 67.0, 78.0, 110.0, 175.0, 219.0, 346.0, 450.0, 690.0, 1039.0, 1605.0, 2485.0, 4243.0, 7760.0, 18114.0, 105513.0, 2385307.0, 1556755.0, 76363.0, 14764.0, 7132.0, 3921.0, 2317.0, 1498.0, 953.0, 664.0, 413.0, 351.0, 228.0, 158.0, 113.0, 79.0, 65.0, 50.0, 42.0, 18.0, 17.0, 16.0, 7.0, 8.0, 3.0, 5.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.375, -83.283203125, -80.19140625, -77.099609375, -74.0078125, -70.916015625, -67.82421875, -64.732421875, -61.640625, -58.548828125, -55.45703125, -52.365234375, -49.2734375, -46.181640625, -43.08984375, -39.998046875, -36.90625, -33.814453125, -30.72265625, -27.630859375, -24.5390625, -21.447265625, -18.35546875, -15.263671875, -12.171875, -9.080078125, -5.98828125, -2.896484375, 0.1953125, 3.287109375, 6.37890625, 9.470703125, 12.5625, 15.654296875, 18.74609375, 21.837890625, 24.9296875, 28.021484375, 31.11328125, 34.205078125, 37.296875, 40.388671875, 43.48046875, 46.572265625, 49.6640625, 52.755859375, 55.84765625, 58.939453125, 62.03125, 65.123046875, 68.21484375, 71.306640625, 74.3984375, 77.490234375, 80.58203125, 83.673828125, 86.765625, 89.857421875, 92.94921875, 96.041015625, 99.1328125, 102.224609375, 105.31640625, 108.408203125, 111.5]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 11.0, 7.0, 21.0, 29.0, 35.0, 44.0, 56.0, 122.0, 282.0, 747.0, 1340.0, 737.0, 267.0, 118.0, 71.0, 33.0, 37.0, 24.0, 24.0, 10.0, 9.0, 8.0, 8.0, 4.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.6875, -90.5087890625, -87.330078125, -84.1513671875, -80.97265625, -77.7939453125, -74.615234375, -71.4365234375, -68.2578125, -65.0791015625, -61.900390625, -58.7216796875, -55.54296875, -52.3642578125, -49.185546875, -46.0068359375, -42.828125, -39.6494140625, -36.470703125, -33.2919921875, -30.11328125, -26.9345703125, -23.755859375, -20.5771484375, -17.3984375, -14.2197265625, -11.041015625, -7.8623046875, -4.68359375, -1.5048828125, 1.673828125, 4.8525390625, 8.03125, 11.2099609375, 14.388671875, 17.5673828125, 20.74609375, 23.9248046875, 27.103515625, 30.2822265625, 33.4609375, 36.6396484375, 39.818359375, 42.9970703125, 46.17578125, 49.3544921875, 52.533203125, 55.7119140625, 58.890625, 62.0693359375, 65.248046875, 68.4267578125, 71.60546875, 74.7841796875, 77.962890625, 81.1416015625, 84.3203125, 87.4990234375, 90.677734375, 93.8564453125, 97.03515625, 100.2138671875, 103.392578125, 106.5712890625, 109.75]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 12.0, 17.0, 24.0, 23.0, 68.0, 147.0, 324.0, 781.0, 2211.0, 8742.0, 70267.0, 3993676.0, 103162.0, 10700.0, 2608.0, 850.0, 328.0, 140.0, 87.0, 41.0, 17.0, 13.0, 8.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-394.25, -383.1640625, -372.078125, -360.9921875, -349.90625, -338.8203125, -327.734375, -316.6484375, -305.5625, -294.4765625, -283.390625, -272.3046875, -261.21875, -250.1328125, -239.046875, -227.9609375, -216.875, -205.7890625, -194.703125, -183.6171875, -172.53125, -161.4453125, -150.359375, -139.2734375, -128.1875, -117.1015625, -106.015625, -94.9296875, -83.84375, -72.7578125, -61.671875, -50.5859375, -39.5, -28.4140625, -17.328125, -6.2421875, 4.84375, 15.9296875, 27.015625, 38.1015625, 49.1875, 60.2734375, 71.359375, 82.4453125, 93.53125, 104.6171875, 115.703125, 126.7890625, 137.875, 148.9609375, 160.046875, 171.1328125, 182.21875, 193.3046875, 204.390625, 215.4765625, 226.5625, 237.6484375, 248.734375, 259.8203125, 270.90625, 281.9921875, 293.078125, 304.1640625, 315.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 15.0, 26.0, 34.0, 67.0, 99.0, 160.0, 204.0, 154.0, 92.0, 52.0, 30.0, 24.0, 13.0, 9.0, 5.0, 1.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-410.4713439941406, -394.8402404785156, -379.2091369628906, -363.5780334472656, -347.9469299316406, -332.3158264160156, -316.6847229003906, -301.0536193847656, -285.4225158691406, -269.7914123535156, -254.16030883789062, -238.52920532226562, -222.89810180664062, -207.26699829101562, -191.63589477539062, -176.00479125976562, -160.37368774414062, -144.74258422851562, -129.11148071289062, -113.48037719726562, -97.84927368164062, -82.21817016601562, -66.58706665039062, -50.955963134765625, -35.324859619140625, -19.693756103515625, -4.062652587890625, 11.568450927734375, 27.199554443359375, 42.830657958984375, 58.461761474609375, 74.09286499023438, 89.7239990234375, 105.3551025390625, 120.9862060546875, 136.6173095703125, 152.2484130859375, 167.8795166015625, 183.5106201171875, 199.1417236328125, 214.7728271484375, 230.4039306640625, 246.0350341796875, 261.6661376953125, 277.2972412109375, 292.9283447265625, 308.5594482421875, 324.1905517578125, 339.8216552734375, 355.4527587890625, 371.0838623046875, 386.7149658203125, 402.3460693359375, 417.9771728515625, 433.6082763671875, 449.2393798828125, 464.8704833984375, 480.5015869140625, 496.1326904296875, 511.7637939453125, 527.3948974609375, 543.0260009765625, 558.6571044921875, 574.2882080078125, 589.9193115234375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 14.0, 14.0, 9.0, 8.0, 19.0, 24.0, 13.0, 16.0, 20.0, 25.0, 37.0, 26.0, 34.0, 28.0, 37.0, 32.0, 40.0, 39.0, 37.0, 39.0, 35.0, 28.0, 21.0, 35.0, 29.0, 37.0, 25.0, 29.0, 27.0, 22.0, 27.0, 19.0, 26.0, 20.0, 12.0, 10.0, 18.0, 10.0, 6.0, 11.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.1181640625, -172.29171752929688, -166.4652557373047, -160.63880920410156, -154.81236267089844, -148.98590087890625, -143.15945434570312, -137.3330078125, -131.5065460205078, -125.68009185791016, -119.85364532470703, -114.02719116210938, -108.20073699951172, -102.37428283691406, -96.54783630371094, -90.72138214111328, -84.89493560791016, -79.0684814453125, -73.24203491210938, -67.41558074951172, -61.58912658691406, -55.76267623901367, -49.93622589111328, -44.109771728515625, -38.283321380615234, -32.456871032714844, -26.630416870117188, -20.803966522216797, -14.977514266967773, -9.15106201171875, -3.3246116638183594, 2.501842498779297, 8.328292846679688, 14.154745101928711, 19.981197357177734, 25.807647705078125, 31.63409996032715, 37.46055221557617, 43.28700256347656, 49.11345672607422, 54.93990707397461, 60.766357421875, 66.59281158447266, 72.41926574707031, 78.24571228027344, 84.0721664428711, 89.89862060546875, 95.72506713867188, 101.55152130126953, 107.37797546386719, 113.20442199707031, 119.03087615966797, 124.85733032226562, 130.68377685546875, 136.51022338867188, 142.33668518066406, 148.1631317138672, 153.9895782470703, 159.8160400390625, 165.64248657226562, 171.46893310546875, 177.29539489746094, 183.12184143066406, 188.94830322265625, 194.77474975585938]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 7.0, 8.0, 6.0, 16.0, 18.0, 27.0, 21.0, 27.0, 24.0, 36.0, 29.0, 40.0, 43.0, 40.0, 51.0, 46.0, 48.0, 39.0, 46.0, 58.0, 41.0, 33.0, 42.0, 39.0, 26.0, 24.0, 20.0, 29.0, 20.0, 14.0, 20.0, 14.0, 9.0, 7.0, 10.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.625, -37.19775390625, -35.7705078125, -34.34326171875, -32.916015625, -31.48876953125, -30.0615234375, -28.63427734375, -27.20703125, -25.77978515625, -24.3525390625, -22.92529296875, -21.498046875, -20.07080078125, -18.6435546875, -17.21630859375, -15.7890625, -14.36181640625, -12.9345703125, -11.50732421875, -10.080078125, -8.65283203125, -7.2255859375, -5.79833984375, -4.37109375, -2.94384765625, -1.5166015625, -0.08935546875, 1.337890625, 2.76513671875, 4.1923828125, 5.61962890625, 7.046875, 8.47412109375, 9.9013671875, 11.32861328125, 12.755859375, 14.18310546875, 15.6103515625, 17.03759765625, 18.46484375, 19.89208984375, 21.3193359375, 22.74658203125, 24.173828125, 25.60107421875, 27.0283203125, 28.45556640625, 29.8828125, 31.31005859375, 32.7373046875, 34.16455078125, 35.591796875, 37.01904296875, 38.4462890625, 39.87353515625, 41.30078125, 42.72802734375, 44.1552734375, 45.58251953125, 47.009765625, 48.43701171875, 49.8642578125, 51.29150390625, 52.71875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 15.0, 19.0, 23.0, 36.0, 49.0, 78.0, 101.0, 187.0, 253.0, 363.0, 608.0, 929.0, 1567.0, 2356.0, 3827.0, 6118.0, 9848.0, 16081.0, 26410.0, 42920.0, 75832.0, 154373.0, 355772.0, 159111.0, 77350.0, 44301.0, 26421.0, 16633.0, 10220.0, 6292.0, 3812.0, 2355.0, 1535.0, 973.0, 643.0, 379.0, 276.0, 190.0, 101.0, 59.0, 47.0, 18.0, 17.0, 16.0, 9.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.6943359375, -1.6405792236328125, -1.586822509765625, -1.5330657958984375, -1.47930908203125, -1.4255523681640625, -1.371795654296875, -1.3180389404296875, -1.2642822265625, -1.2105255126953125, -1.156768798828125, -1.1030120849609375, -1.04925537109375, -0.9954986572265625, -0.941741943359375, -0.8879852294921875, -0.834228515625, -0.7804718017578125, -0.726715087890625, -0.6729583740234375, -0.61920166015625, -0.5654449462890625, -0.511688232421875, -0.4579315185546875, -0.4041748046875, -0.3504180908203125, -0.296661376953125, -0.2429046630859375, -0.18914794921875, -0.1353912353515625, -0.081634521484375, -0.0278778076171875, 0.02587890625, 0.0796356201171875, 0.133392333984375, 0.1871490478515625, 0.24090576171875, 0.2946624755859375, 0.348419189453125, 0.4021759033203125, 0.4559326171875, 0.5096893310546875, 0.563446044921875, 0.6172027587890625, 0.67095947265625, 0.7247161865234375, 0.778472900390625, 0.8322296142578125, 0.885986328125, 0.9397430419921875, 0.993499755859375, 1.0472564697265625, 1.10101318359375, 1.1547698974609375, 1.208526611328125, 1.2622833251953125, 1.3160400390625, 1.3697967529296875, 1.423553466796875, 1.4773101806640625, 1.53106689453125, 1.5848236083984375, 1.638580322265625, 1.6923370361328125, 1.74609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 14.0, 20.0, 9.0, 18.0, 18.0, 25.0, 34.0, 25.0, 26.0, 37.0, 31.0, 45.0, 42.0, 43.0, 43.0, 43.0, 1066.0, 49.0, 30.0, 43.0, 34.0, 47.0, 25.0, 33.0, 26.0, 31.0, 26.0, 22.0, 15.0, 17.0, 14.0, 10.0, 3.0, 13.0, 6.0, 1.0, 4.0, 2.0, 5.0, 5.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -22.92431640625, -22.0361328125, -21.14794921875, -20.259765625, -19.37158203125, -18.4833984375, -17.59521484375, -16.70703125, -15.81884765625, -14.9306640625, -14.04248046875, -13.154296875, -12.26611328125, -11.3779296875, -10.48974609375, -9.6015625, -8.71337890625, -7.8251953125, -6.93701171875, -6.048828125, -5.16064453125, -4.2724609375, -3.38427734375, -2.49609375, -1.60791015625, -0.7197265625, 0.16845703125, 1.056640625, 1.94482421875, 2.8330078125, 3.72119140625, 4.609375, 5.49755859375, 6.3857421875, 7.27392578125, 8.162109375, 9.05029296875, 9.9384765625, 10.82666015625, 11.71484375, 12.60302734375, 13.4912109375, 14.37939453125, 15.267578125, 16.15576171875, 17.0439453125, 17.93212890625, 18.8203125, 19.70849609375, 20.5966796875, 21.48486328125, 22.373046875, 23.26123046875, 24.1494140625, 25.03759765625, 25.92578125, 26.81396484375, 27.7021484375, 28.59033203125, 29.478515625, 30.36669921875, 31.2548828125, 32.14306640625, 33.03125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 12.0, 25.0, 25.0, 50.0, 64.0, 92.0, 143.0, 206.0, 325.0, 475.0, 773.0, 1169.0, 1751.0, 2857.0, 4215.0, 6679.0, 10753.0, 17261.0, 29032.0, 48966.0, 87404.0, 177258.0, 1395154.0, 135280.0, 71662.0, 40571.0, 24376.0, 15096.0, 9248.0, 5886.0, 3629.0, 2326.0, 1467.0, 1028.0, 582.0, 427.0, 300.0, 172.0, 124.0, 90.0, 60.0, 39.0, 26.0, 22.0, 9.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3525390625, -1.310699462890625, -1.26885986328125, -1.227020263671875, -1.1851806640625, -1.143341064453125, -1.10150146484375, -1.059661865234375, -1.017822265625, -0.975982666015625, -0.93414306640625, -0.892303466796875, -0.8504638671875, -0.808624267578125, -0.76678466796875, -0.724945068359375, -0.68310546875, -0.641265869140625, -0.59942626953125, -0.557586669921875, -0.5157470703125, -0.473907470703125, -0.43206787109375, -0.390228271484375, -0.348388671875, -0.306549072265625, -0.26470947265625, -0.222869873046875, -0.1810302734375, -0.139190673828125, -0.09735107421875, -0.055511474609375, -0.013671875, 0.028167724609375, 0.07000732421875, 0.111846923828125, 0.1536865234375, 0.195526123046875, 0.23736572265625, 0.279205322265625, 0.321044921875, 0.362884521484375, 0.40472412109375, 0.446563720703125, 0.4884033203125, 0.530242919921875, 0.57208251953125, 0.613922119140625, 0.65576171875, 0.697601318359375, 0.73944091796875, 0.781280517578125, 0.8231201171875, 0.864959716796875, 0.90679931640625, 0.948638916015625, 0.990478515625, 1.032318115234375, 1.07415771484375, 1.115997314453125, 1.1578369140625, 1.199676513671875, 1.24151611328125, 1.283355712890625, 1.3251953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 1.0, 8.0, 6.0, 8.0, 17.0, 22.0, 24.0, 37.0, 47.0, 58.0, 89.0, 89.0, 102.0, 104.0, 97.0, 60.0, 55.0, 51.0, 29.0, 25.0, 13.0, 15.0, 13.0, 12.0, 7.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.649991989135742e-05, -9.365379810333252e-05, -9.080767631530762e-05, -8.796155452728271e-05, -8.511543273925781e-05, -8.226931095123291e-05, -7.942318916320801e-05, -7.65770673751831e-05, -7.37309455871582e-05, -7.08848237991333e-05, -6.80387020111084e-05, -6.51925802230835e-05, -6.23464584350586e-05, -5.950033664703369e-05, -5.665421485900879e-05, -5.380809307098389e-05, -5.0961971282958984e-05, -4.811584949493408e-05, -4.526972770690918e-05, -4.242360591888428e-05, -3.9577484130859375e-05, -3.673136234283447e-05, -3.388524055480957e-05, -3.103911876678467e-05, -2.8192996978759766e-05, -2.5346875190734863e-05, -2.250075340270996e-05, -1.965463161468506e-05, -1.6808509826660156e-05, -1.3962388038635254e-05, -1.1116266250610352e-05, -8.27014446258545e-06, -5.424022674560547e-06, -2.5779008865356445e-06, 2.682209014892578e-07, 3.11434268951416e-06, 5.9604644775390625e-06, 8.806586265563965e-06, 1.1652708053588867e-05, 1.449882984161377e-05, 1.7344951629638672e-05, 2.0191073417663574e-05, 2.3037195205688477e-05, 2.588331699371338e-05, 2.872943878173828e-05, 3.1575560569763184e-05, 3.4421682357788086e-05, 3.726780414581299e-05, 4.011392593383789e-05, 4.296004772186279e-05, 4.5806169509887695e-05, 4.86522912979126e-05, 5.14984130859375e-05, 5.43445348739624e-05, 5.7190656661987305e-05, 6.003677845001221e-05, 6.288290023803711e-05, 6.572902202606201e-05, 6.857514381408691e-05, 7.142126560211182e-05, 7.426738739013672e-05, 7.711350917816162e-05, 7.995963096618652e-05, 8.280575275421143e-05, 8.565187454223633e-05]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 7.0, 10.0, 14.0, 15.0, 23.0, 31.0, 47.0, 64.0, 113.0, 213.0, 786.0, 7019.0, 252675.0, 774437.0, 11342.0, 1115.0, 283.0, 106.0, 65.0, 50.0, 37.0, 31.0, 13.0, 17.0, 10.0, 7.0, 0.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012454986572265625, -0.0012041032314300537, -0.001162707805633545, -0.0011213123798370361, -0.0010799169540405273, -0.0010385215282440186, -0.0009971261024475098, -0.000955730676651001, -0.0009143352508544922, -0.0008729398250579834, -0.0008315443992614746, -0.0007901489734649658, -0.000748753547668457, -0.0007073581218719482, -0.0006659626960754395, -0.0006245672702789307, -0.0005831718444824219, -0.0005417764186859131, -0.0005003809928894043, -0.0004589855670928955, -0.0004175901412963867, -0.00037619471549987793, -0.00033479928970336914, -0.00029340386390686035, -0.00025200843811035156, -0.00021061301231384277, -0.00016921758651733398, -0.0001278221607208252, -8.64267349243164e-05, -4.503130912780762e-05, -3.635883331298828e-06, 3.775954246520996e-05, 7.915496826171875e-05, 0.00012055039405822754, 0.00016194581985473633, 0.00020334124565124512, 0.0002447366714477539, 0.0002861320972442627, 0.0003275275230407715, 0.0003689229488372803, 0.00041031837463378906, 0.00045171380043029785, 0.0004931092262268066, 0.0005345046520233154, 0.0005759000778198242, 0.000617295503616333, 0.0006586909294128418, 0.0007000863552093506, 0.0007414817810058594, 0.0007828772068023682, 0.000824272632598877, 0.0008656680583953857, 0.0009070634841918945, 0.0009484589099884033, 0.0009898543357849121, 0.001031249761581421, 0.0010726451873779297, 0.0011140406131744385, 0.0011554360389709473, 0.001196831464767456, 0.0012382268905639648, 0.0012796223163604736, 0.0013210177421569824, 0.0013624131679534912, 0.00140380859375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 12.0, 18.0, 34.0, 49.0, 122.0, 287.0, 240.0, 121.0, 59.0, 28.0, 17.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.24573736381717e-05, -3.8906138797756284e-05, -3.5354907595319673e-05, -3.180367639288306e-05, -2.8252441552467644e-05, -2.470120853104163e-05, -2.1149975509615615e-05, -1.75987424881896e-05, -1.4047509466763586e-05, -1.0496276445337571e-05, -6.945043423911557e-06, -3.393810402485542e-06, 1.574226189404726e-07, 3.708655640366487e-06, 7.259888661792502e-06, 1.0811121683218516e-05, 1.4362354704644531e-05, 1.7913587726070546e-05, 2.146482074749656e-05, 2.5016053768922575e-05, 2.856728679034859e-05, 3.211852163076401e-05, 3.566975283320062e-05, 3.922098403563723e-05, 4.277221887605265e-05, 4.6323453716468066e-05, 4.987468491890468e-05, 5.342591612134129e-05, 5.6977150961756706e-05, 6.0528385802172124e-05, 6.407962064258754e-05, 6.763084820704535e-05, 7.118209032341838e-05, 7.47333251638338e-05, 7.828456000424922e-05, 8.183578756870702e-05, 8.538702240912244e-05, 8.893825724953786e-05, 9.248948481399566e-05, 9.604071965441108e-05, 9.95919544948265e-05, 0.00010314318933524191, 0.00010669442417565733, 0.00011024565174011514, 0.00011379688658053055, 0.00011734812142094597, 0.00012089934898540378, 0.0001244505838258192, 0.0001280018186662346, 0.00013155305350665003, 0.00013510428834706545, 0.00013865552318748087, 0.00014220675802789629, 0.00014575797831639647, 0.0001493092131568119, 0.0001528604479972273, 0.00015641168283764273, 0.00015996291767805815, 0.00016351415251847357, 0.00016706538735888898, 0.00017061660764738917, 0.0001741678424878046, 0.00017771907732822, 0.00018127031216863543, 0.00018482154700905085]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 13.0, 12.0, 11.0, 18.0, 18.0, 11.0, 14.0, 17.0, 35.0, 10.0, 28.0, 32.0, 21.0, 45.0, 42.0, 39.0, 32.0, 43.0, 57.0, 45.0, 32.0, 35.0, 37.0, 44.0, 32.0, 29.0, 36.0, 31.0, 30.0, 22.0, 19.0, 20.0, 16.0, 22.0, 9.0, 5.0, 10.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.4868717193603516e-05, -3.383960574865341e-05, -3.281049430370331e-05, -3.1781382858753204e-05, -3.07522714138031e-05, -2.9723159968852997e-05, -2.8694048523902893e-05, -2.766493707895279e-05, -2.6635825634002686e-05, -2.5606714189052582e-05, -2.4577602744102478e-05, -2.3548491299152374e-05, -2.251937985420227e-05, -2.1490268409252167e-05, -2.0461156964302063e-05, -1.943204551935196e-05, -1.8402934074401855e-05, -1.7373822629451752e-05, -1.6344711184501648e-05, -1.5315599739551544e-05, -1.428648829460144e-05, -1.3257376849651337e-05, -1.2228265404701233e-05, -1.1199153959751129e-05, -1.0170042514801025e-05, -9.140931069850922e-06, -8.111819624900818e-06, -7.082708179950714e-06, -6.05359673500061e-06, -5.024485290050507e-06, -3.995373845100403e-06, -2.966262400150299e-06, -1.9371509552001953e-06, -9.080395102500916e-07, 1.210719347000122e-07, 1.150183379650116e-06, 2.1792948246002197e-06, 3.2084062695503235e-06, 4.237517714500427e-06, 5.266629159450531e-06, 6.295740604400635e-06, 7.3248520493507385e-06, 8.353963494300842e-06, 9.383074939250946e-06, 1.041218638420105e-05, 1.1441297829151154e-05, 1.2470409274101257e-05, 1.3499520719051361e-05, 1.4528632164001465e-05, 1.555774360895157e-05, 1.6586855053901672e-05, 1.7615966498851776e-05, 1.864507794380188e-05, 1.9674189388751984e-05, 2.0703300833702087e-05, 2.173241227865219e-05, 2.2761523723602295e-05, 2.37906351685524e-05, 2.4819746613502502e-05, 2.5848858058452606e-05, 2.687796950340271e-05, 2.7907080948352814e-05, 2.8936192393302917e-05, 2.996530383825302e-05, 3.0994415283203125e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 7.0, 8.0, 6.0, 16.0, 18.0, 27.0, 21.0, 27.0, 24.0, 36.0, 29.0, 40.0, 43.0, 40.0, 51.0, 46.0, 48.0, 39.0, 46.0, 58.0, 41.0, 33.0, 42.0, 39.0, 26.0, 24.0, 20.0, 29.0, 20.0, 14.0, 20.0, 14.0, 9.0, 7.0, 10.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.625, -37.19775390625, -35.7705078125, -34.34326171875, -32.916015625, -31.48876953125, -30.0615234375, -28.63427734375, -27.20703125, -25.77978515625, -24.3525390625, -22.92529296875, -21.498046875, -20.07080078125, -18.6435546875, -17.21630859375, -15.7890625, -14.36181640625, -12.9345703125, -11.50732421875, -10.080078125, -8.65283203125, -7.2255859375, -5.79833984375, -4.37109375, -2.94384765625, -1.5166015625, -0.08935546875, 1.337890625, 2.76513671875, 4.1923828125, 5.61962890625, 7.046875, 8.47412109375, 9.9013671875, 11.32861328125, 12.755859375, 14.18310546875, 15.6103515625, 17.03759765625, 18.46484375, 19.89208984375, 21.3193359375, 22.74658203125, 24.173828125, 25.60107421875, 27.0283203125, 28.45556640625, 29.8828125, 31.31005859375, 32.7373046875, 34.16455078125, 35.591796875, 37.01904296875, 38.4462890625, 39.87353515625, 41.30078125, 42.72802734375, 44.1552734375, 45.58251953125, 47.009765625, 48.43701171875, 49.8642578125, 51.29150390625, 52.71875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 4.0, 8.0, 13.0, 11.0, 25.0, 18.0, 33.0, 35.0, 60.0, 70.0, 95.0, 133.0, 202.0, 377.0, 659.0, 1389.0, 3386.0, 12497.0, 100422.0, 799251.0, 109908.0, 13128.0, 3634.0, 1413.0, 680.0, 376.0, 206.0, 134.0, 96.0, 71.0, 48.0, 36.0, 40.0, 27.0, 18.0, 11.0, 18.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.6875, -47.8818359375, -46.076171875, -44.2705078125, -42.46484375, -40.6591796875, -38.853515625, -37.0478515625, -35.2421875, -33.4365234375, -31.630859375, -29.8251953125, -28.01953125, -26.2138671875, -24.408203125, -22.6025390625, -20.796875, -18.9912109375, -17.185546875, -15.3798828125, -13.57421875, -11.7685546875, -9.962890625, -8.1572265625, -6.3515625, -4.5458984375, -2.740234375, -0.9345703125, 0.87109375, 2.6767578125, 4.482421875, 6.2880859375, 8.09375, 9.8994140625, 11.705078125, 13.5107421875, 15.31640625, 17.1220703125, 18.927734375, 20.7333984375, 22.5390625, 24.3447265625, 26.150390625, 27.9560546875, 29.76171875, 31.5673828125, 33.373046875, 35.1787109375, 36.984375, 38.7900390625, 40.595703125, 42.4013671875, 44.20703125, 46.0126953125, 47.818359375, 49.6240234375, 51.4296875, 53.2353515625, 55.041015625, 56.8466796875, 58.65234375, 60.4580078125, 62.263671875, 64.0693359375, 65.875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 6.0, 5.0, 8.0, 4.0, 12.0, 11.0, 22.0, 24.0, 26.0, 19.0, 13.0, 24.0, 25.0, 30.0, 34.0, 30.0, 39.0, 36.0, 42.0, 49.0, 313.0, 1759.0, 51.0, 42.0, 37.0, 38.0, 41.0, 38.0, 34.0, 24.0, 19.0, 31.0, 17.0, 19.0, 11.0, 13.0, 14.0, 19.0, 11.0, 7.0, 12.0, 6.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-104.0, -100.8623046875, -97.724609375, -94.5869140625, -91.44921875, -88.3115234375, -85.173828125, -82.0361328125, -78.8984375, -75.7607421875, -72.623046875, -69.4853515625, -66.34765625, -63.2099609375, -60.072265625, -56.9345703125, -53.796875, -50.6591796875, -47.521484375, -44.3837890625, -41.24609375, -38.1083984375, -34.970703125, -31.8330078125, -28.6953125, -25.5576171875, -22.419921875, -19.2822265625, -16.14453125, -13.0068359375, -9.869140625, -6.7314453125, -3.59375, -0.4560546875, 2.681640625, 5.8193359375, 8.95703125, 12.0947265625, 15.232421875, 18.3701171875, 21.5078125, 24.6455078125, 27.783203125, 30.9208984375, 34.05859375, 37.1962890625, 40.333984375, 43.4716796875, 46.609375, 49.7470703125, 52.884765625, 56.0224609375, 59.16015625, 62.2978515625, 65.435546875, 68.5732421875, 71.7109375, 74.8486328125, 77.986328125, 81.1240234375, 84.26171875, 87.3994140625, 90.537109375, 93.6748046875, 96.8125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 3.0, 1.0, 6.0, 13.0, 15.0, 10.0, 18.0, 20.0, 23.0, 17.0, 35.0, 42.0, 48.0, 65.0, 66.0, 86.0, 146.0, 223.0, 379.0, 656.0, 1395.0, 6298.0, 2947743.0, 181947.0, 3673.0, 1149.0, 557.0, 286.0, 204.0, 108.0, 90.0, 81.0, 54.0, 24.0, 40.0, 42.0, 34.0, 22.0, 14.0, 15.0, 9.0, 13.0, 4.0, 10.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-192.125, -185.900390625, -179.67578125, -173.451171875, -167.2265625, -161.001953125, -154.77734375, -148.552734375, -142.328125, -136.103515625, -129.87890625, -123.654296875, -117.4296875, -111.205078125, -104.98046875, -98.755859375, -92.53125, -86.306640625, -80.08203125, -73.857421875, -67.6328125, -61.408203125, -55.18359375, -48.958984375, -42.734375, -36.509765625, -30.28515625, -24.060546875, -17.8359375, -11.611328125, -5.38671875, 0.837890625, 7.0625, 13.287109375, 19.51171875, 25.736328125, 31.9609375, 38.185546875, 44.41015625, 50.634765625, 56.859375, 63.083984375, 69.30859375, 75.533203125, 81.7578125, 87.982421875, 94.20703125, 100.431640625, 106.65625, 112.880859375, 119.10546875, 125.330078125, 131.5546875, 137.779296875, 144.00390625, 150.228515625, 156.453125, 162.677734375, 168.90234375, 175.126953125, 181.3515625, 187.576171875, 193.80078125, 200.025390625, 206.25]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 5.0, 22.0, 35.0, 56.0, 103.0, 164.0, 196.0, 164.0, 103.0, 57.0, 46.0, 27.0, 7.0, 8.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.73131561279297, -98.40980529785156, -95.08828735351562, -91.76677703857422, -88.44525909423828, -85.12374877929688, -81.80223083496094, -78.48072052001953, -75.15921020507812, -71.83769989013672, -68.51618194580078, -65.19467163085938, -61.87315368652344, -58.55164337158203, -55.23012924194336, -51.90861511230469, -48.58709716796875, -45.26558303833008, -41.944068908691406, -38.62255859375, -35.30104064941406, -31.979528427124023, -28.658016204833984, -25.336502075195312, -22.01498794555664, -18.69347381591797, -15.371960639953613, -12.050447463989258, -8.728933334350586, -5.407419204711914, -2.085906982421875, 1.2356071472167969, 4.55712890625, 7.878642559051514, 11.200156211853027, 14.521669387817383, 17.843183517456055, 21.164697647094727, 24.486209869384766, 27.807723999023438, 31.12923812866211, 34.45075225830078, 37.77226638793945, 41.093780517578125, 44.41529083251953, 47.73680877685547, 51.058319091796875, 54.37983322143555, 57.70134735107422, 61.02286148071289, 64.34437561035156, 67.66588592529297, 70.9874038696289, 74.30891418457031, 77.63043212890625, 80.95194244384766, 84.27345275878906, 87.59496307373047, 90.9164810180664, 94.23799133300781, 97.55950927734375, 100.88101959228516, 104.20252990722656, 107.5240478515625, 110.84556579589844]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 8.0, 7.0, 9.0, 13.0, 11.0, 19.0, 25.0, 30.0, 15.0, 33.0, 33.0, 39.0, 38.0, 41.0, 53.0, 52.0, 52.0, 46.0, 51.0, 48.0, 49.0, 48.0, 52.0, 32.0, 33.0, 35.0, 20.0, 15.0, 18.0, 23.0, 12.0, 13.0, 7.0, 3.0, 11.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-435.68597412109375, -423.80145263671875, -411.91693115234375, -400.03240966796875, -388.14788818359375, -376.2633361816406, -364.3788146972656, -352.4942932128906, -340.6097717285156, -328.7252502441406, -316.8407287597656, -304.9562072753906, -293.0716552734375, -281.1871337890625, -269.3026123046875, -257.4180908203125, -245.5335693359375, -233.6490478515625, -221.7645263671875, -209.87998962402344, -197.99546813964844, -186.11094665527344, -174.22640991210938, -162.34188842773438, -150.45736694335938, -138.57284545898438, -126.68831634521484, -114.80378723144531, -102.91926574707031, -91.03474426269531, -79.15021514892578, -67.26568603515625, -55.381134033203125, -43.49660873413086, -31.612083435058594, -19.727558135986328, -7.8430328369140625, 4.041492462158203, 15.926017761230469, 27.810546875, 39.695068359375, 51.579593658447266, 63.46411895751953, 75.34864807128906, 87.23316955566406, 99.11769104003906, 111.0022201538086, 122.88674926757812, 134.77127075195312, 146.65579223632812, 158.54031372070312, 170.4248504638672, 182.3093719482422, 194.1938934326172, 206.07843017578125, 217.96295166015625, 229.84747314453125, 241.73199462890625, 253.61651611328125, 265.50103759765625, 277.38555908203125, 289.2701110839844, 301.1546325683594, 313.0391540527344, 324.9236755371094]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 13.0, 6.0, 12.0, 14.0, 27.0, 27.0, 21.0, 28.0, 38.0, 34.0, 40.0, 39.0, 45.0, 43.0, 48.0, 57.0, 27.0, 51.0, 57.0, 44.0, 41.0, 45.0, 30.0, 21.0, 31.0, 22.0, 30.0, 22.0, 16.0, 11.0, 10.0, 11.0, 9.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15625, -38.6748046875, -37.193359375, -35.7119140625, -34.23046875, -32.7490234375, -31.267578125, -29.7861328125, -28.3046875, -26.8232421875, -25.341796875, -23.8603515625, -22.37890625, -20.8974609375, -19.416015625, -17.9345703125, -16.453125, -14.9716796875, -13.490234375, -12.0087890625, -10.52734375, -9.0458984375, -7.564453125, -6.0830078125, -4.6015625, -3.1201171875, -1.638671875, -0.1572265625, 1.32421875, 2.8056640625, 4.287109375, 5.7685546875, 7.25, 8.7314453125, 10.212890625, 11.6943359375, 13.17578125, 14.6572265625, 16.138671875, 17.6201171875, 19.1015625, 20.5830078125, 22.064453125, 23.5458984375, 25.02734375, 26.5087890625, 27.990234375, 29.4716796875, 30.953125, 32.4345703125, 33.916015625, 35.3974609375, 36.87890625, 38.3603515625, 39.841796875, 41.3232421875, 42.8046875, 44.2861328125, 45.767578125, 47.2490234375, 48.73046875, 50.2119140625, 51.693359375, 53.1748046875, 54.65625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 7.0, 17.0, 20.0, 28.0, 33.0, 55.0, 60.0, 84.0, 150.0, 145.0, 287.0, 426.0, 693.0, 1276.0, 2451.0, 4555.0, 9630.0, 29038.0, 718024.0, 3336944.0, 63356.0, 13753.0, 6083.0, 2989.0, 1636.0, 889.0, 516.0, 371.0, 217.0, 158.0, 101.0, 79.0, 54.0, 35.0, 38.0, 22.0, 17.0, 12.0, 11.0, 6.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.875, -125.099609375, -120.32421875, -115.548828125, -110.7734375, -105.998046875, -101.22265625, -96.447265625, -91.671875, -86.896484375, -82.12109375, -77.345703125, -72.5703125, -67.794921875, -63.01953125, -58.244140625, -53.46875, -48.693359375, -43.91796875, -39.142578125, -34.3671875, -29.591796875, -24.81640625, -20.041015625, -15.265625, -10.490234375, -5.71484375, -0.939453125, 3.8359375, 8.611328125, 13.38671875, 18.162109375, 22.9375, 27.712890625, 32.48828125, 37.263671875, 42.0390625, 46.814453125, 51.58984375, 56.365234375, 61.140625, 65.916015625, 70.69140625, 75.466796875, 80.2421875, 85.017578125, 89.79296875, 94.568359375, 99.34375, 104.119140625, 108.89453125, 113.669921875, 118.4453125, 123.220703125, 127.99609375, 132.771484375, 137.546875, 142.322265625, 147.09765625, 151.873046875, 156.6484375, 161.423828125, 166.19921875, 170.974609375, 175.75]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 5.0, 8.0, 14.0, 18.0, 27.0, 22.0, 45.0, 56.0, 99.0, 234.0, 497.0, 1144.0, 979.0, 421.0, 181.0, 89.0, 61.0, 29.0, 31.0, 17.0, 18.0, 10.0, 13.0, 4.0, 6.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.8125, -77.69140625, -74.5703125, -71.44921875, -68.328125, -65.20703125, -62.0859375, -58.96484375, -55.84375, -52.72265625, -49.6015625, -46.48046875, -43.359375, -40.23828125, -37.1171875, -33.99609375, -30.875, -27.75390625, -24.6328125, -21.51171875, -18.390625, -15.26953125, -12.1484375, -9.02734375, -5.90625, -2.78515625, 0.3359375, 3.45703125, 6.578125, 9.69921875, 12.8203125, 15.94140625, 19.0625, 22.18359375, 25.3046875, 28.42578125, 31.546875, 34.66796875, 37.7890625, 40.91015625, 44.03125, 47.15234375, 50.2734375, 53.39453125, 56.515625, 59.63671875, 62.7578125, 65.87890625, 69.0, 72.12109375, 75.2421875, 78.36328125, 81.484375, 84.60546875, 87.7265625, 90.84765625, 93.96875, 97.08984375, 100.2109375, 103.33203125, 106.453125, 109.57421875, 112.6953125, 115.81640625, 118.9375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 7.0, 10.0, 12.0, 26.0, 28.0, 57.0, 110.0, 285.0, 747.0, 2287.0, 9763.0, 78423.0, 3986007.0, 101076.0, 11359.0, 2710.0, 777.0, 307.0, 108.0, 64.0, 36.0, 16.0, 17.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-470.75, -458.2109375, -445.671875, -433.1328125, -420.59375, -408.0546875, -395.515625, -382.9765625, -370.4375, -357.8984375, -345.359375, -332.8203125, -320.28125, -307.7421875, -295.203125, -282.6640625, -270.125, -257.5859375, -245.046875, -232.5078125, -219.96875, -207.4296875, -194.890625, -182.3515625, -169.8125, -157.2734375, -144.734375, -132.1953125, -119.65625, -107.1171875, -94.578125, -82.0390625, -69.5, -56.9609375, -44.421875, -31.8828125, -19.34375, -6.8046875, 5.734375, 18.2734375, 30.8125, 43.3515625, 55.890625, 68.4296875, 80.96875, 93.5078125, 106.046875, 118.5859375, 131.125, 143.6640625, 156.203125, 168.7421875, 181.28125, 193.8203125, 206.359375, 218.8984375, 231.4375, 243.9765625, 256.515625, 269.0546875, 281.59375, 294.1328125, 306.671875, 319.2109375, 331.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 10.0, 19.0, 30.0, 51.0, 102.0, 145.0, 213.0, 139.0, 106.0, 60.0, 40.0, 29.0, 21.0, 13.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-726.8011474609375, -710.0838623046875, -693.3665771484375, -676.6492919921875, -659.9320068359375, -643.2147216796875, -626.4974365234375, -609.7801513671875, -593.0628662109375, -576.3455810546875, -559.6282958984375, -542.9110107421875, -526.1937255859375, -509.4764404296875, -492.7591552734375, -476.0418701171875, -459.3245849609375, -442.6072998046875, -425.8900146484375, -409.1727294921875, -392.4554443359375, -375.7381591796875, -359.0208740234375, -342.3035888671875, -325.5863037109375, -308.8690185546875, -292.1517333984375, -275.4344482421875, -258.7171630859375, -241.9998779296875, -225.2825927734375, -208.5653076171875, -191.84796142578125, -175.13067626953125, -158.41339111328125, -141.69610595703125, -124.97882080078125, -108.26153564453125, -91.54425048828125, -74.82696533203125, -58.10968017578125, -41.39239501953125, -24.67510986328125, -7.95782470703125, 8.75946044921875, 25.47674560546875, 42.19403076171875, 58.91131591796875, 75.62860107421875, 92.34588623046875, 109.06317138671875, 125.78045654296875, 142.49774169921875, 159.21502685546875, 175.93231201171875, 192.64959716796875, 209.36688232421875, 226.08416748046875, 242.80145263671875, 259.51873779296875, 276.23602294921875, 292.95330810546875, 309.67059326171875, 326.38787841796875, 343.10516357421875]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 10.0, 9.0, 8.0, 11.0, 11.0, 17.0, 20.0, 17.0, 18.0, 15.0, 28.0, 25.0, 30.0, 31.0, 31.0, 38.0, 41.0, 30.0, 35.0, 44.0, 38.0, 49.0, 49.0, 42.0, 38.0, 31.0, 27.0, 34.0, 31.0, 23.0, 27.0, 15.0, 17.0, 19.0, 10.0, 14.0, 16.0, 7.0, 6.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-212.0902557373047, -205.22824096679688, -198.36622619628906, -191.50421142578125, -184.64219665527344, -177.78018188476562, -170.91818237304688, -164.05615234375, -157.19415283203125, -150.33213806152344, -143.47012329101562, -136.6081085205078, -129.74609375, -122.88407897949219, -116.0220718383789, -109.1600570678711, -102.29803466796875, -95.43601989746094, -88.57400512695312, -81.71199035644531, -74.8499755859375, -67.98796081542969, -61.125953674316406, -54.263938903808594, -47.40192413330078, -40.53990936279297, -33.677894592285156, -26.81588363647461, -19.953868865966797, -13.091854095458984, -6.2298431396484375, 0.632171630859375, 7.49420166015625, 14.356215476989746, 21.218229293823242, 28.080242156982422, 34.942256927490234, 41.80427169799805, 48.666282653808594, 55.528297424316406, 62.39031219482422, 69.25232696533203, 76.11434173583984, 82.97634887695312, 89.83836364746094, 96.70037841796875, 103.56239318847656, 110.42440795898438, 117.28642272949219, 124.1484375, 131.0104522705078, 137.87246704101562, 144.73448181152344, 151.59649658203125, 158.45849609375, 165.32052612304688, 172.18252563476562, 179.04454040527344, 185.90655517578125, 192.76856994628906, 199.63058471679688, 206.4925994873047, 213.3546142578125, 220.21661376953125, 227.07864379882812]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 6.0, 6.0, 8.0, 14.0, 15.0, 15.0, 22.0, 25.0, 28.0, 36.0, 37.0, 34.0, 44.0, 45.0, 37.0, 46.0, 41.0, 35.0, 55.0, 27.0, 38.0, 37.0, 47.0, 43.0, 34.0, 28.0, 25.0, 20.0, 23.0, 22.0, 17.0, 19.0, 8.0, 11.0, 2.0, 13.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.46875, -36.03125, -34.59375, -33.15625, -31.71875, -30.28125, -28.84375, -27.40625, -25.96875, -24.53125, -23.09375, -21.65625, -20.21875, -18.78125, -17.34375, -15.90625, -14.46875, -13.03125, -11.59375, -10.15625, -8.71875, -7.28125, -5.84375, -4.40625, -2.96875, -1.53125, -0.09375, 1.34375, 2.78125, 4.21875, 5.65625, 7.09375, 8.53125, 9.96875, 11.40625, 12.84375, 14.28125, 15.71875, 17.15625, 18.59375, 20.03125, 21.46875, 22.90625, 24.34375, 25.78125, 27.21875, 28.65625, 30.09375, 31.53125, 32.96875, 34.40625, 35.84375, 37.28125, 38.71875, 40.15625, 41.59375, 43.03125, 44.46875, 45.90625, 47.34375, 48.78125, 50.21875, 51.65625, 53.09375, 54.53125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 13.0, 11.0, 22.0, 21.0, 34.0, 41.0, 84.0, 152.0, 193.0, 348.0, 589.0, 1056.0, 1912.0, 3281.0, 5715.0, 10644.0, 19953.0, 38879.0, 78988.0, 184937.0, 417892.0, 146812.0, 65572.0, 32965.0, 17299.0, 9201.0, 5170.0, 2865.0, 1596.0, 923.0, 586.0, 301.0, 173.0, 130.0, 64.0, 42.0, 25.0, 21.0, 16.0, 6.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.802734375, -2.727752685546875, -2.65277099609375, -2.577789306640625, -2.5028076171875, -2.427825927734375, -2.35284423828125, -2.277862548828125, -2.202880859375, -2.127899169921875, -2.05291748046875, -1.977935791015625, -1.9029541015625, -1.827972412109375, -1.75299072265625, -1.678009033203125, -1.60302734375, -1.528045654296875, -1.45306396484375, -1.378082275390625, -1.3031005859375, -1.228118896484375, -1.15313720703125, -1.078155517578125, -1.003173828125, -0.928192138671875, -0.85321044921875, -0.778228759765625, -0.7032470703125, -0.628265380859375, -0.55328369140625, -0.478302001953125, -0.4033203125, -0.328338623046875, -0.25335693359375, -0.178375244140625, -0.1033935546875, -0.028411865234375, 0.04656982421875, 0.121551513671875, 0.196533203125, 0.271514892578125, 0.34649658203125, 0.421478271484375, 0.4964599609375, 0.571441650390625, 0.64642333984375, 0.721405029296875, 0.79638671875, 0.871368408203125, 0.94635009765625, 1.021331787109375, 1.0963134765625, 1.171295166015625, 1.24627685546875, 1.321258544921875, 1.396240234375, 1.471221923828125, 1.54620361328125, 1.621185302734375, 1.6961669921875, 1.771148681640625, 1.84613037109375, 1.921112060546875, 1.99609375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 8.0, 5.0, 8.0, 7.0, 22.0, 12.0, 17.0, 20.0, 21.0, 17.0, 19.0, 25.0, 33.0, 31.0, 31.0, 35.0, 49.0, 36.0, 36.0, 39.0, 50.0, 1060.0, 34.0, 39.0, 28.0, 31.0, 33.0, 34.0, 33.0, 35.0, 23.0, 28.0, 20.0, 19.0, 13.0, 15.0, 15.0, 12.0, 3.0, 8.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.546875, -27.6826171875, -26.818359375, -25.9541015625, -25.08984375, -24.2255859375, -23.361328125, -22.4970703125, -21.6328125, -20.7685546875, -19.904296875, -19.0400390625, -18.17578125, -17.3115234375, -16.447265625, -15.5830078125, -14.71875, -13.8544921875, -12.990234375, -12.1259765625, -11.26171875, -10.3974609375, -9.533203125, -8.6689453125, -7.8046875, -6.9404296875, -6.076171875, -5.2119140625, -4.34765625, -3.4833984375, -2.619140625, -1.7548828125, -0.890625, -0.0263671875, 0.837890625, 1.7021484375, 2.56640625, 3.4306640625, 4.294921875, 5.1591796875, 6.0234375, 6.8876953125, 7.751953125, 8.6162109375, 9.48046875, 10.3447265625, 11.208984375, 12.0732421875, 12.9375, 13.8017578125, 14.666015625, 15.5302734375, 16.39453125, 17.2587890625, 18.123046875, 18.9873046875, 19.8515625, 20.7158203125, 21.580078125, 22.4443359375, 23.30859375, 24.1728515625, 25.037109375, 25.9013671875, 26.765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 8.0, 9.0, 18.0, 17.0, 23.0, 43.0, 68.0, 88.0, 121.0, 153.0, 256.0, 417.0, 551.0, 833.0, 1237.0, 1782.0, 2636.0, 3860.0, 5647.0, 8581.0, 12599.0, 19202.0, 29719.0, 46214.0, 73357.0, 127017.0, 1353649.0, 164343.0, 88542.0, 54187.0, 34319.0, 22307.0, 14755.0, 10023.0, 6723.0, 4504.0, 3001.0, 1991.0, 1361.0, 951.0, 607.0, 414.0, 334.0, 218.0, 141.0, 94.0, 77.0, 52.0, 24.0, 24.0, 18.0, 8.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.1455078125, -1.109344482421875, -1.07318115234375, -1.037017822265625, -1.0008544921875, -0.964691162109375, -0.92852783203125, -0.892364501953125, -0.856201171875, -0.820037841796875, -0.78387451171875, -0.747711181640625, -0.7115478515625, -0.675384521484375, -0.63922119140625, -0.603057861328125, -0.56689453125, -0.530731201171875, -0.49456787109375, -0.458404541015625, -0.4222412109375, -0.386077880859375, -0.34991455078125, -0.313751220703125, -0.277587890625, -0.241424560546875, -0.20526123046875, -0.169097900390625, -0.1329345703125, -0.096771240234375, -0.06060791015625, -0.024444580078125, 0.01171875, 0.047882080078125, 0.08404541015625, 0.120208740234375, 0.1563720703125, 0.192535400390625, 0.22869873046875, 0.264862060546875, 0.301025390625, 0.337188720703125, 0.37335205078125, 0.409515380859375, 0.4456787109375, 0.481842041015625, 0.51800537109375, 0.554168701171875, 0.59033203125, 0.626495361328125, 0.66265869140625, 0.698822021484375, 0.7349853515625, 0.771148681640625, 0.80731201171875, 0.843475341796875, 0.879638671875, 0.915802001953125, 0.95196533203125, 0.988128662109375, 1.0242919921875, 1.060455322265625, 1.09661865234375, 1.132781982421875, 1.1689453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 11.0, 5.0, 4.0, 5.0, 4.0, 7.0, 6.0, 11.0, 12.0, 18.0, 20.0, 14.0, 23.0, 47.0, 77.0, 141.0, 199.0, 132.0, 63.0, 44.0, 21.0, 28.0, 20.0, 13.0, 10.0, 10.0, 10.0, 7.0, 5.0, 3.0, 4.0, 8.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.337331771850586e-05, -7.103756070137024e-05, -6.870180368423462e-05, -6.6366046667099e-05, -6.403028964996338e-05, -6.169453263282776e-05, -5.935877561569214e-05, -5.702301859855652e-05, -5.46872615814209e-05, -5.235150456428528e-05, -5.001574754714966e-05, -4.767999053001404e-05, -4.534423351287842e-05, -4.30084764957428e-05, -4.067271947860718e-05, -3.833696246147156e-05, -3.600120544433594e-05, -3.366544842720032e-05, -3.13296914100647e-05, -2.8993934392929077e-05, -2.6658177375793457e-05, -2.4322420358657837e-05, -2.1986663341522217e-05, -1.9650906324386597e-05, -1.7315149307250977e-05, -1.4979392290115356e-05, -1.2643635272979736e-05, -1.0307878255844116e-05, -7.972121238708496e-06, -5.636364221572876e-06, -3.300607204437256e-06, -9.648501873016357e-07, 1.3709068298339844e-06, 3.7066638469696045e-06, 6.042420864105225e-06, 8.378177881240845e-06, 1.0713934898376465e-05, 1.3049691915512085e-05, 1.5385448932647705e-05, 1.7721205949783325e-05, 2.0056962966918945e-05, 2.2392719984054565e-05, 2.4728477001190186e-05, 2.7064234018325806e-05, 2.9399991035461426e-05, 3.1735748052597046e-05, 3.4071505069732666e-05, 3.6407262086868286e-05, 3.8743019104003906e-05, 4.1078776121139526e-05, 4.3414533138275146e-05, 4.5750290155410767e-05, 4.808604717254639e-05, 5.042180418968201e-05, 5.275756120681763e-05, 5.509331822395325e-05, 5.742907524108887e-05, 5.976483225822449e-05, 6.210058927536011e-05, 6.443634629249573e-05, 6.677210330963135e-05, 6.910786032676697e-05, 7.144361734390259e-05, 7.377937436103821e-05, 7.611513137817383e-05]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 9.0, 3.0, 6.0, 8.0, 8.0, 5.0, 22.0, 23.0, 26.0, 40.0, 74.0, 71.0, 219.0, 1326.0, 17663.0, 976298.0, 49673.0, 2390.0, 336.0, 97.0, 68.0, 41.0, 25.0, 26.0, 18.0, 7.0, 13.0, 7.0, 8.0, 6.0, 8.0, 9.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013227462768554688, -0.0012822151184082031, -0.0012416839599609375, -0.0012011528015136719, -0.0011606216430664062, -0.0011200904846191406, -0.001079559326171875, -0.0010390281677246094, -0.0009984970092773438, -0.0009579658508300781, -0.0009174346923828125, -0.0008769035339355469, -0.0008363723754882812, -0.0007958412170410156, -0.00075531005859375, -0.0007147789001464844, -0.0006742477416992188, -0.0006337165832519531, -0.0005931854248046875, -0.0005526542663574219, -0.0005121231079101562, -0.0004715919494628906, -0.000431060791015625, -0.0003905296325683594, -0.00034999847412109375, -0.0003094673156738281, -0.0002689361572265625, -0.00022840499877929688, -0.00018787384033203125, -0.00014734268188476562, -0.0001068115234375, -6.628036499023438e-05, -2.574920654296875e-05, 1.4781951904296875e-05, 5.53131103515625e-05, 9.584426879882812e-05, 0.00013637542724609375, 0.00017690658569335938, 0.000217437744140625, 0.0002579689025878906, 0.00029850006103515625, 0.0003390312194824219, 0.0003795623779296875, 0.0004200935363769531, 0.00046062469482421875, 0.0005011558532714844, 0.00054168701171875, 0.0005822181701660156, 0.0006227493286132812, 0.0006632804870605469, 0.0007038116455078125, 0.0007443428039550781, 0.0007848739624023438, 0.0008254051208496094, 0.000865936279296875, 0.0009064674377441406, 0.0009469985961914062, 0.0009875297546386719, 0.0010280609130859375, 0.0010685920715332031, 0.0011091232299804688, 0.0011496543884277344, 0.001190185546875, 0.0012307167053222656, 0.0012712478637695312]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 16.0, 73.0, 419.0, 416.0, 73.0, 13.0, 5.0, 1.0, 1.0], "bins": [-0.0004778263682965189, -0.0004695859388448298, -0.0004613454802893102, -0.0004531050508376211, -0.0004448645922821015, -0.0004366241628304124, -0.0004283837042748928, -0.0004201432748232037, -0.0004119028162676841, -0.000403662386815995, -0.0003954219282604754, -0.0003871814988087863, -0.0003789410402532667, -0.00037070061080157757, -0.000362460152246058, -0.00035421972279436886, -0.00034597929334267974, -0.0003377388638909906, -0.00032949840533547103, -0.0003212579758837819, -0.00031301751732826233, -0.0003047770878765732, -0.0002965366293210536, -0.0002882961998693645, -0.0002800557413138449, -0.0002718153118621558, -0.0002635748533066362, -0.0002553344238549471, -0.0002470939652994275, -0.00023885352129582316, -0.0002306130772922188, -0.00022237264784052968, -0.0002141321892850101, -0.00020589174528140575, -0.0001976513012778014, -0.00018941085727419704, -0.0001811704132705927, -0.00017292996926698834, -0.00016468952526338398, -0.00015644909581169486, -0.0001482086518080905, -0.00013996820780448616, -0.0001317277638008818, -0.00012348731979727745, -0.0001152468757936731, -0.00010700643179006875, -9.876599506242201e-05, -9.052555105881765e-05, -8.22851070552133e-05, -7.404466305160895e-05, -6.58042190480046e-05, -5.756377868237905e-05, -4.93233346787747e-05, -4.108289067517035e-05, -3.28424503095448e-05, -2.460200630594045e-05, -1.6361562302336097e-05, -8.121119208226446e-06, 1.1932388588320464e-07, 8.359766070498154e-06, 1.6600210074102506e-05, 2.484065407770686e-05, 3.3081094443332404e-05, 4.1321538446936756e-05, 4.956198245054111e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 10.0, 12.0, 11.0, 12.0, 20.0, 19.0, 15.0, 28.0, 24.0, 24.0, 33.0, 36.0, 30.0, 31.0, 27.0, 33.0, 30.0, 47.0, 45.0, 31.0, 50.0, 43.0, 52.0, 31.0, 27.0, 25.0, 30.0, 20.0, 24.0, 22.0, 29.0, 16.0, 20.0, 16.0, 12.0, 13.0, 7.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0], "bins": [-3.1948089599609375e-05, -3.098789602518082e-05, -3.0027702450752258e-05, -2.90675088763237e-05, -2.810731530189514e-05, -2.7147121727466583e-05, -2.6186928153038025e-05, -2.5226734578609467e-05, -2.4266541004180908e-05, -2.330634742975235e-05, -2.234615385532379e-05, -2.1385960280895233e-05, -2.0425766706466675e-05, -1.9465573132038116e-05, -1.8505379557609558e-05, -1.7545185983181e-05, -1.658499240875244e-05, -1.5624798834323883e-05, -1.4664605259895325e-05, -1.3704411685466766e-05, -1.2744218111038208e-05, -1.178402453660965e-05, -1.0823830962181091e-05, -9.863637387752533e-06, -8.903443813323975e-06, -7.943250238895416e-06, -6.983056664466858e-06, -6.0228630900382996e-06, -5.062669515609741e-06, -4.102475941181183e-06, -3.1422823667526245e-06, -2.182088792324066e-06, -1.2218952178955078e-06, -2.6170164346694946e-07, 6.984919309616089e-07, 1.6586855053901672e-06, 2.6188790798187256e-06, 3.579072654247284e-06, 4.539266228675842e-06, 5.499459803104401e-06, 6.459653377532959e-06, 7.419846951961517e-06, 8.380040526390076e-06, 9.340234100818634e-06, 1.0300427675247192e-05, 1.126062124967575e-05, 1.2220814824104309e-05, 1.3181008398532867e-05, 1.4141201972961426e-05, 1.5101395547389984e-05, 1.6061589121818542e-05, 1.70217826962471e-05, 1.798197627067566e-05, 1.8942169845104218e-05, 1.9902363419532776e-05, 2.0862556993961334e-05, 2.1822750568389893e-05, 2.278294414281845e-05, 2.374313771724701e-05, 2.4703331291675568e-05, 2.5663524866104126e-05, 2.6623718440532684e-05, 2.7583912014961243e-05, 2.85441055893898e-05, 2.950429916381836e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 6.0, 6.0, 8.0, 14.0, 15.0, 15.0, 22.0, 25.0, 28.0, 36.0, 37.0, 34.0, 44.0, 45.0, 37.0, 46.0, 41.0, 35.0, 55.0, 27.0, 38.0, 37.0, 47.0, 43.0, 34.0, 28.0, 25.0, 20.0, 23.0, 22.0, 17.0, 19.0, 8.0, 11.0, 2.0, 13.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.46875, -36.03125, -34.59375, -33.15625, -31.71875, -30.28125, -28.84375, -27.40625, -25.96875, -24.53125, -23.09375, -21.65625, -20.21875, -18.78125, -17.34375, -15.90625, -14.46875, -13.03125, -11.59375, -10.15625, -8.71875, -7.28125, -5.84375, -4.40625, -2.96875, -1.53125, -0.09375, 1.34375, 2.78125, 4.21875, 5.65625, 7.09375, 8.53125, 9.96875, 11.40625, 12.84375, 14.28125, 15.71875, 17.15625, 18.59375, 20.03125, 21.46875, 22.90625, 24.34375, 25.78125, 27.21875, 28.65625, 30.09375, 31.53125, 32.96875, 34.40625, 35.84375, 37.28125, 38.71875, 40.15625, 41.59375, 43.03125, 44.46875, 45.90625, 47.34375, 48.78125, 50.21875, 51.65625, 53.09375, 54.53125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 8.0, 5.0, 15.0, 19.0, 27.0, 53.0, 51.0, 78.0, 100.0, 139.0, 214.0, 273.0, 387.0, 519.0, 790.0, 1098.0, 1630.0, 2539.0, 4106.0, 7662.0, 18490.0, 98478.0, 764987.0, 107666.0, 19190.0, 7767.0, 4360.0, 2451.0, 1613.0, 1140.0, 758.0, 519.0, 390.0, 291.0, 209.0, 169.0, 109.0, 68.0, 49.0, 41.0, 31.0, 26.0, 7.0, 10.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.25, -62.9619140625, -60.673828125, -58.3857421875, -56.09765625, -53.8095703125, -51.521484375, -49.2333984375, -46.9453125, -44.6572265625, -42.369140625, -40.0810546875, -37.79296875, -35.5048828125, -33.216796875, -30.9287109375, -28.640625, -26.3525390625, -24.064453125, -21.7763671875, -19.48828125, -17.2001953125, -14.912109375, -12.6240234375, -10.3359375, -8.0478515625, -5.759765625, -3.4716796875, -1.18359375, 1.1044921875, 3.392578125, 5.6806640625, 7.96875, 10.2568359375, 12.544921875, 14.8330078125, 17.12109375, 19.4091796875, 21.697265625, 23.9853515625, 26.2734375, 28.5615234375, 30.849609375, 33.1376953125, 35.42578125, 37.7138671875, 40.001953125, 42.2900390625, 44.578125, 46.8662109375, 49.154296875, 51.4423828125, 53.73046875, 56.0185546875, 58.306640625, 60.5947265625, 62.8828125, 65.1708984375, 67.458984375, 69.7470703125, 72.03515625, 74.3232421875, 76.611328125, 78.8994140625, 81.1875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 5.0, 1.0, 12.0, 6.0, 11.0, 9.0, 11.0, 19.0, 26.0, 32.0, 18.0, 34.0, 32.0, 41.0, 36.0, 48.0, 47.0, 73.0, 99.0, 232.0, 1678.0, 126.0, 76.0, 58.0, 43.0, 48.0, 26.0, 30.0, 30.0, 26.0, 21.0, 22.0, 10.0, 11.0, 13.0, 14.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-158.75, -153.9609375, -149.171875, -144.3828125, -139.59375, -134.8046875, -130.015625, -125.2265625, -120.4375, -115.6484375, -110.859375, -106.0703125, -101.28125, -96.4921875, -91.703125, -86.9140625, -82.125, -77.3359375, -72.546875, -67.7578125, -62.96875, -58.1796875, -53.390625, -48.6015625, -43.8125, -39.0234375, -34.234375, -29.4453125, -24.65625, -19.8671875, -15.078125, -10.2890625, -5.5, -0.7109375, 4.078125, 8.8671875, 13.65625, 18.4453125, 23.234375, 28.0234375, 32.8125, 37.6015625, 42.390625, 47.1796875, 51.96875, 56.7578125, 61.546875, 66.3359375, 71.125, 75.9140625, 80.703125, 85.4921875, 90.28125, 95.0703125, 99.859375, 104.6484375, 109.4375, 114.2265625, 119.015625, 123.8046875, 128.59375, 133.3828125, 138.171875, 142.9609375, 147.75]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 6.0, 13.0, 14.0, 12.0, 19.0, 26.0, 31.0, 37.0, 41.0, 68.0, 99.0, 219.0, 456.0, 1172.0, 4545.0, 66551.0, 3040014.0, 27402.0, 2966.0, 986.0, 420.0, 187.0, 93.0, 64.0, 58.0, 35.0, 28.0, 25.0, 22.0, 17.0, 13.0, 9.0, 8.0, 8.0, 8.0, 4.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-386.25, -373.53515625, -360.8203125, -348.10546875, -335.390625, -322.67578125, -309.9609375, -297.24609375, -284.53125, -271.81640625, -259.1015625, -246.38671875, -233.671875, -220.95703125, -208.2421875, -195.52734375, -182.8125, -170.09765625, -157.3828125, -144.66796875, -131.953125, -119.23828125, -106.5234375, -93.80859375, -81.09375, -68.37890625, -55.6640625, -42.94921875, -30.234375, -17.51953125, -4.8046875, 7.91015625, 20.625, 33.33984375, 46.0546875, 58.76953125, 71.484375, 84.19921875, 96.9140625, 109.62890625, 122.34375, 135.05859375, 147.7734375, 160.48828125, 173.203125, 185.91796875, 198.6328125, 211.34765625, 224.0625, 236.77734375, 249.4921875, 262.20703125, 274.921875, 287.63671875, 300.3515625, 313.06640625, 325.78125, 338.49609375, 351.2109375, 363.92578125, 376.640625, 389.35546875, 402.0703125, 414.78515625, 427.5]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 11.0, 27.0, 146.0, 527.0, 236.0, 47.0, 16.0, 5.0], "bins": [-1364.74169921875, -1341.8203125, -1318.89892578125, -1295.9775390625, -1273.05615234375, -1250.134765625, -1227.21337890625, -1204.2919921875, -1181.37060546875, -1158.44921875, -1135.52783203125, -1112.6064453125, -1089.68505859375, -1066.763671875, -1043.84228515625, -1020.9208374023438, -997.9993896484375, -975.0780029296875, -952.1566162109375, -929.2352294921875, -906.3138427734375, -883.3923950195312, -860.4710083007812, -837.5496215820312, -814.6282348632812, -791.7068481445312, -768.7854614257812, -745.8640747070312, -722.942626953125, -700.021240234375, -677.099853515625, -654.178466796875, -631.257080078125, -608.335693359375, -585.414306640625, -562.492919921875, -539.571533203125, -516.6500854492188, -493.72869873046875, -470.80731201171875, -447.88592529296875, -424.96453857421875, -402.04315185546875, -379.1217346191406, -356.2003479003906, -333.2789611816406, -310.3575439453125, -287.4361572265625, -264.5147705078125, -241.5933837890625, -218.67198181152344, -195.75057983398438, -172.82919311523438, -149.90780639648438, -126.98640441894531, -104.06500244140625, -81.14360809326172, -58.22221374511719, -35.300819396972656, -12.379425048828125, 10.541969299316406, 33.46336364746094, 56.38475799560547, 79.30615997314453, 102.22754669189453]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 10.0, 5.0, 12.0, 8.0, 11.0, 12.0, 24.0, 15.0, 16.0, 22.0, 20.0, 26.0, 39.0, 25.0, 36.0, 42.0, 33.0, 44.0, 29.0, 36.0, 36.0, 29.0, 42.0, 37.0, 30.0, 35.0, 27.0, 27.0, 31.0, 29.0, 20.0, 21.0, 25.0, 22.0, 19.0, 14.0, 11.0, 8.0, 6.0, 11.0, 9.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0], "bins": [-371.7740173339844, -360.10107421875, -348.4281311035156, -336.75518798828125, -325.0822448730469, -313.4093017578125, -301.73638916015625, -290.06341552734375, -278.3905029296875, -266.7175598144531, -255.04461669921875, -243.37167358398438, -231.69873046875, -220.02578735351562, -208.3528594970703, -196.67991638183594, -185.0069580078125, -173.33401489257812, -161.66107177734375, -149.98812866210938, -138.315185546875, -126.64225006103516, -114.96931457519531, -103.29637145996094, -91.62342834472656, -79.95048522949219, -68.27754211425781, -56.60460662841797, -44.931663513183594, -33.25872039794922, -21.585784912109375, -9.912841796875, 1.7601318359375, 13.433073043823242, 25.106014251708984, 36.778953552246094, 48.45189666748047, 60.124839782714844, 71.79777526855469, 83.47071838378906, 95.14366149902344, 106.81660461425781, 118.48954772949219, 130.1624755859375, 141.83541870117188, 153.50836181640625, 165.18130493164062, 176.854248046875, 188.52719116210938, 200.20013427734375, 211.87307739257812, 223.5460205078125, 235.21896362304688, 246.89190673828125, 258.5648193359375, 270.23779296875, 281.91070556640625, 293.5836486816406, 305.256591796875, 316.9295349121094, 328.60247802734375, 340.2754211425781, 351.9483642578125, 363.62127685546875, 375.29425048828125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 7.0, 8.0, 5.0, 6.0, 12.0, 17.0, 16.0, 16.0, 20.0, 33.0, 28.0, 29.0, 35.0, 33.0, 42.0, 37.0, 44.0, 43.0, 54.0, 36.0, 41.0, 50.0, 46.0, 36.0, 30.0, 31.0, 37.0, 32.0, 27.0, 30.0, 15.0, 17.0, 13.0, 14.0, 12.0, 10.0, 11.0, 6.0, 10.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.90625, -40.33935546875, -38.7724609375, -37.20556640625, -35.638671875, -34.07177734375, -32.5048828125, -30.93798828125, -29.37109375, -27.80419921875, -26.2373046875, -24.67041015625, -23.103515625, -21.53662109375, -19.9697265625, -18.40283203125, -16.8359375, -15.26904296875, -13.7021484375, -12.13525390625, -10.568359375, -9.00146484375, -7.4345703125, -5.86767578125, -4.30078125, -2.73388671875, -1.1669921875, 0.39990234375, 1.966796875, 3.53369140625, 5.1005859375, 6.66748046875, 8.234375, 9.80126953125, 11.3681640625, 12.93505859375, 14.501953125, 16.06884765625, 17.6357421875, 19.20263671875, 20.76953125, 22.33642578125, 23.9033203125, 25.47021484375, 27.037109375, 28.60400390625, 30.1708984375, 31.73779296875, 33.3046875, 34.87158203125, 36.4384765625, 38.00537109375, 39.572265625, 41.13916015625, 42.7060546875, 44.27294921875, 45.83984375, 47.40673828125, 48.9736328125, 50.54052734375, 52.107421875, 53.67431640625, 55.2412109375, 56.80810546875, 58.375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 14.0, 32.0, 28.0, 36.0, 56.0, 105.0, 110.0, 175.0, 214.0, 317.0, 445.0, 576.0, 888.0, 1310.0, 1850.0, 2919.0, 4660.0, 8186.0, 16518.0, 71574.0, 818059.0, 2936858.0, 270086.0, 29059.0, 11881.0, 6311.0, 3918.0, 2444.0, 1681.0, 1107.0, 793.0, 588.0, 381.0, 278.0, 232.0, 150.0, 116.0, 83.0, 59.0, 50.0, 39.0, 23.0, 18.0, 13.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.5625, -89.40234375, -86.2421875, -83.08203125, -79.921875, -76.76171875, -73.6015625, -70.44140625, -67.28125, -64.12109375, -60.9609375, -57.80078125, -54.640625, -51.48046875, -48.3203125, -45.16015625, -42.0, -38.83984375, -35.6796875, -32.51953125, -29.359375, -26.19921875, -23.0390625, -19.87890625, -16.71875, -13.55859375, -10.3984375, -7.23828125, -4.078125, -0.91796875, 2.2421875, 5.40234375, 8.5625, 11.72265625, 14.8828125, 18.04296875, 21.203125, 24.36328125, 27.5234375, 30.68359375, 33.84375, 37.00390625, 40.1640625, 43.32421875, 46.484375, 49.64453125, 52.8046875, 55.96484375, 59.125, 62.28515625, 65.4453125, 68.60546875, 71.765625, 74.92578125, 78.0859375, 81.24609375, 84.40625, 87.56640625, 90.7265625, 93.88671875, 97.046875, 100.20703125, 103.3671875, 106.52734375, 109.6875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 11.0, 11.0, 13.0, 19.0, 20.0, 25.0, 35.0, 44.0, 60.0, 93.0, 192.0, 425.0, 854.0, 1128.0, 579.0, 236.0, 110.0, 62.0, 34.0, 37.0, 20.0, 9.0, 13.0, 7.0, 6.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.6875, -100.138671875, -96.58984375, -93.041015625, -89.4921875, -85.943359375, -82.39453125, -78.845703125, -75.296875, -71.748046875, -68.19921875, -64.650390625, -61.1015625, -57.552734375, -54.00390625, -50.455078125, -46.90625, -43.357421875, -39.80859375, -36.259765625, -32.7109375, -29.162109375, -25.61328125, -22.064453125, -18.515625, -14.966796875, -11.41796875, -7.869140625, -4.3203125, -0.771484375, 2.77734375, 6.326171875, 9.875, 13.423828125, 16.97265625, 20.521484375, 24.0703125, 27.619140625, 31.16796875, 34.716796875, 38.265625, 41.814453125, 45.36328125, 48.912109375, 52.4609375, 56.009765625, 59.55859375, 63.107421875, 66.65625, 70.205078125, 73.75390625, 77.302734375, 80.8515625, 84.400390625, 87.94921875, 91.498046875, 95.046875, 98.595703125, 102.14453125, 105.693359375, 109.2421875, 112.791015625, 116.33984375, 119.888671875, 123.4375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 9.0, 18.0, 15.0, 40.0, 59.0, 92.0, 181.0, 354.0, 737.0, 1859.0, 5568.0, 21110.0, 149051.0, 3867147.0, 120922.0, 18771.0, 5060.0, 1743.0, 708.0, 327.0, 204.0, 110.0, 49.0, 38.0, 28.0, 18.0, 16.0, 11.0, 13.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-329.0, -319.72265625, -310.4453125, -301.16796875, -291.890625, -282.61328125, -273.3359375, -264.05859375, -254.78125, -245.50390625, -236.2265625, -226.94921875, -217.671875, -208.39453125, -199.1171875, -189.83984375, -180.5625, -171.28515625, -162.0078125, -152.73046875, -143.453125, -134.17578125, -124.8984375, -115.62109375, -106.34375, -97.06640625, -87.7890625, -78.51171875, -69.234375, -59.95703125, -50.6796875, -41.40234375, -32.125, -22.84765625, -13.5703125, -4.29296875, 4.984375, 14.26171875, 23.5390625, 32.81640625, 42.09375, 51.37109375, 60.6484375, 69.92578125, 79.203125, 88.48046875, 97.7578125, 107.03515625, 116.3125, 125.58984375, 134.8671875, 144.14453125, 153.421875, 162.69921875, 171.9765625, 181.25390625, 190.53125, 199.80859375, 209.0859375, 218.36328125, 227.640625, 236.91796875, 246.1953125, 255.47265625, 264.75]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 28.0, 263.0, 639.0, 75.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3861.946044921875, -3776.6220703125, -3691.298095703125, -3605.973876953125, -3520.64990234375, -3435.325927734375, -3350.001953125, -3264.677978515625, -3179.35400390625, -3094.030029296875, -3008.7060546875, -2923.3818359375, -2838.057861328125, -2752.73388671875, -2667.409912109375, -2582.0859375, -2496.76171875, -2411.437744140625, -2326.11376953125, -2240.78955078125, -2155.465576171875, -2070.1416015625, -1984.817626953125, -1899.49365234375, -1814.1695556640625, -1728.8455810546875, -1643.521484375, -1558.197509765625, -1472.87353515625, -1387.5494384765625, -1302.2254638671875, -1216.9013671875, -1131.5771484375, -1046.253173828125, -960.9290771484375, -875.6051025390625, -790.2810668945312, -704.95703125, -619.633056640625, -534.3090209960938, -448.9849853515625, -363.66094970703125, -278.3369445800781, -193.01292419433594, -107.68890380859375, -22.3648681640625, 62.959136962890625, 148.28314208984375, 233.607177734375, 318.93121337890625, 404.2552185058594, 489.5792236328125, 574.9032592773438, 660.227294921875, 745.55126953125, 830.8753051757812, 916.1993408203125, 1001.5233764648438, 1086.847412109375, 1172.17138671875, 1257.495361328125, 1342.8194580078125, 1428.1434326171875, 1513.467529296875, 1598.79150390625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 5.0, 13.0, 18.0, 19.0, 21.0, 31.0, 34.0, 28.0, 35.0, 42.0, 53.0, 41.0, 48.0, 54.0, 44.0, 66.0, 52.0, 45.0, 38.0, 43.0, 51.0, 37.0, 40.0, 30.0, 26.0, 22.0, 16.0, 9.0, 7.0, 14.0, 5.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.37890625, -270.19659423828125, -260.0142517089844, -249.83192443847656, -239.64959716796875, -229.46728515625, -219.2849578857422, -209.10263061523438, -198.92030334472656, -188.73797607421875, -178.55564880371094, -168.37332153320312, -158.19100952148438, -148.0086669921875, -137.82635498046875, -127.64402770996094, -117.46170043945312, -107.27937316894531, -97.0970458984375, -86.91472625732422, -76.7323989868164, -66.5500717163086, -56.36774826049805, -46.1854248046875, -36.00309753417969, -25.820772171020508, -15.638446807861328, -5.456121444702148, 4.726203918457031, 14.908531188964844, 25.09085464477539, 35.27317810058594, 45.455535888671875, 55.63786315917969, 65.8201904296875, 76.00251007080078, 86.1848373413086, 96.3671646118164, 106.54948425292969, 116.7318115234375, 126.91413879394531, 137.09646606445312, 147.27879333496094, 157.46112060546875, 167.6434326171875, 177.82577514648438, 188.00808715820312, 198.19041442871094, 208.37274169921875, 218.55506896972656, 228.73739624023438, 238.9197235107422, 249.10205078125, 259.28436279296875, 269.4667053222656, 279.6490173339844, 289.83135986328125, 300.013671875, 310.1960144042969, 320.3783264160156, 330.5606689453125, 340.74298095703125, 350.9253234863281, 361.1076354980469, 371.2899475097656]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 14.0, 15.0, 12.0, 10.0, 16.0, 20.0, 22.0, 22.0, 26.0, 24.0, 37.0, 28.0, 36.0, 43.0, 44.0, 38.0, 48.0, 40.0, 35.0, 30.0, 33.0, 42.0, 45.0, 45.0, 35.0, 17.0, 36.0, 21.0, 20.0, 19.0, 14.0, 16.0, 11.0, 11.0, 9.0, 10.0, 8.0, 10.0, 4.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.54443359375, -37.1201171875, -35.69580078125, -34.271484375, -32.84716796875, -31.4228515625, -29.99853515625, -28.57421875, -27.14990234375, -25.7255859375, -24.30126953125, -22.876953125, -21.45263671875, -20.0283203125, -18.60400390625, -17.1796875, -15.75537109375, -14.3310546875, -12.90673828125, -11.482421875, -10.05810546875, -8.6337890625, -7.20947265625, -5.78515625, -4.36083984375, -2.9365234375, -1.51220703125, -0.087890625, 1.33642578125, 2.7607421875, 4.18505859375, 5.609375, 7.03369140625, 8.4580078125, 9.88232421875, 11.306640625, 12.73095703125, 14.1552734375, 15.57958984375, 17.00390625, 18.42822265625, 19.8525390625, 21.27685546875, 22.701171875, 24.12548828125, 25.5498046875, 26.97412109375, 28.3984375, 29.82275390625, 31.2470703125, 32.67138671875, 34.095703125, 35.52001953125, 36.9443359375, 38.36865234375, 39.79296875, 41.21728515625, 42.6416015625, 44.06591796875, 45.490234375, 46.91455078125, 48.3388671875, 49.76318359375, 51.1875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 8.0, 12.0, 19.0, 21.0, 36.0, 56.0, 69.0, 102.0, 175.0, 226.0, 324.0, 475.0, 660.0, 967.0, 1432.0, 2052.0, 3039.0, 4422.0, 6514.0, 9768.0, 14783.0, 22506.0, 35497.0, 58800.0, 104776.0, 230998.0, 268616.0, 111786.0, 62457.0, 37240.0, 23542.0, 15413.0, 10190.0, 6788.0, 4649.0, 3179.0, 2118.0, 1476.0, 1031.0, 692.0, 510.0, 311.0, 248.0, 176.0, 107.0, 79.0, 76.0, 36.0, 25.0, 24.0, 21.0, 12.0, 5.0, 5.0, 11.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.482421875, -1.4295806884765625, -1.376739501953125, -1.3238983154296875, -1.27105712890625, -1.2182159423828125, -1.165374755859375, -1.1125335693359375, -1.0596923828125, -1.0068511962890625, -0.954010009765625, -0.9011688232421875, -0.84832763671875, -0.7954864501953125, -0.742645263671875, -0.6898040771484375, -0.636962890625, -0.5841217041015625, -0.531280517578125, -0.4784393310546875, -0.42559814453125, -0.3727569580078125, -0.319915771484375, -0.2670745849609375, -0.2142333984375, -0.1613922119140625, -0.108551025390625, -0.0557098388671875, -0.00286865234375, 0.0499725341796875, 0.102813720703125, 0.1556549072265625, 0.20849609375, 0.2613372802734375, 0.314178466796875, 0.3670196533203125, 0.41986083984375, 0.4727020263671875, 0.525543212890625, 0.5783843994140625, 0.6312255859375, 0.6840667724609375, 0.736907958984375, 0.7897491455078125, 0.84259033203125, 0.8954315185546875, 0.948272705078125, 1.0011138916015625, 1.053955078125, 1.1067962646484375, 1.159637451171875, 1.2124786376953125, 1.26531982421875, 1.3181610107421875, 1.371002197265625, 1.4238433837890625, 1.4766845703125, 1.5295257568359375, 1.582366943359375, 1.6352081298828125, 1.68804931640625, 1.7408905029296875, 1.793731689453125, 1.8465728759765625, 1.8994140625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 14.0, 10.0, 14.0, 17.0, 22.0, 13.0, 26.0, 27.0, 29.0, 41.0, 35.0, 42.0, 49.0, 45.0, 45.0, 36.0, 1062.0, 48.0, 46.0, 43.0, 32.0, 38.0, 36.0, 31.0, 25.0, 28.0, 23.0, 22.0, 28.0, 20.0, 13.0, 13.0, 12.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.15625, -32.10888671875, -31.0615234375, -30.01416015625, -28.966796875, -27.91943359375, -26.8720703125, -25.82470703125, -24.77734375, -23.72998046875, -22.6826171875, -21.63525390625, -20.587890625, -19.54052734375, -18.4931640625, -17.44580078125, -16.3984375, -15.35107421875, -14.3037109375, -13.25634765625, -12.208984375, -11.16162109375, -10.1142578125, -9.06689453125, -8.01953125, -6.97216796875, -5.9248046875, -4.87744140625, -3.830078125, -2.78271484375, -1.7353515625, -0.68798828125, 0.359375, 1.40673828125, 2.4541015625, 3.50146484375, 4.548828125, 5.59619140625, 6.6435546875, 7.69091796875, 8.73828125, 9.78564453125, 10.8330078125, 11.88037109375, 12.927734375, 13.97509765625, 15.0224609375, 16.06982421875, 17.1171875, 18.16455078125, 19.2119140625, 20.25927734375, 21.306640625, 22.35400390625, 23.4013671875, 24.44873046875, 25.49609375, 26.54345703125, 27.5908203125, 28.63818359375, 29.685546875, 30.73291015625, 31.7802734375, 32.82763671875, 33.875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 11.0, 14.0, 34.0, 38.0, 59.0, 94.0, 138.0, 203.0, 302.0, 406.0, 627.0, 1002.0, 1466.0, 2340.0, 3555.0, 5451.0, 8455.0, 13199.0, 20497.0, 32032.0, 52411.0, 88782.0, 173436.0, 1367159.0, 131839.0, 73256.0, 43890.0, 27241.0, 17162.0, 11194.0, 7203.0, 4735.0, 3030.0, 2011.0, 1271.0, 884.0, 549.0, 393.0, 230.0, 178.0, 106.0, 73.0, 53.0, 39.0, 22.0, 13.0, 8.0, 11.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.38671875, -1.34381103515625, -1.3009033203125, -1.25799560546875, -1.215087890625, -1.17218017578125, -1.1292724609375, -1.08636474609375, -1.04345703125, -1.00054931640625, -0.9576416015625, -0.91473388671875, -0.871826171875, -0.82891845703125, -0.7860107421875, -0.74310302734375, -0.7001953125, -0.65728759765625, -0.6143798828125, -0.57147216796875, -0.528564453125, -0.48565673828125, -0.4427490234375, -0.39984130859375, -0.35693359375, -0.31402587890625, -0.2711181640625, -0.22821044921875, -0.185302734375, -0.14239501953125, -0.0994873046875, -0.05657958984375, -0.013671875, 0.02923583984375, 0.0721435546875, 0.11505126953125, 0.157958984375, 0.20086669921875, 0.2437744140625, 0.28668212890625, 0.32958984375, 0.37249755859375, 0.4154052734375, 0.45831298828125, 0.501220703125, 0.54412841796875, 0.5870361328125, 0.62994384765625, 0.6728515625, 0.71575927734375, 0.7586669921875, 0.80157470703125, 0.844482421875, 0.88739013671875, 0.9302978515625, 0.97320556640625, 1.01611328125, 1.05902099609375, 1.1019287109375, 1.14483642578125, 1.187744140625, 1.23065185546875, 1.2735595703125, 1.31646728515625, 1.359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 11.0, 10.0, 12.0, 9.0, 16.0, 21.0, 35.0, 33.0, 47.0, 57.0, 63.0, 71.0, 202.0, 75.0, 78.0, 49.0, 38.0, 32.0, 30.0, 28.0, 19.0, 16.0, 9.0, 11.0, 3.0, 2.0, 5.0, 3.0, 6.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.641315460205078e-05, -7.391534745693207e-05, -7.141754031181335e-05, -6.891973316669464e-05, -6.642192602157593e-05, -6.392411887645721e-05, -6.14263117313385e-05, -5.892850458621979e-05, -5.6430697441101074e-05, -5.393289029598236e-05, -5.143508315086365e-05, -4.8937276005744934e-05, -4.643946886062622e-05, -4.394166171550751e-05, -4.1443854570388794e-05, -3.894604742527008e-05, -3.644824028015137e-05, -3.3950433135032654e-05, -3.145262598991394e-05, -2.8954818844795227e-05, -2.6457011699676514e-05, -2.39592045545578e-05, -2.1461397409439087e-05, -1.8963590264320374e-05, -1.646578311920166e-05, -1.3967975974082947e-05, -1.1470168828964233e-05, -8.97236168384552e-06, -6.474554538726807e-06, -3.976747393608093e-06, -1.4789402484893799e-06, 1.0188668966293335e-06, 3.516674041748047e-06, 6.01448118686676e-06, 8.512288331985474e-06, 1.1010095477104187e-05, 1.35079026222229e-05, 1.6005709767341614e-05, 1.8503516912460327e-05, 2.100132405757904e-05, 2.3499131202697754e-05, 2.5996938347816467e-05, 2.849474549293518e-05, 3.0992552638053894e-05, 3.349035978317261e-05, 3.598816692829132e-05, 3.8485974073410034e-05, 4.098378121852875e-05, 4.348158836364746e-05, 4.5979395508766174e-05, 4.847720265388489e-05, 5.09750097990036e-05, 5.3472816944122314e-05, 5.597062408924103e-05, 5.846843123435974e-05, 6.0966238379478455e-05, 6.346404552459717e-05, 6.596185266971588e-05, 6.84596598148346e-05, 7.095746695995331e-05, 7.345527410507202e-05, 7.595308125019073e-05, 7.845088839530945e-05, 8.094869554042816e-05, 8.344650268554688e-05]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 9.0, 9.0, 19.0, 15.0, 21.0, 26.0, 34.0, 62.0, 64.0, 136.0, 359.0, 2048.0, 38318.0, 987083.0, 18280.0, 1389.0, 296.0, 108.0, 84.0, 37.0, 38.0, 29.0, 24.0, 14.0, 8.0, 11.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014324188232421875, -0.001389533281326294, -0.0013466477394104004, -0.0013037621974945068, -0.0012608766555786133, -0.0012179911136627197, -0.0011751055717468262, -0.0011322200298309326, -0.001089334487915039, -0.0010464489459991455, -0.001003563404083252, -0.0009606778621673584, -0.0009177923202514648, -0.0008749067783355713, -0.0008320212364196777, -0.0007891356945037842, -0.0007462501525878906, -0.0007033646106719971, -0.0006604790687561035, -0.00061759352684021, -0.0005747079849243164, -0.0005318224430084229, -0.0004889369010925293, -0.00044605135917663574, -0.0004031658172607422, -0.00036028027534484863, -0.0003173947334289551, -0.0002745091915130615, -0.00023162364959716797, -0.00018873810768127441, -0.00014585256576538086, -0.0001029670238494873, -6.008148193359375e-05, -1.7195940017700195e-05, 2.568960189819336e-05, 6.857514381408691e-05, 0.00011146068572998047, 0.00015434622764587402, 0.00019723176956176758, 0.00024011731147766113, 0.0002830028533935547, 0.00032588839530944824, 0.0003687739372253418, 0.00041165947914123535, 0.0004545450210571289, 0.0004974305629730225, 0.000540316104888916, 0.0005832016468048096, 0.0006260871887207031, 0.0006689727306365967, 0.0007118582725524902, 0.0007547438144683838, 0.0007976293563842773, 0.0008405148983001709, 0.0008834004402160645, 0.000926285982131958, 0.0009691715240478516, 0.0010120570659637451, 0.0010549426078796387, 0.0010978281497955322, 0.0011407136917114258, 0.0011835992336273193, 0.0012264847755432129, 0.0012693703174591064, 0.001312255859375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 3.0, 3.0, 12.0, 18.0, 7.0, 12.0, 31.0, 24.0, 60.0, 76.0, 86.0, 138.0, 124.0, 101.0, 78.0, 54.0, 39.0, 34.0, 24.0, 18.0, 7.0, 5.0, 6.0, 6.0, 2.0, 7.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.7277906560339034e-05, -4.6032557293074206e-05, -4.478720438783057e-05, -4.354185512056574e-05, -4.229650221532211e-05, -4.105115294805728e-05, -3.980580368079245e-05, -3.8560450775548816e-05, -3.731510150828399e-05, -3.606975224101916e-05, -3.4824399335775524e-05, -3.3579050068510696e-05, -3.233369716326706e-05, -3.108834789600223e-05, -2.9842996809748e-05, -2.859764572349377e-05, -2.7352294637239538e-05, -2.6106943550985307e-05, -2.4861592464731075e-05, -2.3616241378476843e-05, -2.2370892111212015e-05, -2.1125541024957784e-05, -1.9880189938703552e-05, -1.8634840671438724e-05, -1.738948776619509e-05, -1.6144136679940857e-05, -1.4898786503181327e-05, -1.3653435416927096e-05, -1.2408085240167566e-05, -1.1162734153913334e-05, -9.917383067659102e-06, -8.672032890899573e-06, -7.426682714140043e-06, -6.181332082633162e-06, -4.935981451126281e-06, -3.6906303648720495e-06, -2.445279733365169e-06, -1.199929101858288e-06, 4.542198439594358e-08, 1.2907721611554734e-06, 2.536123247409705e-06, 3.781473878916586e-06, 5.0268245104234666e-06, 6.272175596677698e-06, 7.517526228184579e-06, 8.76287685969146e-06, 1.0008227945945691e-05, 1.1253578122705221e-05, 1.2498929208959453e-05, 1.3744280295213684e-05, 1.4989630471973214e-05, 1.6234982467722148e-05, 1.7480331734986976e-05, 1.8725682821241207e-05, 1.997103390749544e-05, 2.1216383174760267e-05, 2.2461736080003902e-05, 2.3707087166258134e-05, 2.4952438252512366e-05, 2.6197787519777194e-05, 2.7443138606031425e-05, 2.8688489692285657e-05, 2.993384077853989e-05, 3.117919186479412e-05, 3.242454113205895e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 8.0, 9.0, 4.0, 11.0, 4.0, 9.0, 22.0, 22.0, 25.0, 25.0, 27.0, 23.0, 32.0, 37.0, 33.0, 39.0, 36.0, 42.0, 39.0, 41.0, 48.0, 34.0, 46.0, 41.0, 32.0, 33.0, 48.0, 28.0, 29.0, 19.0, 19.0, 19.0, 21.0, 18.0, 9.0, 17.0, 9.0, 11.0, 11.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.9802322387695312e-05, -2.884306013584137e-05, -2.7883797883987427e-05, -2.6924535632133484e-05, -2.596527338027954e-05, -2.5006011128425598e-05, -2.4046748876571655e-05, -2.3087486624717712e-05, -2.212822437286377e-05, -2.1168962121009827e-05, -2.0209699869155884e-05, -1.925043761730194e-05, -1.8291175365447998e-05, -1.7331913113594055e-05, -1.6372650861740112e-05, -1.541338860988617e-05, -1.4454126358032227e-05, -1.3494864106178284e-05, -1.253560185432434e-05, -1.1576339602470398e-05, -1.0617077350616455e-05, -9.657815098762512e-06, -8.69855284690857e-06, -7.739290595054626e-06, -6.780028343200684e-06, -5.820766091346741e-06, -4.861503839492798e-06, -3.902241587638855e-06, -2.942979335784912e-06, -1.9837170839309692e-06, -1.0244548320770264e-06, -6.51925802230835e-08, 8.940696716308594e-07, 1.8533319234848022e-06, 2.812594175338745e-06, 3.771856427192688e-06, 4.731118679046631e-06, 5.690380930900574e-06, 6.649643182754517e-06, 7.6089054346084595e-06, 8.568167686462402e-06, 9.527429938316345e-06, 1.0486692190170288e-05, 1.1445954442024231e-05, 1.2405216693878174e-05, 1.3364478945732117e-05, 1.432374119758606e-05, 1.5283003449440002e-05, 1.6242265701293945e-05, 1.7201527953147888e-05, 1.816079020500183e-05, 1.9120052456855774e-05, 2.0079314708709717e-05, 2.103857696056366e-05, 2.1997839212417603e-05, 2.2957101464271545e-05, 2.3916363716125488e-05, 2.487562596797943e-05, 2.5834888219833374e-05, 2.6794150471687317e-05, 2.775341272354126e-05, 2.8712674975395203e-05, 2.9671937227249146e-05, 3.063119947910309e-05, 3.159046173095703e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 14.0, 15.0, 12.0, 10.0, 16.0, 20.0, 22.0, 22.0, 26.0, 24.0, 37.0, 28.0, 36.0, 43.0, 44.0, 38.0, 48.0, 40.0, 35.0, 30.0, 33.0, 42.0, 45.0, 45.0, 35.0, 17.0, 36.0, 21.0, 20.0, 19.0, 14.0, 16.0, 11.0, 11.0, 9.0, 10.0, 8.0, 10.0, 4.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.54443359375, -37.1201171875, -35.69580078125, -34.271484375, -32.84716796875, -31.4228515625, -29.99853515625, -28.57421875, -27.14990234375, -25.7255859375, -24.30126953125, -22.876953125, -21.45263671875, -20.0283203125, -18.60400390625, -17.1796875, -15.75537109375, -14.3310546875, -12.90673828125, -11.482421875, -10.05810546875, -8.6337890625, -7.20947265625, -5.78515625, -4.36083984375, -2.9365234375, -1.51220703125, -0.087890625, 1.33642578125, 2.7607421875, 4.18505859375, 5.609375, 7.03369140625, 8.4580078125, 9.88232421875, 11.306640625, 12.73095703125, 14.1552734375, 15.57958984375, 17.00390625, 18.42822265625, 19.8525390625, 21.27685546875, 22.701171875, 24.12548828125, 25.5498046875, 26.97412109375, 28.3984375, 29.82275390625, 31.2470703125, 32.67138671875, 34.095703125, 35.52001953125, 36.9443359375, 38.36865234375, 39.79296875, 41.21728515625, 42.6416015625, 44.06591796875, 45.490234375, 46.91455078125, 48.3388671875, 49.76318359375, 51.1875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 2.0, 9.0, 5.0, 6.0, 11.0, 14.0, 24.0, 25.0, 34.0, 49.0, 62.0, 99.0, 100.0, 136.0, 173.0, 267.0, 356.0, 452.0, 612.0, 771.0, 1101.0, 1579.0, 2589.0, 4505.0, 9867.0, 30216.0, 145480.0, 657475.0, 140492.0, 29572.0, 9703.0, 4395.0, 2454.0, 1603.0, 1073.0, 814.0, 606.0, 443.0, 331.0, 271.0, 203.0, 154.0, 104.0, 87.0, 58.0, 46.0, 44.0, 18.0, 20.0, 12.0, 12.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-55.25, -53.43798828125, -51.6259765625, -49.81396484375, -48.001953125, -46.18994140625, -44.3779296875, -42.56591796875, -40.75390625, -38.94189453125, -37.1298828125, -35.31787109375, -33.505859375, -31.69384765625, -29.8818359375, -28.06982421875, -26.2578125, -24.44580078125, -22.6337890625, -20.82177734375, -19.009765625, -17.19775390625, -15.3857421875, -13.57373046875, -11.76171875, -9.94970703125, -8.1376953125, -6.32568359375, -4.513671875, -2.70166015625, -0.8896484375, 0.92236328125, 2.734375, 4.54638671875, 6.3583984375, 8.17041015625, 9.982421875, 11.79443359375, 13.6064453125, 15.41845703125, 17.23046875, 19.04248046875, 20.8544921875, 22.66650390625, 24.478515625, 26.29052734375, 28.1025390625, 29.91455078125, 31.7265625, 33.53857421875, 35.3505859375, 37.16259765625, 38.974609375, 40.78662109375, 42.5986328125, 44.41064453125, 46.22265625, 48.03466796875, 49.8466796875, 51.65869140625, 53.470703125, 55.28271484375, 57.0947265625, 58.90673828125, 60.71875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 10.0, 8.0, 11.0, 11.0, 17.0, 12.0, 8.0, 17.0, 22.0, 18.0, 24.0, 16.0, 37.0, 27.0, 34.0, 35.0, 40.0, 46.0, 53.0, 157.0, 1812.0, 150.0, 52.0, 50.0, 34.0, 35.0, 32.0, 32.0, 30.0, 34.0, 22.0, 17.0, 15.0, 16.0, 14.0, 15.0, 12.0, 9.0, 6.0, 12.0, 12.0, 8.0, 6.0, 2.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-119.125, -115.080078125, -111.03515625, -106.990234375, -102.9453125, -98.900390625, -94.85546875, -90.810546875, -86.765625, -82.720703125, -78.67578125, -74.630859375, -70.5859375, -66.541015625, -62.49609375, -58.451171875, -54.40625, -50.361328125, -46.31640625, -42.271484375, -38.2265625, -34.181640625, -30.13671875, -26.091796875, -22.046875, -18.001953125, -13.95703125, -9.912109375, -5.8671875, -1.822265625, 2.22265625, 6.267578125, 10.3125, 14.357421875, 18.40234375, 22.447265625, 26.4921875, 30.537109375, 34.58203125, 38.626953125, 42.671875, 46.716796875, 50.76171875, 54.806640625, 58.8515625, 62.896484375, 66.94140625, 70.986328125, 75.03125, 79.076171875, 83.12109375, 87.166015625, 91.2109375, 95.255859375, 99.30078125, 103.345703125, 107.390625, 111.435546875, 115.48046875, 119.525390625, 123.5703125, 127.615234375, 131.66015625, 135.705078125, 139.75]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 8.0, 9.0, 10.0, 12.0, 7.0, 13.0, 23.0, 29.0, 26.0, 35.0, 59.0, 64.0, 86.0, 106.0, 141.0, 231.0, 469.0, 1224.0, 5899.0, 106187.0, 3007092.0, 19581.0, 2577.0, 757.0, 338.0, 165.0, 128.0, 92.0, 76.0, 57.0, 51.0, 29.0, 22.0, 16.0, 15.0, 17.0, 14.0, 11.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-228.75, -221.43359375, -214.1171875, -206.80078125, -199.484375, -192.16796875, -184.8515625, -177.53515625, -170.21875, -162.90234375, -155.5859375, -148.26953125, -140.953125, -133.63671875, -126.3203125, -119.00390625, -111.6875, -104.37109375, -97.0546875, -89.73828125, -82.421875, -75.10546875, -67.7890625, -60.47265625, -53.15625, -45.83984375, -38.5234375, -31.20703125, -23.890625, -16.57421875, -9.2578125, -1.94140625, 5.375, 12.69140625, 20.0078125, 27.32421875, 34.640625, 41.95703125, 49.2734375, 56.58984375, 63.90625, 71.22265625, 78.5390625, 85.85546875, 93.171875, 100.48828125, 107.8046875, 115.12109375, 122.4375, 129.75390625, 137.0703125, 144.38671875, 151.703125, 159.01953125, 166.3359375, 173.65234375, 180.96875, 188.28515625, 195.6015625, 202.91796875, 210.234375, 217.55078125, 224.8671875, 232.18359375, 239.5]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 19.0, 924.0, 77.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-343.4330139160156, -291.4416198730469, -239.45022583007812, -187.45884704589844, -135.4674530029297, -83.47607421875, -31.48468017578125, 20.5067138671875, 72.49810791015625, 124.489501953125, 176.48089599609375, 228.47227478027344, 280.46368408203125, 332.4550476074219, 384.4464416503906, 436.4378356933594, 488.4292297363281, 540.4205932617188, 592.4119873046875, 644.4033813476562, 696.394775390625, 748.3861694335938, 800.3775634765625, 852.3689575195312, 904.3603515625, 956.3517456054688, 1008.3431396484375, 1060.33447265625, 1112.325927734375, 1164.3172607421875, 1216.3087158203125, 1268.300048828125, 1320.2913818359375, 1372.28271484375, 1424.274169921875, 1476.2655029296875, 1528.2569580078125, 1580.248291015625, 1632.23974609375, 1684.2310791015625, 1736.2225341796875, 1788.2138671875, 1840.205322265625, 1892.1966552734375, 1944.1881103515625, 1996.179443359375, 2048.1708984375, 2100.162353515625, 2152.153564453125, 2204.14501953125, 2256.13623046875, 2308.127685546875, 2360.119140625, 2412.110595703125, 2464.101806640625, 2516.09326171875, 2568.084716796875, 2620.076171875, 2672.0673828125, 2724.058837890625, 2776.05029296875, 2828.041748046875, 2880.032958984375, 2932.0244140625, 2984.015869140625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 10.0, 6.0, 8.0, 7.0, 6.0, 13.0, 16.0, 13.0, 17.0, 17.0, 20.0, 27.0, 34.0, 28.0, 29.0, 34.0, 38.0, 29.0, 32.0, 37.0, 46.0, 58.0, 45.0, 40.0, 42.0, 28.0, 39.0, 35.0, 31.0, 23.0, 21.0, 24.0, 14.0, 10.0, 22.0, 20.0, 15.0, 8.0, 12.0, 10.0, 7.0, 13.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-393.0500793457031, -381.58319091796875, -370.11627197265625, -358.64935302734375, -347.1824645996094, -335.715576171875, -324.2486572265625, -312.78173828125, -301.3148498535156, -289.84796142578125, -278.38104248046875, -266.91412353515625, -255.44723510742188, -243.98033142089844, -232.513427734375, -221.04652404785156, -209.57962036132812, -198.1127166748047, -186.64581298828125, -175.1789093017578, -163.71200561523438, -152.24510192871094, -140.7781982421875, -129.31129455566406, -117.84439086914062, -106.37748718261719, -94.91058349609375, -83.44367980957031, -71.97677612304688, -60.50987243652344, -49.04296875, -37.57606506347656, -26.109161376953125, -14.642257690429688, -3.17535400390625, 8.291549682617188, 19.758453369140625, 31.225357055664062, 42.6922607421875, 54.15916442871094, 65.62606811523438, 77.09297180175781, 88.55987548828125, 100.02677917480469, 111.49368286132812, 122.96058654785156, 134.427490234375, 145.89439392089844, 157.36129760742188, 168.8282012939453, 180.29510498046875, 191.7620086669922, 203.22891235351562, 214.69581604003906, 226.1627197265625, 237.62962341308594, 249.09652709960938, 260.56341552734375, 272.03033447265625, 283.49725341796875, 294.9641418457031, 306.4310302734375, 317.89794921875, 329.3648681640625, 340.8317565917969]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 10.0, 12.0, 13.0, 10.0, 10.0, 15.0, 24.0, 21.0, 18.0, 25.0, 34.0, 27.0, 36.0, 37.0, 43.0, 38.0, 59.0, 44.0, 23.0, 37.0, 42.0, 33.0, 34.0, 30.0, 49.0, 32.0, 32.0, 23.0, 26.0, 18.0, 20.0, 17.0, 16.0, 9.0, 8.0, 12.0, 14.0, 5.0, 4.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-40.34375, -38.90087890625, -37.4580078125, -36.01513671875, -34.572265625, -33.12939453125, -31.6865234375, -30.24365234375, -28.80078125, -27.35791015625, -25.9150390625, -24.47216796875, -23.029296875, -21.58642578125, -20.1435546875, -18.70068359375, -17.2578125, -15.81494140625, -14.3720703125, -12.92919921875, -11.486328125, -10.04345703125, -8.6005859375, -7.15771484375, -5.71484375, -4.27197265625, -2.8291015625, -1.38623046875, 0.056640625, 1.49951171875, 2.9423828125, 4.38525390625, 5.828125, 7.27099609375, 8.7138671875, 10.15673828125, 11.599609375, 13.04248046875, 14.4853515625, 15.92822265625, 17.37109375, 18.81396484375, 20.2568359375, 21.69970703125, 23.142578125, 24.58544921875, 26.0283203125, 27.47119140625, 28.9140625, 30.35693359375, 31.7998046875, 33.24267578125, 34.685546875, 36.12841796875, 37.5712890625, 39.01416015625, 40.45703125, 41.89990234375, 43.3427734375, 44.78564453125, 46.228515625, 47.67138671875, 49.1142578125, 50.55712890625, 52.0]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 7.0, 5.0, 12.0, 15.0, 27.0, 24.0, 40.0, 65.0, 68.0, 117.0, 134.0, 159.0, 234.0, 303.0, 377.0, 513.0, 663.0, 891.0, 1228.0, 1743.0, 2424.0, 3718.0, 5806.0, 10246.0, 19695.0, 75021.0, 834474.0, 2969918.0, 199795.0, 29684.0, 13645.0, 7594.0, 4644.0, 3019.0, 2072.0, 1481.0, 1067.0, 791.0, 622.0, 457.0, 345.0, 242.0, 208.0, 158.0, 118.0, 105.0, 70.0, 57.0, 56.0, 27.0, 27.0, 21.0, 13.0, 17.0, 10.0, 7.0, 6.0, 3.0, 3.0, 1.0, 5.0], "bins": [-96.6875, -93.490234375, -90.29296875, -87.095703125, -83.8984375, -80.701171875, -77.50390625, -74.306640625, -71.109375, -67.912109375, -64.71484375, -61.517578125, -58.3203125, -55.123046875, -51.92578125, -48.728515625, -45.53125, -42.333984375, -39.13671875, -35.939453125, -32.7421875, -29.544921875, -26.34765625, -23.150390625, -19.953125, -16.755859375, -13.55859375, -10.361328125, -7.1640625, -3.966796875, -0.76953125, 2.427734375, 5.625, 8.822265625, 12.01953125, 15.216796875, 18.4140625, 21.611328125, 24.80859375, 28.005859375, 31.203125, 34.400390625, 37.59765625, 40.794921875, 43.9921875, 47.189453125, 50.38671875, 53.583984375, 56.78125, 59.978515625, 63.17578125, 66.373046875, 69.5703125, 72.767578125, 75.96484375, 79.162109375, 82.359375, 85.556640625, 88.75390625, 91.951171875, 95.1484375, 98.345703125, 101.54296875, 104.740234375, 107.9375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 12.0, 10.0, 14.0, 19.0, 35.0, 49.0, 73.0, 132.0, 350.0, 910.0, 1457.0, 534.0, 190.0, 92.0, 64.0, 31.0, 25.0, 17.0, 14.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.25, -95.53515625, -90.8203125, -86.10546875, -81.390625, -76.67578125, -71.9609375, -67.24609375, -62.53125, -57.81640625, -53.1015625, -48.38671875, -43.671875, -38.95703125, -34.2421875, -29.52734375, -24.8125, -20.09765625, -15.3828125, -10.66796875, -5.953125, -1.23828125, 3.4765625, 8.19140625, 12.90625, 17.62109375, 22.3359375, 27.05078125, 31.765625, 36.48046875, 41.1953125, 45.91015625, 50.625, 55.33984375, 60.0546875, 64.76953125, 69.484375, 74.19921875, 78.9140625, 83.62890625, 88.34375, 93.05859375, 97.7734375, 102.48828125, 107.203125, 111.91796875, 116.6328125, 121.34765625, 126.0625, 130.77734375, 135.4921875, 140.20703125, 144.921875, 149.63671875, 154.3515625, 159.06640625, 163.78125, 168.49609375, 173.2109375, 177.92578125, 182.640625, 187.35546875, 192.0703125, 196.78515625, 201.5]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 8.0, 9.0, 8.0, 22.0, 34.0, 42.0, 79.0, 151.0, 271.0, 590.0, 1475.0, 4567.0, 17940.0, 167039.0, 3907541.0, 76902.0, 11962.0, 3404.0, 1155.0, 525.0, 269.0, 123.0, 63.0, 51.0, 22.0, 13.0, 7.0, 8.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-543.5, -530.671875, -517.84375, -505.015625, -492.1875, -479.359375, -466.53125, -453.703125, -440.875, -428.046875, -415.21875, -402.390625, -389.5625, -376.734375, -363.90625, -351.078125, -338.25, -325.421875, -312.59375, -299.765625, -286.9375, -274.109375, -261.28125, -248.453125, -235.625, -222.796875, -209.96875, -197.140625, -184.3125, -171.484375, -158.65625, -145.828125, -133.0, -120.171875, -107.34375, -94.515625, -81.6875, -68.859375, -56.03125, -43.203125, -30.375, -17.546875, -4.71875, 8.109375, 20.9375, 33.765625, 46.59375, 59.421875, 72.25, 85.078125, 97.90625, 110.734375, 123.5625, 136.390625, 149.21875, 162.046875, 174.875, 187.703125, 200.53125, 213.359375, 226.1875, 239.015625, 251.84375, 264.671875, 277.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 12.0, 11.0, 15.0, 29.0, 42.0, 73.0, 118.0, 147.0, 181.0, 122.0, 87.0, 63.0, 37.0, 19.0, 16.0, 17.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-500.73388671875, -482.9439392089844, -465.15399169921875, -447.3640441894531, -429.5740966796875, -411.78411865234375, -393.9941711425781, -376.2042236328125, -358.4142761230469, -340.62432861328125, -322.8343811035156, -305.04443359375, -287.25445556640625, -269.46453857421875, -251.674560546875, -233.88461303710938, -216.09466552734375, -198.30471801757812, -180.5147705078125, -162.7248077392578, -144.9348602294922, -127.14491271972656, -109.3549575805664, -91.56500244140625, -73.77505493164062, -55.985103607177734, -38.195152282714844, -20.405200958251953, -2.6152496337890625, 15.174697875976562, 32.96465301513672, 50.754608154296875, 68.54461669921875, 86.33456420898438, 104.12451934814453, 121.91447448730469, 139.7044219970703, 157.49436950683594, 175.28433227539062, 193.07427978515625, 210.86422729492188, 228.6541748046875, 246.44412231445312, 264.23406982421875, 282.0240478515625, 299.81396484375, 317.60394287109375, 335.3938903808594, 353.183837890625, 370.9737854003906, 388.76373291015625, 406.5536804199219, 424.3436279296875, 442.13360595703125, 459.9235534667969, 477.7135009765625, 495.5034484863281, 513.2933959960938, 531.0833740234375, 548.873291015625, 566.6632690429688, 584.4531860351562, 602.2431640625, 620.0330810546875, 637.8230590820312]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 21.0, 11.0, 12.0, 13.0, 25.0, 12.0, 17.0, 14.0, 28.0, 30.0, 29.0, 39.0, 46.0, 35.0, 44.0, 44.0, 49.0, 50.0, 36.0, 46.0, 38.0, 37.0, 34.0, 36.0, 35.0, 28.0, 23.0, 30.0, 21.0, 27.0, 17.0, 14.0, 11.0, 10.0, 5.0, 7.0, 3.0, 3.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-278.71942138671875, -269.37646484375, -260.03350830078125, -250.69053649902344, -241.34756469726562, -232.00460815429688, -222.66165161132812, -213.31869506835938, -203.97572326660156, -194.6327667236328, -185.289794921875, -175.94683837890625, -166.6038818359375, -157.2609100341797, -147.91795349121094, -138.57498168945312, -129.23202514648438, -119.8890609741211, -110.54609680175781, -101.20314025878906, -91.86017608642578, -82.5172119140625, -73.17425537109375, -63.83129119873047, -54.48832702636719, -45.145362854003906, -35.80240249633789, -26.459440231323242, -17.116477966308594, -7.7735137939453125, 1.5694465637207031, 10.912406921386719, 20.25537109375, 29.59833335876465, 38.9412956237793, 48.28425598144531, 57.627220153808594, 66.97018432617188, 76.31314086914062, 85.6561050415039, 94.99906921386719, 104.34203338623047, 113.68499755859375, 123.0279541015625, 132.37091064453125, 141.71388244628906, 151.0568389892578, 160.39981079101562, 169.74276733398438, 179.08572387695312, 188.42869567871094, 197.7716522216797, 207.1146240234375, 216.45758056640625, 225.800537109375, 235.14349365234375, 244.48646545410156, 253.8294219970703, 263.1723937988281, 272.5153503417969, 281.8583068847656, 291.2012939453125, 300.54425048828125, 309.88720703125, 319.23016357421875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 6.0, 4.0, 2.0, 13.0, 18.0, 12.0, 15.0, 24.0, 29.0, 27.0, 31.0, 34.0, 38.0, 40.0, 47.0, 47.0, 53.0, 42.0, 53.0, 51.0, 51.0, 44.0, 46.0, 38.0, 32.0, 27.0, 26.0, 27.0, 30.0, 17.0, 17.0, 13.0, 11.0, 3.0, 9.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.3125, -45.361328125, -43.41015625, -41.458984375, -39.5078125, -37.556640625, -35.60546875, -33.654296875, -31.703125, -29.751953125, -27.80078125, -25.849609375, -23.8984375, -21.947265625, -19.99609375, -18.044921875, -16.09375, -14.142578125, -12.19140625, -10.240234375, -8.2890625, -6.337890625, -4.38671875, -2.435546875, -0.484375, 1.466796875, 3.41796875, 5.369140625, 7.3203125, 9.271484375, 11.22265625, 13.173828125, 15.125, 17.076171875, 19.02734375, 20.978515625, 22.9296875, 24.880859375, 26.83203125, 28.783203125, 30.734375, 32.685546875, 34.63671875, 36.587890625, 38.5390625, 40.490234375, 42.44140625, 44.392578125, 46.34375, 48.294921875, 50.24609375, 52.197265625, 54.1484375, 56.099609375, 58.05078125, 60.001953125, 61.953125, 63.904296875, 65.85546875, 67.806640625, 69.7578125, 71.708984375, 73.66015625, 75.611328125, 77.5625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 8.0, 15.0, 11.0, 26.0, 40.0, 56.0, 84.0, 162.0, 257.0, 422.0, 640.0, 1167.0, 1905.0, 3167.0, 5255.0, 9261.0, 16167.0, 28529.0, 53241.0, 107737.0, 294324.0, 297553.0, 107690.0, 53411.0, 28612.0, 16266.0, 9267.0, 5259.0, 3152.0, 1943.0, 1117.0, 720.0, 433.0, 231.0, 149.0, 93.0, 64.0, 28.0, 21.0, 23.0, 11.0, 7.0, 11.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578125, -2.494964599609375, -2.41180419921875, -2.328643798828125, -2.2454833984375, -2.162322998046875, -2.07916259765625, -1.996002197265625, -1.912841796875, -1.829681396484375, -1.74652099609375, -1.663360595703125, -1.5802001953125, -1.497039794921875, -1.41387939453125, -1.330718994140625, -1.24755859375, -1.164398193359375, -1.08123779296875, -0.998077392578125, -0.9149169921875, -0.831756591796875, -0.74859619140625, -0.665435791015625, -0.582275390625, -0.499114990234375, -0.41595458984375, -0.332794189453125, -0.2496337890625, -0.166473388671875, -0.08331298828125, -0.000152587890625, 0.0830078125, 0.166168212890625, 0.24932861328125, 0.332489013671875, 0.4156494140625, 0.498809814453125, 0.58197021484375, 0.665130615234375, 0.748291015625, 0.831451416015625, 0.91461181640625, 0.997772216796875, 1.0809326171875, 1.164093017578125, 1.24725341796875, 1.330413818359375, 1.41357421875, 1.496734619140625, 1.57989501953125, 1.663055419921875, 1.7462158203125, 1.829376220703125, 1.91253662109375, 1.995697021484375, 2.078857421875, 2.162017822265625, 2.24517822265625, 2.328338623046875, 2.4114990234375, 2.494659423828125, 2.57781982421875, 2.660980224609375, 2.744140625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 9.0, 5.0, 7.0, 9.0, 13.0, 17.0, 13.0, 24.0, 32.0, 30.0, 22.0, 39.0, 29.0, 40.0, 34.0, 38.0, 39.0, 60.0, 1076.0, 41.0, 44.0, 39.0, 41.0, 39.0, 34.0, 33.0, 36.0, 17.0, 26.0, 24.0, 24.0, 13.0, 18.0, 13.0, 13.0, 5.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.625, -40.44580078125, -39.2666015625, -38.08740234375, -36.908203125, -35.72900390625, -34.5498046875, -33.37060546875, -32.19140625, -31.01220703125, -29.8330078125, -28.65380859375, -27.474609375, -26.29541015625, -25.1162109375, -23.93701171875, -22.7578125, -21.57861328125, -20.3994140625, -19.22021484375, -18.041015625, -16.86181640625, -15.6826171875, -14.50341796875, -13.32421875, -12.14501953125, -10.9658203125, -9.78662109375, -8.607421875, -7.42822265625, -6.2490234375, -5.06982421875, -3.890625, -2.71142578125, -1.5322265625, -0.35302734375, 0.826171875, 2.00537109375, 3.1845703125, 4.36376953125, 5.54296875, 6.72216796875, 7.9013671875, 9.08056640625, 10.259765625, 11.43896484375, 12.6181640625, 13.79736328125, 14.9765625, 16.15576171875, 17.3349609375, 18.51416015625, 19.693359375, 20.87255859375, 22.0517578125, 23.23095703125, 24.41015625, 25.58935546875, 26.7685546875, 27.94775390625, 29.126953125, 30.30615234375, 31.4853515625, 32.66455078125, 33.84375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 13.0, 21.0, 33.0, 46.0, 71.0, 86.0, 131.0, 219.0, 322.0, 438.0, 706.0, 1071.0, 1590.0, 2479.0, 3819.0, 6049.0, 9701.0, 15522.0, 24903.0, 41175.0, 70426.0, 129262.0, 1403433.0, 171482.0, 85571.0, 49511.0, 29644.0, 18121.0, 11217.0, 7001.0, 4514.0, 2963.0, 1943.0, 1191.0, 840.0, 536.0, 344.0, 221.0, 172.0, 110.0, 69.0, 53.0, 38.0, 24.0, 10.0, 11.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.669921875, -1.6172027587890625, -1.564483642578125, -1.5117645263671875, -1.45904541015625, -1.4063262939453125, -1.353607177734375, -1.3008880615234375, -1.2481689453125, -1.1954498291015625, -1.142730712890625, -1.0900115966796875, -1.03729248046875, -0.9845733642578125, -0.931854248046875, -0.8791351318359375, -0.826416015625, -0.7736968994140625, -0.720977783203125, -0.6682586669921875, -0.61553955078125, -0.5628204345703125, -0.510101318359375, -0.4573822021484375, -0.4046630859375, -0.3519439697265625, -0.299224853515625, -0.2465057373046875, -0.19378662109375, -0.1410675048828125, -0.088348388671875, -0.0356292724609375, 0.01708984375, 0.0698089599609375, 0.122528076171875, 0.1752471923828125, 0.22796630859375, 0.2806854248046875, 0.333404541015625, 0.3861236572265625, 0.4388427734375, 0.4915618896484375, 0.544281005859375, 0.5970001220703125, 0.64971923828125, 0.7024383544921875, 0.755157470703125, 0.8078765869140625, 0.860595703125, 0.9133148193359375, 0.966033935546875, 1.0187530517578125, 1.07147216796875, 1.1241912841796875, 1.176910400390625, 1.2296295166015625, 1.2823486328125, 1.3350677490234375, 1.387786865234375, 1.4405059814453125, 1.49322509765625, 1.5459442138671875, 1.598663330078125, 1.6513824462890625, 1.7041015625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 14.0, 11.0, 13.0, 25.0, 30.0, 48.0, 66.0, 90.0, 122.0, 159.0, 121.0, 90.0, 59.0, 37.0, 22.0, 26.0, 14.0, 19.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010418891906738281, -0.0001010717824101448, -9.79546457529068e-05, -9.483750909566879e-05, -9.172037243843079e-05, -8.860323578119278e-05, -8.548609912395477e-05, -8.236896246671677e-05, -7.925182580947876e-05, -7.613468915224075e-05, -7.301755249500275e-05, -6.990041583776474e-05, -6.678327918052673e-05, -6.366614252328873e-05, -6.054900586605072e-05, -5.7431869208812714e-05, -5.431473255157471e-05, -5.11975958943367e-05, -4.8080459237098694e-05, -4.496332257986069e-05, -4.184618592262268e-05, -3.8729049265384674e-05, -3.561191260814667e-05, -3.249477595090866e-05, -2.9377639293670654e-05, -2.6260502636432648e-05, -2.314336597919464e-05, -2.0026229321956635e-05, -1.6909092664718628e-05, -1.3791956007480621e-05, -1.0674819350242615e-05, -7.557682693004608e-06, -4.4405460357666016e-06, -1.323409378528595e-06, 1.7937272787094116e-06, 4.910863935947418e-06, 8.028000593185425e-06, 1.1145137250423431e-05, 1.4262273907661438e-05, 1.7379410564899445e-05, 2.049654722213745e-05, 2.3613683879375458e-05, 2.6730820536613464e-05, 2.984795719385147e-05, 3.296509385108948e-05, 3.6082230508327484e-05, 3.919936716556549e-05, 4.23165038228035e-05, 4.5433640480041504e-05, 4.855077713727951e-05, 5.166791379451752e-05, 5.4785050451755524e-05, 5.790218710899353e-05, 6.101932376623154e-05, 6.413646042346954e-05, 6.725359708070755e-05, 7.037073373794556e-05, 7.348787039518356e-05, 7.660500705242157e-05, 7.972214370965958e-05, 8.283928036689758e-05, 8.595641702413559e-05, 8.90735536813736e-05, 9.21906903386116e-05, 9.530782699584961e-05]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 8.0, 11.0, 24.0, 41.0, 49.0, 81.0, 167.0, 502.0, 15132.0, 1005100.0, 26279.0, 689.0, 191.0, 87.0, 66.0, 37.0, 17.0, 18.0, 5.0, 7.0, 0.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001735687255859375, -0.0016788989305496216, -0.0016221106052398682, -0.0015653222799301147, -0.0015085339546203613, -0.001451745629310608, -0.0013949573040008545, -0.001338168978691101, -0.0012813806533813477, -0.0012245923280715942, -0.0011678040027618408, -0.0011110156774520874, -0.001054227352142334, -0.0009974390268325806, -0.0009406507015228271, -0.0008838623762130737, -0.0008270740509033203, -0.0007702857255935669, -0.0007134974002838135, -0.0006567090749740601, -0.0005999207496643066, -0.0005431324243545532, -0.0004863440990447998, -0.0004295557737350464, -0.00037276744842529297, -0.00031597912311553955, -0.00025919079780578613, -0.00020240247249603271, -0.0001456141471862793, -8.882582187652588e-05, -3.203749656677246e-05, 2.4750828742980957e-05, 8.153915405273438e-05, 0.0001383274793624878, 0.0001951158046722412, 0.00025190412998199463, 0.00030869245529174805, 0.00036548078060150146, 0.0004222691059112549, 0.0004790574312210083, 0.0005358457565307617, 0.0005926340818405151, 0.0006494224071502686, 0.000706210732460022, 0.0007629990577697754, 0.0008197873830795288, 0.0008765757083892822, 0.0009333640336990356, 0.000990152359008789, 0.0010469406843185425, 0.001103729009628296, 0.0011605173349380493, 0.0012173056602478027, 0.0012740939855575562, 0.0013308823108673096, 0.001387670636177063, 0.0014444589614868164, 0.0015012472867965698, 0.0015580356121063232, 0.0016148239374160767, 0.00167161226272583, 0.0017284005880355835, 0.001785188913345337, 0.0018419772386550903, 0.0018987655639648438]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 8.0, 10.0, 19.0, 19.0, 32.0, 34.0, 47.0, 49.0, 72.0, 108.0, 108.0, 101.0, 79.0, 64.0, 51.0, 43.0, 29.0, 24.0, 22.0, 11.0, 10.0, 9.0, 4.0, 1.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.5213266275823116e-05, -4.4011838326696306e-05, -4.281040673959069e-05, -4.160897879046388e-05, -4.040755084133707e-05, -3.920611925423145e-05, -3.800469130510464e-05, -3.680326335597783e-05, -3.5601835406851023e-05, -3.4400407457724214e-05, -3.31989758706186e-05, -3.199754792149179e-05, -3.079611997236498e-05, -2.9594690204248764e-05, -2.839326043613255e-05, -2.719183248700574e-05, -2.5990400899900123e-05, -2.478897113178391e-05, -2.35875431826571e-05, -2.2386113414540887e-05, -2.1184685465414077e-05, -1.9983255697297864e-05, -1.878182592918165e-05, -1.758039798005484e-05, -1.6378968211938627e-05, -1.5177539353317115e-05, -1.3976110494695604e-05, -1.277468072657939e-05, -1.1573251867957879e-05, -1.0371823009336367e-05, -9.170393241220154e-06, -7.968964382598642e-06, -6.767535523977131e-06, -5.566106665355619e-06, -4.3646773519867565e-06, -3.1632482659915695e-06, -1.9618191799963824e-06, -7.603903213748708e-07, 4.4103899199399166e-07, 1.6424683053628542e-06, 2.8438971639843658e-06, 4.045326022605877e-06, 5.24675533597474e-06, 6.448184649343602e-06, 7.649613507965114e-06, 8.851042366586626e-06, 1.0052472134702839e-05, 1.125390099332435e-05, 1.2455329851945862e-05, 1.3656758710567374e-05, 1.4858187569188885e-05, 1.60596173373051e-05, 1.726104528643191e-05, 1.8462475054548122e-05, 1.9663904822664335e-05, 2.0865332771791145e-05, 2.206676253990736e-05, 2.3268192308023572e-05, 2.4469620257150382e-05, 2.5671050025266595e-05, 2.687247979338281e-05, 2.807390774250962e-05, 2.9275337510625832e-05, 3.0476767278742045e-05, 3.1678195227868855e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 6.0, 9.0, 9.0, 7.0, 8.0, 10.0, 13.0, 16.0, 15.0, 18.0, 22.0, 26.0, 28.0, 39.0, 39.0, 37.0, 44.0, 49.0, 46.0, 42.0, 36.0, 43.0, 52.0, 41.0, 32.0, 37.0, 31.0, 36.0, 34.0, 24.0, 27.0, 21.0, 20.0, 16.0, 20.0, 9.0, 13.0, 12.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.629922866821289e-05, -3.52468341588974e-05, -3.419443964958191e-05, -3.314204514026642e-05, -3.208965063095093e-05, -3.103725612163544e-05, -2.9984861612319946e-05, -2.8932467103004456e-05, -2.7880072593688965e-05, -2.6827678084373474e-05, -2.5775283575057983e-05, -2.4722889065742493e-05, -2.3670494556427002e-05, -2.261810004711151e-05, -2.156570553779602e-05, -2.051331102848053e-05, -1.946091651916504e-05, -1.840852200984955e-05, -1.7356127500534058e-05, -1.6303732991218567e-05, -1.5251338481903076e-05, -1.4198943972587585e-05, -1.3146549463272095e-05, -1.2094154953956604e-05, -1.1041760444641113e-05, -9.989365935325623e-06, -8.936971426010132e-06, -7.884576916694641e-06, -6.83218240737915e-06, -5.77978789806366e-06, -4.727393388748169e-06, -3.6749988794326782e-06, -2.6226043701171875e-06, -1.5702098608016968e-06, -5.178153514862061e-07, 5.345791578292847e-07, 1.5869736671447754e-06, 2.639368176460266e-06, 3.691762685775757e-06, 4.7441571950912476e-06, 5.796551704406738e-06, 6.848946213722229e-06, 7.90134072303772e-06, 8.95373523235321e-06, 1.0006129741668701e-05, 1.1058524250984192e-05, 1.2110918760299683e-05, 1.3163313269615173e-05, 1.4215707778930664e-05, 1.5268102288246155e-05, 1.6320496797561646e-05, 1.7372891306877136e-05, 1.8425285816192627e-05, 1.9477680325508118e-05, 2.053007483482361e-05, 2.15824693441391e-05, 2.263486385345459e-05, 2.368725836277008e-05, 2.473965287208557e-05, 2.5792047381401062e-05, 2.6844441890716553e-05, 2.7896836400032043e-05, 2.8949230909347534e-05, 3.0001625418663025e-05, 3.1054019927978516e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 6.0, 4.0, 2.0, 13.0, 18.0, 12.0, 15.0, 24.0, 29.0, 27.0, 31.0, 34.0, 38.0, 40.0, 47.0, 47.0, 53.0, 42.0, 53.0, 51.0, 51.0, 44.0, 46.0, 38.0, 32.0, 27.0, 26.0, 27.0, 30.0, 17.0, 17.0, 13.0, 11.0, 3.0, 9.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.3125, -45.361328125, -43.41015625, -41.458984375, -39.5078125, -37.556640625, -35.60546875, -33.654296875, -31.703125, -29.751953125, -27.80078125, -25.849609375, -23.8984375, -21.947265625, -19.99609375, -18.044921875, -16.09375, -14.142578125, -12.19140625, -10.240234375, -8.2890625, -6.337890625, -4.38671875, -2.435546875, -0.484375, 1.466796875, 3.41796875, 5.369140625, 7.3203125, 9.271484375, 11.22265625, 13.173828125, 15.125, 17.076171875, 19.02734375, 20.978515625, 22.9296875, 24.880859375, 26.83203125, 28.783203125, 30.734375, 32.685546875, 34.63671875, 36.587890625, 38.5390625, 40.490234375, 42.44140625, 44.392578125, 46.34375, 48.294921875, 50.24609375, 52.197265625, 54.1484375, 56.099609375, 58.05078125, 60.001953125, 61.953125, 63.904296875, 65.85546875, 67.806640625, 69.7578125, 71.708984375, 73.66015625, 75.611328125, 77.5625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 7.0, 4.0, 7.0, 8.0, 12.0, 31.0, 35.0, 46.0, 73.0, 135.0, 174.0, 271.0, 425.0, 689.0, 1102.0, 2209.0, 5029.0, 15276.0, 100492.0, 855428.0, 48136.0, 10591.0, 3921.0, 1843.0, 941.0, 565.0, 387.0, 239.0, 176.0, 100.0, 60.0, 47.0, 33.0, 16.0, 12.0, 12.0, 10.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.625, -92.814453125, -89.00390625, -85.193359375, -81.3828125, -77.572265625, -73.76171875, -69.951171875, -66.140625, -62.330078125, -58.51953125, -54.708984375, -50.8984375, -47.087890625, -43.27734375, -39.466796875, -35.65625, -31.845703125, -28.03515625, -24.224609375, -20.4140625, -16.603515625, -12.79296875, -8.982421875, -5.171875, -1.361328125, 2.44921875, 6.259765625, 10.0703125, 13.880859375, 17.69140625, 21.501953125, 25.3125, 29.123046875, 32.93359375, 36.744140625, 40.5546875, 44.365234375, 48.17578125, 51.986328125, 55.796875, 59.607421875, 63.41796875, 67.228515625, 71.0390625, 74.849609375, 78.66015625, 82.470703125, 86.28125, 90.091796875, 93.90234375, 97.712890625, 101.5234375, 105.333984375, 109.14453125, 112.955078125, 116.765625, 120.576171875, 124.38671875, 128.197265625, 132.0078125, 135.818359375, 139.62890625, 143.439453125, 147.25]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 3.0, 8.0, 5.0, 7.0, 8.0, 14.0, 16.0, 11.0, 17.0, 16.0, 27.0, 32.0, 25.0, 25.0, 40.0, 47.0, 56.0, 61.0, 63.0, 91.0, 1876.0, 88.0, 68.0, 44.0, 45.0, 49.0, 37.0, 38.0, 33.0, 22.0, 31.0, 20.0, 15.0, 19.0, 23.0, 18.0, 9.0, 11.0, 2.0, 10.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.375, -136.23046875, -131.0859375, -125.94140625, -120.796875, -115.65234375, -110.5078125, -105.36328125, -100.21875, -95.07421875, -89.9296875, -84.78515625, -79.640625, -74.49609375, -69.3515625, -64.20703125, -59.0625, -53.91796875, -48.7734375, -43.62890625, -38.484375, -33.33984375, -28.1953125, -23.05078125, -17.90625, -12.76171875, -7.6171875, -2.47265625, 2.671875, 7.81640625, 12.9609375, 18.10546875, 23.25, 28.39453125, 33.5390625, 38.68359375, 43.828125, 48.97265625, 54.1171875, 59.26171875, 64.40625, 69.55078125, 74.6953125, 79.83984375, 84.984375, 90.12890625, 95.2734375, 100.41796875, 105.5625, 110.70703125, 115.8515625, 120.99609375, 126.140625, 131.28515625, 136.4296875, 141.57421875, 146.71875, 151.86328125, 157.0078125, 162.15234375, 167.296875, 172.44140625, 177.5859375, 182.73046875, 187.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 8.0, 6.0, 12.0, 8.0, 18.0, 16.0, 22.0, 20.0, 29.0, 35.0, 46.0, 76.0, 104.0, 158.0, 238.0, 566.0, 1481.0, 5486.0, 41483.0, 3025471.0, 60406.0, 6896.0, 1688.0, 588.0, 284.0, 168.0, 87.0, 56.0, 62.0, 45.0, 34.0, 26.0, 11.0, 10.0, 15.0, 7.0, 8.0, 5.0, 4.0, 4.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-415.5, -404.13671875, -392.7734375, -381.41015625, -370.046875, -358.68359375, -347.3203125, -335.95703125, -324.59375, -313.23046875, -301.8671875, -290.50390625, -279.140625, -267.77734375, -256.4140625, -245.05078125, -233.6875, -222.32421875, -210.9609375, -199.59765625, -188.234375, -176.87109375, -165.5078125, -154.14453125, -142.78125, -131.41796875, -120.0546875, -108.69140625, -97.328125, -85.96484375, -74.6015625, -63.23828125, -51.875, -40.51171875, -29.1484375, -17.78515625, -6.421875, 4.94140625, 16.3046875, 27.66796875, 39.03125, 50.39453125, 61.7578125, 73.12109375, 84.484375, 95.84765625, 107.2109375, 118.57421875, 129.9375, 141.30078125, 152.6640625, 164.02734375, 175.390625, 186.75390625, 198.1171875, 209.48046875, 220.84375, 232.20703125, 243.5703125, 254.93359375, 266.296875, 277.66015625, 289.0234375, 300.38671875, 311.75]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 10.0, 33.0, 226.0, 593.0, 124.0, 34.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.96212768554688, -191.27572631835938, -155.58934020996094, -119.90294647216797, -84.216552734375, -48.5301513671875, -12.843765258789062, 22.842620849609375, 58.529022216796875, 94.21541595458984, 129.9018096923828, 165.58819580078125, 201.27459716796875, 236.96099853515625, 272.64739990234375, 308.3337707519531, 344.0201721191406, 379.7065734863281, 415.3929443359375, 451.079345703125, 486.7657470703125, 522.4521484375, 558.1385498046875, 593.824951171875, 629.5113525390625, 665.19775390625, 700.8841552734375, 736.570556640625, 772.2569580078125, 807.943359375, 843.6296997070312, 879.3161010742188, 915.00244140625, 950.6888427734375, 986.375244140625, 1022.0616455078125, 1057.748046875, 1093.4344482421875, 1129.120849609375, 1164.80712890625, 1200.49365234375, 1236.1800537109375, 1271.866455078125, 1307.5528564453125, 1343.2392578125, 1378.9256591796875, 1414.612060546875, 1450.29833984375, 1485.9847412109375, 1521.671142578125, 1557.3575439453125, 1593.0439453125, 1628.7303466796875, 1664.416748046875, 1700.1031494140625, 1735.78955078125, 1771.475830078125, 1807.1622314453125, 1842.8486328125, 1878.5350341796875, 1914.221435546875, 1949.9078369140625, 1985.59423828125, 2021.280517578125, 2056.967041015625]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 6.0, 6.0, 11.0, 10.0, 20.0, 13.0, 17.0, 14.0, 24.0, 26.0, 32.0, 37.0, 34.0, 48.0, 35.0, 42.0, 37.0, 45.0, 31.0, 38.0, 38.0, 43.0, 35.0, 40.0, 33.0, 33.0, 19.0, 29.0, 34.0, 21.0, 18.0, 20.0, 16.0, 22.0, 9.0, 3.0, 10.0, 5.0, 3.0, 3.0, 7.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-391.8494873046875, -378.2784423828125, -364.7074279785156, -351.1363830566406, -337.56536865234375, -323.99432373046875, -310.42327880859375, -296.85223388671875, -283.2812194824219, -269.7101745605469, -256.13916015625, -242.568115234375, -228.99708557128906, -215.42605590820312, -201.85501098632812, -188.2839813232422, -174.71295166015625, -161.1419219970703, -147.57089233398438, -133.99984741210938, -120.42881774902344, -106.8577880859375, -93.28675079345703, -79.71571350097656, -66.14468383789062, -52.57365036010742, -39.00261688232422, -25.431583404541016, -11.860549926757812, 1.710479736328125, 15.281517028808594, 28.852554321289062, 42.423553466796875, 55.99458694458008, 69.56562042236328, 83.13665771484375, 96.70768737792969, 110.27871704101562, 123.8497543334961, 137.42079162597656, 150.9918212890625, 164.56285095214844, 178.13388061523438, 191.70492553710938, 205.2759552001953, 218.84698486328125, 232.41802978515625, 245.9890594482422, 259.5600891113281, 273.1311340332031, 286.7021484375, 300.273193359375, 313.84423828125, 327.4152526855469, 340.9862976074219, 354.55731201171875, 368.12835693359375, 381.69940185546875, 395.2704162597656, 408.8414611816406, 422.4124755859375, 435.9835205078125, 449.5545654296875, 463.1256103515625, 476.6966247558594]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 6.0, 8.0, 5.0, 7.0, 17.0, 11.0, 15.0, 26.0, 29.0, 26.0, 30.0, 38.0, 44.0, 37.0, 46.0, 49.0, 45.0, 49.0, 61.0, 43.0, 51.0, 44.0, 41.0, 41.0, 34.0, 28.0, 25.0, 28.0, 25.0, 15.0, 16.0, 12.0, 15.0, 6.0, 4.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.1875, -48.19140625, -46.1953125, -44.19921875, -42.203125, -40.20703125, -38.2109375, -36.21484375, -34.21875, -32.22265625, -30.2265625, -28.23046875, -26.234375, -24.23828125, -22.2421875, -20.24609375, -18.25, -16.25390625, -14.2578125, -12.26171875, -10.265625, -8.26953125, -6.2734375, -4.27734375, -2.28125, -0.28515625, 1.7109375, 3.70703125, 5.703125, 7.69921875, 9.6953125, 11.69140625, 13.6875, 15.68359375, 17.6796875, 19.67578125, 21.671875, 23.66796875, 25.6640625, 27.66015625, 29.65625, 31.65234375, 33.6484375, 35.64453125, 37.640625, 39.63671875, 41.6328125, 43.62890625, 45.625, 47.62109375, 49.6171875, 51.61328125, 53.609375, 55.60546875, 57.6015625, 59.59765625, 61.59375, 63.58984375, 65.5859375, 67.58203125, 69.578125, 71.57421875, 73.5703125, 75.56640625, 77.5625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 11.0, 17.0, 37.0, 42.0, 58.0, 114.0, 161.0, 273.0, 480.0, 751.0, 1197.0, 2056.0, 3639.0, 6587.0, 13314.0, 31853.0, 197945.0, 3677950.0, 197387.0, 31404.0, 13403.0, 6732.0, 3622.0, 2045.0, 1179.0, 734.0, 459.0, 279.0, 177.0, 126.0, 74.0, 60.0, 27.0, 23.0, 12.0, 16.0, 11.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.5, -161.1796875, -154.859375, -148.5390625, -142.21875, -135.8984375, -129.578125, -123.2578125, -116.9375, -110.6171875, -104.296875, -97.9765625, -91.65625, -85.3359375, -79.015625, -72.6953125, -66.375, -60.0546875, -53.734375, -47.4140625, -41.09375, -34.7734375, -28.453125, -22.1328125, -15.8125, -9.4921875, -3.171875, 3.1484375, 9.46875, 15.7890625, 22.109375, 28.4296875, 34.75, 41.0703125, 47.390625, 53.7109375, 60.03125, 66.3515625, 72.671875, 78.9921875, 85.3125, 91.6328125, 97.953125, 104.2734375, 110.59375, 116.9140625, 123.234375, 129.5546875, 135.875, 142.1953125, 148.515625, 154.8359375, 161.15625, 167.4765625, 173.796875, 180.1171875, 186.4375, 192.7578125, 199.078125, 205.3984375, 211.71875, 218.0390625, 224.359375, 230.6796875, 237.0]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 13.0, 7.0, 13.0, 10.0, 17.0, 36.0, 42.0, 59.0, 96.0, 198.0, 526.0, 1382.0, 993.0, 323.0, 132.0, 66.0, 31.0, 19.0, 25.0, 27.0, 9.0, 10.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.125, -132.767578125, -127.41015625, -122.052734375, -116.6953125, -111.337890625, -105.98046875, -100.623046875, -95.265625, -89.908203125, -84.55078125, -79.193359375, -73.8359375, -68.478515625, -63.12109375, -57.763671875, -52.40625, -47.048828125, -41.69140625, -36.333984375, -30.9765625, -25.619140625, -20.26171875, -14.904296875, -9.546875, -4.189453125, 1.16796875, 6.525390625, 11.8828125, 17.240234375, 22.59765625, 27.955078125, 33.3125, 38.669921875, 44.02734375, 49.384765625, 54.7421875, 60.099609375, 65.45703125, 70.814453125, 76.171875, 81.529296875, 86.88671875, 92.244140625, 97.6015625, 102.958984375, 108.31640625, 113.673828125, 119.03125, 124.388671875, 129.74609375, 135.103515625, 140.4609375, 145.818359375, 151.17578125, 156.533203125, 161.890625, 167.248046875, 172.60546875, 177.962890625, 183.3203125, 188.677734375, 194.03515625, 199.392578125, 204.75]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 8.0, 5.0, 11.0, 11.0, 29.0, 47.0, 62.0, 110.0, 209.0, 411.0, 733.0, 1334.0, 2781.0, 6129.0, 15328.0, 49409.0, 405732.0, 3564452.0, 104003.0, 26050.0, 9338.0, 4060.0, 1906.0, 954.0, 535.0, 273.0, 129.0, 106.0, 53.0, 24.0, 14.0, 13.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-365.0, -355.19921875, -345.3984375, -335.59765625, -325.796875, -315.99609375, -306.1953125, -296.39453125, -286.59375, -276.79296875, -266.9921875, -257.19140625, -247.390625, -237.58984375, -227.7890625, -217.98828125, -208.1875, -198.38671875, -188.5859375, -178.78515625, -168.984375, -159.18359375, -149.3828125, -139.58203125, -129.78125, -119.98046875, -110.1796875, -100.37890625, -90.578125, -80.77734375, -70.9765625, -61.17578125, -51.375, -41.57421875, -31.7734375, -21.97265625, -12.171875, -2.37109375, 7.4296875, 17.23046875, 27.03125, 36.83203125, 46.6328125, 56.43359375, 66.234375, 76.03515625, 85.8359375, 95.63671875, 105.4375, 115.23828125, 125.0390625, 134.83984375, 144.640625, 154.44140625, 164.2421875, 174.04296875, 183.84375, 193.64453125, 203.4453125, 213.24609375, 223.046875, 232.84765625, 242.6484375, 252.44921875, 262.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 11.0, 14.0, 17.0, 37.0, 50.0, 101.0, 137.0, 166.0, 171.0, 93.0, 73.0, 44.0, 20.0, 20.0, 15.0, 13.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-461.546630859375, -439.4291687011719, -417.3117370605469, -395.19427490234375, -373.07684326171875, -350.9593811035156, -328.8419189453125, -306.7244873046875, -284.6070251464844, -262.48956298828125, -240.37213134765625, -218.25466918945312, -196.13722229003906, -174.019775390625, -151.90231323242188, -129.7848663330078, -107.66741943359375, -85.54997253417969, -63.432518005371094, -41.3150634765625, -19.197616577148438, 2.919830322265625, 25.03729248046875, 47.15473937988281, 69.27218627929688, 91.38963317871094, 113.50708770751953, 135.62454223632812, 157.7419891357422, 179.85943603515625, 201.97689819335938, 224.09434509277344, 246.21173095703125, 268.3291931152344, 290.4466247558594, 312.5640869140625, 334.6815185546875, 356.7989807128906, 378.91644287109375, 401.03387451171875, 423.1513366699219, 445.268798828125, 467.38623046875, 489.5036926269531, 511.62115478515625, 533.7385864257812, 555.8560791015625, 577.9735107421875, 600.0909423828125, 622.2083740234375, 644.3258666992188, 666.4432983398438, 688.5607299804688, 710.67822265625, 732.795654296875, 754.9130859375, 777.030517578125, 799.14794921875, 821.2654418945312, 843.3828735351562, 865.5003051757812, 887.6177978515625, 909.7352294921875, 931.8526611328125, 953.9701538085938]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 9.0, 13.0, 12.0, 18.0, 11.0, 24.0, 22.0, 25.0, 23.0, 30.0, 26.0, 40.0, 31.0, 35.0, 37.0, 30.0, 34.0, 40.0, 49.0, 38.0, 50.0, 36.0, 36.0, 33.0, 38.0, 44.0, 23.0, 28.0, 22.0, 20.0, 18.0, 15.0, 13.0, 9.0, 11.0, 9.0, 6.0, 8.0, 7.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-311.7288818359375, -301.2641296386719, -290.79937744140625, -280.3345947265625, -269.8698425292969, -259.40509033203125, -248.94033813476562, -238.4755859375, -228.0108184814453, -217.5460662841797, -207.081298828125, -196.61654663085938, -186.15179443359375, -175.68702697753906, -165.22227478027344, -154.75750732421875, -144.29275512695312, -133.8280029296875, -123.36323547363281, -112.89848327636719, -102.43372344970703, -91.96896362304688, -81.50421142578125, -71.0394515991211, -60.57469177246094, -50.10993194580078, -39.64517593383789, -29.180418014526367, -18.715660095214844, -8.250900268554688, 2.213855743408203, 12.678611755371094, 23.143341064453125, 33.60810089111328, 44.07285690307617, 54.53761291503906, 65.00237274169922, 75.46713256835938, 85.931884765625, 96.39664459228516, 106.86140441894531, 117.32616424560547, 127.79092407226562, 138.25567626953125, 148.72042846679688, 159.18519592285156, 169.6499481201172, 180.11471557617188, 190.5794677734375, 201.04421997070312, 211.5089874267578, 221.97373962402344, 232.43850708007812, 242.90325927734375, 253.36801147460938, 263.832763671875, 274.29754638671875, 284.7622985839844, 295.22705078125, 305.69183349609375, 316.1565856933594, 326.621337890625, 337.0860900878906, 347.55084228515625, 358.0155944824219]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 13.0, 6.0, 15.0, 13.0, 12.0, 15.0, 27.0, 20.0, 21.0, 17.0, 28.0, 26.0, 35.0, 43.0, 40.0, 29.0, 34.0, 39.0, 35.0, 38.0, 44.0, 38.0, 48.0, 28.0, 40.0, 23.0, 34.0, 22.0, 22.0, 30.0, 14.0, 24.0, 16.0, 14.0, 21.0, 10.0, 9.0, 8.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.09375, -49.39599609375, -47.6982421875, -46.00048828125, -44.302734375, -42.60498046875, -40.9072265625, -39.20947265625, -37.51171875, -35.81396484375, -34.1162109375, -32.41845703125, -30.720703125, -29.02294921875, -27.3251953125, -25.62744140625, -23.9296875, -22.23193359375, -20.5341796875, -18.83642578125, -17.138671875, -15.44091796875, -13.7431640625, -12.04541015625, -10.34765625, -8.64990234375, -6.9521484375, -5.25439453125, -3.556640625, -1.85888671875, -0.1611328125, 1.53662109375, 3.234375, 4.93212890625, 6.6298828125, 8.32763671875, 10.025390625, 11.72314453125, 13.4208984375, 15.11865234375, 16.81640625, 18.51416015625, 20.2119140625, 21.90966796875, 23.607421875, 25.30517578125, 27.0029296875, 28.70068359375, 30.3984375, 32.09619140625, 33.7939453125, 35.49169921875, 37.189453125, 38.88720703125, 40.5849609375, 42.28271484375, 43.98046875, 45.67822265625, 47.3759765625, 49.07373046875, 50.771484375, 52.46923828125, 54.1669921875, 55.86474609375, 57.5625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 23.0, 31.0, 69.0, 83.0, 142.0, 168.0, 262.0, 408.0, 679.0, 1024.0, 1447.0, 2237.0, 3501.0, 5433.0, 8270.0, 12824.0, 19894.0, 31986.0, 53018.0, 97708.0, 227924.0, 314887.0, 110486.0, 59468.0, 35102.0, 21778.0, 13767.0, 9053.0, 5934.0, 3740.0, 2447.0, 1599.0, 1095.0, 729.0, 454.0, 290.0, 211.0, 122.0, 94.0, 57.0, 37.0, 22.0, 19.0, 8.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.20703125, -2.133697509765625, -2.06036376953125, -1.987030029296875, -1.9136962890625, -1.840362548828125, -1.76702880859375, -1.693695068359375, -1.620361328125, -1.547027587890625, -1.47369384765625, -1.400360107421875, -1.3270263671875, -1.253692626953125, -1.18035888671875, -1.107025146484375, -1.03369140625, -0.960357666015625, -0.88702392578125, -0.813690185546875, -0.7403564453125, -0.667022705078125, -0.59368896484375, -0.520355224609375, -0.447021484375, -0.373687744140625, -0.30035400390625, -0.227020263671875, -0.1536865234375, -0.080352783203125, -0.00701904296875, 0.066314697265625, 0.1396484375, 0.212982177734375, 0.28631591796875, 0.359649658203125, 0.4329833984375, 0.506317138671875, 0.57965087890625, 0.652984619140625, 0.726318359375, 0.799652099609375, 0.87298583984375, 0.946319580078125, 1.0196533203125, 1.092987060546875, 1.16632080078125, 1.239654541015625, 1.31298828125, 1.386322021484375, 1.45965576171875, 1.532989501953125, 1.6063232421875, 1.679656982421875, 1.75299072265625, 1.826324462890625, 1.899658203125, 1.972991943359375, 2.04632568359375, 2.119659423828125, 2.1929931640625, 2.266326904296875, 2.33966064453125, 2.412994384765625, 2.486328125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 5.0, 8.0, 6.0, 13.0, 16.0, 15.0, 15.0, 21.0, 20.0, 25.0, 30.0, 27.0, 26.0, 31.0, 35.0, 30.0, 30.0, 32.0, 37.0, 30.0, 42.0, 1069.0, 37.0, 31.0, 26.0, 42.0, 40.0, 35.0, 27.0, 24.0, 19.0, 18.0, 24.0, 27.0, 19.0, 18.0, 13.0, 12.0, 12.0, 5.0, 10.0, 7.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.28125, -29.2158203125, -28.150390625, -27.0849609375, -26.01953125, -24.9541015625, -23.888671875, -22.8232421875, -21.7578125, -20.6923828125, -19.626953125, -18.5615234375, -17.49609375, -16.4306640625, -15.365234375, -14.2998046875, -13.234375, -12.1689453125, -11.103515625, -10.0380859375, -8.97265625, -7.9072265625, -6.841796875, -5.7763671875, -4.7109375, -3.6455078125, -2.580078125, -1.5146484375, -0.44921875, 0.6162109375, 1.681640625, 2.7470703125, 3.8125, 4.8779296875, 5.943359375, 7.0087890625, 8.07421875, 9.1396484375, 10.205078125, 11.2705078125, 12.3359375, 13.4013671875, 14.466796875, 15.5322265625, 16.59765625, 17.6630859375, 18.728515625, 19.7939453125, 20.859375, 21.9248046875, 22.990234375, 24.0556640625, 25.12109375, 26.1865234375, 27.251953125, 28.3173828125, 29.3828125, 30.4482421875, 31.513671875, 32.5791015625, 33.64453125, 34.7099609375, 35.775390625, 36.8408203125, 37.90625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 6.0, 20.0, 27.0, 28.0, 42.0, 48.0, 76.0, 149.0, 183.0, 239.0, 411.0, 628.0, 839.0, 1277.0, 1900.0, 2764.0, 4219.0, 6270.0, 9590.0, 14603.0, 22226.0, 34100.0, 53661.0, 88102.0, 163185.0, 1358802.0, 127239.0, 73643.0, 46236.0, 29574.0, 19229.0, 12722.0, 8447.0, 5612.0, 3620.0, 2399.0, 1592.0, 1121.0, 691.0, 488.0, 347.0, 233.0, 169.0, 110.0, 81.0, 48.0, 53.0, 30.0, 17.0, 10.0, 7.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.5517578125, -1.503753662109375, -1.45574951171875, -1.407745361328125, -1.3597412109375, -1.311737060546875, -1.26373291015625, -1.215728759765625, -1.167724609375, -1.119720458984375, -1.07171630859375, -1.023712158203125, -0.9757080078125, -0.927703857421875, -0.87969970703125, -0.831695556640625, -0.78369140625, -0.735687255859375, -0.68768310546875, -0.639678955078125, -0.5916748046875, -0.543670654296875, -0.49566650390625, -0.447662353515625, -0.399658203125, -0.351654052734375, -0.30364990234375, -0.255645751953125, -0.2076416015625, -0.159637451171875, -0.11163330078125, -0.063629150390625, -0.015625, 0.032379150390625, 0.08038330078125, 0.128387451171875, 0.1763916015625, 0.224395751953125, 0.27239990234375, 0.320404052734375, 0.368408203125, 0.416412353515625, 0.46441650390625, 0.512420654296875, 0.5604248046875, 0.608428955078125, 0.65643310546875, 0.704437255859375, 0.75244140625, 0.800445556640625, 0.84844970703125, 0.896453857421875, 0.9444580078125, 0.992462158203125, 1.04046630859375, 1.088470458984375, 1.136474609375, 1.184478759765625, 1.23248291015625, 1.280487060546875, 1.3284912109375, 1.376495361328125, 1.42449951171875, 1.472503662109375, 1.5205078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 8.0, 13.0, 11.0, 19.0, 19.0, 26.0, 35.0, 48.0, 82.0, 132.0, 228.0, 109.0, 49.0, 46.0, 29.0, 33.0, 20.0, 24.0, 12.0, 10.0, 2.0, 3.0, 8.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011795759201049805, -0.00011380109935998917, -0.00010964460670948029, -0.0001054881140589714, -0.00010133162140846252, -9.717512875795364e-05, -9.301863610744476e-05, -8.886214345693588e-05, -8.4705650806427e-05, -8.054915815591812e-05, -7.639266550540924e-05, -7.223617285490036e-05, -6.807968020439148e-05, -6.39231875538826e-05, -5.976669490337372e-05, -5.561020225286484e-05, -5.145370960235596e-05, -4.7297216951847076e-05, -4.3140724301338196e-05, -3.8984231650829315e-05, -3.4827739000320435e-05, -3.0671246349811554e-05, -2.6514753699302673e-05, -2.2358261048793793e-05, -1.8201768398284912e-05, -1.4045275747776031e-05, -9.888783097267151e-06, -5.73229044675827e-06, -1.5757977962493896e-06, 2.580694854259491e-06, 6.737187504768372e-06, 1.0893680155277252e-05, 1.5050172805786133e-05, 1.9206665456295013e-05, 2.3363158106803894e-05, 2.7519650757312775e-05, 3.1676143407821655e-05, 3.5832636058330536e-05, 3.9989128708839417e-05, 4.41456213593483e-05, 4.830211400985718e-05, 5.245860666036606e-05, 5.661509931087494e-05, 6.077159196138382e-05, 6.49280846118927e-05, 6.908457726240158e-05, 7.324106991291046e-05, 7.739756256341934e-05, 8.155405521392822e-05, 8.57105478644371e-05, 8.986704051494598e-05, 9.402353316545486e-05, 9.818002581596375e-05, 0.00010233651846647263, 0.0001064930111169815, 0.00011064950376749039, 0.00011480599641799927, 0.00011896248906850815, 0.00012311898171901703, 0.0001272754743695259, 0.0001314319670200348, 0.00013558845967054367, 0.00013974495232105255, 0.00014390144497156143, 0.0001480579376220703]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 6.0, 9.0, 24.0, 20.0, 27.0, 42.0, 72.0, 91.0, 143.0, 598.0, 11952.0, 996239.0, 37514.0, 1261.0, 208.0, 105.0, 66.0, 37.0, 30.0, 23.0, 19.0, 17.0, 12.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0025234222412109375, -0.0024526119232177734, -0.0023818016052246094, -0.0023109912872314453, -0.0022401809692382812, -0.002169370651245117, -0.002098560333251953, -0.002027750015258789, -0.001956939697265625, -0.001886129379272461, -0.0018153190612792969, -0.0017445087432861328, -0.0016736984252929688, -0.0016028881072998047, -0.0015320777893066406, -0.0014612674713134766, -0.0013904571533203125, -0.0013196468353271484, -0.0012488365173339844, -0.0011780261993408203, -0.0011072158813476562, -0.0010364055633544922, -0.0009655952453613281, -0.0008947849273681641, -0.000823974609375, -0.0007531642913818359, -0.0006823539733886719, -0.0006115436553955078, -0.0005407333374023438, -0.0004699230194091797, -0.0003991127014160156, -0.00032830238342285156, -0.0002574920654296875, -0.00018668174743652344, -0.00011587142944335938, -4.506111145019531e-05, 2.574920654296875e-05, 9.655952453613281e-05, 0.00016736984252929688, 0.00023818016052246094, 0.000308990478515625, 0.00037980079650878906, 0.0004506111145019531, 0.0005214214324951172, 0.0005922317504882812, 0.0006630420684814453, 0.0007338523864746094, 0.0008046627044677734, 0.0008754730224609375, 0.0009462833404541016, 0.0010170936584472656, 0.0010879039764404297, 0.0011587142944335938, 0.0012295246124267578, 0.0013003349304199219, 0.001371145248413086, 0.00144195556640625, 0.001512765884399414, 0.0015835762023925781, 0.0016543865203857422, 0.0017251968383789062, 0.0017960071563720703, 0.0018668174743652344, 0.0019376277923583984, 0.0020084381103515625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 11.0, 14.0, 20.0, 34.0, 36.0, 61.0, 101.0, 182.0, 173.0, 148.0, 75.0, 53.0, 31.0, 18.0, 12.0, 12.0, 8.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.00013911361747886986, -0.00013616749492939562, -0.00013322137237992138, -0.00013027524983044714, -0.0001273291272809729, -0.0001243830192834139, -0.00012143688945798203, -0.0001184907669085078, -0.00011554465163499117, -0.00011259852908551693, -0.00010965240653604269, -0.00010670628398656845, -0.00010376016871305183, -0.00010081404616357759, -9.786792361410335e-05, -9.492180106462911e-05, -9.197567851515487e-05, -8.902955596568063e-05, -8.608343341620639e-05, -8.313731814268976e-05, -8.019119559321553e-05, -7.724507304374129e-05, -7.429895049426705e-05, -7.135282794479281e-05, -6.840670539531857e-05, -6.546058284584433e-05, -6.251446029637009e-05, -5.956834138487466e-05, -5.6622222473379225e-05, -5.3676099923904985e-05, -5.0729977374430746e-05, -4.7783854824956506e-05, -4.483774318941869e-05, -4.189162063994445e-05, -3.894550172844902e-05, -3.599937917897478e-05, -3.305325662950054e-05, -3.0107137718005106e-05, -2.7161015168530867e-05, -2.421489443804603e-05, -2.1268773707561195e-05, -1.832265297707636e-05, -1.5376532246591523e-05, -1.2430409697117284e-05, -9.484288966632448e-06, -6.538168236147612e-06, -3.592045686673373e-06, -6.459249561885372e-07, 2.3001957742962986e-06, 5.246316959528485e-06, 8.192438144760672e-06, 1.113855978474021e-05, 1.4084680515225045e-05, 1.703080124570988e-05, 1.997692379518412e-05, 2.2923044525668956e-05, 2.5869165256153792e-05, 2.8815285986638628e-05, 3.1761406717123464e-05, 3.47075292665977e-05, 3.7653648178093135e-05, 4.0599770727567375e-05, 4.3545893277041614e-05, 4.6492015826515853e-05, 4.9438134738011286e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 11.0, 3.0, 4.0, 15.0, 14.0, 11.0, 21.0, 19.0, 26.0, 33.0, 27.0, 23.0, 33.0, 27.0, 42.0, 36.0, 39.0, 40.0, 36.0, 45.0, 28.0, 43.0, 40.0, 32.0, 38.0, 33.0, 37.0, 29.0, 28.0, 28.0, 22.0, 17.0, 20.0, 19.0, 13.0, 10.0, 13.0, 13.0, 3.0, 6.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64320182800293e-05, -4.494842141866684e-05, -4.346482455730438e-05, -4.1981227695941925e-05, -4.049763083457947e-05, -3.901403397321701e-05, -3.753043711185455e-05, -3.6046840250492096e-05, -3.456324338912964e-05, -3.307964652776718e-05, -3.1596049666404724e-05, -3.0112452805042267e-05, -2.862885594367981e-05, -2.7145259082317352e-05, -2.5661662220954895e-05, -2.4178065359592438e-05, -2.269446849822998e-05, -2.1210871636867523e-05, -1.9727274775505066e-05, -1.824367791414261e-05, -1.676008105278015e-05, -1.5276484191417694e-05, -1.3792887330055237e-05, -1.230929046869278e-05, -1.0825693607330322e-05, -9.342096745967865e-06, -7.858499884605408e-06, -6.3749030232429504e-06, -4.891306161880493e-06, -3.407709300518036e-06, -1.9241124391555786e-06, -4.4051557779312134e-07, 1.043081283569336e-06, 2.5266781449317932e-06, 4.0102750062942505e-06, 5.493871867656708e-06, 6.977468729019165e-06, 8.461065590381622e-06, 9.94466245174408e-06, 1.1428259313106537e-05, 1.2911856174468994e-05, 1.4395453035831451e-05, 1.587904989719391e-05, 1.7362646758556366e-05, 1.8846243619918823e-05, 2.032984048128128e-05, 2.1813437342643738e-05, 2.3297034204006195e-05, 2.4780631065368652e-05, 2.626422792673111e-05, 2.7747824788093567e-05, 2.9231421649456024e-05, 3.071501851081848e-05, 3.219861537218094e-05, 3.3682212233543396e-05, 3.516580909490585e-05, 3.664940595626831e-05, 3.813300281763077e-05, 3.9616599678993225e-05, 4.110019654035568e-05, 4.258379340171814e-05, 4.40673902630806e-05, 4.5550987124443054e-05, 4.703458398580551e-05, 4.851818084716797e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 13.0, 6.0, 15.0, 13.0, 12.0, 15.0, 27.0, 20.0, 21.0, 17.0, 28.0, 26.0, 35.0, 43.0, 40.0, 29.0, 34.0, 39.0, 35.0, 38.0, 44.0, 38.0, 48.0, 28.0, 40.0, 23.0, 34.0, 22.0, 22.0, 30.0, 14.0, 24.0, 16.0, 14.0, 21.0, 10.0, 9.0, 8.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.09375, -49.39599609375, -47.6982421875, -46.00048828125, -44.302734375, -42.60498046875, -40.9072265625, -39.20947265625, -37.51171875, -35.81396484375, -34.1162109375, -32.41845703125, -30.720703125, -29.02294921875, -27.3251953125, -25.62744140625, -23.9296875, -22.23193359375, -20.5341796875, -18.83642578125, -17.138671875, -15.44091796875, -13.7431640625, -12.04541015625, -10.34765625, -8.64990234375, -6.9521484375, -5.25439453125, -3.556640625, -1.85888671875, -0.1611328125, 1.53662109375, 3.234375, 4.93212890625, 6.6298828125, 8.32763671875, 10.025390625, 11.72314453125, 13.4208984375, 15.11865234375, 16.81640625, 18.51416015625, 20.2119140625, 21.90966796875, 23.607421875, 25.30517578125, 27.0029296875, 28.70068359375, 30.3984375, 32.09619140625, 33.7939453125, 35.49169921875, 37.189453125, 38.88720703125, 40.5849609375, 42.28271484375, 43.98046875, 45.67822265625, 47.3759765625, 49.07373046875, 50.771484375, 52.46923828125, 54.1669921875, 55.86474609375, 57.5625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 3.0, 5.0, 7.0, 3.0, 1.0, 5.0, 10.0, 16.0, 24.0, 23.0, 22.0, 30.0, 42.0, 50.0, 77.0, 89.0, 146.0, 186.0, 289.0, 460.0, 779.0, 1259.0, 2178.0, 3874.0, 7653.0, 19279.0, 251311.0, 714271.0, 26164.0, 9276.0, 4603.0, 2489.0, 1448.0, 829.0, 537.0, 323.0, 202.0, 149.0, 114.0, 71.0, 47.0, 51.0, 35.0, 27.0, 19.0, 18.0, 13.0, 11.0, 12.0, 5.0, 6.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-117.0, -113.115234375, -109.23046875, -105.345703125, -101.4609375, -97.576171875, -93.69140625, -89.806640625, -85.921875, -82.037109375, -78.15234375, -74.267578125, -70.3828125, -66.498046875, -62.61328125, -58.728515625, -54.84375, -50.958984375, -47.07421875, -43.189453125, -39.3046875, -35.419921875, -31.53515625, -27.650390625, -23.765625, -19.880859375, -15.99609375, -12.111328125, -8.2265625, -4.341796875, -0.45703125, 3.427734375, 7.3125, 11.197265625, 15.08203125, 18.966796875, 22.8515625, 26.736328125, 30.62109375, 34.505859375, 38.390625, 42.275390625, 46.16015625, 50.044921875, 53.9296875, 57.814453125, 61.69921875, 65.583984375, 69.46875, 73.353515625, 77.23828125, 81.123046875, 85.0078125, 88.892578125, 92.77734375, 96.662109375, 100.546875, 104.431640625, 108.31640625, 112.201171875, 116.0859375, 119.970703125, 123.85546875, 127.740234375, 131.625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 4.0, 7.0, 4.0, 8.0, 14.0, 11.0, 17.0, 19.0, 20.0, 26.0, 25.0, 37.0, 24.0, 39.0, 29.0, 41.0, 56.0, 36.0, 63.0, 1563.0, 473.0, 70.0, 56.0, 41.0, 52.0, 43.0, 18.0, 28.0, 33.0, 29.0, 33.0, 20.0, 19.0, 13.0, 18.0, 13.0, 4.0, 9.0, 7.0, 9.0, 8.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.5, -129.515625, -124.53125, -119.546875, -114.5625, -109.578125, -104.59375, -99.609375, -94.625, -89.640625, -84.65625, -79.671875, -74.6875, -69.703125, -64.71875, -59.734375, -54.75, -49.765625, -44.78125, -39.796875, -34.8125, -29.828125, -24.84375, -19.859375, -14.875, -9.890625, -4.90625, 0.078125, 5.0625, 10.046875, 15.03125, 20.015625, 25.0, 29.984375, 34.96875, 39.953125, 44.9375, 49.921875, 54.90625, 59.890625, 64.875, 69.859375, 74.84375, 79.828125, 84.8125, 89.796875, 94.78125, 99.765625, 104.75, 109.734375, 114.71875, 119.703125, 124.6875, 129.671875, 134.65625, 139.640625, 144.625, 149.609375, 154.59375, 159.578125, 164.5625, 169.546875, 174.53125, 179.515625, 184.5]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 10.0, 6.0, 9.0, 11.0, 10.0, 21.0, 25.0, 26.0, 49.0, 63.0, 116.0, 165.0, 302.0, 566.0, 1119.0, 2033.0, 4390.0, 9987.0, 41351.0, 3027413.0, 39278.0, 9998.0, 4257.0, 2141.0, 1043.0, 578.0, 263.0, 158.0, 91.0, 73.0, 36.0, 34.0, 17.0, 19.0, 7.0, 11.0, 7.0, 7.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-452.75, -439.23046875, -425.7109375, -412.19140625, -398.671875, -385.15234375, -371.6328125, -358.11328125, -344.59375, -331.07421875, -317.5546875, -304.03515625, -290.515625, -276.99609375, -263.4765625, -249.95703125, -236.4375, -222.91796875, -209.3984375, -195.87890625, -182.359375, -168.83984375, -155.3203125, -141.80078125, -128.28125, -114.76171875, -101.2421875, -87.72265625, -74.203125, -60.68359375, -47.1640625, -33.64453125, -20.125, -6.60546875, 6.9140625, 20.43359375, 33.953125, 47.47265625, 60.9921875, 74.51171875, 88.03125, 101.55078125, 115.0703125, 128.58984375, 142.109375, 155.62890625, 169.1484375, 182.66796875, 196.1875, 209.70703125, 223.2265625, 236.74609375, 250.265625, 263.78515625, 277.3046875, 290.82421875, 304.34375, 317.86328125, 331.3828125, 344.90234375, 358.421875, 371.94140625, 385.4609375, 398.98046875, 412.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 11.0, 18.0, 15.0, 26.0, 37.0, 55.0, 69.0, 75.0, 107.0, 146.0, 109.0, 70.0, 66.0, 36.0, 28.0, 27.0, 18.0, 10.0, 15.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.05255126953125, -326.4740295410156, -314.8955383300781, -303.3170166015625, -291.738525390625, -280.1600036621094, -268.58148193359375, -257.00299072265625, -245.42446899414062, -233.84596252441406, -222.2674560546875, -210.68893432617188, -199.1104278564453, -187.53192138671875, -175.95339965820312, -164.37489318847656, -152.79638671875, -141.21788024902344, -129.63937377929688, -118.06085205078125, -106.48234558105469, -94.90383911132812, -83.32532501220703, -71.74681091308594, -60.168304443359375, -48.58979415893555, -37.01128387451172, -25.43277359008789, -13.854263305664062, -2.2757530212402344, 9.302757263183594, 20.881271362304688, 32.45977783203125, 44.03828811645508, 55.616798400878906, 67.1953125, 78.77381896972656, 90.35232543945312, 101.93083953857422, 113.50935363769531, 125.08786010742188, 136.66636657714844, 148.244873046875, 159.82339477539062, 171.4019012451172, 182.98040771484375, 194.55892944335938, 206.13743591308594, 217.7159423828125, 229.29444885253906, 240.87295532226562, 252.45147705078125, 264.02996826171875, 275.6084899902344, 287.18701171875, 298.7655029296875, 310.3440246582031, 321.92254638671875, 333.50103759765625, 345.0795593261719, 356.6580810546875, 368.236572265625, 379.8150939941406, 391.39361572265625, 402.97210693359375]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 5.0, 11.0, 9.0, 12.0, 15.0, 14.0, 24.0, 27.0, 17.0, 36.0, 26.0, 38.0, 39.0, 41.0, 50.0, 41.0, 49.0, 47.0, 42.0, 53.0, 55.0, 35.0, 48.0, 29.0, 42.0, 28.0, 26.0, 14.0, 18.0, 20.0, 14.0, 15.0, 12.0, 10.0, 11.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-521.4607543945312, -506.02197265625, -490.58319091796875, -475.1444091796875, -459.70562744140625, -444.266845703125, -428.8280944824219, -413.3893127441406, -397.9505310058594, -382.5117492675781, -367.0729675292969, -351.6341857910156, -336.1954345703125, -320.75665283203125, -305.31787109375, -289.87908935546875, -274.4403076171875, -259.00152587890625, -243.562744140625, -228.1239776611328, -212.68519592285156, -197.2464141845703, -181.80764770507812, -166.36886596679688, -150.93008422851562, -135.49130249023438, -120.05252838134766, -104.61375427246094, -89.17497253417969, -73.73619079589844, -58.29741668701172, -42.858642578125, -27.419891357421875, -11.98111343383789, 3.4576644897460938, 18.896442413330078, 34.33522033691406, 49.77400207519531, 65.21277618408203, 80.65155029296875, 96.09033203125, 111.52911376953125, 126.96788787841797, 142.4066619873047, 157.84544372558594, 173.2842254638672, 188.72299194335938, 204.16177368164062, 219.60055541992188, 235.03933715820312, 250.47811889648438, 265.9169006347656, 281.35565185546875, 296.79443359375, 312.23321533203125, 327.6719970703125, 343.11077880859375, 358.549560546875, 373.98834228515625, 389.4271240234375, 404.86590576171875, 420.3046875, 435.7434387207031, 451.1822204589844, 466.6210021972656]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 9.0, 7.0, 9.0, 16.0, 17.0, 20.0, 21.0, 17.0, 23.0, 21.0, 17.0, 28.0, 36.0, 32.0, 44.0, 33.0, 41.0, 41.0, 50.0, 31.0, 43.0, 39.0, 30.0, 38.0, 30.0, 27.0, 34.0, 36.0, 29.0, 29.0, 24.0, 22.0, 14.0, 17.0, 16.0, 9.0, 9.0, 2.0, 8.0, 5.0, 2.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.75, -56.8779296875, -55.005859375, -53.1337890625, -51.26171875, -49.3896484375, -47.517578125, -45.6455078125, -43.7734375, -41.9013671875, -40.029296875, -38.1572265625, -36.28515625, -34.4130859375, -32.541015625, -30.6689453125, -28.796875, -26.9248046875, -25.052734375, -23.1806640625, -21.30859375, -19.4365234375, -17.564453125, -15.6923828125, -13.8203125, -11.9482421875, -10.076171875, -8.2041015625, -6.33203125, -4.4599609375, -2.587890625, -0.7158203125, 1.15625, 3.0283203125, 4.900390625, 6.7724609375, 8.64453125, 10.5166015625, 12.388671875, 14.2607421875, 16.1328125, 18.0048828125, 19.876953125, 21.7490234375, 23.62109375, 25.4931640625, 27.365234375, 29.2373046875, 31.109375, 32.9814453125, 34.853515625, 36.7255859375, 38.59765625, 40.4697265625, 42.341796875, 44.2138671875, 46.0859375, 47.9580078125, 49.830078125, 51.7021484375, 53.57421875, 55.4462890625, 57.318359375, 59.1904296875, 61.0625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 10.0, 6.0, 13.0, 17.0, 17.0, 33.0, 47.0, 56.0, 69.0, 83.0, 141.0, 186.0, 241.0, 293.0, 430.0, 614.0, 839.0, 1173.0, 1770.0, 2563.0, 3952.0, 6550.0, 10984.0, 20086.0, 46648.0, 431247.0, 3302189.0, 278464.0, 39358.0, 18230.0, 10101.0, 5902.0, 3778.0, 2459.0, 1609.0, 1101.0, 816.0, 550.0, 438.0, 279.0, 262.0, 162.0, 136.0, 87.0, 78.0, 69.0, 36.0, 38.0, 20.0, 12.0, 17.0, 13.0, 3.0, 6.0, 5.0], "bins": [-168.125, -163.37890625, -158.6328125, -153.88671875, -149.140625, -144.39453125, -139.6484375, -134.90234375, -130.15625, -125.41015625, -120.6640625, -115.91796875, -111.171875, -106.42578125, -101.6796875, -96.93359375, -92.1875, -87.44140625, -82.6953125, -77.94921875, -73.203125, -68.45703125, -63.7109375, -58.96484375, -54.21875, -49.47265625, -44.7265625, -39.98046875, -35.234375, -30.48828125, -25.7421875, -20.99609375, -16.25, -11.50390625, -6.7578125, -2.01171875, 2.734375, 7.48046875, 12.2265625, 16.97265625, 21.71875, 26.46484375, 31.2109375, 35.95703125, 40.703125, 45.44921875, 50.1953125, 54.94140625, 59.6875, 64.43359375, 69.1796875, 73.92578125, 78.671875, 83.41796875, 88.1640625, 92.91015625, 97.65625, 102.40234375, 107.1484375, 111.89453125, 116.640625, 121.38671875, 126.1328125, 130.87890625, 135.625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 9.0, 5.0, 8.0, 17.0, 16.0, 15.0, 34.0, 47.0, 63.0, 97.0, 214.0, 556.0, 1429.0, 874.0, 304.0, 123.0, 71.0, 44.0, 43.0, 21.0, 15.0, 18.0, 8.0, 6.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-217.625, -212.4052734375, -207.185546875, -201.9658203125, -196.74609375, -191.5263671875, -186.306640625, -181.0869140625, -175.8671875, -170.6474609375, -165.427734375, -160.2080078125, -154.98828125, -149.7685546875, -144.548828125, -139.3291015625, -134.109375, -128.8896484375, -123.669921875, -118.4501953125, -113.23046875, -108.0107421875, -102.791015625, -97.5712890625, -92.3515625, -87.1318359375, -81.912109375, -76.6923828125, -71.47265625, -66.2529296875, -61.033203125, -55.8134765625, -50.59375, -45.3740234375, -40.154296875, -34.9345703125, -29.71484375, -24.4951171875, -19.275390625, -14.0556640625, -8.8359375, -3.6162109375, 1.603515625, 6.8232421875, 12.04296875, 17.2626953125, 22.482421875, 27.7021484375, 32.921875, 38.1416015625, 43.361328125, 48.5810546875, 53.80078125, 59.0205078125, 64.240234375, 69.4599609375, 74.6796875, 79.8994140625, 85.119140625, 90.3388671875, 95.55859375, 100.7783203125, 105.998046875, 111.2177734375, 116.4375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 8.0, 8.0, 9.0, 15.0, 20.0, 29.0, 34.0, 54.0, 90.0, 126.0, 228.0, 495.0, 1056.0, 2270.0, 5228.0, 13715.0, 46977.0, 627373.0, 3389391.0, 76061.0, 18764.0, 6858.0, 2835.0, 1222.0, 625.0, 306.0, 183.0, 94.0, 52.0, 39.0, 26.0, 22.0, 14.0, 17.0, 11.0, 10.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-327.25, -316.39453125, -305.5390625, -294.68359375, -283.828125, -272.97265625, -262.1171875, -251.26171875, -240.40625, -229.55078125, -218.6953125, -207.83984375, -196.984375, -186.12890625, -175.2734375, -164.41796875, -153.5625, -142.70703125, -131.8515625, -120.99609375, -110.140625, -99.28515625, -88.4296875, -77.57421875, -66.71875, -55.86328125, -45.0078125, -34.15234375, -23.296875, -12.44140625, -1.5859375, 9.26953125, 20.125, 30.98046875, 41.8359375, 52.69140625, 63.546875, 74.40234375, 85.2578125, 96.11328125, 106.96875, 117.82421875, 128.6796875, 139.53515625, 150.390625, 161.24609375, 172.1015625, 182.95703125, 193.8125, 204.66796875, 215.5234375, 226.37890625, 237.234375, 248.08984375, 258.9453125, 269.80078125, 280.65625, 291.51171875, 302.3671875, 313.22265625, 324.078125, 334.93359375, 345.7890625, 356.64453125, 367.5]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 6.0, 7.0, 12.0, 26.0, 25.0, 43.0, 46.0, 74.0, 114.0, 147.0, 123.0, 123.0, 73.0, 62.0, 34.0, 29.0, 19.0, 13.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-885.46875, -866.6326904296875, -847.796630859375, -828.9605712890625, -810.12451171875, -791.2884521484375, -772.452392578125, -753.6163330078125, -734.7802734375, -715.9442138671875, -697.108154296875, -678.2720947265625, -659.43603515625, -640.5999755859375, -621.763916015625, -602.9278564453125, -584.0918579101562, -565.2557983398438, -546.4197387695312, -527.5836791992188, -508.74761962890625, -489.91156005859375, -471.0755310058594, -452.2394714355469, -433.4034118652344, -414.5673522949219, -395.7312927246094, -376.8952331542969, -358.0592041015625, -339.22314453125, -320.3870849609375, -301.551025390625, -282.71490478515625, -263.87884521484375, -245.04278564453125, -226.2067413330078, -207.3706817626953, -188.5346221923828, -169.69857788085938, -150.86251831054688, -132.02645874023438, -113.19039916992188, -94.3543472290039, -75.51829528808594, -56.68223571777344, -37.84617614746094, -19.01012420654297, -0.174072265625, 18.6619873046875, 37.498043060302734, 56.33409881591797, 75.17015075683594, 94.00621032714844, 112.84226989746094, 131.67831420898438, 150.51437377929688, 169.35043334960938, 188.18649291992188, 207.02255249023438, 225.8585968017578, 244.6946563720703, 263.53070068359375, 282.36676025390625, 301.20281982421875, 320.03887939453125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 5.0, 11.0, 11.0, 6.0, 20.0, 15.0, 28.0, 23.0, 22.0, 34.0, 25.0, 34.0, 30.0, 40.0, 38.0, 31.0, 44.0, 31.0, 43.0, 38.0, 47.0, 37.0, 39.0, 39.0, 37.0, 27.0, 21.0, 31.0, 37.0, 26.0, 20.0, 23.0, 12.0, 15.0, 9.0, 7.0, 14.0, 7.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-360.9302673339844, -349.7471008300781, -338.5639343261719, -327.3807678222656, -316.1976013183594, -305.0144348144531, -293.831298828125, -282.64813232421875, -271.4649658203125, -260.28179931640625, -249.0986328125, -237.91546630859375, -226.7322998046875, -215.54913330078125, -204.36598205566406, -193.1828155517578, -181.9996337890625, -170.81646728515625, -159.63330078125, -148.45013427734375, -137.2669677734375, -126.08380889892578, -114.90065002441406, -103.71748352050781, -92.53431701660156, -81.35115051269531, -70.16798400878906, -58.984825134277344, -47.801658630371094, -36.618492126464844, -25.435333251953125, -14.252166748046875, -3.069000244140625, 8.114164352416992, 19.29732894897461, 30.480491638183594, 41.663658142089844, 52.846824645996094, 64.02998352050781, 75.21315002441406, 86.39631652832031, 97.57948303222656, 108.76264953613281, 119.94580841064453, 131.12896728515625, 142.3121337890625, 153.49530029296875, 164.678466796875, 175.86163330078125, 187.0447998046875, 198.22796630859375, 209.4111328125, 220.59429931640625, 231.7774658203125, 242.9606170654297, 254.14378356933594, 265.32696533203125, 276.5101318359375, 287.69329833984375, 298.87646484375, 310.05963134765625, 321.2427978515625, 332.42596435546875, 343.609130859375, 354.7922668457031]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 8.0, 7.0, 10.0, 10.0, 11.0, 15.0, 22.0, 23.0, 25.0, 20.0, 32.0, 30.0, 40.0, 27.0, 30.0, 51.0, 45.0, 56.0, 50.0, 32.0, 51.0, 45.0, 43.0, 32.0, 27.0, 33.0, 33.0, 35.0, 22.0, 24.0, 22.0, 20.0, 15.0, 10.0, 8.0, 9.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.716796875, -62.62109375, -60.525390625, -58.4296875, -56.333984375, -54.23828125, -52.142578125, -50.046875, -47.951171875, -45.85546875, -43.759765625, -41.6640625, -39.568359375, -37.47265625, -35.376953125, -33.28125, -31.185546875, -29.08984375, -26.994140625, -24.8984375, -22.802734375, -20.70703125, -18.611328125, -16.515625, -14.419921875, -12.32421875, -10.228515625, -8.1328125, -6.037109375, -3.94140625, -1.845703125, 0.25, 2.345703125, 4.44140625, 6.537109375, 8.6328125, 10.728515625, 12.82421875, 14.919921875, 17.015625, 19.111328125, 21.20703125, 23.302734375, 25.3984375, 27.494140625, 29.58984375, 31.685546875, 33.78125, 35.876953125, 37.97265625, 40.068359375, 42.1640625, 44.259765625, 46.35546875, 48.451171875, 50.546875, 52.642578125, 54.73828125, 56.833984375, 58.9296875, 61.025390625, 63.12109375, 65.216796875, 67.3125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 12.0, 19.0, 24.0, 36.0, 48.0, 90.0, 113.0, 162.0, 287.0, 345.0, 568.0, 829.0, 1308.0, 1938.0, 3044.0, 4827.0, 7705.0, 12470.0, 20419.0, 33880.0, 57471.0, 109673.0, 334256.0, 236755.0, 92667.0, 50644.0, 30197.0, 18307.0, 11131.0, 6927.0, 4401.0, 2737.0, 1759.0, 1178.0, 771.0, 482.0, 365.0, 201.0, 164.0, 101.0, 72.0, 60.0, 26.0, 30.0, 17.0, 5.0, 15.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.6580810546875, -2.572021484375, -2.4859619140625, -2.39990234375, -2.3138427734375, -2.227783203125, -2.1417236328125, -2.0556640625, -1.9696044921875, -1.883544921875, -1.7974853515625, -1.71142578125, -1.6253662109375, -1.539306640625, -1.4532470703125, -1.3671875, -1.2811279296875, -1.195068359375, -1.1090087890625, -1.02294921875, -0.9368896484375, -0.850830078125, -0.7647705078125, -0.6787109375, -0.5926513671875, -0.506591796875, -0.4205322265625, -0.33447265625, -0.2484130859375, -0.162353515625, -0.0762939453125, 0.009765625, 0.0958251953125, 0.181884765625, 0.2679443359375, 0.35400390625, 0.4400634765625, 0.526123046875, 0.6121826171875, 0.6982421875, 0.7843017578125, 0.870361328125, 0.9564208984375, 1.04248046875, 1.1285400390625, 1.214599609375, 1.3006591796875, 1.38671875, 1.4727783203125, 1.558837890625, 1.6448974609375, 1.73095703125, 1.8170166015625, 1.903076171875, 1.9891357421875, 2.0751953125, 2.1612548828125, 2.247314453125, 2.3333740234375, 2.41943359375, 2.5054931640625, 2.591552734375, 2.6776123046875, 2.763671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 3.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 8.0, 12.0, 14.0, 25.0, 19.0, 27.0, 29.0, 34.0, 29.0, 28.0, 25.0, 38.0, 41.0, 31.0, 41.0, 33.0, 1057.0, 54.0, 44.0, 48.0, 42.0, 32.0, 36.0, 23.0, 30.0, 32.0, 22.0, 20.0, 17.0, 18.0, 12.0, 7.0, 8.0, 14.0, 9.0, 10.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.21875, -37.01220703125, -35.8056640625, -34.59912109375, -33.392578125, -32.18603515625, -30.9794921875, -29.77294921875, -28.56640625, -27.35986328125, -26.1533203125, -24.94677734375, -23.740234375, -22.53369140625, -21.3271484375, -20.12060546875, -18.9140625, -17.70751953125, -16.5009765625, -15.29443359375, -14.087890625, -12.88134765625, -11.6748046875, -10.46826171875, -9.26171875, -8.05517578125, -6.8486328125, -5.64208984375, -4.435546875, -3.22900390625, -2.0224609375, -0.81591796875, 0.390625, 1.59716796875, 2.8037109375, 4.01025390625, 5.216796875, 6.42333984375, 7.6298828125, 8.83642578125, 10.04296875, 11.24951171875, 12.4560546875, 13.66259765625, 14.869140625, 16.07568359375, 17.2822265625, 18.48876953125, 19.6953125, 20.90185546875, 22.1083984375, 23.31494140625, 24.521484375, 25.72802734375, 26.9345703125, 28.14111328125, 29.34765625, 30.55419921875, 31.7607421875, 32.96728515625, 34.173828125, 35.38037109375, 36.5869140625, 37.79345703125, 39.0]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 9.0, 7.0, 25.0, 29.0, 43.0, 61.0, 80.0, 133.0, 175.0, 243.0, 366.0, 498.0, 728.0, 1010.0, 1402.0, 2144.0, 3087.0, 4689.0, 6621.0, 9931.0, 14635.0, 22313.0, 33756.0, 52998.0, 86383.0, 167470.0, 1356335.0, 126259.0, 71855.0, 44794.0, 29346.0, 19439.0, 12798.0, 8494.0, 5940.0, 4022.0, 2813.0, 1913.0, 1308.0, 891.0, 629.0, 424.0, 302.0, 213.0, 164.0, 106.0, 66.0, 47.0, 39.0, 34.0, 21.0, 8.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0], "bins": [-1.595703125, -1.54632568359375, -1.4969482421875, -1.44757080078125, -1.398193359375, -1.34881591796875, -1.2994384765625, -1.25006103515625, -1.20068359375, -1.15130615234375, -1.1019287109375, -1.05255126953125, -1.003173828125, -0.95379638671875, -0.9044189453125, -0.85504150390625, -0.8056640625, -0.75628662109375, -0.7069091796875, -0.65753173828125, -0.608154296875, -0.55877685546875, -0.5093994140625, -0.46002197265625, -0.41064453125, -0.36126708984375, -0.3118896484375, -0.26251220703125, -0.213134765625, -0.16375732421875, -0.1143798828125, -0.06500244140625, -0.015625, 0.03375244140625, 0.0831298828125, 0.13250732421875, 0.181884765625, 0.23126220703125, 0.2806396484375, 0.33001708984375, 0.37939453125, 0.42877197265625, 0.4781494140625, 0.52752685546875, 0.576904296875, 0.62628173828125, 0.6756591796875, 0.72503662109375, 0.7744140625, 0.82379150390625, 0.8731689453125, 0.92254638671875, 0.971923828125, 1.02130126953125, 1.0706787109375, 1.12005615234375, 1.16943359375, 1.21881103515625, 1.2681884765625, 1.31756591796875, 1.366943359375, 1.41632080078125, 1.4656982421875, 1.51507568359375, 1.564453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 6.0, 11.0, 8.0, 8.0, 16.0, 11.0, 27.0, 27.0, 28.0, 42.0, 51.0, 54.0, 69.0, 150.0, 142.0, 81.0, 45.0, 35.0, 29.0, 25.0, 15.0, 15.0, 19.0, 17.0, 5.0, 12.0, 7.0, 7.0, 7.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.693601608276367e-05, -6.444007158279419e-05, -6.194412708282471e-05, -5.9448182582855225e-05, -5.695223808288574e-05, -5.445629358291626e-05, -5.196034908294678e-05, -4.9464404582977295e-05, -4.696846008300781e-05, -4.447251558303833e-05, -4.197657108306885e-05, -3.9480626583099365e-05, -3.698468208312988e-05, -3.44887375831604e-05, -3.199279308319092e-05, -2.9496848583221436e-05, -2.7000904083251953e-05, -2.450495958328247e-05, -2.2009015083312988e-05, -1.9513070583343506e-05, -1.7017126083374023e-05, -1.4521181583404541e-05, -1.2025237083435059e-05, -9.529292583465576e-06, -7.033348083496094e-06, -4.537403583526611e-06, -2.041459083557129e-06, 4.544854164123535e-07, 2.950429916381836e-06, 5.446374416351318e-06, 7.9423189163208e-06, 1.0438263416290283e-05, 1.2934207916259766e-05, 1.5430152416229248e-05, 1.792609691619873e-05, 2.0422041416168213e-05, 2.2917985916137695e-05, 2.5413930416107178e-05, 2.790987491607666e-05, 3.0405819416046143e-05, 3.2901763916015625e-05, 3.539770841598511e-05, 3.789365291595459e-05, 4.038959741592407e-05, 4.2885541915893555e-05, 4.538148641586304e-05, 4.787743091583252e-05, 5.0373375415802e-05, 5.2869319915771484e-05, 5.536526441574097e-05, 5.786120891571045e-05, 6.035715341567993e-05, 6.285309791564941e-05, 6.53490424156189e-05, 6.784498691558838e-05, 7.034093141555786e-05, 7.283687591552734e-05, 7.533282041549683e-05, 7.782876491546631e-05, 8.032470941543579e-05, 8.282065391540527e-05, 8.531659841537476e-05, 8.781254291534424e-05, 9.030848741531372e-05, 9.28044319152832e-05]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 6.0, 6.0, 11.0, 7.0, 18.0, 15.0, 15.0, 25.0, 41.0, 31.0, 67.0, 96.0, 219.0, 929.0, 7687.0, 189630.0, 831399.0, 16078.0, 1536.0, 319.0, 145.0, 62.0, 46.0, 35.0, 27.0, 18.0, 23.0, 12.0, 9.0, 4.0, 6.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0017156600952148438, -0.001669466495513916, -0.0016232728958129883, -0.0015770792961120605, -0.0015308856964111328, -0.001484692096710205, -0.0014384984970092773, -0.0013923048973083496, -0.0013461112976074219, -0.0012999176979064941, -0.0012537240982055664, -0.0012075304985046387, -0.001161336898803711, -0.0011151432991027832, -0.0010689496994018555, -0.0010227560997009277, -0.0009765625, -0.0009303689002990723, -0.0008841753005981445, -0.0008379817008972168, -0.0007917881011962891, -0.0007455945014953613, -0.0006994009017944336, -0.0006532073020935059, -0.0006070137023925781, -0.0005608201026916504, -0.0005146265029907227, -0.0004684329032897949, -0.0004222393035888672, -0.00037604570388793945, -0.0003298521041870117, -0.000283658504486084, -0.00023746490478515625, -0.00019127130508422852, -0.00014507770538330078, -9.888410568237305e-05, -5.269050598144531e-05, -6.496906280517578e-06, 3.9696693420410156e-05, 8.589029312133789e-05, 0.00013208389282226562, 0.00017827749252319336, 0.0002244710922241211, 0.00027066469192504883, 0.00031685829162597656, 0.0003630518913269043, 0.00040924549102783203, 0.00045543909072875977, 0.0005016326904296875, 0.0005478262901306152, 0.000594019889831543, 0.0006402134895324707, 0.0006864070892333984, 0.0007326006889343262, 0.0007787942886352539, 0.0008249878883361816, 0.0008711814880371094, 0.0009173750877380371, 0.0009635686874389648, 0.0010097622871398926, 0.0010559558868408203, 0.001102149486541748, 0.0011483430862426758, 0.0011945366859436035, 0.0012407302856445312]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 10.0, 19.0, 55.0, 132.0, 330.0, 259.0, 104.0, 47.0, 15.0, 18.0, 7.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002329054696019739, -0.00022747441835235804, -0.0002220433671027422, -0.00021661231585312635, -0.0002111812646035105, -0.00020575022790580988, -0.0002003191621042788, -0.00019488812540657818, -0.00018945707415696234, -0.0001840260229073465, -0.00017859497165773064, -0.0001731639204081148, -0.00016773286915849894, -0.0001623018179088831, -0.00015687078121118248, -0.00015143972996156663, -0.00014600867871195078, -0.00014057762746233493, -0.00013514657621271908, -0.00012971552496310323, -0.0001242844737134874, -0.00011885342973982915, -0.0001134223784902133, -0.00010799133451655507, -0.000102560268715024, -9.712921746540815e-05, -9.16981662157923e-05, -8.626711496617645e-05, -8.083607099251822e-05, -7.540501974290237e-05, -6.997396849328652e-05, -6.454292451962829e-05, -5.9111865994054824e-05, -5.3680814744438976e-05, -4.8249767132801935e-05, -4.281871588318609e-05, -3.7387668271549046e-05, -3.19566170219332e-05, -2.652556577231735e-05, -2.109451816068031e-05, -1.566346691106446e-05, -1.0232417480438016e-05, -4.80136714031687e-06, 6.296831998042762e-07, 6.060732630430721e-06, 1.1491782061057165e-05, 1.6922833310673013e-05, 2.2353880922310054e-05, 2.7784932171925902e-05, 3.321598342154175e-05, 3.864703103317879e-05, 4.407808228279464e-05, 4.950912989443168e-05, 5.494018114404753e-05, 6.0371232393663377e-05, 6.580227636732161e-05, 7.123332761693746e-05, 7.66643788665533e-05, 8.209543011616915e-05, 8.7526481365785e-05, 9.295752533944324e-05, 9.838857658905908e-05, 0.00010381962783867493, 0.00010925067181233317, 0.00011468173033790663]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 13.0, 9.0, 14.0, 17.0, 21.0, 23.0, 21.0, 26.0, 30.0, 31.0, 28.0, 23.0, 50.0, 44.0, 39.0, 32.0, 34.0, 34.0, 45.0, 46.0, 41.0, 33.0, 32.0, 33.0, 31.0, 33.0, 30.0, 29.0, 24.0, 21.0, 10.0, 13.0, 19.0, 9.0, 6.0, 7.0, 4.0, 3.0, 7.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.4689903259277344e-05, -3.354158252477646e-05, -3.2393261790275574e-05, -3.124494105577469e-05, -3.0096620321273804e-05, -2.894829958677292e-05, -2.7799978852272034e-05, -2.665165811777115e-05, -2.5503337383270264e-05, -2.435501664876938e-05, -2.3206695914268494e-05, -2.205837517976761e-05, -2.0910054445266724e-05, -1.976173371076584e-05, -1.8613412976264954e-05, -1.746509224176407e-05, -1.6316771507263184e-05, -1.5168450772762299e-05, -1.4020130038261414e-05, -1.2871809303760529e-05, -1.1723488569259644e-05, -1.0575167834758759e-05, -9.426847100257874e-06, -8.278526365756989e-06, -7.1302056312561035e-06, -5.9818848967552185e-06, -4.8335641622543335e-06, -3.6852434277534485e-06, -2.5369226932525635e-06, -1.3886019587516785e-06, -2.4028122425079346e-07, 9.080395102500916e-07, 2.0563602447509766e-06, 3.2046809792518616e-06, 4.353001713752747e-06, 5.501322448253632e-06, 6.649643182754517e-06, 7.797963917255402e-06, 8.946284651756287e-06, 1.0094605386257172e-05, 1.1242926120758057e-05, 1.2391246855258942e-05, 1.3539567589759827e-05, 1.4687888324260712e-05, 1.5836209058761597e-05, 1.698452979326248e-05, 1.8132850527763367e-05, 1.9281171262264252e-05, 2.0429491996765137e-05, 2.1577812731266022e-05, 2.2726133465766907e-05, 2.3874454200267792e-05, 2.5022774934768677e-05, 2.6171095669269562e-05, 2.7319416403770447e-05, 2.8467737138271332e-05, 2.9616057872772217e-05, 3.07643786072731e-05, 3.191269934177399e-05, 3.306102007627487e-05, 3.420934081077576e-05, 3.535766154527664e-05, 3.650598227977753e-05, 3.765430301427841e-05, 3.88026237487793e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 8.0, 7.0, 10.0, 10.0, 11.0, 15.0, 22.0, 23.0, 25.0, 20.0, 32.0, 30.0, 40.0, 27.0, 30.0, 51.0, 45.0, 56.0, 50.0, 32.0, 51.0, 45.0, 43.0, 32.0, 27.0, 33.0, 33.0, 35.0, 22.0, 24.0, 22.0, 20.0, 15.0, 10.0, 8.0, 9.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.716796875, -62.62109375, -60.525390625, -58.4296875, -56.333984375, -54.23828125, -52.142578125, -50.046875, -47.951171875, -45.85546875, -43.759765625, -41.6640625, -39.568359375, -37.47265625, -35.376953125, -33.28125, -31.185546875, -29.08984375, -26.994140625, -24.8984375, -22.802734375, -20.70703125, -18.611328125, -16.515625, -14.419921875, -12.32421875, -10.228515625, -8.1328125, -6.037109375, -3.94140625, -1.845703125, 0.25, 2.345703125, 4.44140625, 6.537109375, 8.6328125, 10.728515625, 12.82421875, 14.919921875, 17.015625, 19.111328125, 21.20703125, 23.302734375, 25.3984375, 27.494140625, 29.58984375, 31.685546875, 33.78125, 35.876953125, 37.97265625, 40.068359375, 42.1640625, 44.259765625, 46.35546875, 48.451171875, 50.546875, 52.642578125, 54.73828125, 56.833984375, 58.9296875, 61.025390625, 63.12109375, 65.216796875, 67.3125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 10.0, 10.0, 17.0, 15.0, 37.0, 55.0, 56.0, 93.0, 111.0, 178.0, 235.0, 326.0, 431.0, 726.0, 1119.0, 1782.0, 2962.0, 5496.0, 11577.0, 31714.0, 164171.0, 681321.0, 100603.0, 24099.0, 9394.0, 4550.0, 2643.0, 1647.0, 1018.0, 669.0, 437.0, 295.0, 230.0, 116.0, 110.0, 70.0, 57.0, 38.0, 33.0, 25.0, 17.0, 9.0, 16.0, 5.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-96.75, -93.8515625, -90.953125, -88.0546875, -85.15625, -82.2578125, -79.359375, -76.4609375, -73.5625, -70.6640625, -67.765625, -64.8671875, -61.96875, -59.0703125, -56.171875, -53.2734375, -50.375, -47.4765625, -44.578125, -41.6796875, -38.78125, -35.8828125, -32.984375, -30.0859375, -27.1875, -24.2890625, -21.390625, -18.4921875, -15.59375, -12.6953125, -9.796875, -6.8984375, -4.0, -1.1015625, 1.796875, 4.6953125, 7.59375, 10.4921875, 13.390625, 16.2890625, 19.1875, 22.0859375, 24.984375, 27.8828125, 30.78125, 33.6796875, 36.578125, 39.4765625, 42.375, 45.2734375, 48.171875, 51.0703125, 53.96875, 56.8671875, 59.765625, 62.6640625, 65.5625, 68.4609375, 71.359375, 74.2578125, 77.15625, 80.0546875, 82.953125, 85.8515625, 88.75]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 2.0, 6.0, 9.0, 16.0, 5.0, 18.0, 16.0, 19.0, 18.0, 29.0, 19.0, 22.0, 28.0, 26.0, 33.0, 36.0, 40.0, 49.0, 65.0, 79.0, 138.0, 1716.0, 154.0, 67.0, 50.0, 55.0, 44.0, 39.0, 30.0, 26.0, 28.0, 23.0, 25.0, 18.0, 25.0, 12.0, 12.0, 8.0, 10.0, 12.0, 4.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-163.375, -158.490234375, -153.60546875, -148.720703125, -143.8359375, -138.951171875, -134.06640625, -129.181640625, -124.296875, -119.412109375, -114.52734375, -109.642578125, -104.7578125, -99.873046875, -94.98828125, -90.103515625, -85.21875, -80.333984375, -75.44921875, -70.564453125, -65.6796875, -60.794921875, -55.91015625, -51.025390625, -46.140625, -41.255859375, -36.37109375, -31.486328125, -26.6015625, -21.716796875, -16.83203125, -11.947265625, -7.0625, -2.177734375, 2.70703125, 7.591796875, 12.4765625, 17.361328125, 22.24609375, 27.130859375, 32.015625, 36.900390625, 41.78515625, 46.669921875, 51.5546875, 56.439453125, 61.32421875, 66.208984375, 71.09375, 75.978515625, 80.86328125, 85.748046875, 90.6328125, 95.517578125, 100.40234375, 105.287109375, 110.171875, 115.056640625, 119.94140625, 124.826171875, 129.7109375, 134.595703125, 139.48046875, 144.365234375, 149.25]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 9.0, 10.0, 6.0, 12.0, 23.0, 37.0, 49.0, 70.0, 72.0, 128.0, 191.0, 356.0, 667.0, 1747.0, 5795.0, 25429.0, 422089.0, 2633479.0, 43255.0, 7986.0, 2289.0, 904.0, 404.0, 194.0, 141.0, 104.0, 65.0, 55.0, 37.0, 28.0, 21.0, 15.0, 9.0, 8.0, 8.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-250.875, -243.734375, -236.59375, -229.453125, -222.3125, -215.171875, -208.03125, -200.890625, -193.75, -186.609375, -179.46875, -172.328125, -165.1875, -158.046875, -150.90625, -143.765625, -136.625, -129.484375, -122.34375, -115.203125, -108.0625, -100.921875, -93.78125, -86.640625, -79.5, -72.359375, -65.21875, -58.078125, -50.9375, -43.796875, -36.65625, -29.515625, -22.375, -15.234375, -8.09375, -0.953125, 6.1875, 13.328125, 20.46875, 27.609375, 34.75, 41.890625, 49.03125, 56.171875, 63.3125, 70.453125, 77.59375, 84.734375, 91.875, 99.015625, 106.15625, 113.296875, 120.4375, 127.578125, 134.71875, 141.859375, 149.0, 156.140625, 163.28125, 170.421875, 177.5625, 184.703125, 191.84375, 198.984375, 206.125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 897.0, 96.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2094.220947265625, -2001.781005859375, -1909.3411865234375, -1816.9013671875, -1724.46142578125, -1632.021484375, -1539.5816650390625, -1447.141845703125, -1354.701904296875, -1262.261962890625, -1169.8221435546875, -1077.38232421875, -984.9423828125, -892.5025024414062, -800.0626220703125, -707.6227416992188, -615.182861328125, -522.7429809570312, -430.3031005859375, -337.86322021484375, -245.42333984375, -152.98345947265625, -60.5435791015625, 31.89630126953125, 124.336181640625, 216.77606201171875, 309.2159423828125, 401.65582275390625, 494.095703125, 586.5355834960938, 678.9754638671875, 771.4153442382812, 863.855224609375, 956.2951049804688, 1048.7349853515625, 1141.1748046875, 1233.61474609375, 1326.0546875, 1418.4945068359375, 1510.934326171875, 1603.374267578125, 1695.814208984375, 1788.2540283203125, 1880.69384765625, 1973.1337890625, 2065.57373046875, 2158.013671875, 2250.453369140625, 2342.893310546875, 2435.333251953125, 2527.77294921875, 2620.212890625, 2712.65283203125, 2805.0927734375, 2897.53271484375, 2989.972412109375, 3082.412353515625, 3174.852294921875, 3267.2919921875, 3359.73193359375, 3452.171875, 3544.61181640625, 3637.0517578125, 3729.491455078125, 3821.931396484375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 4.0, 6.0, 11.0, 10.0, 24.0, 16.0, 17.0, 18.0, 13.0, 38.0, 28.0, 40.0, 23.0, 47.0, 34.0, 31.0, 41.0, 49.0, 40.0, 46.0, 49.0, 49.0, 38.0, 35.0, 38.0, 31.0, 26.0, 26.0, 23.0, 26.0, 16.0, 20.0, 24.0, 11.0, 8.0, 4.0, 5.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-418.1995544433594, -405.60662841796875, -393.013671875, -380.4207458496094, -367.82781982421875, -355.23486328125, -342.6419372558594, -330.04901123046875, -317.4560546875, -304.8631286621094, -292.2701721191406, -279.67724609375, -267.0843200683594, -254.49136352539062, -241.8984375, -229.3054962158203, -216.7125701904297, -204.11962890625, -191.52670288085938, -178.9337615966797, -166.3408203125, -153.74789428710938, -141.1549530029297, -128.56201171875, -115.96907806396484, -103.37614440917969, -90.783203125, -78.19026947021484, -65.59733581542969, -53.00439453125, -40.411460876464844, -27.818519592285156, -15.2255859375, -2.6326494216918945, 9.960287094116211, 22.55322265625, 35.14616012573242, 47.739097595214844, 60.33203125, 72.92497253417969, 85.51790618896484, 98.11083984375, 110.70378112792969, 123.29671478271484, 135.8896484375, 148.4825897216797, 161.07553100585938, 173.66845703125, 186.2613983154297, 198.85433959960938, 211.447265625, 224.0402069091797, 236.63314819335938, 249.22607421875, 261.81903076171875, 274.4119567871094, 287.0048828125, 299.5978088378906, 312.1907653808594, 324.78369140625, 337.3766174316406, 349.9695739746094, 362.5625, 375.15545654296875, 387.7483825683594]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 8.0, 16.0, 18.0, 15.0, 12.0, 28.0, 26.0, 19.0, 27.0, 30.0, 51.0, 48.0, 47.0, 29.0, 50.0, 41.0, 52.0, 59.0, 44.0, 35.0, 31.0, 40.0, 31.0, 27.0, 29.0, 36.0, 28.0, 20.0, 22.0, 10.0, 7.0, 11.0, 15.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.8125, -69.5927734375, -67.373046875, -65.1533203125, -62.93359375, -60.7138671875, -58.494140625, -56.2744140625, -54.0546875, -51.8349609375, -49.615234375, -47.3955078125, -45.17578125, -42.9560546875, -40.736328125, -38.5166015625, -36.296875, -34.0771484375, -31.857421875, -29.6376953125, -27.41796875, -25.1982421875, -22.978515625, -20.7587890625, -18.5390625, -16.3193359375, -14.099609375, -11.8798828125, -9.66015625, -7.4404296875, -5.220703125, -3.0009765625, -0.78125, 1.4384765625, 3.658203125, 5.8779296875, 8.09765625, 10.3173828125, 12.537109375, 14.7568359375, 16.9765625, 19.1962890625, 21.416015625, 23.6357421875, 25.85546875, 28.0751953125, 30.294921875, 32.5146484375, 34.734375, 36.9541015625, 39.173828125, 41.3935546875, 43.61328125, 45.8330078125, 48.052734375, 50.2724609375, 52.4921875, 54.7119140625, 56.931640625, 59.1513671875, 61.37109375, 63.5908203125, 65.810546875, 68.0302734375, 70.25]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 10.0, 10.0, 20.0, 23.0, 33.0, 42.0, 69.0, 77.0, 112.0, 162.0, 238.0, 333.0, 499.0, 830.0, 1481.0, 2627.0, 4701.0, 9154.0, 21458.0, 70282.0, 3229283.0, 774018.0, 45478.0, 16270.0, 7540.0, 3998.0, 2114.0, 1258.0, 740.0, 480.0, 281.0, 191.0, 137.0, 90.0, 58.0, 61.0, 21.0, 25.0, 17.0, 16.0, 11.0, 6.0, 10.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-279.25, -271.0, -262.75, -254.5, -246.25, -238.0, -229.75, -221.5, -213.25, -205.0, -196.75, -188.5, -180.25, -172.0, -163.75, -155.5, -147.25, -139.0, -130.75, -122.5, -114.25, -106.0, -97.75, -89.5, -81.25, -73.0, -64.75, -56.5, -48.25, -40.0, -31.75, -23.5, -15.25, -7.0, 1.25, 9.5, 17.75, 26.0, 34.25, 42.5, 50.75, 59.0, 67.25, 75.5, 83.75, 92.0, 100.25, 108.5, 116.75, 125.0, 133.25, 141.5, 149.75, 158.0, 166.25, 174.5, 182.75, 191.0, 199.25, 207.5, 215.75, 224.0, 232.25, 240.5, 248.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 10.0, 11.0, 8.0, 13.0, 19.0, 15.0, 23.0, 18.0, 28.0, 41.0, 44.0, 74.0, 98.0, 229.0, 694.0, 1345.0, 733.0, 241.0, 125.0, 58.0, 51.0, 46.0, 27.0, 26.0, 19.0, 12.0, 12.0, 10.0, 8.0, 7.0, 8.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.875, -128.521484375, -124.16796875, -119.814453125, -115.4609375, -111.107421875, -106.75390625, -102.400390625, -98.046875, -93.693359375, -89.33984375, -84.986328125, -80.6328125, -76.279296875, -71.92578125, -67.572265625, -63.21875, -58.865234375, -54.51171875, -50.158203125, -45.8046875, -41.451171875, -37.09765625, -32.744140625, -28.390625, -24.037109375, -19.68359375, -15.330078125, -10.9765625, -6.623046875, -2.26953125, 2.083984375, 6.4375, 10.791015625, 15.14453125, 19.498046875, 23.8515625, 28.205078125, 32.55859375, 36.912109375, 41.265625, 45.619140625, 49.97265625, 54.326171875, 58.6796875, 63.033203125, 67.38671875, 71.740234375, 76.09375, 80.447265625, 84.80078125, 89.154296875, 93.5078125, 97.861328125, 102.21484375, 106.568359375, 110.921875, 115.275390625, 119.62890625, 123.982421875, 128.3359375, 132.689453125, 137.04296875, 141.396484375, 145.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 7.0, 6.0, 11.0, 15.0, 30.0, 38.0, 54.0, 61.0, 117.0, 159.0, 229.0, 350.0, 459.0, 623.0, 1015.0, 1505.0, 2261.0, 3364.0, 5370.0, 8910.0, 15547.0, 28534.0, 60125.0, 191288.0, 3150198.0, 544294.0, 91006.0, 38433.0, 20142.0, 11173.0, 6645.0, 4182.0, 2706.0, 1709.0, 1123.0, 843.0, 532.0, 367.0, 259.0, 154.0, 142.0, 101.0, 51.0, 46.0, 42.0, 17.0, 15.0, 7.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-176.0, -170.62109375, -165.2421875, -159.86328125, -154.484375, -149.10546875, -143.7265625, -138.34765625, -132.96875, -127.58984375, -122.2109375, -116.83203125, -111.453125, -106.07421875, -100.6953125, -95.31640625, -89.9375, -84.55859375, -79.1796875, -73.80078125, -68.421875, -63.04296875, -57.6640625, -52.28515625, -46.90625, -41.52734375, -36.1484375, -30.76953125, -25.390625, -20.01171875, -14.6328125, -9.25390625, -3.875, 1.50390625, 6.8828125, 12.26171875, 17.640625, 23.01953125, 28.3984375, 33.77734375, 39.15625, 44.53515625, 49.9140625, 55.29296875, 60.671875, 66.05078125, 71.4296875, 76.80859375, 82.1875, 87.56640625, 92.9453125, 98.32421875, 103.703125, 109.08203125, 114.4609375, 119.83984375, 125.21875, 130.59765625, 135.9765625, 141.35546875, 146.734375, 152.11328125, 157.4921875, 162.87109375, 168.25]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 15.0, 40.0, 31.0, 71.0, 110.0, 165.0, 170.0, 159.0, 87.0, 56.0, 29.0, 21.0, 14.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-530.7828979492188, -506.9376220703125, -483.09234619140625, -459.2470703125, -435.40179443359375, -411.5565185546875, -387.7112731933594, -363.8659973144531, -340.0207214355469, -316.1754455566406, -292.3301696777344, -268.48492431640625, -244.63963317871094, -220.7943572998047, -196.9490966796875, -173.10382080078125, -149.258544921875, -125.41326904296875, -101.56800079345703, -77.72273254394531, -53.87745666503906, -30.032180786132812, -6.186920166015625, 17.658355712890625, 41.503631591796875, 65.34890747070312, 89.19417572021484, 113.03944396972656, 136.8847198486328, 160.72999572753906, 184.57525634765625, 208.4205322265625, 232.2657470703125, 256.11102294921875, 279.956298828125, 303.80157470703125, 327.6468505859375, 351.49212646484375, 375.3373718261719, 399.1826477050781, 423.0279235839844, 446.8731994628906, 470.7184753417969, 494.563720703125, 518.4089965820312, 542.2542724609375, 566.0995483398438, 589.94482421875, 613.7901000976562, 637.6353759765625, 661.4806518554688, 685.325927734375, 709.1712036132812, 733.0164794921875, 756.8616943359375, 780.70703125, 804.55224609375, 828.3975219726562, 852.2427978515625, 876.0880737304688, 899.933349609375, 923.7786254882812, 947.6239013671875, 971.4691162109375, 995.314453125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 4.0, 12.0, 5.0, 14.0, 12.0, 17.0, 19.0, 22.0, 11.0, 34.0, 23.0, 43.0, 30.0, 52.0, 35.0, 43.0, 41.0, 38.0, 34.0, 42.0, 33.0, 50.0, 34.0, 42.0, 30.0, 24.0, 37.0, 25.0, 31.0, 31.0, 28.0, 18.0, 20.0, 12.0, 9.0, 8.0, 7.0, 3.0, 9.0, 4.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-332.7120361328125, -321.55078125, -310.3895263671875, -299.228271484375, -288.0669860839844, -276.9057312011719, -265.7444763183594, -254.58322143554688, -243.42196655273438, -232.26071166992188, -221.0994415283203, -209.9381866455078, -198.7769317626953, -187.61566162109375, -176.45440673828125, -165.29315185546875, -154.1318817138672, -142.9706268310547, -131.80935668945312, -120.64810180664062, -109.48684692382812, -98.3255844116211, -87.16432189941406, -76.00306701660156, -64.84180450439453, -53.680545806884766, -42.519287109375, -31.35802459716797, -20.196765899658203, -9.035507202148438, 2.1257553100585938, 13.287010192871094, 24.448272705078125, 35.60953140258789, 46.770790100097656, 57.93205261230469, 69.09330749511719, 80.25457000732422, 91.41583251953125, 102.57708740234375, 113.73834991455078, 124.89961242675781, 136.0608673095703, 147.22213745117188, 158.38339233398438, 169.54464721679688, 180.70590209960938, 191.86715698242188, 203.02842712402344, 214.18968200683594, 225.3509521484375, 236.51220703125, 247.6734619140625, 258.834716796875, 269.9959716796875, 281.1572265625, 292.3185119628906, 303.4797668457031, 314.6410217285156, 325.80230712890625, 336.96356201171875, 348.12481689453125, 359.28607177734375, 370.44732666015625, 381.60858154296875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 8.0, 7.0, 11.0, 12.0, 18.0, 16.0, 16.0, 18.0, 25.0, 31.0, 31.0, 30.0, 34.0, 46.0, 35.0, 32.0, 42.0, 40.0, 46.0, 43.0, 30.0, 52.0, 37.0, 31.0, 35.0, 27.0, 25.0, 26.0, 24.0, 20.0, 21.0, 20.0, 13.0, 18.0, 12.0, 13.0, 11.0, 11.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-66.875, -64.7587890625, -62.642578125, -60.5263671875, -58.41015625, -56.2939453125, -54.177734375, -52.0615234375, -49.9453125, -47.8291015625, -45.712890625, -43.5966796875, -41.48046875, -39.3642578125, -37.248046875, -35.1318359375, -33.015625, -30.8994140625, -28.783203125, -26.6669921875, -24.55078125, -22.4345703125, -20.318359375, -18.2021484375, -16.0859375, -13.9697265625, -11.853515625, -9.7373046875, -7.62109375, -5.5048828125, -3.388671875, -1.2724609375, 0.84375, 2.9599609375, 5.076171875, 7.1923828125, 9.30859375, 11.4248046875, 13.541015625, 15.6572265625, 17.7734375, 19.8896484375, 22.005859375, 24.1220703125, 26.23828125, 28.3544921875, 30.470703125, 32.5869140625, 34.703125, 36.8193359375, 38.935546875, 41.0517578125, 43.16796875, 45.2841796875, 47.400390625, 49.5166015625, 51.6328125, 53.7490234375, 55.865234375, 57.9814453125, 60.09765625, 62.2138671875, 64.330078125, 66.4462890625, 68.5625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [7.0, 5.0, 3.0, 11.0, 12.0, 18.0, 18.0, 37.0, 41.0, 56.0, 69.0, 90.0, 120.0, 199.0, 266.0, 365.0, 501.0, 703.0, 938.0, 1422.0, 1952.0, 2843.0, 4113.0, 6071.0, 8978.0, 13043.0, 19651.0, 29890.0, 45331.0, 72635.0, 126800.0, 307491.0, 161301.0, 86335.0, 53042.0, 34294.0, 22521.0, 14917.0, 10056.0, 6810.0, 4643.0, 3362.0, 2097.0, 1580.0, 1062.0, 855.0, 571.0, 415.0, 263.0, 231.0, 150.0, 94.0, 67.0, 61.0, 52.0, 37.0, 25.0, 10.0, 15.0, 12.0, 8.0, 3.0, 6.0, 2.0], "bins": [-2.322265625, -2.248931884765625, -2.17559814453125, -2.102264404296875, -2.0289306640625, -1.955596923828125, -1.88226318359375, -1.808929443359375, -1.735595703125, -1.662261962890625, -1.58892822265625, -1.515594482421875, -1.4422607421875, -1.368927001953125, -1.29559326171875, -1.222259521484375, -1.14892578125, -1.075592041015625, -1.00225830078125, -0.928924560546875, -0.8555908203125, -0.782257080078125, -0.70892333984375, -0.635589599609375, -0.562255859375, -0.488922119140625, -0.41558837890625, -0.342254638671875, -0.2689208984375, -0.195587158203125, -0.12225341796875, -0.048919677734375, 0.0244140625, 0.097747802734375, 0.17108154296875, 0.244415283203125, 0.3177490234375, 0.391082763671875, 0.46441650390625, 0.537750244140625, 0.611083984375, 0.684417724609375, 0.75775146484375, 0.831085205078125, 0.9044189453125, 0.977752685546875, 1.05108642578125, 1.124420166015625, 1.19775390625, 1.271087646484375, 1.34442138671875, 1.417755126953125, 1.4910888671875, 1.564422607421875, 1.63775634765625, 1.711090087890625, 1.784423828125, 1.857757568359375, 1.93109130859375, 2.004425048828125, 2.0777587890625, 2.151092529296875, 2.22442626953125, 2.297760009765625, 2.37109375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 8.0, 3.0, 9.0, 7.0, 11.0, 12.0, 18.0, 22.0, 16.0, 23.0, 26.0, 35.0, 39.0, 19.0, 39.0, 44.0, 39.0, 39.0, 50.0, 1071.0, 50.0, 52.0, 50.0, 45.0, 39.0, 31.0, 36.0, 36.0, 23.0, 18.0, 18.0, 15.0, 10.0, 16.0, 11.0, 8.0, 10.0, 5.0, 5.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.5, -47.97265625, -46.4453125, -44.91796875, -43.390625, -41.86328125, -40.3359375, -38.80859375, -37.28125, -35.75390625, -34.2265625, -32.69921875, -31.171875, -29.64453125, -28.1171875, -26.58984375, -25.0625, -23.53515625, -22.0078125, -20.48046875, -18.953125, -17.42578125, -15.8984375, -14.37109375, -12.84375, -11.31640625, -9.7890625, -8.26171875, -6.734375, -5.20703125, -3.6796875, -2.15234375, -0.625, 0.90234375, 2.4296875, 3.95703125, 5.484375, 7.01171875, 8.5390625, 10.06640625, 11.59375, 13.12109375, 14.6484375, 16.17578125, 17.703125, 19.23046875, 20.7578125, 22.28515625, 23.8125, 25.33984375, 26.8671875, 28.39453125, 29.921875, 31.44921875, 32.9765625, 34.50390625, 36.03125, 37.55859375, 39.0859375, 40.61328125, 42.140625, 43.66796875, 45.1953125, 46.72265625, 48.25]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 2.0, 6.0, 11.0, 9.0, 18.0, 24.0, 37.0, 59.0, 71.0, 103.0, 158.0, 217.0, 317.0, 446.0, 635.0, 982.0, 1470.0, 2122.0, 3135.0, 4751.0, 7017.0, 10487.0, 16153.0, 25702.0, 41317.0, 69667.0, 129483.0, 1387828.0, 173191.0, 85595.0, 49500.0, 30334.0, 19259.0, 12351.0, 8073.0, 5377.0, 3538.0, 2493.0, 1600.0, 1119.0, 752.0, 531.0, 363.0, 273.0, 168.0, 108.0, 98.0, 63.0, 42.0, 21.0, 18.0, 11.0, 11.0, 10.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0], "bins": [-1.9853515625, -1.9226837158203125, -1.860015869140625, -1.7973480224609375, -1.73468017578125, -1.6720123291015625, -1.609344482421875, -1.5466766357421875, -1.4840087890625, -1.4213409423828125, -1.358673095703125, -1.2960052490234375, -1.23333740234375, -1.1706695556640625, -1.108001708984375, -1.0453338623046875, -0.982666015625, -0.9199981689453125, -0.857330322265625, -0.7946624755859375, -0.73199462890625, -0.6693267822265625, -0.606658935546875, -0.5439910888671875, -0.4813232421875, -0.4186553955078125, -0.355987548828125, -0.2933197021484375, -0.23065185546875, -0.1679840087890625, -0.105316162109375, -0.0426483154296875, 0.02001953125, 0.0826873779296875, 0.145355224609375, 0.2080230712890625, 0.27069091796875, 0.3333587646484375, 0.396026611328125, 0.4586944580078125, 0.5213623046875, 0.5840301513671875, 0.646697998046875, 0.7093658447265625, 0.77203369140625, 0.8347015380859375, 0.897369384765625, 0.9600372314453125, 1.022705078125, 1.0853729248046875, 1.148040771484375, 1.2107086181640625, 1.27337646484375, 1.3360443115234375, 1.398712158203125, 1.4613800048828125, 1.5240478515625, 1.5867156982421875, 1.649383544921875, 1.7120513916015625, 1.77471923828125, 1.8373870849609375, 1.900054931640625, 1.9627227783203125, 2.025390625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 12.0, 9.0, 10.0, 8.0, 15.0, 18.0, 37.0, 50.0, 84.0, 221.0, 180.0, 109.0, 50.0, 32.0, 22.0, 24.0, 12.0, 17.0, 10.0, 11.0, 9.0, 5.0, 7.0, 9.0, 8.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011360645294189453, -0.00010992772877216339, -0.00010624900460243225, -0.00010257028043270111, -9.889155626296997e-05, -9.521283209323883e-05, -9.153410792350769e-05, -8.785538375377655e-05, -8.417665958404541e-05, -8.049793541431427e-05, -7.681921124458313e-05, -7.314048707485199e-05, -6.946176290512085e-05, -6.578303873538971e-05, -6.210431456565857e-05, -5.842559039592743e-05, -5.474686622619629e-05, -5.106814205646515e-05, -4.738941788673401e-05, -4.371069371700287e-05, -4.003196954727173e-05, -3.635324537754059e-05, -3.267452120780945e-05, -2.8995797038078308e-05, -2.5317072868347168e-05, -2.1638348698616028e-05, -1.7959624528884888e-05, -1.4280900359153748e-05, -1.0602176189422607e-05, -6.923452019691467e-06, -3.244727849960327e-06, 4.33996319770813e-07, 4.112720489501953e-06, 7.791444659233093e-06, 1.1470168828964233e-05, 1.5148892998695374e-05, 1.8827617168426514e-05, 2.2506341338157654e-05, 2.6185065507888794e-05, 2.9863789677619934e-05, 3.3542513847351074e-05, 3.7221238017082214e-05, 4.0899962186813354e-05, 4.4578686356544495e-05, 4.8257410526275635e-05, 5.1936134696006775e-05, 5.5614858865737915e-05, 5.9293583035469055e-05, 6.29723072052002e-05, 6.665103137493134e-05, 7.032975554466248e-05, 7.400847971439362e-05, 7.768720388412476e-05, 8.13659280538559e-05, 8.504465222358704e-05, 8.872337639331818e-05, 9.240210056304932e-05, 9.608082473278046e-05, 9.97595489025116e-05, 0.00010343827307224274, 0.00010711699724197388, 0.00011079572141170502, 0.00011447444558143616, 0.0001181531697511673, 0.00012183189392089844]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 8.0, 11.0, 16.0, 17.0, 10.0, 28.0, 18.0, 34.0, 26.0, 54.0, 86.0, 133.0, 338.0, 3205.0, 158652.0, 878354.0, 6702.0, 465.0, 138.0, 70.0, 41.0, 41.0, 21.0, 16.0, 19.0, 10.0, 10.0, 3.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0021724700927734375, -0.00210687518119812, -0.0020412802696228027, -0.0019756853580474854, -0.001910090446472168, -0.0018444955348968506, -0.0017789006233215332, -0.0017133057117462158, -0.0016477108001708984, -0.001582115888595581, -0.0015165209770202637, -0.0014509260654449463, -0.001385331153869629, -0.0013197362422943115, -0.0012541413307189941, -0.0011885464191436768, -0.0011229515075683594, -0.001057356595993042, -0.0009917616844177246, -0.0009261667728424072, -0.0008605718612670898, -0.0007949769496917725, -0.0007293820381164551, -0.0006637871265411377, -0.0005981922149658203, -0.0005325973033905029, -0.00046700239181518555, -0.00040140748023986816, -0.0003358125686645508, -0.0002702176570892334, -0.00020462274551391602, -0.00013902783393859863, -7.343292236328125e-05, -7.838010787963867e-06, 5.7756900787353516e-05, 0.0001233518123626709, 0.00018894672393798828, 0.00025454163551330566, 0.00032013654708862305, 0.00038573145866394043, 0.0004513263702392578, 0.0005169212818145752, 0.0005825161933898926, 0.00064811110496521, 0.0007137060165405273, 0.0007793009281158447, 0.0008448958396911621, 0.0009104907512664795, 0.0009760856628417969, 0.0010416805744171143, 0.0011072754859924316, 0.001172870397567749, 0.0012384653091430664, 0.0013040602207183838, 0.0013696551322937012, 0.0014352500438690186, 0.001500844955444336, 0.0015664398670196533, 0.0016320347785949707, 0.001697629690170288, 0.0017632246017456055, 0.0018288195133209229, 0.0018944144248962402, 0.0019600093364715576, 0.002025604248046875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 25.0, 60.0, 148.0, 265.0, 297.0, 120.0, 48.0, 18.0, 17.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7190707593690604e-05, -5.1480183174135163e-05, -4.576965875457972e-05, -4.0059130697045475e-05, -3.434860991546884e-05, -2.8638083676923998e-05, -2.2927557438379154e-05, -1.7217033018823713e-05, -1.1506508599268273e-05, -5.795983724965481e-06, -8.545885066268966e-08, 5.625066478387453e-06, 1.1335590897942893e-05, 1.7046115317498334e-05, 2.2756641556043178e-05, 2.846716597559862e-05, 3.417769039515406e-05, 3.98882148147095e-05, 4.559873923426494e-05, 5.130926729179919e-05, 5.701978807337582e-05, 6.273031613091007e-05, 6.844084418844432e-05, 7.415136497002095e-05, 7.986188575159758e-05, 8.557241380913183e-05, 9.128293459070846e-05, 9.699346264824271e-05, 0.00010270398342981935, 0.00010841451148735359, 0.00011412503954488784, 0.00011983556032646447, 0.0001255460811080411, 0.00013125660188961774, 0.0001369671372231096, 0.00014267765800468624, 0.00014838817878626287, 0.0001540986995678395, 0.00015980923490133137, 0.000165519755682908, 0.00017123027646448463, 0.00017694079724606127, 0.00018265133257955313, 0.00018836185336112976, 0.0001940723741427064, 0.00019978289492428303, 0.0002054934302577749, 0.00021120395103935152, 0.00021691448637284338, 0.00022262500715442002, 0.00022833554248791188, 0.0002340460632694885, 0.00023975658405106515, 0.000245467119384557, 0.00025117764016613364, 0.0002568881609477103, 0.0002625986817292869, 0.00026830920251086354, 0.0002740197232924402, 0.0002797302440740168, 0.0002854407939594239, 0.00029115131474100053, 0.00029686183552257717, 0.0003025723563041538, 0.00030828287708573043]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 6.0, 6.0, 8.0, 5.0, 15.0, 14.0, 7.0, 15.0, 12.0, 19.0, 18.0, 15.0, 20.0, 17.0, 22.0, 31.0, 38.0, 38.0, 38.0, 29.0, 36.0, 41.0, 24.0, 34.0, 38.0, 28.0, 40.0, 22.0, 54.0, 36.0, 28.0, 32.0, 27.0, 28.0, 28.0, 22.0, 19.0, 14.0, 13.0, 19.0, 13.0, 14.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.190206527709961e-05, -4.0628015995025635e-05, -3.935396671295166e-05, -3.8079917430877686e-05, -3.680586814880371e-05, -3.5531818866729736e-05, -3.425776958465576e-05, -3.298372030258179e-05, -3.170967102050781e-05, -3.0435621738433838e-05, -2.9161572456359863e-05, -2.788752317428589e-05, -2.6613473892211914e-05, -2.533942461013794e-05, -2.4065375328063965e-05, -2.279132604598999e-05, -2.1517276763916016e-05, -2.024322748184204e-05, -1.8969178199768066e-05, -1.7695128917694092e-05, -1.6421079635620117e-05, -1.5147030353546143e-05, -1.3872981071472168e-05, -1.2598931789398193e-05, -1.1324882507324219e-05, -1.0050833225250244e-05, -8.77678394317627e-06, -7.502734661102295e-06, -6.22868537902832e-06, -4.954636096954346e-06, -3.680586814880371e-06, -2.4065375328063965e-06, -1.1324882507324219e-06, 1.4156103134155273e-07, 1.4156103134155273e-06, 2.689659595489502e-06, 3.9637088775634766e-06, 5.237758159637451e-06, 6.511807441711426e-06, 7.7858567237854e-06, 9.059906005859375e-06, 1.033395528793335e-05, 1.1608004570007324e-05, 1.2882053852081299e-05, 1.4156103134155273e-05, 1.5430152416229248e-05, 1.6704201698303223e-05, 1.7978250980377197e-05, 1.9252300262451172e-05, 2.0526349544525146e-05, 2.180039882659912e-05, 2.3074448108673096e-05, 2.434849739074707e-05, 2.5622546672821045e-05, 2.689659595489502e-05, 2.8170645236968994e-05, 2.944469451904297e-05, 3.071874380111694e-05, 3.199279308319092e-05, 3.326684236526489e-05, 3.454089164733887e-05, 3.581494092941284e-05, 3.7088990211486816e-05, 3.836303949356079e-05, 3.9637088775634766e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 8.0, 7.0, 11.0, 12.0, 18.0, 16.0, 16.0, 18.0, 25.0, 31.0, 31.0, 30.0, 34.0, 46.0, 35.0, 32.0, 42.0, 40.0, 46.0, 43.0, 30.0, 52.0, 37.0, 31.0, 35.0, 27.0, 25.0, 26.0, 24.0, 20.0, 21.0, 20.0, 13.0, 18.0, 12.0, 13.0, 11.0, 11.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-66.875, -64.7587890625, -62.642578125, -60.5263671875, -58.41015625, -56.2939453125, -54.177734375, -52.0615234375, -49.9453125, -47.8291015625, -45.712890625, -43.5966796875, -41.48046875, -39.3642578125, -37.248046875, -35.1318359375, -33.015625, -30.8994140625, -28.783203125, -26.6669921875, -24.55078125, -22.4345703125, -20.318359375, -18.2021484375, -16.0859375, -13.9697265625, -11.853515625, -9.7373046875, -7.62109375, -5.5048828125, -3.388671875, -1.2724609375, 0.84375, 2.9599609375, 5.076171875, 7.1923828125, 9.30859375, 11.4248046875, 13.541015625, 15.6572265625, 17.7734375, 19.8896484375, 22.005859375, 24.1220703125, 26.23828125, 28.3544921875, 30.470703125, 32.5869140625, 34.703125, 36.8193359375, 38.935546875, 41.0517578125, 43.16796875, 45.2841796875, 47.400390625, 49.5166015625, 51.6328125, 53.7490234375, 55.865234375, 57.9814453125, 60.09765625, 62.2138671875, 64.330078125, 66.4462890625, 68.5625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 10.0, 13.0, 20.0, 25.0, 35.0, 47.0, 73.0, 91.0, 147.0, 193.0, 270.0, 376.0, 540.0, 718.0, 1038.0, 1485.0, 2048.0, 3003.0, 4672.0, 6930.0, 11527.0, 19534.0, 39042.0, 137256.0, 628873.0, 106528.0, 34832.0, 17935.0, 10702.0, 6611.0, 4285.0, 2929.0, 1969.0, 1386.0, 955.0, 706.0, 485.0, 360.0, 248.0, 200.0, 138.0, 85.0, 61.0, 53.0, 32.0, 31.0, 15.0, 17.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-101.3125, -98.0888671875, -94.865234375, -91.6416015625, -88.41796875, -85.1943359375, -81.970703125, -78.7470703125, -75.5234375, -72.2998046875, -69.076171875, -65.8525390625, -62.62890625, -59.4052734375, -56.181640625, -52.9580078125, -49.734375, -46.5107421875, -43.287109375, -40.0634765625, -36.83984375, -33.6162109375, -30.392578125, -27.1689453125, -23.9453125, -20.7216796875, -17.498046875, -14.2744140625, -11.05078125, -7.8271484375, -4.603515625, -1.3798828125, 1.84375, 5.0673828125, 8.291015625, 11.5146484375, 14.73828125, 17.9619140625, 21.185546875, 24.4091796875, 27.6328125, 30.8564453125, 34.080078125, 37.3037109375, 40.52734375, 43.7509765625, 46.974609375, 50.1982421875, 53.421875, 56.6455078125, 59.869140625, 63.0927734375, 66.31640625, 69.5400390625, 72.763671875, 75.9873046875, 79.2109375, 82.4345703125, 85.658203125, 88.8818359375, 92.10546875, 95.3291015625, 98.552734375, 101.7763671875, 105.0]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 15.0, 17.0, 15.0, 14.0, 11.0, 28.0, 17.0, 27.0, 42.0, 45.0, 47.0, 56.0, 66.0, 94.0, 195.0, 1708.0, 213.0, 69.0, 57.0, 38.0, 37.0, 31.0, 48.0, 27.0, 31.0, 18.0, 24.0, 11.0, 15.0, 9.0, 4.0, 5.0, 5.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.125, -158.908203125, -152.69140625, -146.474609375, -140.2578125, -134.041015625, -127.82421875, -121.607421875, -115.390625, -109.173828125, -102.95703125, -96.740234375, -90.5234375, -84.306640625, -78.08984375, -71.873046875, -65.65625, -59.439453125, -53.22265625, -47.005859375, -40.7890625, -34.572265625, -28.35546875, -22.138671875, -15.921875, -9.705078125, -3.48828125, 2.728515625, 8.9453125, 15.162109375, 21.37890625, 27.595703125, 33.8125, 40.029296875, 46.24609375, 52.462890625, 58.6796875, 64.896484375, 71.11328125, 77.330078125, 83.546875, 89.763671875, 95.98046875, 102.197265625, 108.4140625, 114.630859375, 120.84765625, 127.064453125, 133.28125, 139.498046875, 145.71484375, 151.931640625, 158.1484375, 164.365234375, 170.58203125, 176.798828125, 183.015625, 189.232421875, 195.44921875, 201.666015625, 207.8828125, 214.099609375, 220.31640625, 226.533203125, 232.75]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 10.0, 12.0, 5.0, 10.0, 16.0, 22.0, 21.0, 45.0, 38.0, 60.0, 118.0, 252.0, 539.0, 1415.0, 5534.0, 29564.0, 2577258.0, 501921.0, 22089.0, 4455.0, 1238.0, 511.0, 209.0, 115.0, 75.0, 52.0, 44.0, 23.0, 23.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-310.0, -299.640625, -289.28125, -278.921875, -268.5625, -258.203125, -247.84375, -237.484375, -227.125, -216.765625, -206.40625, -196.046875, -185.6875, -175.328125, -164.96875, -154.609375, -144.25, -133.890625, -123.53125, -113.171875, -102.8125, -92.453125, -82.09375, -71.734375, -61.375, -51.015625, -40.65625, -30.296875, -19.9375, -9.578125, 0.78125, 11.140625, 21.5, 31.859375, 42.21875, 52.578125, 62.9375, 73.296875, 83.65625, 94.015625, 104.375, 114.734375, 125.09375, 135.453125, 145.8125, 156.171875, 166.53125, 176.890625, 187.25, 197.609375, 207.96875, 218.328125, 228.6875, 239.046875, 249.40625, 259.765625, 270.125, 280.484375, 290.84375, 301.203125, 311.5625, 321.921875, 332.28125, 342.640625, 353.0]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 33.0, 185.0, 486.0, 243.0, 53.0, 11.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-704.7377319335938, -670.683837890625, -636.6298828125, -602.5759887695312, -568.5220947265625, -534.4682006835938, -500.4142761230469, -466.3603515625, -432.30645751953125, -398.2525634765625, -364.1986389160156, -330.14471435546875, -296.0908203125, -262.03692626953125, -227.98300170898438, -193.92909240722656, -159.87518310546875, -125.82127380371094, -91.76736450195312, -57.71345520019531, -23.6595458984375, 10.394363403320312, 44.448272705078125, 78.50218200683594, 112.55609130859375, 146.61000061035156, 180.66390991210938, 214.7178192138672, 248.771728515625, 282.82562255859375, 316.8795471191406, 350.9334716796875, 384.9874267578125, 419.04132080078125, 453.0952453613281, 487.149169921875, 521.2030639648438, 555.2569580078125, 589.3109130859375, 623.3648071289062, 657.418701171875, 691.4725952148438, 725.5264892578125, 759.5804443359375, 793.6343383789062, 827.688232421875, 861.7421875, 895.7960815429688, 929.8499755859375, 963.9038696289062, 997.957763671875, 1032.01171875, 1066.065673828125, 1100.1195068359375, 1134.1734619140625, 1168.227294921875, 1202.28125, 1236.335205078125, 1270.3890380859375, 1304.4429931640625, 1338.496826171875, 1372.55078125, 1406.604736328125, 1440.6585693359375, 1474.7125244140625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 10.0, 3.0, 12.0, 8.0, 17.0, 11.0, 16.0, 20.0, 14.0, 26.0, 21.0, 24.0, 29.0, 30.0, 34.0, 38.0, 51.0, 42.0, 34.0, 45.0, 43.0, 35.0, 45.0, 41.0, 30.0, 29.0, 31.0, 35.0, 30.0, 40.0, 28.0, 20.0, 21.0, 20.0, 10.0, 12.0, 9.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-327.2459411621094, -316.4234313964844, -305.60089111328125, -294.77838134765625, -283.95587158203125, -273.13336181640625, -262.31085205078125, -251.48831176757812, -240.66580200195312, -229.84329223632812, -219.02076721191406, -208.1982421875, -197.375732421875, -186.55322265625, -175.73069763183594, -164.90817260742188, -154.08566284179688, -143.26315307617188, -132.4406280517578, -121.61811065673828, -110.79559326171875, -99.97307586669922, -89.15055847167969, -78.32804107666016, -67.50552368164062, -56.683006286621094, -45.86048889160156, -35.03797149658203, -24.2154541015625, -13.392936706542969, -2.5704193115234375, 8.252098083496094, 19.074615478515625, 29.897132873535156, 40.71965026855469, 51.54216766357422, 62.36468505859375, 73.18720245361328, 84.00971984863281, 94.83223724365234, 105.65475463867188, 116.4772720336914, 127.29978942871094, 138.122314453125, 148.94482421875, 159.767333984375, 170.58985900878906, 181.41238403320312, 192.23489379882812, 203.05740356445312, 213.8799285888672, 224.70245361328125, 235.52496337890625, 246.34747314453125, 257.16998291015625, 267.9925231933594, 278.8150329589844, 289.6375427246094, 300.4600830078125, 311.2825927734375, 322.1051025390625, 332.9276123046875, 343.7501220703125, 354.5726623535156, 365.3951721191406]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 1.0, 2.0, 8.0, 9.0, 2.0, 9.0, 10.0, 14.0, 15.0, 16.0, 16.0, 23.0, 22.0, 28.0, 33.0, 33.0, 41.0, 35.0, 35.0, 41.0, 43.0, 41.0, 38.0, 47.0, 55.0, 35.0, 23.0, 36.0, 30.0, 32.0, 33.0, 22.0, 23.0, 17.0, 24.0, 21.0, 16.0, 13.0, 13.0, 13.0, 7.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-67.8125, -65.6669921875, -63.521484375, -61.3759765625, -59.23046875, -57.0849609375, -54.939453125, -52.7939453125, -50.6484375, -48.5029296875, -46.357421875, -44.2119140625, -42.06640625, -39.9208984375, -37.775390625, -35.6298828125, -33.484375, -31.3388671875, -29.193359375, -27.0478515625, -24.90234375, -22.7568359375, -20.611328125, -18.4658203125, -16.3203125, -14.1748046875, -12.029296875, -9.8837890625, -7.73828125, -5.5927734375, -3.447265625, -1.3017578125, 0.84375, 2.9892578125, 5.134765625, 7.2802734375, 9.42578125, 11.5712890625, 13.716796875, 15.8623046875, 18.0078125, 20.1533203125, 22.298828125, 24.4443359375, 26.58984375, 28.7353515625, 30.880859375, 33.0263671875, 35.171875, 37.3173828125, 39.462890625, 41.6083984375, 43.75390625, 45.8994140625, 48.044921875, 50.1904296875, 52.3359375, 54.4814453125, 56.626953125, 58.7724609375, 60.91796875, 63.0634765625, 65.208984375, 67.3544921875, 69.5]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 12.0, 5.0, 19.0, 17.0, 19.0, 20.0, 31.0, 35.0, 45.0, 69.0, 79.0, 125.0, 220.0, 413.0, 804.0, 1964.0, 5959.0, 30710.0, 4016625.0, 120930.0, 10551.0, 3045.0, 1181.0, 535.0, 259.0, 177.0, 95.0, 61.0, 55.0, 46.0, 27.0, 28.0, 9.0, 19.0, 17.0, 13.0, 15.0, 7.0, 7.0, 7.0, 7.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-590.0, -571.390625, -552.78125, -534.171875, -515.5625, -496.953125, -478.34375, -459.734375, -441.125, -422.515625, -403.90625, -385.296875, -366.6875, -348.078125, -329.46875, -310.859375, -292.25, -273.640625, -255.03125, -236.421875, -217.8125, -199.203125, -180.59375, -161.984375, -143.375, -124.765625, -106.15625, -87.546875, -68.9375, -50.328125, -31.71875, -13.109375, 5.5, 24.109375, 42.71875, 61.328125, 79.9375, 98.546875, 117.15625, 135.765625, 154.375, 172.984375, 191.59375, 210.203125, 228.8125, 247.421875, 266.03125, 284.640625, 303.25, 321.859375, 340.46875, 359.078125, 377.6875, 396.296875, 414.90625, 433.515625, 452.125, 470.734375, 489.34375, 507.953125, 526.5625, 545.171875, 563.78125, 582.390625, 601.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 9.0, 9.0, 15.0, 19.0, 13.0, 27.0, 17.0, 36.0, 39.0, 66.0, 132.0, 274.0, 820.0, 1318.0, 617.0, 247.0, 108.0, 83.0, 48.0, 41.0, 21.0, 18.0, 21.0, 15.0, 11.0, 5.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.25, -118.904296875, -114.55859375, -110.212890625, -105.8671875, -101.521484375, -97.17578125, -92.830078125, -88.484375, -84.138671875, -79.79296875, -75.447265625, -71.1015625, -66.755859375, -62.41015625, -58.064453125, -53.71875, -49.373046875, -45.02734375, -40.681640625, -36.3359375, -31.990234375, -27.64453125, -23.298828125, -18.953125, -14.607421875, -10.26171875, -5.916015625, -1.5703125, 2.775390625, 7.12109375, 11.466796875, 15.8125, 20.158203125, 24.50390625, 28.849609375, 33.1953125, 37.541015625, 41.88671875, 46.232421875, 50.578125, 54.923828125, 59.26953125, 63.615234375, 67.9609375, 72.306640625, 76.65234375, 80.998046875, 85.34375, 89.689453125, 94.03515625, 98.380859375, 102.7265625, 107.072265625, 111.41796875, 115.763671875, 120.109375, 124.455078125, 128.80078125, 133.146484375, 137.4921875, 141.837890625, 146.18359375, 150.529296875, 154.875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 3.0, 16.0, 13.0, 22.0, 35.0, 47.0, 114.0, 163.0, 314.0, 685.0, 1462.0, 3394.0, 8928.0, 27804.0, 142512.0, 3791198.0, 170852.0, 30358.0, 9591.0, 3727.0, 1541.0, 707.0, 375.0, 178.0, 87.0, 60.0, 26.0, 23.0, 12.0, 8.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.0, -261.34765625, -250.6953125, -240.04296875, -229.390625, -218.73828125, -208.0859375, -197.43359375, -186.78125, -176.12890625, -165.4765625, -154.82421875, -144.171875, -133.51953125, -122.8671875, -112.21484375, -101.5625, -90.91015625, -80.2578125, -69.60546875, -58.953125, -48.30078125, -37.6484375, -26.99609375, -16.34375, -5.69140625, 4.9609375, 15.61328125, 26.265625, 36.91796875, 47.5703125, 58.22265625, 68.875, 79.52734375, 90.1796875, 100.83203125, 111.484375, 122.13671875, 132.7890625, 143.44140625, 154.09375, 164.74609375, 175.3984375, 186.05078125, 196.703125, 207.35546875, 218.0078125, 228.66015625, 239.3125, 249.96484375, 260.6171875, 271.26953125, 281.921875, 292.57421875, 303.2265625, 313.87890625, 324.53125, 335.18359375, 345.8359375, 356.48828125, 367.140625, 377.79296875, 388.4453125, 399.09765625, 409.75]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 17.0, 49.0, 69.0, 222.0, 367.0, 185.0, 59.0, 20.0, 14.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2131.30419921875, -2089.8017578125, -2048.29931640625, -2006.796875, -1965.29443359375, -1923.7919921875, -1882.28955078125, -1840.787109375, -1799.28466796875, -1757.7822265625, -1716.27978515625, -1674.77734375, -1633.27490234375, -1591.7724609375, -1550.27001953125, -1508.767578125, -1467.2650146484375, -1425.7625732421875, -1384.2601318359375, -1342.7576904296875, -1301.2552490234375, -1259.7528076171875, -1218.2503662109375, -1176.747802734375, -1135.245361328125, -1093.742919921875, -1052.240478515625, -1010.738037109375, -969.235595703125, -927.733154296875, -886.2306518554688, -844.7282104492188, -803.225830078125, -761.723388671875, -720.220947265625, -678.718505859375, -637.216064453125, -595.713623046875, -554.2111206054688, -512.7086791992188, -471.20623779296875, -429.70379638671875, -388.20135498046875, -346.6988830566406, -305.1964416503906, -263.6940002441406, -222.19154357910156, -180.6890869140625, -139.1866455078125, -97.68419647216797, -56.18174743652344, -14.679298400878906, 26.823150634765625, 68.32559204101562, 109.82804870605469, 151.33050537109375, 192.83294677734375, 234.33538818359375, 275.83782958984375, 317.3403015136719, 358.8427429199219, 400.3451843261719, 441.84765625, 483.35009765625, 524.8525390625]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 4.0, 5.0, 4.0, 8.0, 10.0, 15.0, 20.0, 18.0, 12.0, 29.0, 23.0, 38.0, 36.0, 30.0, 35.0, 36.0, 35.0, 47.0, 38.0, 45.0, 40.0, 48.0, 38.0, 43.0, 42.0, 37.0, 31.0, 29.0, 26.0, 25.0, 25.0, 15.0, 15.0, 19.0, 11.0, 11.0, 6.0, 9.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-319.42138671875, -308.74334716796875, -298.0653076171875, -287.38726806640625, -276.709228515625, -266.03118896484375, -255.3531494140625, -244.67510986328125, -233.9970703125, -223.31903076171875, -212.6409912109375, -201.96295166015625, -191.284912109375, -180.60687255859375, -169.9288330078125, -159.25079345703125, -148.57273864746094, -137.8946990966797, -127.21665954589844, -116.53861999511719, -105.86058044433594, -95.18254089355469, -84.5044937133789, -73.82645416259766, -63.148414611816406, -52.470375061035156, -41.792335510253906, -31.11429214477539, -20.43625259399414, -9.75821304321289, 0.919830322265625, 11.597869873046875, 22.275909423828125, 32.953948974609375, 43.631988525390625, 54.31003189086914, 64.98806762695312, 75.66610717773438, 86.34415435791016, 97.0221939086914, 107.70023345947266, 118.3782730102539, 129.0563201904297, 139.73435974121094, 150.4123992919922, 161.09043884277344, 171.7684783935547, 182.44651794433594, 193.1245574951172, 203.80259704589844, 214.4806365966797, 225.15867614746094, 235.8367156982422, 246.51475524902344, 257.19281005859375, 267.870849609375, 278.54888916015625, 289.2269287109375, 299.90496826171875, 310.5830078125, 321.26104736328125, 331.9390869140625, 342.61712646484375, 353.295166015625, 363.97320556640625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 4.0, 10.0, 5.0, 10.0, 15.0, 23.0, 30.0, 18.0, 33.0, 30.0, 30.0, 35.0, 36.0, 31.0, 38.0, 50.0, 29.0, 44.0, 30.0, 53.0, 37.0, 43.0, 39.0, 44.0, 22.0, 31.0, 32.0, 19.0, 25.0, 22.0, 12.0, 20.0, 7.0, 15.0, 13.0, 7.0, 10.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.125, -68.962890625, -66.80078125, -64.638671875, -62.4765625, -60.314453125, -58.15234375, -55.990234375, -53.828125, -51.666015625, -49.50390625, -47.341796875, -45.1796875, -43.017578125, -40.85546875, -38.693359375, -36.53125, -34.369140625, -32.20703125, -30.044921875, -27.8828125, -25.720703125, -23.55859375, -21.396484375, -19.234375, -17.072265625, -14.91015625, -12.748046875, -10.5859375, -8.423828125, -6.26171875, -4.099609375, -1.9375, 0.224609375, 2.38671875, 4.548828125, 6.7109375, 8.873046875, 11.03515625, 13.197265625, 15.359375, 17.521484375, 19.68359375, 21.845703125, 24.0078125, 26.169921875, 28.33203125, 30.494140625, 32.65625, 34.818359375, 36.98046875, 39.142578125, 41.3046875, 43.466796875, 45.62890625, 47.791015625, 49.953125, 52.115234375, 54.27734375, 56.439453125, 58.6015625, 60.763671875, 62.92578125, 65.087890625, 67.25]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 18.0, 24.0, 28.0, 45.0, 70.0, 92.0, 140.0, 196.0, 304.0, 376.0, 548.0, 789.0, 1071.0, 1568.0, 2209.0, 3186.0, 4395.0, 6736.0, 9806.0, 14510.0, 22297.0, 34660.0, 55823.0, 96733.0, 211033.0, 291966.0, 112775.0, 63265.0, 38687.0, 24404.0, 16158.0, 10694.0, 7353.0, 5035.0, 3447.0, 2330.0, 1706.0, 1232.0, 864.0, 543.0, 427.0, 273.0, 198.0, 188.0, 99.0, 65.0, 59.0, 41.0, 18.0, 9.0, 15.0, 13.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.517578125, -2.436676025390625, -2.35577392578125, -2.274871826171875, -2.1939697265625, -2.113067626953125, -2.03216552734375, -1.951263427734375, -1.870361328125, -1.789459228515625, -1.70855712890625, -1.627655029296875, -1.5467529296875, -1.465850830078125, -1.38494873046875, -1.304046630859375, -1.22314453125, -1.142242431640625, -1.06134033203125, -0.980438232421875, -0.8995361328125, -0.818634033203125, -0.73773193359375, -0.656829833984375, -0.575927734375, -0.495025634765625, -0.41412353515625, -0.333221435546875, -0.2523193359375, -0.171417236328125, -0.09051513671875, -0.009613037109375, 0.0712890625, 0.152191162109375, 0.23309326171875, 0.313995361328125, 0.3948974609375, 0.475799560546875, 0.55670166015625, 0.637603759765625, 0.718505859375, 0.799407958984375, 0.88031005859375, 0.961212158203125, 1.0421142578125, 1.123016357421875, 1.20391845703125, 1.284820556640625, 1.36572265625, 1.446624755859375, 1.52752685546875, 1.608428955078125, 1.6893310546875, 1.770233154296875, 1.85113525390625, 1.932037353515625, 2.012939453125, 2.093841552734375, 2.17474365234375, 2.255645751953125, 2.3365478515625, 2.417449951171875, 2.49835205078125, 2.579254150390625, 2.66015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 4.0, 5.0, 12.0, 6.0, 7.0, 19.0, 15.0, 13.0, 15.0, 21.0, 21.0, 37.0, 36.0, 35.0, 31.0, 39.0, 48.0, 46.0, 51.0, 34.0, 1066.0, 39.0, 37.0, 41.0, 30.0, 29.0, 31.0, 31.0, 28.0, 32.0, 27.0, 21.0, 17.0, 20.0, 10.0, 12.0, 9.0, 9.0, 9.0, 9.0, 6.0, 6.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-46.9375, -45.49951171875, -44.0615234375, -42.62353515625, -41.185546875, -39.74755859375, -38.3095703125, -36.87158203125, -35.43359375, -33.99560546875, -32.5576171875, -31.11962890625, -29.681640625, -28.24365234375, -26.8056640625, -25.36767578125, -23.9296875, -22.49169921875, -21.0537109375, -19.61572265625, -18.177734375, -16.73974609375, -15.3017578125, -13.86376953125, -12.42578125, -10.98779296875, -9.5498046875, -8.11181640625, -6.673828125, -5.23583984375, -3.7978515625, -2.35986328125, -0.921875, 0.51611328125, 1.9541015625, 3.39208984375, 4.830078125, 6.26806640625, 7.7060546875, 9.14404296875, 10.58203125, 12.02001953125, 13.4580078125, 14.89599609375, 16.333984375, 17.77197265625, 19.2099609375, 20.64794921875, 22.0859375, 23.52392578125, 24.9619140625, 26.39990234375, 27.837890625, 29.27587890625, 30.7138671875, 32.15185546875, 33.58984375, 35.02783203125, 36.4658203125, 37.90380859375, 39.341796875, 40.77978515625, 42.2177734375, 43.65576171875, 45.09375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 8.0, 11.0, 11.0, 10.0, 28.0, 35.0, 57.0, 79.0, 85.0, 144.0, 208.0, 317.0, 377.0, 609.0, 832.0, 1128.0, 1770.0, 2576.0, 3761.0, 5483.0, 8023.0, 11941.0, 18491.0, 28416.0, 44506.0, 72216.0, 130092.0, 1359963.0, 168103.0, 87721.0, 52414.0, 33221.0, 21463.0, 13834.0, 9282.0, 6213.0, 4262.0, 2927.0, 1918.0, 1421.0, 930.0, 682.0, 486.0, 302.0, 223.0, 171.0, 119.0, 84.0, 63.0, 26.0, 22.0, 24.0, 16.0, 14.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0], "bins": [-1.8828125, -1.8233642578125, -1.763916015625, -1.7044677734375, -1.64501953125, -1.5855712890625, -1.526123046875, -1.4666748046875, -1.4072265625, -1.3477783203125, -1.288330078125, -1.2288818359375, -1.16943359375, -1.1099853515625, -1.050537109375, -0.9910888671875, -0.931640625, -0.8721923828125, -0.812744140625, -0.7532958984375, -0.69384765625, -0.6343994140625, -0.574951171875, -0.5155029296875, -0.4560546875, -0.3966064453125, -0.337158203125, -0.2777099609375, -0.21826171875, -0.1588134765625, -0.099365234375, -0.0399169921875, 0.01953125, 0.0789794921875, 0.138427734375, 0.1978759765625, 0.25732421875, 0.3167724609375, 0.376220703125, 0.4356689453125, 0.4951171875, 0.5545654296875, 0.614013671875, 0.6734619140625, 0.73291015625, 0.7923583984375, 0.851806640625, 0.9112548828125, 0.970703125, 1.0301513671875, 1.089599609375, 1.1490478515625, 1.20849609375, 1.2679443359375, 1.327392578125, 1.3868408203125, 1.4462890625, 1.5057373046875, 1.565185546875, 1.6246337890625, 1.68408203125, 1.7435302734375, 1.802978515625, 1.8624267578125, 1.921875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 5.0, 10.0, 8.0, 8.0, 18.0, 9.0, 17.0, 19.0, 26.0, 33.0, 41.0, 55.0, 77.0, 98.0, 128.0, 98.0, 69.0, 45.0, 42.0, 28.0, 36.0, 15.0, 12.0, 15.0, 10.0, 8.0, 13.0, 8.0, 4.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.679794311523438e-05, -9.380653500556946e-05, -9.081512689590454e-05, -8.782371878623962e-05, -8.483231067657471e-05, -8.184090256690979e-05, -7.884949445724487e-05, -7.585808634757996e-05, -7.286667823791504e-05, -6.987527012825012e-05, -6.68838620185852e-05, -6.389245390892029e-05, -6.090104579925537e-05, -5.7909637689590454e-05, -5.491822957992554e-05, -5.192682147026062e-05, -4.89354133605957e-05, -4.5944005250930786e-05, -4.295259714126587e-05, -3.996118903160095e-05, -3.6969780921936035e-05, -3.397837281227112e-05, -3.09869647026062e-05, -2.7995556592941284e-05, -2.5004148483276367e-05, -2.201274037361145e-05, -1.9021332263946533e-05, -1.6029924154281616e-05, -1.30385160446167e-05, -1.0047107934951782e-05, -7.055699825286865e-06, -4.064291715621948e-06, -1.0728836059570312e-06, 1.9185245037078857e-06, 4.909932613372803e-06, 7.90134072303772e-06, 1.0892748832702637e-05, 1.3884156942367554e-05, 1.687556505203247e-05, 1.9866973161697388e-05, 2.2858381271362305e-05, 2.584978938102722e-05, 2.884119749069214e-05, 3.1832605600357056e-05, 3.482401371002197e-05, 3.781542181968689e-05, 4.080682992935181e-05, 4.3798238039016724e-05, 4.678964614868164e-05, 4.978105425834656e-05, 5.2772462368011475e-05, 5.576387047767639e-05, 5.875527858734131e-05, 6.174668669700623e-05, 6.473809480667114e-05, 6.772950291633606e-05, 7.072091102600098e-05, 7.37123191356659e-05, 7.670372724533081e-05, 7.969513535499573e-05, 8.268654346466064e-05, 8.567795157432556e-05, 8.866935968399048e-05, 9.16607677936554e-05, 9.465217590332031e-05]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 8.0, 9.0, 19.0, 16.0, 15.0, 20.0, 25.0, 28.0, 40.0, 54.0, 66.0, 142.0, 220.0, 456.0, 2275.0, 27441.0, 943688.0, 68616.0, 3986.0, 648.0, 235.0, 139.0, 90.0, 52.0, 44.0, 43.0, 25.0, 24.0, 18.0, 12.0, 15.0, 13.0, 12.0, 2.0, 5.0, 6.0, 4.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0015115737915039062, -0.0014637857675552368, -0.0014159977436065674, -0.001368209719657898, -0.0013204216957092285, -0.001272633671760559, -0.0012248456478118896, -0.0011770576238632202, -0.0011292695999145508, -0.0010814815759658813, -0.001033693552017212, -0.0009859055280685425, -0.000938117504119873, -0.0008903294801712036, -0.0008425414562225342, -0.0007947534322738647, -0.0007469654083251953, -0.0006991773843765259, -0.0006513893604278564, -0.000603601336479187, -0.0005558133125305176, -0.0005080252885818481, -0.0004602372646331787, -0.0004124492406845093, -0.00036466121673583984, -0.0003168731927871704, -0.000269085168838501, -0.00022129714488983154, -0.0001735091209411621, -0.00012572109699249268, -7.793307304382324e-05, -3.014504909515381e-05, 1.7642974853515625e-05, 6.543099880218506e-05, 0.00011321902275085449, 0.00016100704669952393, 0.00020879507064819336, 0.0002565830945968628, 0.0003043711185455322, 0.00035215914249420166, 0.0003999471664428711, 0.00044773519039154053, 0.00049552321434021, 0.0005433112382888794, 0.0005910992622375488, 0.0006388872861862183, 0.0006866753101348877, 0.0007344633340835571, 0.0007822513580322266, 0.000830039381980896, 0.0008778274059295654, 0.0009256154298782349, 0.0009734034538269043, 0.0010211914777755737, 0.0010689795017242432, 0.0011167675256729126, 0.001164555549621582, 0.0012123435735702515, 0.001260131597518921, 0.0013079196214675903, 0.0013557076454162598, 0.0014034956693649292, 0.0014512836933135986, 0.001499071717262268, 0.0015468597412109375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 13.0, 29.0, 39.0, 59.0, 116.0, 253.0, 249.0, 124.0, 59.0, 25.0, 18.0, 12.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020603692973963916, -0.00020183276501484215, -0.00019762858573812991, -0.0001934244210133329, -0.00018922024173662066, -0.00018501607701182365, -0.00018081189773511142, -0.0001766077330103144, -0.00017240355373360217, -0.00016819938900880516, -0.00016399520973209292, -0.0001597910450072959, -0.00015558686573058367, -0.00015138270100578666, -0.00014717852172907442, -0.0001429743570042774, -0.00013877017772756517, -0.00013456601300276816, -0.00013036183372605592, -0.0001261576690012589, -0.00012195348972454667, -0.00011774931772379205, -0.00011354514572303742, -0.00010934098099824041, -0.0001051368162734434, -0.00010093264427268878, -9.672847227193415e-05, -9.252430027117953e-05, -8.83201282704249e-05, -8.411595626967028e-05, -7.991178426891565e-05, -7.570761954411864e-05, -7.150344754336402e-05, -6.72992755426094e-05, -6.309510354185477e-05, -5.8890931541100144e-05, -5.468675954034552e-05, -5.0482587539590895e-05, -4.627841917681508e-05, -4.207424717606045e-05, -3.787007517530583e-05, -3.3665903174551204e-05, -2.946173117379658e-05, -2.5257560992031358e-05, -2.1053388991276734e-05, -1.684921699052211e-05, -1.2645046808756888e-05, -8.440874808002263e-06, -4.236702807247639e-06, -3.2531261240364984e-08, 4.171640284766909e-06, 8.375811376026832e-06, 1.2579983376781456e-05, 1.678415537753608e-05, 2.0988325559301302e-05, 2.5192497560055926e-05, 2.939666956081055e-05, 3.3600841561565176e-05, 3.78050135623198e-05, 4.200918192509562e-05, 4.621335392585024e-05, 5.041752592660487e-05, 5.462169792735949e-05, 5.8825869928114116e-05, 6.303004192886874e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 9.0, 3.0, 5.0, 6.0, 7.0, 8.0, 7.0, 15.0, 11.0, 17.0, 23.0, 26.0, 22.0, 21.0, 35.0, 26.0, 30.0, 44.0, 32.0, 43.0, 30.0, 41.0, 34.0, 41.0, 35.0, 40.0, 29.0, 37.0, 46.0, 32.0, 29.0, 22.0, 29.0, 28.0, 23.0, 16.0, 17.0, 18.0, 11.0, 11.0, 8.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.202127456665039e-05, -4.06680628657341e-05, -3.931485116481781e-05, -3.796163946390152e-05, -3.660842776298523e-05, -3.525521606206894e-05, -3.390200436115265e-05, -3.254879266023636e-05, -3.119558095932007e-05, -2.9842369258403778e-05, -2.8489157557487488e-05, -2.7135945856571198e-05, -2.5782734155654907e-05, -2.4429522454738617e-05, -2.3076310753822327e-05, -2.1723099052906036e-05, -2.0369887351989746e-05, -1.9016675651073456e-05, -1.7663463950157166e-05, -1.6310252249240875e-05, -1.4957040548324585e-05, -1.3603828847408295e-05, -1.2250617146492004e-05, -1.0897405445575714e-05, -9.544193744659424e-06, -8.190982043743134e-06, -6.837770342826843e-06, -5.484558641910553e-06, -4.131346940994263e-06, -2.7781352400779724e-06, -1.4249235391616821e-06, -7.171183824539185e-08, 1.2814998626708984e-06, 2.6347115635871887e-06, 3.987923264503479e-06, 5.341134965419769e-06, 6.6943466663360596e-06, 8.04755836725235e-06, 9.40077006816864e-06, 1.075398176908493e-05, 1.210719347000122e-05, 1.3460405170917511e-05, 1.4813616871833801e-05, 1.616682857275009e-05, 1.7520040273666382e-05, 1.8873251974582672e-05, 2.0226463675498962e-05, 2.1579675376415253e-05, 2.2932887077331543e-05, 2.4286098778247833e-05, 2.5639310479164124e-05, 2.6992522180080414e-05, 2.8345733880996704e-05, 2.9698945581912994e-05, 3.1052157282829285e-05, 3.2405368983745575e-05, 3.3758580684661865e-05, 3.5111792385578156e-05, 3.6465004086494446e-05, 3.7818215787410736e-05, 3.9171427488327026e-05, 4.052463918924332e-05, 4.187785089015961e-05, 4.32310625910759e-05, 4.458427429199219e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 4.0, 10.0, 5.0, 10.0, 15.0, 23.0, 30.0, 18.0, 33.0, 30.0, 30.0, 35.0, 36.0, 31.0, 38.0, 50.0, 29.0, 44.0, 30.0, 53.0, 37.0, 43.0, 39.0, 44.0, 22.0, 31.0, 32.0, 19.0, 25.0, 22.0, 12.0, 20.0, 7.0, 15.0, 13.0, 7.0, 10.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.125, -68.962890625, -66.80078125, -64.638671875, -62.4765625, -60.314453125, -58.15234375, -55.990234375, -53.828125, -51.666015625, -49.50390625, -47.341796875, -45.1796875, -43.017578125, -40.85546875, -38.693359375, -36.53125, -34.369140625, -32.20703125, -30.044921875, -27.8828125, -25.720703125, -23.55859375, -21.396484375, -19.234375, -17.072265625, -14.91015625, -12.748046875, -10.5859375, -8.423828125, -6.26171875, -4.099609375, -1.9375, 0.224609375, 2.38671875, 4.548828125, 6.7109375, 8.873046875, 11.03515625, 13.197265625, 15.359375, 17.521484375, 19.68359375, 21.845703125, 24.0078125, 26.169921875, 28.33203125, 30.494140625, 32.65625, 34.818359375, 36.98046875, 39.142578125, 41.3046875, 43.466796875, 45.62890625, 47.791015625, 49.953125, 52.115234375, 54.27734375, 56.439453125, 58.6015625, 60.763671875, 62.92578125, 65.087890625, 67.25]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 7.0, 9.0, 8.0, 12.0, 20.0, 31.0, 45.0, 70.0, 60.0, 89.0, 120.0, 189.0, 231.0, 298.0, 401.0, 578.0, 789.0, 1198.0, 1670.0, 2524.0, 4132.0, 6749.0, 12457.0, 25729.0, 66023.0, 235868.0, 480805.0, 123767.0, 41666.0, 18003.0, 9303.0, 5341.0, 3282.0, 2044.0, 1462.0, 983.0, 665.0, 508.0, 380.0, 252.0, 231.0, 141.0, 123.0, 80.0, 50.0, 45.0, 36.0, 29.0, 13.0, 16.0, 6.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-119.375, -115.67578125, -111.9765625, -108.27734375, -104.578125, -100.87890625, -97.1796875, -93.48046875, -89.78125, -86.08203125, -82.3828125, -78.68359375, -74.984375, -71.28515625, -67.5859375, -63.88671875, -60.1875, -56.48828125, -52.7890625, -49.08984375, -45.390625, -41.69140625, -37.9921875, -34.29296875, -30.59375, -26.89453125, -23.1953125, -19.49609375, -15.796875, -12.09765625, -8.3984375, -4.69921875, -1.0, 2.69921875, 6.3984375, 10.09765625, 13.796875, 17.49609375, 21.1953125, 24.89453125, 28.59375, 32.29296875, 35.9921875, 39.69140625, 43.390625, 47.08984375, 50.7890625, 54.48828125, 58.1875, 61.88671875, 65.5859375, 69.28515625, 72.984375, 76.68359375, 80.3828125, 84.08203125, 87.78125, 91.48046875, 95.1796875, 98.87890625, 102.578125, 106.27734375, 109.9765625, 113.67578125, 117.375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 4.0, 7.0, 14.0, 13.0, 14.0, 21.0, 30.0, 33.0, 32.0, 52.0, 42.0, 50.0, 79.0, 132.0, 446.0, 1505.0, 166.0, 81.0, 56.0, 55.0, 46.0, 32.0, 31.0, 18.0, 21.0, 13.0, 16.0, 7.0, 8.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.75, -192.3515625, -185.953125, -179.5546875, -173.15625, -166.7578125, -160.359375, -153.9609375, -147.5625, -141.1640625, -134.765625, -128.3671875, -121.96875, -115.5703125, -109.171875, -102.7734375, -96.375, -89.9765625, -83.578125, -77.1796875, -70.78125, -64.3828125, -57.984375, -51.5859375, -45.1875, -38.7890625, -32.390625, -25.9921875, -19.59375, -13.1953125, -6.796875, -0.3984375, 6.0, 12.3984375, 18.796875, 25.1953125, 31.59375, 37.9921875, 44.390625, 50.7890625, 57.1875, 63.5859375, 69.984375, 76.3828125, 82.78125, 89.1796875, 95.578125, 101.9765625, 108.375, 114.7734375, 121.171875, 127.5703125, 133.96875, 140.3671875, 146.765625, 153.1640625, 159.5625, 165.9609375, 172.359375, 178.7578125, 185.15625, 191.5546875, 197.953125, 204.3515625, 210.75]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 10.0, 12.0, 8.0, 18.0, 35.0, 41.0, 56.0, 97.0, 192.0, 583.0, 4001.0, 3062483.0, 75944.0, 1434.0, 356.0, 153.0, 76.0, 48.0, 37.0, 27.0, 25.0, 16.0, 14.0, 8.0, 8.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-767.0, -741.2578125, -715.515625, -689.7734375, -664.03125, -638.2890625, -612.546875, -586.8046875, -561.0625, -535.3203125, -509.578125, -483.8359375, -458.09375, -432.3515625, -406.609375, -380.8671875, -355.125, -329.3828125, -303.640625, -277.8984375, -252.15625, -226.4140625, -200.671875, -174.9296875, -149.1875, -123.4453125, -97.703125, -71.9609375, -46.21875, -20.4765625, 5.265625, 31.0078125, 56.75, 82.4921875, 108.234375, 133.9765625, 159.71875, 185.4609375, 211.203125, 236.9453125, 262.6875, 288.4296875, 314.171875, 339.9140625, 365.65625, 391.3984375, 417.140625, 442.8828125, 468.625, 494.3671875, 520.109375, 545.8515625, 571.59375, 597.3359375, 623.078125, 648.8203125, 674.5625, 700.3046875, 726.046875, 751.7890625, 777.53125, 803.2734375, 829.015625, 854.7578125, 880.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 35.0, 178.0, 397.0, 270.0, 91.0, 24.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-430.9970397949219, -399.5403747558594, -368.0837097167969, -336.6270446777344, -305.1703796386719, -273.7137451171875, -242.25706481933594, -210.80039978027344, -179.34373474121094, -147.88706970214844, -116.43040466308594, -84.97374725341797, -53.51708221435547, -22.0604248046875, 9.396240234375, 40.8529052734375, 72.3095703125, 103.7662353515625, 135.222900390625, 166.6795654296875, 198.13623046875, 229.59288024902344, 261.049560546875, 292.5062255859375, 323.962890625, 355.4195556640625, 386.876220703125, 418.3328857421875, 449.78955078125, 481.2462158203125, 512.702880859375, 544.1595458984375, 575.6161499023438, 607.0728149414062, 638.5294799804688, 669.9861450195312, 701.4428100585938, 732.8994750976562, 764.3561401367188, 795.8128051757812, 827.2694702148438, 858.7261352539062, 890.1828002929688, 921.6394653320312, 953.0961303710938, 984.5527954101562, 1016.0094604492188, 1047.466064453125, 1078.9227294921875, 1110.37939453125, 1141.8360595703125, 1173.292724609375, 1204.7493896484375, 1236.2060546875, 1267.6627197265625, 1299.119384765625, 1330.5760498046875, 1362.03271484375, 1393.4893798828125, 1424.946044921875, 1456.4027099609375, 1487.859375, 1519.3160400390625, 1550.772705078125, 1582.2293701171875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 10.0, 9.0, 10.0, 15.0, 13.0, 18.0, 25.0, 22.0, 19.0, 18.0, 30.0, 36.0, 29.0, 38.0, 36.0, 37.0, 39.0, 41.0, 39.0, 37.0, 44.0, 41.0, 48.0, 37.0, 37.0, 29.0, 30.0, 27.0, 31.0, 19.0, 16.0, 20.0, 20.0, 16.0, 15.0, 14.0, 2.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-372.13116455078125, -359.1233215332031, -346.115478515625, -333.1076354980469, -320.09979248046875, -307.0919494628906, -294.0841064453125, -281.07623291015625, -268.06842041015625, -255.06057739257812, -242.052734375, -229.04489135742188, -216.03704833984375, -203.02920532226562, -190.02134704589844, -177.0135040283203, -164.00564575195312, -150.997802734375, -137.98995971679688, -124.98210906982422, -111.9742660522461, -98.96642303466797, -85.95857238769531, -72.95072937011719, -59.94288635253906, -46.93504333496094, -33.92719650268555, -20.919349670410156, -7.911506652832031, 5.096336364746094, 18.10418701171875, 31.112030029296875, 44.119873046875, 57.127716064453125, 70.13555908203125, 83.1434097290039, 96.15125274658203, 109.15909576416016, 122.16694641113281, 135.17478942871094, 148.18263244628906, 161.1904754638672, 174.1983184814453, 187.2061767578125, 200.21401977539062, 213.22186279296875, 226.22970581054688, 239.237548828125, 252.24539184570312, 265.25323486328125, 278.2610778808594, 291.2689208984375, 304.2767639160156, 317.28460693359375, 330.29248046875, 343.30029296875, 356.30816650390625, 369.3160095214844, 382.3238525390625, 395.3316955566406, 408.33953857421875, 421.3473815917969, 434.355224609375, 447.36309814453125, 460.37091064453125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 10.0, 5.0, 7.0, 8.0, 9.0, 15.0, 19.0, 23.0, 17.0, 25.0, 23.0, 35.0, 31.0, 30.0, 31.0, 43.0, 26.0, 50.0, 37.0, 43.0, 42.0, 39.0, 50.0, 31.0, 40.0, 38.0, 30.0, 29.0, 26.0, 37.0, 12.0, 22.0, 21.0, 15.0, 17.0, 9.0, 6.0, 15.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-65.5, -63.3134765625, -61.126953125, -58.9404296875, -56.75390625, -54.5673828125, -52.380859375, -50.1943359375, -48.0078125, -45.8212890625, -43.634765625, -41.4482421875, -39.26171875, -37.0751953125, -34.888671875, -32.7021484375, -30.515625, -28.3291015625, -26.142578125, -23.9560546875, -21.76953125, -19.5830078125, -17.396484375, -15.2099609375, -13.0234375, -10.8369140625, -8.650390625, -6.4638671875, -4.27734375, -2.0908203125, 0.095703125, 2.2822265625, 4.46875, 6.6552734375, 8.841796875, 11.0283203125, 13.21484375, 15.4013671875, 17.587890625, 19.7744140625, 21.9609375, 24.1474609375, 26.333984375, 28.5205078125, 30.70703125, 32.8935546875, 35.080078125, 37.2666015625, 39.453125, 41.6396484375, 43.826171875, 46.0126953125, 48.19921875, 50.3857421875, 52.572265625, 54.7587890625, 56.9453125, 59.1318359375, 61.318359375, 63.5048828125, 65.69140625, 67.8779296875, 70.064453125, 72.2509765625, 74.4375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 8.0, 11.0, 16.0, 23.0, 28.0, 39.0, 52.0, 63.0, 79.0, 131.0, 179.0, 229.0, 350.0, 473.0, 688.0, 1046.0, 1619.0, 2479.0, 4252.0, 7562.0, 15800.0, 49289.0, 419670.0, 2876049.0, 697009.0, 76249.0, 18992.0, 8719.0, 4776.0, 2963.0, 1746.0, 1114.0, 754.0, 535.0, 344.0, 272.0, 170.0, 134.0, 87.0, 84.0, 42.0, 42.0, 37.0, 16.0, 10.0, 20.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-163.375, -158.513671875, -153.65234375, -148.791015625, -143.9296875, -139.068359375, -134.20703125, -129.345703125, -124.484375, -119.623046875, -114.76171875, -109.900390625, -105.0390625, -100.177734375, -95.31640625, -90.455078125, -85.59375, -80.732421875, -75.87109375, -71.009765625, -66.1484375, -61.287109375, -56.42578125, -51.564453125, -46.703125, -41.841796875, -36.98046875, -32.119140625, -27.2578125, -22.396484375, -17.53515625, -12.673828125, -7.8125, -2.951171875, 1.91015625, 6.771484375, 11.6328125, 16.494140625, 21.35546875, 26.216796875, 31.078125, 35.939453125, 40.80078125, 45.662109375, 50.5234375, 55.384765625, 60.24609375, 65.107421875, 69.96875, 74.830078125, 79.69140625, 84.552734375, 89.4140625, 94.275390625, 99.13671875, 103.998046875, 108.859375, 113.720703125, 118.58203125, 123.443359375, 128.3046875, 133.166015625, 138.02734375, 142.888671875, 147.75]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 10.0, 14.0, 9.0, 20.0, 21.0, 29.0, 52.0, 62.0, 82.0, 171.0, 258.0, 529.0, 899.0, 818.0, 424.0, 254.0, 125.0, 73.0, 47.0, 42.0, 39.0, 21.0, 20.0, 15.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.125, -126.416015625, -121.70703125, -116.998046875, -112.2890625, -107.580078125, -102.87109375, -98.162109375, -93.453125, -88.744140625, -84.03515625, -79.326171875, -74.6171875, -69.908203125, -65.19921875, -60.490234375, -55.78125, -51.072265625, -46.36328125, -41.654296875, -36.9453125, -32.236328125, -27.52734375, -22.818359375, -18.109375, -13.400390625, -8.69140625, -3.982421875, 0.7265625, 5.435546875, 10.14453125, 14.853515625, 19.5625, 24.271484375, 28.98046875, 33.689453125, 38.3984375, 43.107421875, 47.81640625, 52.525390625, 57.234375, 61.943359375, 66.65234375, 71.361328125, 76.0703125, 80.779296875, 85.48828125, 90.197265625, 94.90625, 99.615234375, 104.32421875, 109.033203125, 113.7421875, 118.451171875, 123.16015625, 127.869140625, 132.578125, 137.287109375, 141.99609375, 146.705078125, 151.4140625, 156.123046875, 160.83203125, 165.541015625, 170.25]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 3.0, 5.0, 15.0, 15.0, 18.0, 36.0, 60.0, 115.0, 183.0, 330.0, 591.0, 1049.0, 1935.0, 4109.0, 9246.0, 25126.0, 93814.0, 1083417.0, 2784035.0, 135900.0, 32937.0, 11396.0, 4943.0, 2334.0, 1154.0, 626.0, 367.0, 225.0, 109.0, 76.0, 42.0, 25.0, 10.0, 13.0, 9.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.875, -239.06640625, -232.2578125, -225.44921875, -218.640625, -211.83203125, -205.0234375, -198.21484375, -191.40625, -184.59765625, -177.7890625, -170.98046875, -164.171875, -157.36328125, -150.5546875, -143.74609375, -136.9375, -130.12890625, -123.3203125, -116.51171875, -109.703125, -102.89453125, -96.0859375, -89.27734375, -82.46875, -75.66015625, -68.8515625, -62.04296875, -55.234375, -48.42578125, -41.6171875, -34.80859375, -28.0, -21.19140625, -14.3828125, -7.57421875, -0.765625, 6.04296875, 12.8515625, 19.66015625, 26.46875, 33.27734375, 40.0859375, 46.89453125, 53.703125, 60.51171875, 67.3203125, 74.12890625, 80.9375, 87.74609375, 94.5546875, 101.36328125, 108.171875, 114.98046875, 121.7890625, 128.59765625, 135.40625, 142.21484375, 149.0234375, 155.83203125, 162.640625, 169.44921875, 176.2578125, 183.06640625, 189.875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 29.0, 94.0, 296.0, 381.0, 137.0, 49.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1074.2515869140625, -1020.8753051757812, -967.4990234375, -914.1227416992188, -860.7464599609375, -807.3701782226562, -753.993896484375, -700.6176147460938, -647.2413330078125, -593.8650512695312, -540.48876953125, -487.11248779296875, -433.7362060546875, -380.35992431640625, -326.983642578125, -273.60736083984375, -220.2310791015625, -166.85479736328125, -113.478515625, -60.10223388671875, -6.7259521484375, 46.65032958984375, 100.026611328125, 153.40289306640625, 206.7791748046875, 260.15545654296875, 313.53173828125, 366.90802001953125, 420.2843017578125, 473.66058349609375, 527.036865234375, 580.4131469726562, 633.789306640625, 687.1655883789062, 740.5418701171875, 793.9181518554688, 847.29443359375, 900.6707153320312, 954.0469970703125, 1007.4232788085938, 1060.799560546875, 1114.17578125, 1167.5521240234375, 1220.928466796875, 1274.3046875, 1327.680908203125, 1381.0572509765625, 1434.43359375, 1487.809814453125, 1541.18603515625, 1594.5623779296875, 1647.938720703125, 1701.31494140625, 1754.691162109375, 1808.0675048828125, 1861.44384765625, 1914.820068359375, 1968.1962890625, 2021.5726318359375, 2074.948974609375, 2128.3251953125, 2181.701416015625, 2235.07763671875, 2288.4541015625, 2341.830322265625]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 7.0, 7.0, 10.0, 13.0, 15.0, 15.0, 20.0, 23.0, 20.0, 27.0, 36.0, 36.0, 32.0, 46.0, 37.0, 34.0, 48.0, 44.0, 31.0, 35.0, 28.0, 51.0, 31.0, 48.0, 23.0, 32.0, 28.0, 28.0, 21.0, 22.0, 29.0, 19.0, 19.0, 19.0, 11.0, 14.0, 8.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-393.8462219238281, -381.8681335449219, -369.8900451660156, -357.9119567871094, -345.9338684082031, -333.9557800292969, -321.9776611328125, -309.99957275390625, -298.021484375, -286.04339599609375, -274.0653076171875, -262.08721923828125, -250.109130859375, -238.13104248046875, -226.15293884277344, -214.1748504638672, -202.19677734375, -190.21868896484375, -178.2406005859375, -166.26251220703125, -154.284423828125, -142.30633544921875, -130.32823181152344, -118.35014343261719, -106.37205505371094, -94.39396667480469, -82.41587829589844, -70.43778228759766, -58.459693908691406, -46.481605529785156, -34.503509521484375, -22.525421142578125, -10.54730224609375, 1.4307880401611328, 13.408878326416016, 25.38697052001953, 37.36505889892578, 49.34314727783203, 61.32124328613281, 73.29933166503906, 85.27742004394531, 97.25550842285156, 109.23359680175781, 121.2116928100586, 133.18978881835938, 145.16787719726562, 157.14596557617188, 169.12405395507812, 181.10214233398438, 193.08023071289062, 205.05831909179688, 217.03640747070312, 229.01449584960938, 240.99258422851562, 252.97068786621094, 264.94879150390625, 276.9268798828125, 288.90496826171875, 300.883056640625, 312.86114501953125, 324.8392333984375, 336.81732177734375, 348.79541015625, 360.77349853515625, 372.7515869140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 4.0, 4.0, 7.0, 14.0, 12.0, 14.0, 14.0, 23.0, 21.0, 26.0, 26.0, 25.0, 39.0, 35.0, 40.0, 46.0, 39.0, 38.0, 40.0, 40.0, 32.0, 36.0, 42.0, 45.0, 26.0, 34.0, 30.0, 23.0, 26.0, 26.0, 21.0, 25.0, 26.0, 21.0, 20.0, 14.0, 7.0, 5.0, 3.0, 2.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-58.90625, -56.91943359375, -54.9326171875, -52.94580078125, -50.958984375, -48.97216796875, -46.9853515625, -44.99853515625, -43.01171875, -41.02490234375, -39.0380859375, -37.05126953125, -35.064453125, -33.07763671875, -31.0908203125, -29.10400390625, -27.1171875, -25.13037109375, -23.1435546875, -21.15673828125, -19.169921875, -17.18310546875, -15.1962890625, -13.20947265625, -11.22265625, -9.23583984375, -7.2490234375, -5.26220703125, -3.275390625, -1.28857421875, 0.6982421875, 2.68505859375, 4.671875, 6.65869140625, 8.6455078125, 10.63232421875, 12.619140625, 14.60595703125, 16.5927734375, 18.57958984375, 20.56640625, 22.55322265625, 24.5400390625, 26.52685546875, 28.513671875, 30.50048828125, 32.4873046875, 34.47412109375, 36.4609375, 38.44775390625, 40.4345703125, 42.42138671875, 44.408203125, 46.39501953125, 48.3818359375, 50.36865234375, 52.35546875, 54.34228515625, 56.3291015625, 58.31591796875, 60.302734375, 62.28955078125, 64.2763671875, 66.26318359375, 68.25]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 17.0, 30.0, 29.0, 59.0, 95.0, 158.0, 240.0, 315.0, 435.0, 657.0, 1014.0, 1689.0, 2552.0, 3933.0, 6267.0, 10209.0, 15914.0, 26559.0, 43309.0, 75179.0, 141379.0, 327600.0, 172551.0, 89006.0, 49612.0, 30236.0, 18268.0, 11298.0, 7032.0, 4604.0, 2921.0, 1820.0, 1200.0, 792.0, 530.0, 342.0, 212.0, 165.0, 101.0, 69.0, 43.0, 32.0, 21.0, 14.0, 7.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.47265625, -2.38922119140625, -2.3057861328125, -2.22235107421875, -2.138916015625, -2.05548095703125, -1.9720458984375, -1.88861083984375, -1.80517578125, -1.72174072265625, -1.6383056640625, -1.55487060546875, -1.471435546875, -1.38800048828125, -1.3045654296875, -1.22113037109375, -1.1376953125, -1.05426025390625, -0.9708251953125, -0.88739013671875, -0.803955078125, -0.72052001953125, -0.6370849609375, -0.55364990234375, -0.47021484375, -0.38677978515625, -0.3033447265625, -0.21990966796875, -0.136474609375, -0.05303955078125, 0.0303955078125, 0.11383056640625, 0.197265625, 0.28070068359375, 0.3641357421875, 0.44757080078125, 0.531005859375, 0.61444091796875, 0.6978759765625, 0.78131103515625, 0.86474609375, 0.94818115234375, 1.0316162109375, 1.11505126953125, 1.198486328125, 1.28192138671875, 1.3653564453125, 1.44879150390625, 1.5322265625, 1.61566162109375, 1.6990966796875, 1.78253173828125, 1.865966796875, 1.94940185546875, 2.0328369140625, 2.11627197265625, 2.19970703125, 2.28314208984375, 2.3665771484375, 2.45001220703125, 2.533447265625, 2.61688232421875, 2.7003173828125, 2.78375244140625, 2.8671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 4.0, 9.0, 9.0, 9.0, 10.0, 7.0, 13.0, 12.0, 16.0, 26.0, 24.0, 20.0, 18.0, 30.0, 23.0, 35.0, 39.0, 32.0, 42.0, 28.0, 32.0, 1069.0, 39.0, 35.0, 32.0, 30.0, 28.0, 42.0, 21.0, 32.0, 22.0, 26.0, 30.0, 22.0, 17.0, 19.0, 14.0, 16.0, 14.0, 8.0, 5.0, 9.0, 5.0, 8.0, 9.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0], "bins": [-39.46875, -38.33544921875, -37.2021484375, -36.06884765625, -34.935546875, -33.80224609375, -32.6689453125, -31.53564453125, -30.40234375, -29.26904296875, -28.1357421875, -27.00244140625, -25.869140625, -24.73583984375, -23.6025390625, -22.46923828125, -21.3359375, -20.20263671875, -19.0693359375, -17.93603515625, -16.802734375, -15.66943359375, -14.5361328125, -13.40283203125, -12.26953125, -11.13623046875, -10.0029296875, -8.86962890625, -7.736328125, -6.60302734375, -5.4697265625, -4.33642578125, -3.203125, -2.06982421875, -0.9365234375, 0.19677734375, 1.330078125, 2.46337890625, 3.5966796875, 4.72998046875, 5.86328125, 6.99658203125, 8.1298828125, 9.26318359375, 10.396484375, 11.52978515625, 12.6630859375, 13.79638671875, 14.9296875, 16.06298828125, 17.1962890625, 18.32958984375, 19.462890625, 20.59619140625, 21.7294921875, 22.86279296875, 23.99609375, 25.12939453125, 26.2626953125, 27.39599609375, 28.529296875, 29.66259765625, 30.7958984375, 31.92919921875, 33.0625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 8.0, 12.0, 23.0, 29.0, 31.0, 52.0, 81.0, 133.0, 141.0, 192.0, 310.0, 423.0, 565.0, 816.0, 1158.0, 1645.0, 2339.0, 3191.0, 4647.0, 6492.0, 9524.0, 13792.0, 20438.0, 30012.0, 45952.0, 72958.0, 125294.0, 1349061.0, 158306.0, 86607.0, 53484.0, 34469.0, 23165.0, 15602.0, 10725.0, 7358.0, 5286.0, 3743.0, 2666.0, 1915.0, 1330.0, 989.0, 599.0, 460.0, 339.0, 218.0, 154.0, 122.0, 98.0, 58.0, 40.0, 31.0, 22.0, 21.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.583984375, -1.533966064453125, -1.48394775390625, -1.433929443359375, -1.3839111328125, -1.333892822265625, -1.28387451171875, -1.233856201171875, -1.183837890625, -1.133819580078125, -1.08380126953125, -1.033782958984375, -0.9837646484375, -0.933746337890625, -0.88372802734375, -0.833709716796875, -0.78369140625, -0.733673095703125, -0.68365478515625, -0.633636474609375, -0.5836181640625, -0.533599853515625, -0.48358154296875, -0.433563232421875, -0.383544921875, -0.333526611328125, -0.28350830078125, -0.233489990234375, -0.1834716796875, -0.133453369140625, -0.08343505859375, -0.033416748046875, 0.0166015625, 0.066619873046875, 0.11663818359375, 0.166656494140625, 0.2166748046875, 0.266693115234375, 0.31671142578125, 0.366729736328125, 0.416748046875, 0.466766357421875, 0.51678466796875, 0.566802978515625, 0.6168212890625, 0.666839599609375, 0.71685791015625, 0.766876220703125, 0.81689453125, 0.866912841796875, 0.91693115234375, 0.966949462890625, 1.0169677734375, 1.066986083984375, 1.11700439453125, 1.167022705078125, 1.217041015625, 1.267059326171875, 1.31707763671875, 1.367095947265625, 1.4171142578125, 1.467132568359375, 1.51715087890625, 1.567169189453125, 1.6171875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 4.0, 11.0, 5.0, 15.0, 11.0, 11.0, 26.0, 17.0, 29.0, 29.0, 41.0, 53.0, 63.0, 100.0, 125.0, 100.0, 72.0, 51.0, 50.0, 33.0, 33.0, 18.0, 18.0, 20.0, 10.0, 4.0, 7.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.655952453613281e-05, -9.328126907348633e-05, -9.000301361083984e-05, -8.672475814819336e-05, -8.344650268554688e-05, -8.016824722290039e-05, -7.68899917602539e-05, -7.361173629760742e-05, -7.033348083496094e-05, -6.705522537231445e-05, -6.377696990966797e-05, -6.0498714447021484e-05, -5.7220458984375e-05, -5.3942203521728516e-05, -5.066394805908203e-05, -4.738569259643555e-05, -4.410743713378906e-05, -4.082918167114258e-05, -3.7550926208496094e-05, -3.427267074584961e-05, -3.0994415283203125e-05, -2.771615982055664e-05, -2.4437904357910156e-05, -2.1159648895263672e-05, -1.7881393432617188e-05, -1.4603137969970703e-05, -1.1324882507324219e-05, -8.046627044677734e-06, -4.76837158203125e-06, -1.4901161193847656e-06, 1.7881393432617188e-06, 5.066394805908203e-06, 8.344650268554688e-06, 1.1622905731201172e-05, 1.4901161193847656e-05, 1.817941665649414e-05, 2.1457672119140625e-05, 2.473592758178711e-05, 2.8014183044433594e-05, 3.129243850708008e-05, 3.457069396972656e-05, 3.784894943237305e-05, 4.112720489501953e-05, 4.4405460357666016e-05, 4.76837158203125e-05, 5.0961971282958984e-05, 5.424022674560547e-05, 5.751848220825195e-05, 6.079673767089844e-05, 6.407499313354492e-05, 6.73532485961914e-05, 7.063150405883789e-05, 7.390975952148438e-05, 7.718801498413086e-05, 8.046627044677734e-05, 8.374452590942383e-05, 8.702278137207031e-05, 9.03010368347168e-05, 9.357929229736328e-05, 9.685754776000977e-05, 0.00010013580322265625, 0.00010341405868530273, 0.00010669231414794922, 0.0001099705696105957, 0.00011324882507324219]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 0.0, 7.0, 3.0, 9.0, 5.0, 9.0, 9.0, 7.0, 15.0, 15.0, 11.0, 24.0, 49.0, 37.0, 57.0, 94.0, 140.0, 242.0, 546.0, 5198.0, 789773.0, 247943.0, 3208.0, 499.0, 216.0, 113.0, 75.0, 50.0, 47.0, 24.0, 29.0, 25.0, 20.0, 18.0, 12.0, 7.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001983642578125, -0.0019268393516540527, -0.0018700361251831055, -0.0018132328987121582, -0.001756429672241211, -0.0016996264457702637, -0.0016428232192993164, -0.0015860199928283691, -0.0015292167663574219, -0.0014724135398864746, -0.0014156103134155273, -0.00135880708694458, -0.0013020038604736328, -0.0012452006340026855, -0.0011883974075317383, -0.001131594181060791, -0.0010747909545898438, -0.0010179877281188965, -0.0009611845016479492, -0.000904381275177002, -0.0008475780487060547, -0.0007907748222351074, -0.0007339715957641602, -0.0006771683692932129, -0.0006203651428222656, -0.0005635619163513184, -0.0005067586898803711, -0.00044995546340942383, -0.00039315223693847656, -0.0003363490104675293, -0.00027954578399658203, -0.00022274255752563477, -0.0001659393310546875, -0.00010913610458374023, -5.233287811279297e-05, 4.470348358154297e-06, 6.127357482910156e-05, 0.00011807680130004883, 0.0001748800277709961, 0.00023168325424194336, 0.0002884864807128906, 0.0003452897071838379, 0.00040209293365478516, 0.0004588961601257324, 0.0005156993865966797, 0.000572502613067627, 0.0006293058395385742, 0.0006861090660095215, 0.0007429122924804688, 0.000799715518951416, 0.0008565187454223633, 0.0009133219718933105, 0.0009701251983642578, 0.001026928424835205, 0.0010837316513061523, 0.0011405348777770996, 0.0011973381042480469, 0.0012541413307189941, 0.0013109445571899414, 0.0013677477836608887, 0.001424551010131836, 0.0014813542366027832, 0.0015381574630737305, 0.0015949606895446777, 0.001651763916015625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 19.0, 32.0, 90.0, 212.0, 318.0, 183.0, 83.0, 41.0, 16.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.824001608649269e-05, -9.366520680487156e-05, -8.909039752325043e-05, -8.45155882416293e-05, -7.994078623596579e-05, -7.536596967838705e-05, -7.079116767272353e-05, -6.62163583911024e-05, -6.164154910948128e-05, -5.706673982786015e-05, -5.249193054623902e-05, -4.79171249025967e-05, -4.334231562097557e-05, -3.876750633935444e-05, -3.419270069571212e-05, -2.961789141409099e-05, -2.5043082132469863e-05, -2.0468272850848734e-05, -1.589346538821701e-05, -1.1318657016090583e-05, -6.7438486439641565e-06, -2.169039362343028e-06, 2.4057681002886966e-06, 6.980575562920421e-06, 1.155538484454155e-05, 1.6130194126162678e-05, 2.0705001588794403e-05, 2.5279809051426128e-05, 2.9854618333047256e-05, 3.4429427614668384e-05, 3.9004233258310705e-05, 4.3579042539931834e-05, 4.815384454559535e-05, 5.2728653827216476e-05, 5.7303463108837605e-05, 6.187827239045873e-05, 6.645308167207986e-05, 7.102788367774338e-05, 7.56026929593645e-05, 8.017750224098563e-05, 8.475231152260676e-05, 8.932712080422789e-05, 9.390193008584902e-05, 9.847673936747015e-05, 0.00010305154137313366, 0.0001076263579307124, 0.00011220115993637592, 0.00011677596921799704, 0.00012135077849961817, 0.0001259255805052817, 0.00013050039706286043, 0.00013507519906852394, 0.00013965001562610269, 0.0001442248176317662, 0.00014879963418934494, 0.00015337443619500846, 0.0001579492527525872, 0.0001625240547582507, 0.00016709887131582946, 0.00017167367332149297, 0.0001762484898790717, 0.00018082329188473523, 0.00018539810844231397, 0.00018997291044797748, 0.000194547712453641]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 7.0, 7.0, 16.0, 11.0, 14.0, 21.0, 24.0, 20.0, 27.0, 20.0, 28.0, 27.0, 29.0, 37.0, 52.0, 49.0, 45.0, 44.0, 27.0, 43.0, 45.0, 45.0, 46.0, 40.0, 37.0, 33.0, 38.0, 26.0, 25.0, 18.0, 21.0, 16.0, 11.0, 13.0, 12.0, 8.0, 4.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.173683166503906e-05, -5.017593502998352e-05, -4.861503839492798e-05, -4.7054141759872437e-05, -4.5493245124816895e-05, -4.393234848976135e-05, -4.237145185470581e-05, -4.081055521965027e-05, -3.9249658584594727e-05, -3.7688761949539185e-05, -3.612786531448364e-05, -3.45669686794281e-05, -3.300607204437256e-05, -3.1445175409317017e-05, -2.9884278774261475e-05, -2.8323382139205933e-05, -2.676248550415039e-05, -2.520158886909485e-05, -2.3640692234039307e-05, -2.2079795598983765e-05, -2.0518898963928223e-05, -1.895800232887268e-05, -1.739710569381714e-05, -1.5836209058761597e-05, -1.4275312423706055e-05, -1.2714415788650513e-05, -1.115351915359497e-05, -9.592622518539429e-06, -8.031725883483887e-06, -6.470829248428345e-06, -4.909932613372803e-06, -3.3490359783172607e-06, -1.7881393432617188e-06, -2.2724270820617676e-07, 1.3336539268493652e-06, 2.8945505619049072e-06, 4.455447196960449e-06, 6.016343832015991e-06, 7.577240467071533e-06, 9.138137102127075e-06, 1.0699033737182617e-05, 1.225993037223816e-05, 1.3820827007293701e-05, 1.5381723642349243e-05, 1.6942620277404785e-05, 1.8503516912460327e-05, 2.006441354751587e-05, 2.162531018257141e-05, 2.3186206817626953e-05, 2.4747103452682495e-05, 2.6308000087738037e-05, 2.786889672279358e-05, 2.942979335784912e-05, 3.099068999290466e-05, 3.2551586627960205e-05, 3.411248326301575e-05, 3.567337989807129e-05, 3.723427653312683e-05, 3.879517316818237e-05, 4.0356069803237915e-05, 4.191696643829346e-05, 4.3477863073349e-05, 4.503875970840454e-05, 4.659965634346008e-05, 4.8160552978515625e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 4.0, 4.0, 7.0, 14.0, 12.0, 14.0, 14.0, 23.0, 21.0, 26.0, 26.0, 25.0, 39.0, 35.0, 40.0, 46.0, 39.0, 38.0, 40.0, 40.0, 32.0, 36.0, 42.0, 45.0, 26.0, 34.0, 30.0, 23.0, 26.0, 26.0, 21.0, 25.0, 26.0, 21.0, 20.0, 14.0, 7.0, 5.0, 3.0, 2.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-58.90625, -56.91943359375, -54.9326171875, -52.94580078125, -50.958984375, -48.97216796875, -46.9853515625, -44.99853515625, -43.01171875, -41.02490234375, -39.0380859375, -37.05126953125, -35.064453125, -33.07763671875, -31.0908203125, -29.10400390625, -27.1171875, -25.13037109375, -23.1435546875, -21.15673828125, -19.169921875, -17.18310546875, -15.1962890625, -13.20947265625, -11.22265625, -9.23583984375, -7.2490234375, -5.26220703125, -3.275390625, -1.28857421875, 0.6982421875, 2.68505859375, 4.671875, 6.65869140625, 8.6455078125, 10.63232421875, 12.619140625, 14.60595703125, 16.5927734375, 18.57958984375, 20.56640625, 22.55322265625, 24.5400390625, 26.52685546875, 28.513671875, 30.50048828125, 32.4873046875, 34.47412109375, 36.4609375, 38.44775390625, 40.4345703125, 42.42138671875, 44.408203125, 46.39501953125, 48.3818359375, 50.36865234375, 52.35546875, 54.34228515625, 56.3291015625, 58.31591796875, 60.302734375, 62.28955078125, 64.2763671875, 66.26318359375, 68.25]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 14.0, 11.0, 17.0, 16.0, 29.0, 25.0, 38.0, 71.0, 99.0, 135.0, 192.0, 230.0, 361.0, 486.0, 763.0, 1082.0, 1626.0, 2470.0, 4106.0, 7104.0, 15564.0, 43428.0, 195790.0, 600056.0, 115080.0, 31167.0, 12109.0, 6112.0, 3640.0, 2109.0, 1452.0, 942.0, 658.0, 431.0, 322.0, 241.0, 175.0, 115.0, 94.0, 55.0, 37.0, 23.0, 20.0, 22.0, 10.0, 11.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0], "bins": [-138.75, -134.58984375, -130.4296875, -126.26953125, -122.109375, -117.94921875, -113.7890625, -109.62890625, -105.46875, -101.30859375, -97.1484375, -92.98828125, -88.828125, -84.66796875, -80.5078125, -76.34765625, -72.1875, -68.02734375, -63.8671875, -59.70703125, -55.546875, -51.38671875, -47.2265625, -43.06640625, -38.90625, -34.74609375, -30.5859375, -26.42578125, -22.265625, -18.10546875, -13.9453125, -9.78515625, -5.625, -1.46484375, 2.6953125, 6.85546875, 11.015625, 15.17578125, 19.3359375, 23.49609375, 27.65625, 31.81640625, 35.9765625, 40.13671875, 44.296875, 48.45703125, 52.6171875, 56.77734375, 60.9375, 65.09765625, 69.2578125, 73.41796875, 77.578125, 81.73828125, 85.8984375, 90.05859375, 94.21875, 98.37890625, 102.5390625, 106.69921875, 110.859375, 115.01953125, 119.1796875, 123.33984375, 127.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 4.0, 11.0, 3.0, 12.0, 16.0, 17.0, 29.0, 17.0, 27.0, 23.0, 25.0, 43.0, 29.0, 46.0, 47.0, 71.0, 81.0, 93.0, 316.0, 1460.0, 142.0, 101.0, 59.0, 46.0, 43.0, 42.0, 29.0, 28.0, 24.0, 19.0, 20.0, 21.0, 13.0, 12.0, 8.0, 12.0, 8.0, 10.0, 12.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-124.5625, -120.5615234375, -116.560546875, -112.5595703125, -108.55859375, -104.5576171875, -100.556640625, -96.5556640625, -92.5546875, -88.5537109375, -84.552734375, -80.5517578125, -76.55078125, -72.5498046875, -68.548828125, -64.5478515625, -60.546875, -56.5458984375, -52.544921875, -48.5439453125, -44.54296875, -40.5419921875, -36.541015625, -32.5400390625, -28.5390625, -24.5380859375, -20.537109375, -16.5361328125, -12.53515625, -8.5341796875, -4.533203125, -0.5322265625, 3.46875, 7.4697265625, 11.470703125, 15.4716796875, 19.47265625, 23.4736328125, 27.474609375, 31.4755859375, 35.4765625, 39.4775390625, 43.478515625, 47.4794921875, 51.48046875, 55.4814453125, 59.482421875, 63.4833984375, 67.484375, 71.4853515625, 75.486328125, 79.4873046875, 83.48828125, 87.4892578125, 91.490234375, 95.4912109375, 99.4921875, 103.4931640625, 107.494140625, 111.4951171875, 115.49609375, 119.4970703125, 123.498046875, 127.4990234375, 131.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 2.0, 5.0, 6.0, 10.0, 16.0, 26.0, 26.0, 42.0, 61.0, 72.0, 132.0, 208.0, 393.0, 1207.0, 13280.0, 3082144.0, 44937.0, 1897.0, 517.0, 260.0, 143.0, 95.0, 58.0, 49.0, 38.0, 22.0, 16.0, 11.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-478.75, -462.59765625, -446.4453125, -430.29296875, -414.140625, -397.98828125, -381.8359375, -365.68359375, -349.53125, -333.37890625, -317.2265625, -301.07421875, -284.921875, -268.76953125, -252.6171875, -236.46484375, -220.3125, -204.16015625, -188.0078125, -171.85546875, -155.703125, -139.55078125, -123.3984375, -107.24609375, -91.09375, -74.94140625, -58.7890625, -42.63671875, -26.484375, -10.33203125, 5.8203125, 21.97265625, 38.125, 54.27734375, 70.4296875, 86.58203125, 102.734375, 118.88671875, 135.0390625, 151.19140625, 167.34375, 183.49609375, 199.6484375, 215.80078125, 231.953125, 248.10546875, 264.2578125, 280.41015625, 296.5625, 312.71484375, 328.8671875, 345.01953125, 361.171875, 377.32421875, 393.4765625, 409.62890625, 425.78125, 441.93359375, 458.0859375, 474.23828125, 490.390625, 506.54296875, 522.6953125, 538.84765625, 555.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 17.0, 157.0, 545.0, 229.0, 53.0, 10.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2238.07177734375, -2177.052734375, -2116.033935546875, -2055.014892578125, -1993.995849609375, -1932.9769287109375, -1871.9578857421875, -1810.93896484375, -1749.919921875, -1688.9010009765625, -1627.8819580078125, -1566.863037109375, -1505.843994140625, -1444.8250732421875, -1383.8060302734375, -1322.787109375, -1261.76806640625, -1200.7491455078125, -1139.7301025390625, -1078.711181640625, -1017.692138671875, -956.6732177734375, -895.6541748046875, -834.63525390625, -773.6163330078125, -712.5973510742188, -651.578369140625, -590.5593872070312, -529.5404052734375, -468.5214538574219, -407.5024719238281, -346.4834899902344, -285.4644775390625, -224.44549560546875, -163.426513671875, -102.40754699707031, -41.38856506347656, 19.630401611328125, 80.64938354492188, 141.66836547851562, 202.68734741210938, 263.7063293457031, 324.7253112792969, 385.7442626953125, 446.76324462890625, 507.7822265625, 568.8012084960938, 629.8201904296875, 690.8391723632812, 751.858154296875, 812.8771362304688, 873.8961181640625, 934.9151000976562, 995.93408203125, 1056.9530029296875, 1117.9720458984375, 1178.990966796875, 1240.0098876953125, 1301.0289306640625, 1362.0478515625, 1423.06689453125, 1484.0858154296875, 1545.1048583984375, 1606.123779296875, 1667.142822265625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 1.0, 4.0, 3.0, 6.0, 2.0, 10.0, 10.0, 14.0, 13.0, 9.0, 14.0, 26.0, 27.0, 23.0, 25.0, 34.0, 28.0, 35.0, 41.0, 49.0, 36.0, 49.0, 44.0, 48.0, 42.0, 40.0, 43.0, 50.0, 40.0, 36.0, 36.0, 31.0, 23.0, 11.0, 17.0, 13.0, 12.0, 9.0, 15.0, 10.0, 7.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-495.6785583496094, -481.4095764160156, -467.1405944824219, -452.8716125488281, -438.6026611328125, -424.33367919921875, -410.064697265625, -395.79571533203125, -381.5267333984375, -367.25775146484375, -352.98876953125, -338.71978759765625, -324.4508056640625, -310.18182373046875, -295.9128723144531, -281.6438903808594, -267.3749084472656, -253.10592651367188, -238.83694458007812, -224.56797790527344, -210.2989959716797, -196.03001403808594, -181.76104736328125, -167.4920654296875, -153.22308349609375, -138.9541015625, -124.68512725830078, -110.41615295410156, -96.14717102050781, -81.87818908691406, -67.60921478271484, -53.340240478515625, -39.071258544921875, -24.80228042602539, -10.533302307128906, 3.735675811767578, 18.004653930664062, 32.27363586425781, 46.54261016845703, 60.81158447265625, 75.08056640625, 89.34954833984375, 103.61852264404297, 117.88749694824219, 132.15647888183594, 146.4254608154297, 160.69442749023438, 174.96340942382812, 189.23239135742188, 203.50137329101562, 217.77035522460938, 232.03932189941406, 246.3083038330078, 260.5772705078125, 274.84625244140625, 289.115234375, 303.38421630859375, 317.6531982421875, 331.92218017578125, 346.191162109375, 360.46014404296875, 374.7291259765625, 388.9980773925781, 403.2670593261719, 417.5360412597656]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 2.0, 6.0, 7.0, 7.0, 12.0, 7.0, 12.0, 14.0, 16.0, 21.0, 22.0, 33.0, 30.0, 52.0, 31.0, 28.0, 42.0, 45.0, 33.0, 42.0, 34.0, 42.0, 42.0, 36.0, 39.0, 44.0, 34.0, 29.0, 39.0, 26.0, 29.0, 26.0, 18.0, 21.0, 14.0, 12.0, 11.0, 10.0, 12.0, 4.0, 3.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.0625, -60.888671875, -58.71484375, -56.541015625, -54.3671875, -52.193359375, -50.01953125, -47.845703125, -45.671875, -43.498046875, -41.32421875, -39.150390625, -36.9765625, -34.802734375, -32.62890625, -30.455078125, -28.28125, -26.107421875, -23.93359375, -21.759765625, -19.5859375, -17.412109375, -15.23828125, -13.064453125, -10.890625, -8.716796875, -6.54296875, -4.369140625, -2.1953125, -0.021484375, 2.15234375, 4.326171875, 6.5, 8.673828125, 10.84765625, 13.021484375, 15.1953125, 17.369140625, 19.54296875, 21.716796875, 23.890625, 26.064453125, 28.23828125, 30.412109375, 32.5859375, 34.759765625, 36.93359375, 39.107421875, 41.28125, 43.455078125, 45.62890625, 47.802734375, 49.9765625, 52.150390625, 54.32421875, 56.498046875, 58.671875, 60.845703125, 63.01953125, 65.193359375, 67.3671875, 69.541015625, 71.71484375, 73.888671875, 76.0625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 6.0, 17.0, 15.0, 31.0, 45.0, 53.0, 72.0, 112.0, 105.0, 193.0, 261.0, 361.0, 543.0, 836.0, 1362.0, 2377.0, 4494.0, 10679.0, 34702.0, 414038.0, 3352849.0, 319697.0, 30706.0, 10097.0, 4356.0, 2221.0, 1419.0, 847.0, 511.0, 323.0, 241.0, 169.0, 148.0, 110.0, 78.0, 68.0, 37.0, 35.0, 14.0, 14.0, 11.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.25, -191.28515625, -184.3203125, -177.35546875, -170.390625, -163.42578125, -156.4609375, -149.49609375, -142.53125, -135.56640625, -128.6015625, -121.63671875, -114.671875, -107.70703125, -100.7421875, -93.77734375, -86.8125, -79.84765625, -72.8828125, -65.91796875, -58.953125, -51.98828125, -45.0234375, -38.05859375, -31.09375, -24.12890625, -17.1640625, -10.19921875, -3.234375, 3.73046875, 10.6953125, 17.66015625, 24.625, 31.58984375, 38.5546875, 45.51953125, 52.484375, 59.44921875, 66.4140625, 73.37890625, 80.34375, 87.30859375, 94.2734375, 101.23828125, 108.203125, 115.16796875, 122.1328125, 129.09765625, 136.0625, 143.02734375, 149.9921875, 156.95703125, 163.921875, 170.88671875, 177.8515625, 184.81640625, 191.78125, 198.74609375, 205.7109375, 212.67578125, 219.640625, 226.60546875, 233.5703125, 240.53515625, 247.5]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 10.0, 4.0, 13.0, 8.0, 21.0, 19.0, 31.0, 46.0, 66.0, 92.0, 149.0, 253.0, 434.0, 739.0, 926.0, 498.0, 273.0, 159.0, 108.0, 68.0, 58.0, 25.0, 21.0, 12.0, 11.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-154.375, -149.724609375, -145.07421875, -140.423828125, -135.7734375, -131.123046875, -126.47265625, -121.822265625, -117.171875, -112.521484375, -107.87109375, -103.220703125, -98.5703125, -93.919921875, -89.26953125, -84.619140625, -79.96875, -75.318359375, -70.66796875, -66.017578125, -61.3671875, -56.716796875, -52.06640625, -47.416015625, -42.765625, -38.115234375, -33.46484375, -28.814453125, -24.1640625, -19.513671875, -14.86328125, -10.212890625, -5.5625, -0.912109375, 3.73828125, 8.388671875, 13.0390625, 17.689453125, 22.33984375, 26.990234375, 31.640625, 36.291015625, 40.94140625, 45.591796875, 50.2421875, 54.892578125, 59.54296875, 64.193359375, 68.84375, 73.494140625, 78.14453125, 82.794921875, 87.4453125, 92.095703125, 96.74609375, 101.396484375, 106.046875, 110.697265625, 115.34765625, 119.998046875, 124.6484375, 129.298828125, 133.94921875, 138.599609375, 143.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 12.0, 12.0, 19.0, 32.0, 56.0, 86.0, 147.0, 249.0, 527.0, 1145.0, 2999.0, 10481.0, 61206.0, 2193265.0, 1850114.0, 58523.0, 10029.0, 2999.0, 1172.0, 514.0, 284.0, 148.0, 80.0, 48.0, 40.0, 32.0, 17.0, 15.0, 7.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-299.0, -289.3515625, -279.703125, -270.0546875, -260.40625, -250.7578125, -241.109375, -231.4609375, -221.8125, -212.1640625, -202.515625, -192.8671875, -183.21875, -173.5703125, -163.921875, -154.2734375, -144.625, -134.9765625, -125.328125, -115.6796875, -106.03125, -96.3828125, -86.734375, -77.0859375, -67.4375, -57.7890625, -48.140625, -38.4921875, -28.84375, -19.1953125, -9.546875, 0.1015625, 9.75, 19.3984375, 29.046875, 38.6953125, 48.34375, 57.9921875, 67.640625, 77.2890625, 86.9375, 96.5859375, 106.234375, 115.8828125, 125.53125, 135.1796875, 144.828125, 154.4765625, 164.125, 173.7734375, 183.421875, 193.0703125, 202.71875, 212.3671875, 222.015625, 231.6640625, 241.3125, 250.9609375, 260.609375, 270.2578125, 279.90625, 289.5546875, 299.203125, 308.8515625, 318.5]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 11.0, 64.0, 398.0, 448.0, 72.0, 17.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-684.424072265625, -588.0590209960938, -491.6939697265625, -395.32891845703125, -298.9638671875, -202.59881591796875, -106.2337646484375, -9.86871337890625, 86.496337890625, 182.86138916015625, 279.2264404296875, 375.59149169921875, 471.95654296875, 568.3215942382812, 664.6866455078125, 761.0516967773438, 857.416748046875, 953.7817993164062, 1050.1468505859375, 1146.511962890625, 1242.876953125, 1339.241943359375, 1435.6070556640625, 1531.97216796875, 1628.337158203125, 1724.7021484375, 1821.0672607421875, 1917.432373046875, 2013.79736328125, 2110.162353515625, 2206.52734375, 2302.892578125, 2399.25732421875, 2495.622314453125, 2591.9873046875, 2688.3525390625, 2784.717529296875, 2881.08251953125, 2977.44775390625, 3073.812744140625, 3170.177734375, 3266.542724609375, 3362.90771484375, 3459.27294921875, 3555.637939453125, 3652.0029296875, 3748.3681640625, 3844.733154296875, 3941.09814453125, 4037.463134765625, 4133.828125, 4230.193359375, 4326.55859375, 4422.92333984375, 4519.28857421875, 4615.6533203125, 4712.0185546875, 4808.3837890625, 4904.74853515625, 5001.11376953125, 5097.478515625, 5193.84375, 5290.208984375, 5386.57373046875, 5482.93896484375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 8.0, 14.0, 15.0, 17.0, 23.0, 26.0, 19.0, 40.0, 33.0, 35.0, 31.0, 33.0, 40.0, 46.0, 51.0, 49.0, 36.0, 29.0, 56.0, 37.0, 45.0, 48.0, 27.0, 36.0, 32.0, 18.0, 21.0, 16.0, 19.0, 17.0, 15.0, 7.0, 9.0, 10.0, 7.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-409.103759765625, -396.1347961425781, -383.16583251953125, -370.1968688964844, -357.2279052734375, -344.2589416503906, -331.28997802734375, -318.321044921875, -305.35205078125, -292.3830871582031, -279.41412353515625, -266.4451599121094, -253.4761962890625, -240.50723266601562, -227.5382843017578, -214.56932067871094, -201.60037231445312, -188.63140869140625, -175.66244506835938, -162.6934814453125, -149.72451782226562, -136.75555419921875, -123.78660583496094, -110.81764221191406, -97.84867858886719, -84.87971496582031, -71.91075134277344, -58.941795349121094, -45.97283172607422, -33.003868103027344, -20.034912109375, -7.065948486328125, 5.90301513671875, 18.871976852416992, 31.840938568115234, 44.809898376464844, 57.77886199951172, 70.7478256225586, 83.71678161621094, 96.68574523925781, 109.65470886230469, 122.62367248535156, 135.59263610839844, 148.56158447265625, 161.53054809570312, 174.49951171875, 187.46847534179688, 200.43743896484375, 213.40640258789062, 226.3753662109375, 239.34432983398438, 252.31329345703125, 265.2822570800781, 278.251220703125, 291.22015380859375, 304.18914794921875, 317.1580810546875, 330.1270446777344, 343.09600830078125, 356.0649719238281, 369.033935546875, 382.0028991699219, 394.97186279296875, 407.9407958984375, 420.9097900390625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 16.0, 15.0, 6.0, 19.0, 15.0, 15.0, 15.0, 28.0, 39.0, 27.0, 21.0, 33.0, 49.0, 37.0, 41.0, 35.0, 46.0, 44.0, 41.0, 43.0, 33.0, 42.0, 41.0, 29.0, 37.0, 29.0, 25.0, 30.0, 23.0, 18.0, 15.0, 16.0, 10.0, 6.0, 16.0, 7.0, 9.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-67.0625, -64.95703125, -62.8515625, -60.74609375, -58.640625, -56.53515625, -54.4296875, -52.32421875, -50.21875, -48.11328125, -46.0078125, -43.90234375, -41.796875, -39.69140625, -37.5859375, -35.48046875, -33.375, -31.26953125, -29.1640625, -27.05859375, -24.953125, -22.84765625, -20.7421875, -18.63671875, -16.53125, -14.42578125, -12.3203125, -10.21484375, -8.109375, -6.00390625, -3.8984375, -1.79296875, 0.3125, 2.41796875, 4.5234375, 6.62890625, 8.734375, 10.83984375, 12.9453125, 15.05078125, 17.15625, 19.26171875, 21.3671875, 23.47265625, 25.578125, 27.68359375, 29.7890625, 31.89453125, 34.0, 36.10546875, 38.2109375, 40.31640625, 42.421875, 44.52734375, 46.6328125, 48.73828125, 50.84375, 52.94921875, 55.0546875, 57.16015625, 59.265625, 61.37109375, 63.4765625, 65.58203125, 67.6875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 8.0, 6.0, 10.0, 15.0, 21.0, 21.0, 40.0, 56.0, 60.0, 101.0, 158.0, 234.0, 332.0, 471.0, 689.0, 969.0, 1452.0, 2092.0, 3253.0, 4791.0, 7091.0, 10755.0, 16382.0, 25364.0, 40396.0, 66863.0, 117122.0, 298566.0, 198723.0, 96647.0, 56241.0, 34524.0, 22358.0, 14071.0, 9444.0, 6329.0, 4155.0, 2875.0, 1752.0, 1304.0, 844.0, 623.0, 390.0, 281.0, 205.0, 151.0, 87.0, 76.0, 56.0, 33.0, 28.0, 12.0, 9.0, 11.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0], "bins": [-2.494140625, -2.415802001953125, -2.33746337890625, -2.259124755859375, -2.1807861328125, -2.102447509765625, -2.02410888671875, -1.945770263671875, -1.867431640625, -1.789093017578125, -1.71075439453125, -1.632415771484375, -1.5540771484375, -1.475738525390625, -1.39739990234375, -1.319061279296875, -1.24072265625, -1.162384033203125, -1.08404541015625, -1.005706787109375, -0.9273681640625, -0.849029541015625, -0.77069091796875, -0.692352294921875, -0.614013671875, -0.535675048828125, -0.45733642578125, -0.378997802734375, -0.3006591796875, -0.222320556640625, -0.14398193359375, -0.065643310546875, 0.0126953125, 0.091033935546875, 0.16937255859375, 0.247711181640625, 0.3260498046875, 0.404388427734375, 0.48272705078125, 0.561065673828125, 0.639404296875, 0.717742919921875, 0.79608154296875, 0.874420166015625, 0.9527587890625, 1.031097412109375, 1.10943603515625, 1.187774658203125, 1.26611328125, 1.344451904296875, 1.42279052734375, 1.501129150390625, 1.5794677734375, 1.657806396484375, 1.73614501953125, 1.814483642578125, 1.892822265625, 1.971160888671875, 2.04949951171875, 2.127838134765625, 2.2061767578125, 2.284515380859375, 2.36285400390625, 2.441192626953125, 2.51953125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 5.0, 8.0, 12.0, 17.0, 15.0, 11.0, 14.0, 25.0, 21.0, 31.0, 29.0, 35.0, 38.0, 25.0, 40.0, 36.0, 32.0, 33.0, 33.0, 1065.0, 29.0, 41.0, 36.0, 38.0, 34.0, 38.0, 27.0, 23.0, 34.0, 31.0, 29.0, 20.0, 12.0, 20.0, 14.0, 9.0, 6.0, 10.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.03125, -37.744140625, -36.45703125, -35.169921875, -33.8828125, -32.595703125, -31.30859375, -30.021484375, -28.734375, -27.447265625, -26.16015625, -24.873046875, -23.5859375, -22.298828125, -21.01171875, -19.724609375, -18.4375, -17.150390625, -15.86328125, -14.576171875, -13.2890625, -12.001953125, -10.71484375, -9.427734375, -8.140625, -6.853515625, -5.56640625, -4.279296875, -2.9921875, -1.705078125, -0.41796875, 0.869140625, 2.15625, 3.443359375, 4.73046875, 6.017578125, 7.3046875, 8.591796875, 9.87890625, 11.166015625, 12.453125, 13.740234375, 15.02734375, 16.314453125, 17.6015625, 18.888671875, 20.17578125, 21.462890625, 22.75, 24.037109375, 25.32421875, 26.611328125, 27.8984375, 29.185546875, 30.47265625, 31.759765625, 33.046875, 34.333984375, 35.62109375, 36.908203125, 38.1953125, 39.482421875, 40.76953125, 42.056640625, 43.34375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 9.0, 12.0, 12.0, 26.0, 26.0, 45.0, 66.0, 77.0, 143.0, 168.0, 267.0, 323.0, 497.0, 744.0, 992.0, 1457.0, 2142.0, 3037.0, 4494.0, 6501.0, 9906.0, 14798.0, 22825.0, 34852.0, 54573.0, 89333.0, 161605.0, 1344669.0, 130111.0, 75586.0, 47272.0, 30339.0, 19637.0, 12977.0, 8718.0, 5864.0, 4023.0, 2733.0, 1920.0, 1308.0, 940.0, 632.0, 443.0, 308.0, 224.0, 138.0, 98.0, 75.0, 71.0, 39.0, 27.0, 19.0, 12.0, 8.0, 9.0, 8.0, 2.0, 1.0, 1.0], "bins": [-1.775390625, -1.720489501953125, -1.66558837890625, -1.610687255859375, -1.5557861328125, -1.500885009765625, -1.44598388671875, -1.391082763671875, -1.336181640625, -1.281280517578125, -1.22637939453125, -1.171478271484375, -1.1165771484375, -1.061676025390625, -1.00677490234375, -0.951873779296875, -0.89697265625, -0.842071533203125, -0.78717041015625, -0.732269287109375, -0.6773681640625, -0.622467041015625, -0.56756591796875, -0.512664794921875, -0.457763671875, -0.402862548828125, -0.34796142578125, -0.293060302734375, -0.2381591796875, -0.183258056640625, -0.12835693359375, -0.073455810546875, -0.0185546875, 0.036346435546875, 0.09124755859375, 0.146148681640625, 0.2010498046875, 0.255950927734375, 0.31085205078125, 0.365753173828125, 0.420654296875, 0.475555419921875, 0.53045654296875, 0.585357666015625, 0.6402587890625, 0.695159912109375, 0.75006103515625, 0.804962158203125, 0.85986328125, 0.914764404296875, 0.96966552734375, 1.024566650390625, 1.0794677734375, 1.134368896484375, 1.18927001953125, 1.244171142578125, 1.299072265625, 1.353973388671875, 1.40887451171875, 1.463775634765625, 1.5186767578125, 1.573577880859375, 1.62847900390625, 1.683380126953125, 1.73828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 7.0, 9.0, 17.0, 11.0, 16.0, 19.0, 29.0, 26.0, 60.0, 90.0, 155.0, 171.0, 105.0, 62.0, 32.0, 20.0, 25.0, 24.0, 17.0, 9.0, 12.0, 13.0, 13.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014853477478027344, -0.0001437664031982422, -0.00013899803161621094, -0.0001342296600341797, -0.00012946128845214844, -0.0001246929168701172, -0.00011992454528808594, -0.00011515617370605469, -0.00011038780212402344, -0.00010561943054199219, -0.00010085105895996094, -9.608268737792969e-05, -9.131431579589844e-05, -8.654594421386719e-05, -8.177757263183594e-05, -7.700920104980469e-05, -7.224082946777344e-05, -6.747245788574219e-05, -6.270408630371094e-05, -5.793571472167969e-05, -5.316734313964844e-05, -4.839897155761719e-05, -4.363059997558594e-05, -3.886222839355469e-05, -3.409385681152344e-05, -2.9325485229492188e-05, -2.4557113647460938e-05, -1.9788742065429688e-05, -1.5020370483398438e-05, -1.0251998901367188e-05, -5.4836273193359375e-06, -7.152557373046875e-07, 4.0531158447265625e-06, 8.821487426757812e-06, 1.3589859008789062e-05, 1.8358230590820312e-05, 2.3126602172851562e-05, 2.7894973754882812e-05, 3.266334533691406e-05, 3.743171691894531e-05, 4.220008850097656e-05, 4.696846008300781e-05, 5.173683166503906e-05, 5.650520324707031e-05, 6.127357482910156e-05, 6.604194641113281e-05, 7.081031799316406e-05, 7.557868957519531e-05, 8.034706115722656e-05, 8.511543273925781e-05, 8.988380432128906e-05, 9.465217590332031e-05, 9.942054748535156e-05, 0.00010418891906738281, 0.00010895729064941406, 0.00011372566223144531, 0.00011849403381347656, 0.0001232624053955078, 0.00012803077697753906, 0.0001327991485595703, 0.00013756752014160156, 0.0001423358917236328, 0.00014710426330566406, 0.0001518726348876953, 0.00015664100646972656]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 11.0, 6.0, 13.0, 12.0, 21.0, 20.0, 24.0, 32.0, 34.0, 47.0, 75.0, 83.0, 128.0, 247.0, 620.0, 6626.0, 842121.0, 193892.0, 3375.0, 483.0, 189.0, 130.0, 73.0, 63.0, 42.0, 35.0, 29.0, 15.0, 17.0, 16.0, 14.0, 4.0, 7.0, 6.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00232696533203125, -0.0022562146186828613, -0.0021854639053344727, -0.002114713191986084, -0.0020439624786376953, -0.0019732117652893066, -0.001902461051940918, -0.0018317103385925293, -0.0017609596252441406, -0.001690208911895752, -0.0016194581985473633, -0.0015487074851989746, -0.001477956771850586, -0.0014072060585021973, -0.0013364553451538086, -0.00126570463180542, -0.0011949539184570312, -0.0011242032051086426, -0.001053452491760254, -0.0009827017784118652, -0.0009119510650634766, -0.0008412003517150879, -0.0007704496383666992, -0.0006996989250183105, -0.0006289482116699219, -0.0005581974983215332, -0.00048744678497314453, -0.00041669607162475586, -0.0003459453582763672, -0.0002751946449279785, -0.00020444393157958984, -0.00013369321823120117, -6.29425048828125e-05, 7.808208465576172e-06, 7.855892181396484e-05, 0.00014930963516235352, 0.0002200603485107422, 0.00029081106185913086, 0.00036156177520751953, 0.0004323124885559082, 0.0005030632019042969, 0.0005738139152526855, 0.0006445646286010742, 0.0007153153419494629, 0.0007860660552978516, 0.0008568167686462402, 0.0009275674819946289, 0.0009983181953430176, 0.0010690689086914062, 0.001139819622039795, 0.0012105703353881836, 0.0012813210487365723, 0.001352071762084961, 0.0014228224754333496, 0.0014935731887817383, 0.001564323902130127, 0.0016350746154785156, 0.0017058253288269043, 0.001776576042175293, 0.0018473267555236816, 0.0019180774688720703, 0.001988828182220459, 0.0020595788955688477, 0.0021303296089172363, 0.002201080322265625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 5.0, 10.0, 31.0, 109.0, 425.0, 333.0, 73.0, 21.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.037957352120429e-05, -8.015183266252279e-05, -6.992409180384129e-05, -5.969635822111741e-05, -4.946861736243591e-05, -3.924087650375441e-05, -2.901314292103052e-05, -1.878540206234902e-05, -8.557661203667521e-06, 1.670077836024575e-06, 1.1897816875716671e-05, 2.2125554096419364e-05, 3.2353294955100864e-05, 4.2581035813782364e-05, 5.280876939650625e-05, 6.303651025518775e-05, 7.326425111386925e-05, 8.349199197255075e-05, 9.371973283123225e-05, 0.00010394746641395614, 0.00011417520727263764, 0.00012440295540727675, 0.00013463068171404302, 0.00014485842257272452, 0.00015508616343140602, 0.00016531390429008752, 0.00017554164514876902, 0.0001857693714555353, 0.00019599712686613202, 0.0002062248531728983, 0.0002164525940315798, 0.0002266803348902613, 0.00023690809030085802, 0.0002471358166076243, 0.000257363572018221, 0.0002675912983249873, 0.000277819053735584, 0.0002880467800423503, 0.00029827450634911656, 0.0003085022617597133, 0.00031873001717031, 0.0003289577434770763, 0.000339185498887673, 0.0003494132251944393, 0.000359640980605036, 0.0003698687069118023, 0.00038009643321856856, 0.0003903241886291653, 0.00040055191493593156, 0.00041077964124269783, 0.00042100739665329456, 0.00043123512296006083, 0.00044146287837065756, 0.00045169060467742383, 0.00046191836008802056, 0.00047214608639478683, 0.0004823738127015531, 0.0004926015390083194, 0.0005028292653150856, 0.0005130570498295128, 0.0005232847761362791, 0.0005335125024430454, 0.0005437402287498116, 0.0005539680132642388, 0.0005641957395710051]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 9.0, 2.0, 8.0, 7.0, 10.0, 11.0, 10.0, 13.0, 18.0, 12.0, 23.0, 21.0, 21.0, 33.0, 32.0, 28.0, 26.0, 46.0, 38.0, 34.0, 36.0, 41.0, 45.0, 28.0, 39.0, 39.0, 29.0, 27.0, 27.0, 30.0, 36.0, 37.0, 18.0, 28.0, 27.0, 17.0, 24.0, 14.0, 12.0, 7.0, 10.0, 5.0, 4.0, 2.0, 3.0, 6.0, 1.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.412101745605469e-05, -5.235057324171066e-05, -5.058012902736664e-05, -4.8809684813022614e-05, -4.703924059867859e-05, -4.5268796384334564e-05, -4.349835216999054e-05, -4.1727907955646515e-05, -3.995746374130249e-05, -3.8187019526958466e-05, -3.641657531261444e-05, -3.4646131098270416e-05, -3.287568688392639e-05, -3.110524266958237e-05, -2.9334798455238342e-05, -2.7564354240894318e-05, -2.5793910026550293e-05, -2.402346581220627e-05, -2.2253021597862244e-05, -2.048257738351822e-05, -1.8712133169174194e-05, -1.694168895483017e-05, -1.5171244740486145e-05, -1.340080052614212e-05, -1.1630356311798096e-05, -9.859912097454071e-06, -8.089467883110046e-06, -6.319023668766022e-06, -4.548579454421997e-06, -2.7781352400779724e-06, -1.0076910257339478e-06, 7.627531886100769e-07, 2.5331974029541016e-06, 4.303641617298126e-06, 6.074085831642151e-06, 7.844530045986176e-06, 9.6149742603302e-06, 1.1385418474674225e-05, 1.315586268901825e-05, 1.4926306903362274e-05, 1.66967511177063e-05, 1.8467195332050323e-05, 2.0237639546394348e-05, 2.2008083760738373e-05, 2.3778527975082397e-05, 2.5548972189426422e-05, 2.7319416403770447e-05, 2.908986061811447e-05, 3.0860304832458496e-05, 3.263074904680252e-05, 3.4401193261146545e-05, 3.617163747549057e-05, 3.7942081689834595e-05, 3.971252590417862e-05, 4.1482970118522644e-05, 4.325341433286667e-05, 4.502385854721069e-05, 4.679430276155472e-05, 4.856474697589874e-05, 5.033519119024277e-05, 5.210563540458679e-05, 5.387607961893082e-05, 5.564652383327484e-05, 5.7416968047618866e-05, 5.918741226196289e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 16.0, 15.0, 6.0, 19.0, 15.0, 15.0, 15.0, 28.0, 39.0, 27.0, 21.0, 33.0, 49.0, 37.0, 41.0, 35.0, 46.0, 44.0, 41.0, 43.0, 33.0, 42.0, 41.0, 29.0, 37.0, 29.0, 25.0, 30.0, 23.0, 18.0, 15.0, 16.0, 10.0, 6.0, 16.0, 7.0, 9.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-67.0625, -64.95703125, -62.8515625, -60.74609375, -58.640625, -56.53515625, -54.4296875, -52.32421875, -50.21875, -48.11328125, -46.0078125, -43.90234375, -41.796875, -39.69140625, -37.5859375, -35.48046875, -33.375, -31.26953125, -29.1640625, -27.05859375, -24.953125, -22.84765625, -20.7421875, -18.63671875, -16.53125, -14.42578125, -12.3203125, -10.21484375, -8.109375, -6.00390625, -3.8984375, -1.79296875, 0.3125, 2.41796875, 4.5234375, 6.62890625, 8.734375, 10.83984375, 12.9453125, 15.05078125, 17.15625, 19.26171875, 21.3671875, 23.47265625, 25.578125, 27.68359375, 29.7890625, 31.89453125, 34.0, 36.10546875, 38.2109375, 40.31640625, 42.421875, 44.52734375, 46.6328125, 48.73828125, 50.84375, 52.94921875, 55.0546875, 57.16015625, 59.265625, 61.37109375, 63.4765625, 65.58203125, 67.6875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 10.0, 10.0, 9.0, 21.0, 33.0, 39.0, 72.0, 79.0, 119.0, 196.0, 213.0, 365.0, 496.0, 835.0, 1164.0, 1821.0, 2988.0, 5188.0, 9718.0, 21885.0, 58892.0, 222395.0, 514626.0, 131692.0, 40514.0, 16045.0, 7648.0, 4280.0, 2400.0, 1586.0, 1056.0, 661.0, 458.0, 300.0, 204.0, 151.0, 106.0, 81.0, 55.0, 40.0, 27.0, 23.0, 14.0, 12.0, 11.0, 2.0, 2.0, 3.0, 8.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.6875, -86.62890625, -83.5703125, -80.51171875, -77.453125, -74.39453125, -71.3359375, -68.27734375, -65.21875, -62.16015625, -59.1015625, -56.04296875, -52.984375, -49.92578125, -46.8671875, -43.80859375, -40.75, -37.69140625, -34.6328125, -31.57421875, -28.515625, -25.45703125, -22.3984375, -19.33984375, -16.28125, -13.22265625, -10.1640625, -7.10546875, -4.046875, -0.98828125, 2.0703125, 5.12890625, 8.1875, 11.24609375, 14.3046875, 17.36328125, 20.421875, 23.48046875, 26.5390625, 29.59765625, 32.65625, 35.71484375, 38.7734375, 41.83203125, 44.890625, 47.94921875, 51.0078125, 54.06640625, 57.125, 60.18359375, 63.2421875, 66.30078125, 69.359375, 72.41796875, 75.4765625, 78.53515625, 81.59375, 84.65234375, 87.7109375, 90.76953125, 93.828125, 96.88671875, 99.9453125, 103.00390625, 106.0625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 10.0, 14.0, 18.0, 7.0, 15.0, 22.0, 37.0, 34.0, 48.0, 44.0, 53.0, 69.0, 79.0, 141.0, 347.0, 1466.0, 165.0, 82.0, 45.0, 65.0, 45.0, 35.0, 32.0, 39.0, 31.0, 21.0, 13.0, 17.0, 13.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-160.0, -154.849609375, -149.69921875, -144.548828125, -139.3984375, -134.248046875, -129.09765625, -123.947265625, -118.796875, -113.646484375, -108.49609375, -103.345703125, -98.1953125, -93.044921875, -87.89453125, -82.744140625, -77.59375, -72.443359375, -67.29296875, -62.142578125, -56.9921875, -51.841796875, -46.69140625, -41.541015625, -36.390625, -31.240234375, -26.08984375, -20.939453125, -15.7890625, -10.638671875, -5.48828125, -0.337890625, 4.8125, 9.962890625, 15.11328125, 20.263671875, 25.4140625, 30.564453125, 35.71484375, 40.865234375, 46.015625, 51.166015625, 56.31640625, 61.466796875, 66.6171875, 71.767578125, 76.91796875, 82.068359375, 87.21875, 92.369140625, 97.51953125, 102.669921875, 107.8203125, 112.970703125, 118.12109375, 123.271484375, 128.421875, 133.572265625, 138.72265625, 143.873046875, 149.0234375, 154.173828125, 159.32421875, 164.474609375, 169.625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 13.0, 13.0, 25.0, 30.0, 40.0, 47.0, 66.0, 83.0, 164.0, 333.0, 698.0, 3265.0, 116082.0, 3009123.0, 13312.0, 1359.0, 415.0, 215.0, 132.0, 80.0, 57.0, 37.0, 25.0, 15.0, 10.0, 19.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-428.75, -415.85546875, -402.9609375, -390.06640625, -377.171875, -364.27734375, -351.3828125, -338.48828125, -325.59375, -312.69921875, -299.8046875, -286.91015625, -274.015625, -261.12109375, -248.2265625, -235.33203125, -222.4375, -209.54296875, -196.6484375, -183.75390625, -170.859375, -157.96484375, -145.0703125, -132.17578125, -119.28125, -106.38671875, -93.4921875, -80.59765625, -67.703125, -54.80859375, -41.9140625, -29.01953125, -16.125, -3.23046875, 9.6640625, 22.55859375, 35.453125, 48.34765625, 61.2421875, 74.13671875, 87.03125, 99.92578125, 112.8203125, 125.71484375, 138.609375, 151.50390625, 164.3984375, 177.29296875, 190.1875, 203.08203125, 215.9765625, 228.87109375, 241.765625, 254.66015625, 267.5546875, 280.44921875, 293.34375, 306.23828125, 319.1328125, 332.02734375, 344.921875, 357.81640625, 370.7109375, 383.60546875, 396.5]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 352.0, 631.0, 22.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3949.839599609375, -3846.263427734375, -3742.68701171875, -3639.11083984375, -3535.53466796875, -3431.95849609375, -3328.38232421875, -3224.805908203125, -3121.229736328125, -3017.653564453125, -2914.0771484375, -2810.5009765625, -2706.9248046875, -2603.3486328125, -2499.7724609375, -2396.196044921875, -2292.619873046875, -2189.043701171875, -2085.46728515625, -1981.89111328125, -1878.31494140625, -1774.73876953125, -1671.1624755859375, -1567.586181640625, -1464.010009765625, -1360.433837890625, -1256.8575439453125, -1153.28125, -1049.705078125, -946.1288452148438, -842.5526123046875, -738.9763793945312, -635.39990234375, -531.8236694335938, -428.2474365234375, -324.67120361328125, -221.094970703125, -117.51873779296875, -13.9425048828125, 89.63372802734375, 193.2099609375, 296.78619384765625, 400.3624267578125, 503.93865966796875, 607.514892578125, 711.0911254882812, 814.6673583984375, 918.2435913085938, 1021.81982421875, 1125.39599609375, 1228.9722900390625, 1332.548583984375, 1436.124755859375, 1539.700927734375, 1643.2772216796875, 1746.853515625, 1850.4296875, 1954.005859375, 2057.58203125, 2161.158447265625, 2264.734619140625, 2368.310791015625, 2471.88720703125, 2575.46337890625, 2679.03955078125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 8.0, 14.0, 8.0, 8.0, 20.0, 27.0, 21.0, 31.0, 36.0, 25.0, 31.0, 35.0, 30.0, 38.0, 38.0, 45.0, 33.0, 35.0, 48.0, 54.0, 37.0, 30.0, 29.0, 39.0, 38.0, 27.0, 21.0, 15.0, 16.0, 16.0, 28.0, 20.0, 21.0, 10.0, 15.0, 7.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-396.3738708496094, -385.3954162597656, -374.4169616699219, -363.4384765625, -352.46002197265625, -341.4815673828125, -330.50311279296875, -319.524658203125, -308.54620361328125, -297.5677490234375, -286.58929443359375, -275.61083984375, -264.6323547363281, -253.65390014648438, -242.67544555664062, -231.69699096679688, -220.718505859375, -209.74005126953125, -198.76158142089844, -187.7831268310547, -176.80465698242188, -165.82620239257812, -154.84774780273438, -143.86929321289062, -132.8908233642578, -121.91236114501953, -110.93389892578125, -99.9554443359375, -88.97698211669922, -77.99851989746094, -67.02006530761719, -56.041603088378906, -45.0631103515625, -34.08464813232422, -23.106189727783203, -12.127731323242188, -1.1492691040039062, 9.829193115234375, 20.807647705078125, 31.786109924316406, 42.76457214355469, 53.74303436279297, 64.72149658203125, 75.699951171875, 86.67841339111328, 97.65687561035156, 108.63533020019531, 119.6137924194336, 130.59225463867188, 141.57070922851562, 152.54917907714844, 163.5276336669922, 174.506103515625, 185.48455810546875, 196.4630126953125, 207.44146728515625, 218.41993713378906, 229.3983917236328, 240.37686157226562, 251.35531616210938, 262.3337707519531, 273.312255859375, 284.29071044921875, 295.2691650390625, 306.24761962890625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 3.0, 6.0, 11.0, 5.0, 11.0, 14.0, 4.0, 7.0, 23.0, 16.0, 27.0, 22.0, 25.0, 27.0, 40.0, 44.0, 46.0, 39.0, 40.0, 34.0, 44.0, 23.0, 45.0, 40.0, 38.0, 30.0, 43.0, 35.0, 33.0, 38.0, 27.0, 19.0, 27.0, 20.0, 20.0, 10.0, 8.0, 9.0, 10.0, 10.0, 10.0, 3.0, 9.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-74.75, -72.4638671875, -70.177734375, -67.8916015625, -65.60546875, -63.3193359375, -61.033203125, -58.7470703125, -56.4609375, -54.1748046875, -51.888671875, -49.6025390625, -47.31640625, -45.0302734375, -42.744140625, -40.4580078125, -38.171875, -35.8857421875, -33.599609375, -31.3134765625, -29.02734375, -26.7412109375, -24.455078125, -22.1689453125, -19.8828125, -17.5966796875, -15.310546875, -13.0244140625, -10.73828125, -8.4521484375, -6.166015625, -3.8798828125, -1.59375, 0.6923828125, 2.978515625, 5.2646484375, 7.55078125, 9.8369140625, 12.123046875, 14.4091796875, 16.6953125, 18.9814453125, 21.267578125, 23.5537109375, 25.83984375, 28.1259765625, 30.412109375, 32.6982421875, 34.984375, 37.2705078125, 39.556640625, 41.8427734375, 44.12890625, 46.4150390625, 48.701171875, 50.9873046875, 53.2734375, 55.5595703125, 57.845703125, 60.1318359375, 62.41796875, 64.7041015625, 66.990234375, 69.2763671875, 71.5625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 1.0, 8.0, 10.0, 12.0, 13.0, 10.0, 21.0, 18.0, 42.0, 43.0, 70.0, 97.0, 131.0, 193.0, 283.0, 484.0, 935.0, 1777.0, 3950.0, 9424.0, 27246.0, 137014.0, 3062775.0, 864917.0, 56348.0, 16562.0, 6066.0, 2626.0, 1282.0, 641.0, 401.0, 248.0, 191.0, 127.0, 78.0, 56.0, 40.0, 32.0, 19.0, 28.0, 20.0, 11.0, 10.0, 11.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-338.25, -327.6015625, -316.953125, -306.3046875, -295.65625, -285.0078125, -274.359375, -263.7109375, -253.0625, -242.4140625, -231.765625, -221.1171875, -210.46875, -199.8203125, -189.171875, -178.5234375, -167.875, -157.2265625, -146.578125, -135.9296875, -125.28125, -114.6328125, -103.984375, -93.3359375, -82.6875, -72.0390625, -61.390625, -50.7421875, -40.09375, -29.4453125, -18.796875, -8.1484375, 2.5, 13.1484375, 23.796875, 34.4453125, 45.09375, 55.7421875, 66.390625, 77.0390625, 87.6875, 98.3359375, 108.984375, 119.6328125, 130.28125, 140.9296875, 151.578125, 162.2265625, 172.875, 183.5234375, 194.171875, 204.8203125, 215.46875, 226.1171875, 236.765625, 247.4140625, 258.0625, 268.7109375, 279.359375, 290.0078125, 300.65625, 311.3046875, 321.953125, 332.6015625, 343.25]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 9.0, 19.0, 17.0, 18.0, 26.0, 23.0, 39.0, 51.0, 59.0, 72.0, 115.0, 152.0, 191.0, 307.0, 450.0, 646.0, 581.0, 382.0, 218.0, 152.0, 118.0, 74.0, 71.0, 56.0, 40.0, 32.0, 23.0, 18.0, 23.0, 13.0, 11.0, 8.0, 6.0, 6.0, 1.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-183.625, -178.345703125, -173.06640625, -167.787109375, -162.5078125, -157.228515625, -151.94921875, -146.669921875, -141.390625, -136.111328125, -130.83203125, -125.552734375, -120.2734375, -114.994140625, -109.71484375, -104.435546875, -99.15625, -93.876953125, -88.59765625, -83.318359375, -78.0390625, -72.759765625, -67.48046875, -62.201171875, -56.921875, -51.642578125, -46.36328125, -41.083984375, -35.8046875, -30.525390625, -25.24609375, -19.966796875, -14.6875, -9.408203125, -4.12890625, 1.150390625, 6.4296875, 11.708984375, 16.98828125, 22.267578125, 27.546875, 32.826171875, 38.10546875, 43.384765625, 48.6640625, 53.943359375, 59.22265625, 64.501953125, 69.78125, 75.060546875, 80.33984375, 85.619140625, 90.8984375, 96.177734375, 101.45703125, 106.736328125, 112.015625, 117.294921875, 122.57421875, 127.853515625, 133.1328125, 138.412109375, 143.69140625, 148.970703125, 154.25]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [5.0, 3.0, 7.0, 5.0, 9.0, 8.0, 18.0, 30.0, 25.0, 55.0, 68.0, 91.0, 122.0, 221.0, 308.0, 413.0, 699.0, 1005.0, 1550.0, 2385.0, 3946.0, 6259.0, 10601.0, 18297.0, 34337.0, 70895.0, 171551.0, 618460.0, 2416205.0, 536548.0, 157323.0, 66326.0, 32393.0, 17702.0, 10020.0, 6052.0, 3589.0, 2345.0, 1490.0, 954.0, 642.0, 426.0, 279.0, 203.0, 138.0, 96.0, 63.0, 42.0, 24.0, 21.0, 13.0, 14.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.6875, -101.0087890625, -97.330078125, -93.6513671875, -89.97265625, -86.2939453125, -82.615234375, -78.9365234375, -75.2578125, -71.5791015625, -67.900390625, -64.2216796875, -60.54296875, -56.8642578125, -53.185546875, -49.5068359375, -45.828125, -42.1494140625, -38.470703125, -34.7919921875, -31.11328125, -27.4345703125, -23.755859375, -20.0771484375, -16.3984375, -12.7197265625, -9.041015625, -5.3623046875, -1.68359375, 1.9951171875, 5.673828125, 9.3525390625, 13.03125, 16.7099609375, 20.388671875, 24.0673828125, 27.74609375, 31.4248046875, 35.103515625, 38.7822265625, 42.4609375, 46.1396484375, 49.818359375, 53.4970703125, 57.17578125, 60.8544921875, 64.533203125, 68.2119140625, 71.890625, 75.5693359375, 79.248046875, 82.9267578125, 86.60546875, 90.2841796875, 93.962890625, 97.6416015625, 101.3203125, 104.9990234375, 108.677734375, 112.3564453125, 116.03515625, 119.7138671875, 123.392578125, 127.0712890625, 130.75]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 8.0, 7.0, 10.0, 11.0, 32.0, 29.0, 44.0, 55.0, 71.0, 123.0, 131.0, 133.0, 100.0, 70.0, 55.0, 26.0, 24.0, 22.0, 13.0, 7.0, 6.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1723.2225341796875, -1669.1153564453125, -1615.0081787109375, -1560.9010009765625, -1506.7939453125, -1452.686767578125, -1398.57958984375, -1344.472412109375, -1290.365234375, -1236.258056640625, -1182.15087890625, -1128.043701171875, -1073.9365234375, -1019.8294067382812, -965.7222900390625, -911.6151123046875, -857.5079345703125, -803.4007568359375, -749.2935791015625, -695.1864624023438, -641.0792846679688, -586.9721069335938, -532.864990234375, -478.7578125, -424.650634765625, -370.54345703125, -316.4363098144531, -262.32916259765625, -208.22198486328125, -154.11480712890625, -100.00765991210938, -45.9005126953125, 8.20654296875, 62.31370544433594, 116.42086791992188, 170.5280303955078, 224.63519287109375, 278.74237060546875, 332.8495178222656, 386.9566650390625, 441.0638427734375, 495.1710205078125, 549.2781982421875, 603.3853149414062, 657.4924926757812, 711.5996704101562, 765.706787109375, 819.81396484375, 873.921142578125, 928.0283203125, 982.135498046875, 1036.24267578125, 1090.349853515625, 1144.45703125, 1198.5640869140625, 1252.6712646484375, 1306.7784423828125, 1360.8856201171875, 1414.9927978515625, 1469.0999755859375, 1523.20703125, 1577.314208984375, 1631.42138671875, 1685.528564453125, 1739.6357421875]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 9.0, 5.0, 5.0, 10.0, 12.0, 16.0, 16.0, 11.0, 19.0, 20.0, 24.0, 33.0, 27.0, 24.0, 32.0, 48.0, 34.0, 44.0, 32.0, 41.0, 39.0, 40.0, 37.0, 35.0, 50.0, 40.0, 36.0, 45.0, 29.0, 31.0, 25.0, 19.0, 19.0, 18.0, 15.0, 13.0, 16.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-807.42333984375, -781.0552368164062, -754.6870727539062, -728.3189697265625, -701.9508056640625, -675.5827026367188, -649.214599609375, -622.846435546875, -596.4783325195312, -570.1102294921875, -543.7420654296875, -517.3739624023438, -491.0058288574219, -464.6376953125, -438.2695617675781, -411.90142822265625, -385.5332946777344, -359.1651611328125, -332.7970275878906, -306.42889404296875, -280.060791015625, -253.69265747070312, -227.32452392578125, -200.95640563964844, -174.58827209472656, -148.2201385498047, -121.85202026367188, -95.48388671875, -69.11576080322266, -42.74763488769531, -16.379501342773438, 9.988616943359375, 36.35675048828125, 62.724876403808594, 89.09300231933594, 115.46113586425781, 141.82925415039062, 168.1973876953125, 194.56552124023438, 220.9336395263672, 247.30177307128906, 273.6698913574219, 300.03802490234375, 326.4061584472656, 352.7742919921875, 379.14239501953125, 405.51055908203125, 431.878662109375, 458.2467956542969, 484.61492919921875, 510.9830627441406, 537.3511962890625, 563.7192993164062, 590.08740234375, 616.45556640625, 642.8236694335938, 669.1918334960938, 695.5599365234375, 721.9281005859375, 748.2962036132812, 774.6643676757812, 801.032470703125, 827.400634765625, 853.7687377929688, 880.1368408203125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 8.0, 14.0, 16.0, 12.0, 16.0, 18.0, 23.0, 16.0, 27.0, 36.0, 32.0, 31.0, 46.0, 37.0, 44.0, 52.0, 38.0, 55.0, 37.0, 47.0, 43.0, 46.0, 45.0, 33.0, 30.0, 33.0, 24.0, 20.0, 20.0, 11.0, 23.0, 9.0, 15.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1396.0, -1347.921875, -1299.84375, -1251.765625, -1203.6875, -1155.609375, -1107.53125, -1059.453125, -1011.375, -963.296875, -915.21875, -867.140625, -819.0625, -770.984375, -722.90625, -674.828125, -626.75, -578.671875, -530.59375, -482.515625, -434.4375, -386.359375, -338.28125, -290.203125, -242.125, -194.046875, -145.96875, -97.890625, -49.8125, -1.734375, 46.34375, 94.421875, 142.5, 190.578125, 238.65625, 286.734375, 334.8125, 382.890625, 430.96875, 479.046875, 527.125, 575.203125, 623.28125, 671.359375, 719.4375, 767.515625, 815.59375, 863.671875, 911.75, 959.828125, 1007.90625, 1055.984375, 1104.0625, 1152.140625, 1200.21875, 1248.296875, 1296.375, 1344.453125, 1392.53125, 1440.609375, 1488.6875, 1536.765625, 1584.84375, 1632.921875, 1681.0]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 12.0, 20.0, 14.0, 49.0, 46.0, 99.0, 114.0, 209.0, 268.0, 393.0, 578.0, 840.0, 1249.0, 1813.0, 2874.0, 4522.0, 7191.0, 11476.0, 19007.0, 32133.0, 56554.0, 106892.0, 252819.0, 291720.0, 112483.0, 58952.0, 33471.0, 19731.0, 11999.0, 7448.0, 4713.0, 3006.0, 2028.0, 1338.0, 852.0, 512.0, 353.0, 223.0, 157.0, 117.0, 73.0, 51.0, 45.0, 38.0, 21.0, 16.0, 14.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.0625, -68.615234375, -66.16796875, -63.720703125, -61.2734375, -58.826171875, -56.37890625, -53.931640625, -51.484375, -49.037109375, -46.58984375, -44.142578125, -41.6953125, -39.248046875, -36.80078125, -34.353515625, -31.90625, -29.458984375, -27.01171875, -24.564453125, -22.1171875, -19.669921875, -17.22265625, -14.775390625, -12.328125, -9.880859375, -7.43359375, -4.986328125, -2.5390625, -0.091796875, 2.35546875, 4.802734375, 7.25, 9.697265625, 12.14453125, 14.591796875, 17.0390625, 19.486328125, 21.93359375, 24.380859375, 26.828125, 29.275390625, 31.72265625, 34.169921875, 36.6171875, 39.064453125, 41.51171875, 43.958984375, 46.40625, 48.853515625, 51.30078125, 53.748046875, 56.1953125, 58.642578125, 61.08984375, 63.537109375, 65.984375, 68.431640625, 70.87890625, 73.326171875, 75.7734375, 78.220703125, 80.66796875, 83.115234375, 85.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 4.0, 7.0, 8.0, 7.0, 12.0, 11.0, 12.0, 22.0, 23.0, 18.0, 23.0, 24.0, 34.0, 30.0, 37.0, 33.0, 40.0, 47.0, 36.0, 36.0, 1056.0, 37.0, 46.0, 43.0, 29.0, 40.0, 25.0, 36.0, 31.0, 30.0, 33.0, 24.0, 30.0, 15.0, 12.0, 16.0, 9.0, 8.0, 5.0, 6.0, 5.0, 1.0, 10.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-969.0, -940.859375, -912.71875, -884.578125, -856.4375, -828.296875, -800.15625, -772.015625, -743.875, -715.734375, -687.59375, -659.453125, -631.3125, -603.171875, -575.03125, -546.890625, -518.75, -490.609375, -462.46875, -434.328125, -406.1875, -378.046875, -349.90625, -321.765625, -293.625, -265.484375, -237.34375, -209.203125, -181.0625, -152.921875, -124.78125, -96.640625, -68.5, -40.359375, -12.21875, 15.921875, 44.0625, 72.203125, 100.34375, 128.484375, 156.625, 184.765625, 212.90625, 241.046875, 269.1875, 297.328125, 325.46875, 353.609375, 381.75, 409.890625, 438.03125, 466.171875, 494.3125, 522.453125, 550.59375, 578.734375, 606.875, 635.015625, 663.15625, 691.296875, 719.4375, 747.578125, 775.71875, 803.859375, 832.0]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 4.0, 6.0, 23.0, 34.0, 37.0, 71.0, 76.0, 103.0, 170.0, 219.0, 333.0, 521.0, 733.0, 1060.0, 1641.0, 2302.0, 3386.0, 4906.0, 7667.0, 11711.0, 18227.0, 28462.0, 45206.0, 73490.0, 132971.0, 1357958.0, 169950.0, 88683.0, 52970.0, 32825.0, 20867.0, 13698.0, 8892.0, 5741.0, 3900.0, 2625.0, 1826.0, 1209.0, 801.0, 572.0, 347.0, 277.0, 199.0, 140.0, 88.0, 66.0, 48.0, 32.0, 22.0, 14.0, 5.0, 9.0, 7.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.8125, -37.5869140625, -36.361328125, -35.1357421875, -33.91015625, -32.6845703125, -31.458984375, -30.2333984375, -29.0078125, -27.7822265625, -26.556640625, -25.3310546875, -24.10546875, -22.8798828125, -21.654296875, -20.4287109375, -19.203125, -17.9775390625, -16.751953125, -15.5263671875, -14.30078125, -13.0751953125, -11.849609375, -10.6240234375, -9.3984375, -8.1728515625, -6.947265625, -5.7216796875, -4.49609375, -3.2705078125, -2.044921875, -0.8193359375, 0.40625, 1.6318359375, 2.857421875, 4.0830078125, 5.30859375, 6.5341796875, 7.759765625, 8.9853515625, 10.2109375, 11.4365234375, 12.662109375, 13.8876953125, 15.11328125, 16.3388671875, 17.564453125, 18.7900390625, 20.015625, 21.2412109375, 22.466796875, 23.6923828125, 24.91796875, 26.1435546875, 27.369140625, 28.5947265625, 29.8203125, 31.0458984375, 32.271484375, 33.4970703125, 34.72265625, 35.9482421875, 37.173828125, 38.3994140625, 39.625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 7.0, 16.0, 11.0, 17.0, 22.0, 20.0, 27.0, 41.0, 25.0, 52.0, 86.0, 131.0, 140.0, 89.0, 57.0, 38.0, 43.0, 23.0, 27.0, 19.0, 13.0, 14.0, 11.0, 10.0, 5.0, 12.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052490234375, -0.005040526390075684, -0.004832029342651367, -0.004623532295227051, -0.004415035247802734, -0.004206538200378418, -0.0039980411529541016, -0.003789544105529785, -0.0035810470581054688, -0.0033725500106811523, -0.003164052963256836, -0.0029555559158325195, -0.002747058868408203, -0.0025385618209838867, -0.0023300647735595703, -0.002121567726135254, -0.0019130706787109375, -0.001704573631286621, -0.0014960765838623047, -0.0012875795364379883, -0.0010790824890136719, -0.0008705854415893555, -0.0006620883941650391, -0.00045359134674072266, -0.00024509429931640625, -3.6597251892089844e-05, 0.00017189979553222656, 0.00038039684295654297, 0.0005888938903808594, 0.0007973909378051758, 0.0010058879852294922, 0.0012143850326538086, 0.001422882080078125, 0.0016313791275024414, 0.0018398761749267578, 0.0020483732223510742, 0.0022568702697753906, 0.002465367317199707, 0.0026738643646240234, 0.00288236141204834, 0.0030908584594726562, 0.0032993555068969727, 0.003507852554321289, 0.0037163496017456055, 0.003924846649169922, 0.004133343696594238, 0.004341840744018555, 0.004550337791442871, 0.0047588348388671875, 0.004967331886291504, 0.00517582893371582, 0.005384325981140137, 0.005592823028564453, 0.0058013200759887695, 0.006009817123413086, 0.006218314170837402, 0.006426811218261719, 0.006635308265686035, 0.0068438053131103516, 0.007052302360534668, 0.007260799407958984, 0.007469296455383301, 0.007677793502807617, 0.007886290550231934, 0.00809478759765625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 9.0, 12.0, 26.0, 39.0, 61.0, 95.0, 129.0, 210.0, 317.0, 489.0, 815.0, 1336.0, 2238.0, 3819.0, 7210.0, 14145.0, 29843.0, 72721.0, 300976.0, 463580.0, 83654.0, 33265.0, 15344.0, 7681.0, 4175.0, 2400.0, 1528.0, 878.0, 568.0, 325.0, 186.0, 139.0, 89.0, 61.0, 53.0, 29.0, 23.0, 20.0, 17.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0], "bins": [-0.03375244140625, -0.03286576271057129, -0.03197908401489258, -0.031092405319213867, -0.030205726623535156, -0.029319047927856445, -0.028432369232177734, -0.027545690536499023, -0.026659011840820312, -0.0257723331451416, -0.02488565444946289, -0.02399897575378418, -0.02311229705810547, -0.022225618362426758, -0.021338939666748047, -0.020452260971069336, -0.019565582275390625, -0.018678903579711914, -0.017792224884033203, -0.016905546188354492, -0.01601886749267578, -0.01513218879699707, -0.01424551010131836, -0.013358831405639648, -0.012472152709960938, -0.011585474014282227, -0.010698795318603516, -0.009812116622924805, -0.008925437927246094, -0.008038759231567383, -0.007152080535888672, -0.006265401840209961, -0.00537872314453125, -0.004492044448852539, -0.003605365753173828, -0.002718687057495117, -0.0018320083618164062, -0.0009453296661376953, -5.8650970458984375e-05, 0.0008280277252197266, 0.0017147064208984375, 0.0026013851165771484, 0.0034880638122558594, 0.00437474250793457, 0.005261421203613281, 0.006148099899291992, 0.007034778594970703, 0.007921457290649414, 0.008808135986328125, 0.009694814682006836, 0.010581493377685547, 0.011468172073364258, 0.012354850769042969, 0.01324152946472168, 0.01412820816040039, 0.015014886856079102, 0.015901565551757812, 0.016788244247436523, 0.017674922943115234, 0.018561601638793945, 0.019448280334472656, 0.020334959030151367, 0.021221637725830078, 0.02210831642150879, 0.0229949951171875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 6.0, 16.0, 12.0, 17.0, 17.0, 26.0, 25.0, 47.0, 61.0, 108.0, 202.0, 221.0, 102.0, 43.0, 33.0, 23.0, 13.0, 8.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.025583025068044662, -0.025102611631155014, -0.024622198194265366, -0.024141782894730568, -0.02366136945784092, -0.02318095602095127, -0.022700542584061623, -0.022220127284526825, -0.021739713847637177, -0.021259300410747528, -0.02077888697385788, -0.020298471674323082, -0.019818058237433434, -0.019337644800543785, -0.018857231363654137, -0.01837681606411934, -0.01789640262722969, -0.017415989190340042, -0.016935575753450394, -0.016455160453915596, -0.015974747017025948, -0.0154943335801363, -0.01501392014324665, -0.014533505775034428, -0.014053093269467354, -0.013572679832577705, -0.013092265464365482, -0.012611852027475834, -0.01213143765926361, -0.011651024222373962, -0.011170610785484314, -0.010690196417272091, -0.010209782049059868, -0.00972936861217022, -0.009248954243957996, -0.008768540807068348, -0.008288126438856125, -0.0078077130019664764, -0.007327299099415541, -0.006846885196864605, -0.0063664717599749565, -0.005886057857424021, -0.005405643954873085, -0.004925230517983437, -0.0044448161497712135, -0.003964402712881565, -0.0034839888103306293, -0.0030035749077796936, -0.002523161005228758, -0.002042747102677822, -0.0015623333165422082, -0.0010819195304065943, -0.0006015056278556585, -0.00012109172530472279, 0.0003593219444155693, 0.000839735846966505, 0.0013201497495174408, 0.0018005636520683765, 0.0022809775546193123, 0.0027613912243396044, 0.00324180512689054, 0.003722219029441476, 0.004202632699161768, 0.004683046601712704, 0.0051634605042636395]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 14.0, 9.0, 9.0, 11.0, 13.0, 14.0, 13.0, 19.0, 21.0, 18.0, 26.0, 28.0, 28.0, 41.0, 41.0, 31.0, 42.0, 31.0, 40.0, 51.0, 38.0, 47.0, 44.0, 43.0, 40.0, 39.0, 37.0, 24.0, 28.0, 19.0, 35.0, 17.0, 12.0, 19.0, 13.0, 7.0, 6.0, 3.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.005986213684082031, -0.005795221775770187, -0.0056042298674583435, -0.0054132379591465, -0.005222246050834656, -0.005031254142522812, -0.004840262234210968, -0.004649270325899124, -0.00445827841758728, -0.004267286509275436, -0.0040762946009635925, -0.0038853026926517487, -0.003694310784339905, -0.003503318876028061, -0.003312326967716217, -0.003121335059404373, -0.0029303431510925293, -0.0027393512427806854, -0.0025483593344688416, -0.0023573674261569977, -0.002166375517845154, -0.00197538360953331, -0.001784391701221466, -0.0015933997929096222, -0.0014024078845977783, -0.0012114159762859344, -0.0010204240679740906, -0.0008294321596622467, -0.0006384402513504028, -0.00044744834303855896, -0.0002564564347267151, -6.546452641487122e-05, 0.00012552738189697266, 0.00031651929020881653, 0.0005075111985206604, 0.0006985031068325043, 0.0008894950151443481, 0.001080486923456192, 0.0012714788317680359, 0.0014624707400798798, 0.0016534626483917236, 0.0018444545567035675, 0.0020354464650154114, 0.0022264383733272552, 0.002417430281639099, 0.002608422189950943, 0.002799414098262787, 0.0029904060065746307, 0.0031813979148864746, 0.0033723898231983185, 0.0035633817315101624, 0.0037543736398220062, 0.00394536554813385, 0.004136357456445694, 0.004327349364757538, 0.004518341273069382, 0.004709333181381226, 0.0049003250896930695, 0.005091316998004913, 0.005282308906316757, 0.005473300814628601, 0.005664292722940445, 0.005855284631252289, 0.006046276539564133, 0.0062372684478759766]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 8.0, 14.0, 16.0, 12.0, 16.0, 18.0, 23.0, 16.0, 27.0, 36.0, 32.0, 31.0, 46.0, 37.0, 44.0, 52.0, 38.0, 55.0, 37.0, 47.0, 43.0, 46.0, 45.0, 33.0, 30.0, 33.0, 24.0, 20.0, 20.0, 11.0, 23.0, 9.0, 15.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1396.0, -1347.921875, -1299.84375, -1251.765625, -1203.6875, -1155.609375, -1107.53125, -1059.453125, -1011.375, -963.296875, -915.21875, -867.140625, -819.0625, -770.984375, -722.90625, -674.828125, -626.75, -578.671875, -530.59375, -482.515625, -434.4375, -386.359375, -338.28125, -290.203125, -242.125, -194.046875, -145.96875, -97.890625, -49.8125, -1.734375, 46.34375, 94.421875, 142.5, 190.578125, 238.65625, 286.734375, 334.8125, 382.890625, 430.96875, 479.046875, 527.125, 575.203125, 623.28125, 671.359375, 719.4375, 767.515625, 815.59375, 863.671875, 911.75, 959.828125, 1007.90625, 1055.984375, 1104.0625, 1152.140625, 1200.21875, 1248.296875, 1296.375, 1344.453125, 1392.53125, 1440.609375, 1488.6875, 1536.765625, 1584.84375, 1632.921875, 1681.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 8.0, 5.0, 8.0, 13.0, 20.0, 24.0, 32.0, 42.0, 45.0, 88.0, 123.0, 163.0, 274.0, 465.0, 828.0, 1656.0, 3468.0, 8176.0, 21839.0, 70155.0, 336815.0, 465742.0, 92891.0, 27262.0, 10084.0, 4064.0, 1865.0, 976.0, 506.0, 328.0, 185.0, 133.0, 84.0, 47.0, 43.0, 28.0, 22.0, 12.0, 10.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-222.25, -214.61328125, -206.9765625, -199.33984375, -191.703125, -184.06640625, -176.4296875, -168.79296875, -161.15625, -153.51953125, -145.8828125, -138.24609375, -130.609375, -122.97265625, -115.3359375, -107.69921875, -100.0625, -92.42578125, -84.7890625, -77.15234375, -69.515625, -61.87890625, -54.2421875, -46.60546875, -38.96875, -31.33203125, -23.6953125, -16.05859375, -8.421875, -0.78515625, 6.8515625, 14.48828125, 22.125, 29.76171875, 37.3984375, 45.03515625, 52.671875, 60.30859375, 67.9453125, 75.58203125, 83.21875, 90.85546875, 98.4921875, 106.12890625, 113.765625, 121.40234375, 129.0390625, 136.67578125, 144.3125, 151.94921875, 159.5859375, 167.22265625, 174.859375, 182.49609375, 190.1328125, 197.76953125, 205.40625, 213.04296875, 220.6796875, 228.31640625, 235.953125, 243.58984375, 251.2265625, 258.86328125, 266.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 9.0, 6.0, 36.0, 20.0, 36.0, 48.0, 55.0, 49.0, 84.0, 81.0, 2096.0, 102.0, 72.0, 68.0, 68.0, 56.0, 45.0, 35.0, 18.0, 18.0, 18.0, 15.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3062.0, -2968.40625, -2874.8125, -2781.21875, -2687.625, -2594.03125, -2500.4375, -2406.84375, -2313.25, -2219.65625, -2126.0625, -2032.46875, -1938.875, -1845.28125, -1751.6875, -1658.09375, -1564.5, -1470.90625, -1377.3125, -1283.71875, -1190.125, -1096.53125, -1002.9375, -909.34375, -815.75, -722.15625, -628.5625, -534.96875, -441.375, -347.78125, -254.1875, -160.59375, -67.0, 26.59375, 120.1875, 213.78125, 307.375, 400.96875, 494.5625, 588.15625, 681.75, 775.34375, 868.9375, 962.53125, 1056.125, 1149.71875, 1243.3125, 1336.90625, 1430.5, 1524.09375, 1617.6875, 1711.28125, 1804.875, 1898.46875, 1992.0625, 2085.65625, 2179.25, 2272.84375, 2366.4375, 2460.03125, 2553.625, 2647.21875, 2740.8125, 2834.40625, 2928.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 7.0, 8.0, 13.0, 26.0, 33.0, 40.0, 63.0, 90.0, 139.0, 219.0, 337.0, 683.0, 1282.0, 3822.0, 19973.0, 241562.0, 2816872.0, 49588.0, 6943.0, 1990.0, 824.0, 482.0, 263.0, 137.0, 95.0, 74.0, 33.0, 23.0, 32.0, 14.0, 14.0, 2.0, 5.0, 7.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-391.75, -379.953125, -368.15625, -356.359375, -344.5625, -332.765625, -320.96875, -309.171875, -297.375, -285.578125, -273.78125, -261.984375, -250.1875, -238.390625, -226.59375, -214.796875, -203.0, -191.203125, -179.40625, -167.609375, -155.8125, -144.015625, -132.21875, -120.421875, -108.625, -96.828125, -85.03125, -73.234375, -61.4375, -49.640625, -37.84375, -26.046875, -14.25, -2.453125, 9.34375, 21.140625, 32.9375, 44.734375, 56.53125, 68.328125, 80.125, 91.921875, 103.71875, 115.515625, 127.3125, 139.109375, 150.90625, 162.703125, 174.5, 186.296875, 198.09375, 209.890625, 221.6875, 233.484375, 245.28125, 257.078125, 268.875, 280.671875, 292.46875, 304.265625, 316.0625, 327.859375, 339.65625, 351.453125, 363.25]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 4.0, 20.0, 30.0, 50.0, 89.0, 201.0, 302.0, 183.0, 61.0, 26.0, 9.0, 9.0, 5.0, 8.0, 1.0, 2.0, 1.0], "bins": [-9103.0927734375, -8932.533203125, -8761.974609375, -8591.4150390625, -8420.85546875, -8250.2958984375, -8079.73681640625, -7909.177734375, -7738.6181640625, -7568.05859375, -7397.49951171875, -7226.9404296875, -7056.380859375, -6885.8212890625, -6715.26220703125, -6544.703125, -6374.1435546875, -6203.583984375, -6033.02490234375, -5862.4658203125, -5691.90625, -5521.3466796875, -5350.78759765625, -5180.228515625, -5009.6689453125, -4839.109375, -4668.55029296875, -4497.9912109375, -4327.431640625, -4156.8720703125, -3986.31298828125, -3815.753662109375, -3645.19482421875, -3474.635498046875, -3304.076171875, -3133.516845703125, -2962.95751953125, -2792.398193359375, -2621.8388671875, -2451.279541015625, -2280.72021484375, -2110.160888671875, -1939.6015625, -1769.042236328125, -1598.48291015625, -1427.923583984375, -1257.3642578125, -1086.804931640625, -916.2454833984375, -745.6861572265625, -575.1268310546875, -404.5675048828125, -234.0081787109375, -63.4488525390625, 107.1104736328125, 277.6697998046875, 448.2291259765625, 618.7884521484375, 789.3477783203125, 959.9071044921875, 1130.4664306640625, 1301.0257568359375, 1471.5850830078125, 1642.1444091796875, 1812.7037353515625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 6.0, 12.0, 10.0, 10.0, 18.0, 17.0, 11.0, 24.0, 24.0, 27.0, 45.0, 47.0, 38.0, 33.0, 40.0, 45.0, 43.0, 50.0, 45.0, 38.0, 47.0, 57.0, 45.0, 43.0, 39.0, 32.0, 21.0, 23.0, 16.0, 17.0, 18.0, 15.0, 16.0, 12.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3429.6953125, -3339.20166015625, -3248.707763671875, -3158.2138671875, -3067.72021484375, -2977.2265625, -2886.732666015625, -2796.23876953125, -2705.7451171875, -2615.25146484375, -2524.757568359375, -2434.263671875, -2343.77001953125, -2253.2763671875, -2162.782470703125, -2072.28857421875, -1981.794921875, -1891.3011474609375, -1800.807373046875, -1710.3135986328125, -1619.81982421875, -1529.3260498046875, -1438.832275390625, -1348.3385009765625, -1257.8447265625, -1167.3509521484375, -1076.857177734375, -986.3634033203125, -895.86962890625, -805.3758544921875, -714.882080078125, -624.3883056640625, -533.89453125, -443.4007568359375, -352.906982421875, -262.4132080078125, -171.91943359375, -81.4256591796875, 9.068115234375, 99.5618896484375, 190.0556640625, 280.5494384765625, 371.043212890625, 461.5369873046875, 552.03076171875, 642.5245361328125, 733.018310546875, 823.5120849609375, 914.005859375, 1004.4996337890625, 1094.993408203125, 1185.4871826171875, 1275.98095703125, 1366.4747314453125, 1456.968505859375, 1547.4622802734375, 1637.9560546875, 1728.4498291015625, 1818.943603515625, 1909.4373779296875, 1999.93115234375, 2090.4248046875, 2180.918701171875, 2271.41259765625, 2361.90625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 9.0, 13.0, 10.0, 20.0, 18.0, 14.0, 16.0, 32.0, 52.0, 43.0, 44.0, 107.0, 199.0, 339.0, 545.0, 950.0, 1044146.0, 707.0, 510.0, 271.0, 140.0, 95.0, 60.0, 39.0, 40.0, 25.0, 24.0, 19.0, 12.0, 10.0, 7.0, 9.0, 8.0, 5.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1432.5977783203125, -1383.76611328125, -1334.9344482421875, -1286.102783203125, -1237.2711181640625, -1188.439453125, -1139.60791015625, -1090.776123046875, -1041.944580078125, -993.1129150390625, -944.28125, -895.4495849609375, -846.617919921875, -797.7862548828125, -748.9546508789062, -700.1229858398438, -651.291259765625, -602.4595947265625, -553.6279296875, -504.7962951660156, -455.9646301269531, -407.1329650878906, -358.30133056640625, -309.46966552734375, -260.63800048828125, -211.80633544921875, -162.9746856689453, -114.14303588867188, -65.31137084960938, -16.479705810546875, 32.3519287109375, 81.18359375, 130.015380859375, 178.8470458984375, 227.67869567871094, 276.5103454589844, 325.3420104980469, 374.1736755371094, 423.00531005859375, 471.83697509765625, 520.6686401367188, 569.5003051757812, 618.3319702148438, 667.16357421875, 715.9952392578125, 764.826904296875, 813.6585693359375, 862.490234375, 911.3218994140625, 960.153564453125, 1008.9852294921875, 1057.81689453125, 1106.6485595703125, 1155.480224609375, 1204.311767578125, 1253.1435546875, 1301.97509765625, 1350.8067626953125, 1399.638427734375, 1448.4700927734375, 1497.3017578125, 1546.1334228515625, 1594.965087890625, 1643.796630859375, 1692.62841796875]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 13.0, 8.0, 21.0, 36.0, 47.0, 54.0, 98.0, 139.0, 377.0, 1467.0, 51457376.0, 2561.0, 468.0, 176.0, 94.0, 64.0, 40.0, 30.0, 22.0, 8.0, 15.0, 6.0, 10.0, 8.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3951.513916015625, -3849.203857421875, -3746.89404296875, -3644.583984375, -3542.27392578125, -3439.9638671875, -3337.65380859375, -3235.343994140625, -3133.033935546875, -3030.723876953125, -2928.4140625, -2826.10400390625, -2723.7939453125, -2621.48388671875, -2519.173828125, -2416.864013671875, -2314.553955078125, -2212.243896484375, -2109.93408203125, -2007.6240234375, -1905.31396484375, -1803.00390625, -1700.6939697265625, -1598.384033203125, -1496.073974609375, -1393.763916015625, -1291.4539794921875, -1189.14404296875, -1086.833984375, -984.5239868164062, -882.2139892578125, -779.9039916992188, -677.59375, -575.2837524414062, -472.9737548828125, -370.66375732421875, -268.353759765625, -166.04376220703125, -63.7337646484375, 38.57623291015625, 140.88623046875, 243.19622802734375, 345.5062255859375, 447.81622314453125, 550.126220703125, 652.4362182617188, 754.7462158203125, 857.0562133789062, 959.3662109375, 1061.67626953125, 1163.9862060546875, 1266.296142578125, 1368.606201171875, 1470.916259765625, 1573.2261962890625, 1675.5361328125, 1777.84619140625, 1880.15625, 1982.4661865234375, 2084.776123046875, 2187.086181640625, 2289.396240234375, 2391.7060546875, 2494.01611328125, 2596.326171875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 11.0, 19.0, 35.0, 60.0, 62.0, 108.0, 170.0, 237.0, 349.0, 499.0, 763.0, 1140.0, 1665.0, 2487.0, 3814.0, 5758.0, 8176.0, 12453.0, 18950.0, 28759.0, 44160.0, 68936.0, 108437.0, 181774.0, 347086.0, 4070095.0, 669297.0, 286061.0, 158396.0, 94800.0, 60131.0, 39252.0, 25806.0, 17385.0, 11588.0, 7515.0, 5053.0, 3281.0, 2232.0, 1506.0, 1004.0, 729.0, 470.0, 305.0, 184.0, 148.0, 100.0, 71.0, 36.0, 24.0, 21.0, 19.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-12.890625, -12.486083984375, -12.08154296875, -11.677001953125, -11.2724609375, -10.867919921875, -10.46337890625, -10.058837890625, -9.654296875, -9.249755859375, -8.84521484375, -8.440673828125, -8.0361328125, -7.631591796875, -7.22705078125, -6.822509765625, -6.41796875, -6.013427734375, -5.60888671875, -5.204345703125, -4.7998046875, -4.395263671875, -3.99072265625, -3.586181640625, -3.181640625, -2.777099609375, -2.37255859375, -1.968017578125, -1.5634765625, -1.158935546875, -0.75439453125, -0.349853515625, 0.0546875, 0.459228515625, 0.86376953125, 1.268310546875, 1.6728515625, 2.077392578125, 2.48193359375, 2.886474609375, 3.291015625, 3.695556640625, 4.10009765625, 4.504638671875, 4.9091796875, 5.313720703125, 5.71826171875, 6.122802734375, 6.52734375, 6.931884765625, 7.33642578125, 7.740966796875, 8.1455078125, 8.550048828125, 8.95458984375, 9.359130859375, 9.763671875, 10.168212890625, 10.57275390625, 10.977294921875, 11.3818359375, 11.786376953125, 12.19091796875, 12.595458984375, 13.0]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 1.0, 6.0, 6.0, 9.0, 9.0, 5.0, 14.0, 17.0, 22.0, 20.0, 12.0, 20.0, 28.0, 23.0, 20.0, 25.0, 28.0, 35.0, 38.0, 43.0, 39.0, 37.0, 100.0, 1001.0, 43.0, 34.0, 44.0, 31.0, 35.0, 29.0, 25.0, 33.0, 26.0, 21.0, 26.0, 20.0, 16.0, 11.0, 10.0, 10.0, 11.0, 3.0, 8.0, 11.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-312.5, -302.7734375, -293.046875, -283.3203125, -273.59375, -263.8671875, -254.140625, -244.4140625, -234.6875, -224.9609375, -215.234375, -205.5078125, -195.78125, -186.0546875, -176.328125, -166.6015625, -156.875, -147.1484375, -137.421875, -127.6953125, -117.96875, -108.2421875, -98.515625, -88.7890625, -79.0625, -69.3359375, -59.609375, -49.8828125, -40.15625, -30.4296875, -20.703125, -10.9765625, -1.25, 8.4765625, 18.203125, 27.9296875, 37.65625, 47.3828125, 57.109375, 66.8359375, 76.5625, 86.2890625, 96.015625, 105.7421875, 115.46875, 125.1953125, 134.921875, 144.6484375, 154.375, 164.1015625, 173.828125, 183.5546875, 193.28125, 203.0078125, 212.734375, 222.4609375, 232.1875, 241.9140625, 251.640625, 261.3671875, 271.09375, 280.8203125, 290.546875, 300.2734375, 310.0]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 3.0, 5.0, 12.0, 12.0, 13.0, 20.0, 33.0, 46.0, 54.0, 81.0, 109.0, 162.0, 226.0, 290.0, 454.0, 706.0, 1041.0, 1602.0, 2572.0, 4056.0, 6915.0, 12870.0, 25712.0, 60955.0, 189637.0, 4716862.0, 1000804.0, 159848.0, 54009.0, 23405.0, 11696.0, 6351.0, 3960.0, 2316.0, 1468.0, 993.0, 682.0, 440.0, 295.0, 219.0, 167.0, 106.0, 60.0, 62.0, 26.0, 26.0, 19.0, 11.0, 10.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-26.265625, -25.38818359375, -24.5107421875, -23.63330078125, -22.755859375, -21.87841796875, -21.0009765625, -20.12353515625, -19.24609375, -18.36865234375, -17.4912109375, -16.61376953125, -15.736328125, -14.85888671875, -13.9814453125, -13.10400390625, -12.2265625, -11.34912109375, -10.4716796875, -9.59423828125, -8.716796875, -7.83935546875, -6.9619140625, -6.08447265625, -5.20703125, -4.32958984375, -3.4521484375, -2.57470703125, -1.697265625, -0.81982421875, 0.0576171875, 0.93505859375, 1.8125, 2.68994140625, 3.5673828125, 4.44482421875, 5.322265625, 6.19970703125, 7.0771484375, 7.95458984375, 8.83203125, 9.70947265625, 10.5869140625, 11.46435546875, 12.341796875, 13.21923828125, 14.0966796875, 14.97412109375, 15.8515625, 16.72900390625, 17.6064453125, 18.48388671875, 19.361328125, 20.23876953125, 21.1162109375, 21.99365234375, 22.87109375, 23.74853515625, 24.6259765625, 25.50341796875, 26.380859375, 27.25830078125, 28.1357421875, 29.01318359375, 29.890625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 10.0, 7.0, 10.0, 13.0, 11.0, 14.0, 20.0, 26.0, 25.0, 32.0, 32.0, 42.0, 34.0, 32.0, 51.0, 41.0, 41.0, 349.0, 766.0, 47.0, 39.0, 42.0, 51.0, 37.0, 34.0, 40.0, 28.0, 29.0, 19.0, 25.0, 11.0, 15.0, 11.0, 8.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-376.5, -365.4296875, -354.359375, -343.2890625, -332.21875, -321.1484375, -310.078125, -299.0078125, -287.9375, -276.8671875, -265.796875, -254.7265625, -243.65625, -232.5859375, -221.515625, -210.4453125, -199.375, -188.3046875, -177.234375, -166.1640625, -155.09375, -144.0234375, -132.953125, -121.8828125, -110.8125, -99.7421875, -88.671875, -77.6015625, -66.53125, -55.4609375, -44.390625, -33.3203125, -22.25, -11.1796875, -0.109375, 10.9609375, 22.03125, 33.1015625, 44.171875, 55.2421875, 66.3125, 77.3828125, 88.453125, 99.5234375, 110.59375, 121.6640625, 132.734375, 143.8046875, 154.875, 165.9453125, 177.015625, 188.0859375, 199.15625, 210.2265625, 221.296875, 232.3671875, 243.4375, 254.5078125, 265.578125, 276.6484375, 287.71875, 298.7890625, 309.859375, 320.9296875, 332.0]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 7.0, 2.0, 16.0, 16.0, 13.0, 27.0, 39.0, 28.0, 49.0, 107.0, 129.0, 210.0, 285.0, 524.0, 771.0, 1559.0, 3212.0, 8410.0, 33381.0, 6034746.0, 177264.0, 19344.0, 5804.0, 2511.0, 1147.0, 676.0, 421.0, 217.0, 144.0, 104.0, 78.0, 39.0, 35.0, 40.0, 24.0, 11.0, 11.0, 11.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-220.5, -213.783203125, -207.06640625, -200.349609375, -193.6328125, -186.916015625, -180.19921875, -173.482421875, -166.765625, -160.048828125, -153.33203125, -146.615234375, -139.8984375, -133.181640625, -126.46484375, -119.748046875, -113.03125, -106.314453125, -99.59765625, -92.880859375, -86.1640625, -79.447265625, -72.73046875, -66.013671875, -59.296875, -52.580078125, -45.86328125, -39.146484375, -32.4296875, -25.712890625, -18.99609375, -12.279296875, -5.5625, 1.154296875, 7.87109375, 14.587890625, 21.3046875, 28.021484375, 34.73828125, 41.455078125, 48.171875, 54.888671875, 61.60546875, 68.322265625, 75.0390625, 81.755859375, 88.47265625, 95.189453125, 101.90625, 108.623046875, 115.33984375, 122.056640625, 128.7734375, 135.490234375, 142.20703125, 148.923828125, 155.640625, 162.357421875, 169.07421875, 175.791015625, 182.5078125, 189.224609375, 195.94140625, 202.658203125, 209.375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 6.0, 7.0, 17.0, 22.0, 22.0, 27.0, 38.0, 53.0, 68.0, 97.0, 133.0, 877.0, 231.0, 98.0, 83.0, 53.0, 46.0, 36.0, 18.0, 19.0, 15.0, 12.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-93.8125, -91.5458984375, -89.279296875, -87.0126953125, -84.74609375, -82.4794921875, -80.212890625, -77.9462890625, -75.6796875, -73.4130859375, -71.146484375, -68.8798828125, -66.61328125, -64.3466796875, -62.080078125, -59.8134765625, -57.546875, -55.2802734375, -53.013671875, -50.7470703125, -48.48046875, -46.2138671875, -43.947265625, -41.6806640625, -39.4140625, -37.1474609375, -34.880859375, -32.6142578125, -30.34765625, -28.0810546875, -25.814453125, -23.5478515625, -21.28125, -19.0146484375, -16.748046875, -14.4814453125, -12.21484375, -9.9482421875, -7.681640625, -5.4150390625, -3.1484375, -0.8818359375, 1.384765625, 3.6513671875, 5.91796875, 8.1845703125, 10.451171875, 12.7177734375, 14.984375, 17.2509765625, 19.517578125, 21.7841796875, 24.05078125, 26.3173828125, 28.583984375, 30.8505859375, 33.1171875, 35.3837890625, 37.650390625, 39.9169921875, 42.18359375, 44.4501953125, 46.716796875, 48.9833984375, 51.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 2.0, 9.0, 8.0, 15.0, 15.0, 28.0, 55.0, 104.0, 360.0, 239.0, 64.0, 35.0, 19.0, 13.0, 8.0, 8.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-679.916748046875, -663.2799072265625, -646.6430053710938, -630.0061645507812, -613.3692626953125, -596.732421875, -580.0955810546875, -563.4586791992188, -546.8218383789062, -530.1849975585938, -513.548095703125, -496.9112548828125, -480.2743835449219, -463.63751220703125, -447.0006408691406, -430.36376953125, -413.7268981933594, -397.09002685546875, -380.4531555175781, -363.8162841796875, -347.179443359375, -330.5425720214844, -313.90570068359375, -297.2688293457031, -280.6319580078125, -263.9950866699219, -247.3582305908203, -230.7213592529297, -214.08450317382812, -197.4476318359375, -180.81076049804688, -164.17388916015625, -147.53701782226562, -130.900146484375, -114.26329040527344, -97.62641906738281, -80.98955535888672, -64.35269165039062, -47.7158203125, -31.078956604003906, -14.442092895507812, 2.194772720336914, 18.83163833618164, 35.468505859375, 52.105369567871094, 68.74223327636719, 85.37910461425781, 102.0159683227539, 118.65283203125, 135.28970336914062, 151.9265594482422, 168.5634307861328, 185.20028686523438, 201.837158203125, 218.47402954101562, 235.11090087890625, 251.7477569580078, 268.3846130371094, 285.021484375, 301.6583557128906, 318.29522705078125, 334.93206787109375, 351.5689697265625, 368.205810546875, 384.8426818847656]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 7.0, 6.0, 10.0, 4.0, 20.0, 16.0, 46.0, 98.0, 214.0, 238.0, 153.0, 51.0, 34.0, 21.0, 10.0, 16.0, 11.0, 9.0, 2.0, 2.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-748.8748168945312, -727.6260375976562, -706.3772583007812, -685.1284790039062, -663.8796997070312, -642.6309814453125, -621.3822021484375, -600.1334228515625, -578.8846435546875, -557.6358642578125, -536.3870849609375, -515.1383056640625, -493.8895568847656, -472.6407775878906, -451.3919982910156, -430.14324951171875, -408.8944396972656, -387.6456604003906, -366.3968811035156, -345.14813232421875, -323.89935302734375, -302.65057373046875, -281.40179443359375, -260.15301513671875, -238.9042510986328, -217.6554718017578, -196.40670776367188, -175.15792846679688, -153.90914916992188, -132.66038513183594, -111.41160583496094, -90.162841796875, -68.9140625, -47.66529083251953, -26.416515350341797, -5.1677398681640625, 16.081031799316406, 37.329803466796875, 58.578582763671875, 79.82734680175781, 101.07612609863281, 122.32489776611328, 143.57366943359375, 164.82244873046875, 186.07122802734375, 207.3199920654297, 228.5687713623047, 249.81753540039062, 271.0663146972656, 292.3150939941406, 313.5638732910156, 334.8126220703125, 356.0614013671875, 377.3101806640625, 398.5589599609375, 419.8077392578125, 441.0565185546875, 462.3052978515625, 483.5540771484375, 504.8028564453125, 526.0516357421875, 547.3004150390625, 568.5491943359375, 589.7979125976562, 611.0466918945312]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 8.0, 13.0, 18.0, 8.0, 18.0, 19.0, 42.0, 53.0, 65.0, 83.0, 126.0, 170.0, 238.0, 369.0, 553.0, 850.0, 1329.0, 2140.0, 3940.0, 8095.0, 24864.0, 4026051.0, 98095.0, 13004.0, 5812.0, 3111.0, 1841.0, 1069.0, 717.0, 458.0, 314.0, 228.0, 143.0, 105.0, 88.0, 48.0, 41.0, 33.0, 34.0, 21.0, 11.0, 9.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.1392822265625, -0.13475608825683594, -0.13022994995117188, -0.1257038116455078, -0.12117767333984375, -0.11665153503417969, -0.11212539672851562, -0.10759925842285156, -0.1030731201171875, -0.09854698181152344, -0.09402084350585938, -0.08949470520019531, -0.08496856689453125, -0.08044242858886719, -0.07591629028320312, -0.07139015197753906, -0.066864013671875, -0.06233787536621094, -0.057811737060546875, -0.05328559875488281, -0.04875946044921875, -0.04423332214355469, -0.039707183837890625, -0.03518104553222656, -0.0306549072265625, -0.026128768920898438, -0.021602630615234375, -0.017076492309570312, -0.01255035400390625, -0.008024215698242188, -0.003498077392578125, 0.0010280609130859375, 0.00555419921875, 0.010080337524414062, 0.014606475830078125, 0.019132614135742188, 0.02365875244140625, 0.028184890747070312, 0.032711029052734375, 0.03723716735839844, 0.0417633056640625, 0.04628944396972656, 0.050815582275390625, 0.05534172058105469, 0.05986785888671875, 0.06439399719238281, 0.06892013549804688, 0.07344627380371094, 0.077972412109375, 0.08249855041503906, 0.08702468872070312, 0.09155082702636719, 0.09607696533203125, 0.10060310363769531, 0.10512924194335938, 0.10965538024902344, 0.1141815185546875, 0.11870765686035156, 0.12323379516601562, 0.1277599334716797, 0.13228607177734375, 0.1368122100830078, 0.14133834838867188, 0.14586448669433594, 0.150390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 7.0, 3.0, 8.0, 10.0, 9.0, 12.0, 16.0, 59.0, 157.0, 257.0, 245.0, 101.0, 33.0, 15.0, 10.0, 5.0, 4.0, 3.0, 5.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0083770751953125, -0.008104920387268066, -0.007832765579223633, -0.007560610771179199, -0.007288455963134766, -0.007016301155090332, -0.0067441463470458984, -0.006471991539001465, -0.006199836730957031, -0.005927681922912598, -0.005655527114868164, -0.0053833723068237305, -0.005111217498779297, -0.004839062690734863, -0.00456690788269043, -0.004294753074645996, -0.0040225982666015625, -0.003750443458557129, -0.0034782886505126953, -0.0032061338424682617, -0.002933979034423828, -0.0026618242263793945, -0.002389669418334961, -0.0021175146102905273, -0.0018453598022460938, -0.0015732049942016602, -0.0013010501861572266, -0.001028895378112793, -0.0007567405700683594, -0.0004845857620239258, -0.0002124309539794922, 5.9723854064941406e-05, 0.000331878662109375, 0.0006040334701538086, 0.0008761882781982422, 0.0011483430862426758, 0.0014204978942871094, 0.001692652702331543, 0.0019648075103759766, 0.00223696231842041, 0.0025091171264648438, 0.0027812719345092773, 0.003053426742553711, 0.0033255815505981445, 0.003597736358642578, 0.0038698911666870117, 0.004142045974731445, 0.004414200782775879, 0.0046863555908203125, 0.004958510398864746, 0.00523066520690918, 0.005502820014953613, 0.005774974822998047, 0.0060471296310424805, 0.006319284439086914, 0.006591439247131348, 0.006863594055175781, 0.007135748863220215, 0.0074079036712646484, 0.007680058479309082, 0.007952213287353516, 0.00822436809539795, 0.008496522903442383, 0.008768677711486816, 0.00904083251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 11.0, 4.0, 7.0, 16.0, 18.0, 27.0, 41.0, 78.0, 79.0, 108.0, 224.0, 288.0, 527.0, 961.0, 2241.0, 7147.0, 44810.0, 3932220.0, 179173.0, 18520.0, 4260.0, 1575.0, 836.0, 391.0, 229.0, 163.0, 107.0, 74.0, 44.0, 31.0, 21.0, 16.0, 11.0, 13.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20361328125, -0.19739723205566406, -0.19118118286132812, -0.1849651336669922, -0.17874908447265625, -0.1725330352783203, -0.16631698608398438, -0.16010093688964844, -0.1538848876953125, -0.14766883850097656, -0.14145278930664062, -0.1352367401123047, -0.12902069091796875, -0.12280464172363281, -0.11658859252929688, -0.11037254333496094, -0.104156494140625, -0.09794044494628906, -0.09172439575195312, -0.08550834655761719, -0.07929229736328125, -0.07307624816894531, -0.06686019897460938, -0.06064414978027344, -0.0544281005859375, -0.04821205139160156, -0.041996002197265625, -0.03577995300292969, -0.02956390380859375, -0.023347854614257812, -0.017131805419921875, -0.010915756225585938, -0.00469970703125, 0.0015163421630859375, 0.007732391357421875, 0.013948440551757812, 0.02016448974609375, 0.026380538940429688, 0.032596588134765625, 0.03881263732910156, 0.0450286865234375, 0.05124473571777344, 0.057460784912109375, 0.06367683410644531, 0.06989288330078125, 0.07610893249511719, 0.08232498168945312, 0.08854103088378906, 0.094757080078125, 0.10097312927246094, 0.10718917846679688, 0.11340522766113281, 0.11962127685546875, 0.1258373260498047, 0.13205337524414062, 0.13826942443847656, 0.1444854736328125, 0.15070152282714844, 0.15691757202148438, 0.1631336212158203, 0.16934967041015625, 0.1755657196044922, 0.18178176879882812, 0.18799781799316406, 0.1942138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 11.0, 8.0, 5.0, 8.0, 11.0, 22.0, 20.0, 29.0, 29.0, 33.0, 50.0, 73.0, 374.0, 2797.0, 181.0, 67.0, 39.0, 47.0, 44.0, 33.0, 37.0, 36.0, 25.0, 22.0, 23.0, 8.0, 10.0, 12.0, 5.0, 10.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0246734619140625, -0.02397298812866211, -0.02327251434326172, -0.022572040557861328, -0.021871566772460938, -0.021171092987060547, -0.020470619201660156, -0.019770145416259766, -0.019069671630859375, -0.018369197845458984, -0.017668724060058594, -0.016968250274658203, -0.016267776489257812, -0.015567302703857422, -0.014866828918457031, -0.01416635513305664, -0.01346588134765625, -0.01276540756225586, -0.012064933776855469, -0.011364459991455078, -0.010663986206054688, -0.009963512420654297, -0.009263038635253906, -0.008562564849853516, -0.007862091064453125, -0.007161617279052734, -0.006461143493652344, -0.005760669708251953, -0.0050601959228515625, -0.004359722137451172, -0.0036592483520507812, -0.0029587745666503906, -0.00225830078125, -0.0015578269958496094, -0.0008573532104492188, -0.00015687942504882812, 0.0005435943603515625, 0.0012440681457519531, 0.0019445419311523438, 0.0026450157165527344, 0.003345489501953125, 0.004045963287353516, 0.004746437072753906, 0.005446910858154297, 0.0061473846435546875, 0.006847858428955078, 0.007548332214355469, 0.00824880599975586, 0.00894927978515625, 0.00964975357055664, 0.010350227355957031, 0.011050701141357422, 0.011751174926757812, 0.012451648712158203, 0.013152122497558594, 0.013852596282958984, 0.014553070068359375, 0.015253543853759766, 0.015954017639160156, 0.016654491424560547, 0.017354965209960938, 0.018055438995361328, 0.01875591278076172, 0.01945638656616211, 0.0201568603515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 10.0, 35.0, 431.0, 431.0, 77.0, 13.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20509663224220276, -0.17570139467716217, -0.14630615711212158, -0.11691092699766159, -0.087515689432621, -0.05812045931816101, -0.028725221753120422, 0.000670015811920166, 0.030065253376960754, 0.05946049094200134, 0.08885572850704193, 0.11825095862150192, 0.14764618873596191, 0.1770414263010025, 0.2064366638660431, 0.23583190143108368, 0.26522713899612427, 0.29462236166000366, 0.32401761412620544, 0.35341283679008484, 0.3828080892562866, 0.412203311920166, 0.4415985345840454, 0.4709937870502472, 0.500389039516449, 0.5297842621803284, 0.5591794848442078, 0.5885747671127319, 0.6179699897766113, 0.6473652124404907, 0.6767604351043701, 0.7061556577682495, 0.7355509400367737, 0.7649461627006531, 0.7943413853645325, 0.8237366676330566, 0.853131890296936, 0.8825271129608154, 0.9119223356246948, 0.9413175582885742, 0.9707128405570984, 1.0001081228256226, 1.029503345489502, 1.0588985681533813, 1.0882937908172607, 1.1176890134811401, 1.1470842361450195, 1.176479458808899, 1.2058746814727783, 1.2352699041366577, 1.264665126800537, 1.2940603494644165, 1.323455572128296, 1.3528509140014648, 1.3822461366653442, 1.4116413593292236, 1.441036581993103, 1.4704318046569824, 1.4998270273208618, 1.5292222499847412, 1.5586174726486206, 1.5880126953125, 1.617408037185669, 1.6468032598495483, 1.6761984825134277]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 19.0, 32.0, 27.0, 42.0, 47.0, 59.0, 51.0, 63.0, 68.0, 94.0, 67.0, 62.0, 61.0, 63.0, 56.0, 37.0, 32.0, 24.0, 17.0, 12.0, 13.0, 7.0, 7.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.16973507404327393, -0.1655745804309845, -0.16141408681869507, -0.15725359320640564, -0.1530930995941162, -0.14893262088298798, -0.14477212727069855, -0.14061163365840912, -0.1364511400461197, -0.13229064643383026, -0.12813015282154083, -0.123969666659832, -0.11980917304754257, -0.11564867943525314, -0.11148819327354431, -0.10732769966125488, -0.10316720604896545, -0.09900671243667603, -0.0948462188243866, -0.09068573266267776, -0.08652523905038834, -0.08236474543809891, -0.07820425927639008, -0.07404376566410065, -0.06988327205181122, -0.06572277843952179, -0.06156228855252266, -0.05740179866552353, -0.0532413050532341, -0.04908081144094467, -0.04492032155394554, -0.04075983166694641, -0.03659933805465698, -0.032438844442367554, -0.028278354555368423, -0.024117862805724144, -0.019957371056079865, -0.015796879306435585, -0.011636387556791306, -0.007475895807147026, -0.0033154040575027466, 0.0008450876921415329, 0.005005579441785812, 0.009166071191430092, 0.013326562941074371, 0.01748705469071865, 0.02164754644036293, 0.02580803819000721, 0.02996852993965149, 0.03412902355194092, 0.03828951343894005, 0.04245000332593918, 0.04661049693822861, 0.050770990550518036, 0.054931480437517166, 0.059091970324516296, 0.06325246393680573, 0.06741295754909515, 0.07157345116138458, 0.07573393732309341, 0.07989443093538284, 0.08405492454767227, 0.0882154107093811, 0.09237590432167053, 0.09653639793395996]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 10.0, 10.0, 19.0, 15.0, 25.0, 35.0, 44.0, 51.0, 75.0, 106.0, 127.0, 161.0, 227.0, 318.0, 436.0, 599.0, 871.0, 1180.0, 1673.0, 2580.0, 3955.0, 6539.0, 12930.0, 41748.0, 779580.0, 149733.0, 20865.0, 8953.0, 5196.0, 3218.0, 2112.0, 1513.0, 967.0, 688.0, 516.0, 377.0, 268.0, 195.0, 152.0, 106.0, 77.0, 79.0, 54.0, 35.0, 24.0, 28.0, 15.0, 15.0, 11.0, 10.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0], "bins": [-0.10260009765625, -0.09946823120117188, -0.09633636474609375, -0.09320449829101562, -0.0900726318359375, -0.08694076538085938, -0.08380889892578125, -0.08067703247070312, -0.077545166015625, -0.07441329956054688, -0.07128143310546875, -0.06814956665039062, -0.0650177001953125, -0.061885833740234375, -0.05875396728515625, -0.055622100830078125, -0.052490234375, -0.049358367919921875, -0.04622650146484375, -0.043094635009765625, -0.0399627685546875, -0.036830902099609375, -0.03369903564453125, -0.030567169189453125, -0.027435302734375, -0.024303436279296875, -0.02117156982421875, -0.018039703369140625, -0.0149078369140625, -0.011775970458984375, -0.00864410400390625, -0.005512237548828125, -0.00238037109375, 0.000751495361328125, 0.00388336181640625, 0.007015228271484375, 0.0101470947265625, 0.013278961181640625, 0.01641082763671875, 0.019542694091796875, 0.022674560546875, 0.025806427001953125, 0.02893829345703125, 0.032070159912109375, 0.0352020263671875, 0.038333892822265625, 0.04146575927734375, 0.044597625732421875, 0.0477294921875, 0.050861358642578125, 0.05399322509765625, 0.057125091552734375, 0.0602569580078125, 0.06338882446289062, 0.06652069091796875, 0.06965255737304688, 0.072784423828125, 0.07591629028320312, 0.07904815673828125, 0.08218002319335938, 0.0853118896484375, 0.08844375610351562, 0.09157562255859375, 0.09470748901367188, 0.09783935546875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 7.0, 3.0, 8.0, 10.0, 11.0, 10.0, 16.0, 64.0, 171.0, 263.0, 230.0, 100.0, 24.0, 16.0, 9.0, 5.0, 4.0, 5.0, 3.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00836181640625, -0.008089661598205566, -0.007817506790161133, -0.007545351982116699, -0.007273197174072266, -0.007001042366027832, -0.0067288875579833984, -0.006456732749938965, -0.006184577941894531, -0.005912423133850098, -0.005640268325805664, -0.0053681135177612305, -0.005095958709716797, -0.004823803901672363, -0.00455164909362793, -0.004279494285583496, -0.0040073394775390625, -0.003735184669494629, -0.0034630298614501953, -0.0031908750534057617, -0.002918720245361328, -0.0026465654373168945, -0.002374410629272461, -0.0021022558212280273, -0.0018301010131835938, -0.0015579462051391602, -0.0012857913970947266, -0.001013636589050293, -0.0007414817810058594, -0.0004693269729614258, -0.0001971721649169922, 7.49826431274414e-05, 0.000347137451171875, 0.0006192922592163086, 0.0008914470672607422, 0.0011636018753051758, 0.0014357566833496094, 0.001707911491394043, 0.0019800662994384766, 0.00225222110748291, 0.0025243759155273438, 0.0027965307235717773, 0.003068685531616211, 0.0033408403396606445, 0.003612995147705078, 0.0038851499557495117, 0.004157304763793945, 0.004429459571838379, 0.0047016143798828125, 0.004973769187927246, 0.00524592399597168, 0.005518078804016113, 0.005790233612060547, 0.0060623884201049805, 0.006334543228149414, 0.006606698036193848, 0.006878852844238281, 0.007151007652282715, 0.0074231624603271484, 0.007695317268371582, 0.007967472076416016, 0.00823962688446045, 0.008511781692504883, 0.008783936500549316, 0.00905609130859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 6.0, 5.0, 12.0, 16.0, 12.0, 25.0, 57.0, 46.0, 89.0, 100.0, 159.0, 262.0, 348.0, 534.0, 936.0, 1518.0, 3229.0, 7652.0, 32971.0, 598535.0, 360095.0, 27901.0, 7175.0, 2882.0, 1521.0, 815.0, 562.0, 354.0, 220.0, 139.0, 116.0, 88.0, 55.0, 33.0, 29.0, 16.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.17919921875, -0.17421531677246094, -0.16923141479492188, -0.1642475128173828, -0.15926361083984375, -0.1542797088623047, -0.14929580688476562, -0.14431190490722656, -0.1393280029296875, -0.13434410095214844, -0.12936019897460938, -0.12437629699707031, -0.11939239501953125, -0.11440849304199219, -0.10942459106445312, -0.10444068908691406, -0.099456787109375, -0.09447288513183594, -0.08948898315429688, -0.08450508117675781, -0.07952117919921875, -0.07453727722167969, -0.06955337524414062, -0.06456947326660156, -0.0595855712890625, -0.05460166931152344, -0.049617767333984375, -0.04463386535644531, -0.03964996337890625, -0.03466606140136719, -0.029682159423828125, -0.024698257446289062, -0.01971435546875, -0.014730453491210938, -0.009746551513671875, -0.0047626495361328125, 0.00022125244140625, 0.0052051544189453125, 0.010189056396484375, 0.015172958374023438, 0.0201568603515625, 0.025140762329101562, 0.030124664306640625, 0.03510856628417969, 0.04009246826171875, 0.04507637023925781, 0.050060272216796875, 0.05504417419433594, 0.060028076171875, 0.06501197814941406, 0.06999588012695312, 0.07497978210449219, 0.07996368408203125, 0.08494758605957031, 0.08993148803710938, 0.09491539001464844, 0.0998992919921875, 0.10488319396972656, 0.10986709594726562, 0.11485099792480469, 0.11983489990234375, 0.12481880187988281, 0.12980270385742188, 0.13478660583496094, 0.1397705078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 4.0, 10.0, 11.0, 6.0, 9.0, 20.0, 9.0, 24.0, 27.0, 23.0, 28.0, 30.0, 23.0, 42.0, 30.0, 41.0, 46.0, 56.0, 52.0, 54.0, 42.0, 42.0, 36.0, 41.0, 38.0, 45.0, 30.0, 29.0, 26.0, 26.0, 19.0, 19.0, 15.0, 17.0, 3.0, 6.0, 7.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0421142578125, -0.040943145751953125, -0.03977203369140625, -0.038600921630859375, -0.0374298095703125, -0.036258697509765625, -0.03508758544921875, -0.033916473388671875, -0.032745361328125, -0.031574249267578125, -0.03040313720703125, -0.029232025146484375, -0.0280609130859375, -0.026889801025390625, -0.02571868896484375, -0.024547576904296875, -0.02337646484375, -0.022205352783203125, -0.02103424072265625, -0.019863128662109375, -0.0186920166015625, -0.017520904541015625, -0.01634979248046875, -0.015178680419921875, -0.014007568359375, -0.012836456298828125, -0.01166534423828125, -0.010494232177734375, -0.0093231201171875, -0.008152008056640625, -0.00698089599609375, -0.005809783935546875, -0.004638671875, -0.003467559814453125, -0.00229644775390625, -0.001125335693359375, 4.57763671875e-05, 0.001216888427734375, 0.00238800048828125, 0.003559112548828125, 0.004730224609375, 0.005901336669921875, 0.00707244873046875, 0.008243560791015625, 0.0094146728515625, 0.010585784912109375, 0.01175689697265625, 0.012928009033203125, 0.01409912109375, 0.015270233154296875, 0.01644134521484375, 0.017612457275390625, 0.0187835693359375, 0.019954681396484375, 0.02112579345703125, 0.022296905517578125, 0.023468017578125, 0.024639129638671875, 0.02581024169921875, 0.026981353759765625, 0.0281524658203125, 0.029323577880859375, 0.03049468994140625, 0.031665802001953125, 0.0328369140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 10.0, 2.0, 3.0, 9.0, 17.0, 15.0, 21.0, 27.0, 26.0, 59.0, 71.0, 94.0, 171.0, 268.0, 507.0, 1067.0, 2957.0, 13419.0, 657751.0, 354995.0, 11931.0, 2885.0, 966.0, 498.0, 261.0, 159.0, 111.0, 68.0, 52.0, 29.0, 23.0, 26.0, 15.0, 7.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.975629806518555e-05, -3.868062049150467e-05, -3.760494291782379e-05, -3.6529265344142914e-05, -3.5453587770462036e-05, -3.437791019678116e-05, -3.330223262310028e-05, -3.22265550494194e-05, -3.1150877475738525e-05, -3.0075199902057648e-05, -2.899952232837677e-05, -2.7923844754695892e-05, -2.6848167181015015e-05, -2.5772489607334137e-05, -2.469681203365326e-05, -2.362113445997238e-05, -2.2545456886291504e-05, -2.1469779312610626e-05, -2.039410173892975e-05, -1.931842416524887e-05, -1.8242746591567993e-05, -1.7167069017887115e-05, -1.6091391444206238e-05, -1.501571387052536e-05, -1.3940036296844482e-05, -1.2864358723163605e-05, -1.1788681149482727e-05, -1.071300357580185e-05, -9.637326002120972e-06, -8.561648428440094e-06, -7.485970854759216e-06, -6.410293281078339e-06, -5.334615707397461e-06, -4.258938133716583e-06, -3.1832605600357056e-06, -2.107582986354828e-06, -1.0319054126739502e-06, 4.377216100692749e-08, 1.1194497346878052e-06, 2.195127308368683e-06, 3.2708048820495605e-06, 4.346482455730438e-06, 5.422160029411316e-06, 6.497837603092194e-06, 7.573515176773071e-06, 8.649192750453949e-06, 9.724870324134827e-06, 1.0800547897815704e-05, 1.1876225471496582e-05, 1.295190304517746e-05, 1.4027580618858337e-05, 1.5103258192539215e-05, 1.6178935766220093e-05, 1.725461333990097e-05, 1.8330290913581848e-05, 1.9405968487262726e-05, 2.0481646060943604e-05, 2.155732363462448e-05, 2.263300120830536e-05, 2.3708678781986237e-05, 2.4784356355667114e-05, 2.5860033929347992e-05, 2.693571150302887e-05, 2.8011389076709747e-05, 2.9087066650390625e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 1.0, 2.0, 4.0, 9.0, 8.0, 9.0, 15.0, 14.0, 16.0, 54.0, 49.0, 74.0, 105.0, 160.0, 129.0, 104.0, 51.0, 43.0, 43.0, 25.0, 24.0, 11.0, 14.0, 10.0, 6.0, 2.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.417533874511719e-06, -9.181909263134003e-06, -8.946284651756287e-06, -8.71066004037857e-06, -8.475035429000854e-06, -8.239410817623138e-06, -8.003786206245422e-06, -7.768161594867706e-06, -7.53253698348999e-06, -7.296912372112274e-06, -7.061287760734558e-06, -6.825663149356842e-06, -6.590038537979126e-06, -6.35441392660141e-06, -6.118789315223694e-06, -5.883164703845978e-06, -5.647540092468262e-06, -5.411915481090546e-06, -5.17629086971283e-06, -4.9406662583351135e-06, -4.7050416469573975e-06, -4.469417035579681e-06, -4.233792424201965e-06, -3.998167812824249e-06, -3.762543201446533e-06, -3.526918590068817e-06, -3.291293978691101e-06, -3.055669367313385e-06, -2.820044755935669e-06, -2.584420144557953e-06, -2.348795533180237e-06, -2.1131709218025208e-06, -1.8775463104248047e-06, -1.6419216990470886e-06, -1.4062970876693726e-06, -1.1706724762916565e-06, -9.350478649139404e-07, -6.994232535362244e-07, -4.637986421585083e-07, -2.2817403078079224e-07, 7.450580596923828e-09, 2.430751919746399e-07, 4.78699803352356e-07, 7.14324414730072e-07, 9.499490261077881e-07, 1.1855736374855042e-06, 1.4211982488632202e-06, 1.6568228602409363e-06, 1.8924474716186523e-06, 2.1280720829963684e-06, 2.3636966943740845e-06, 2.5993213057518005e-06, 2.8349459171295166e-06, 3.0705705285072327e-06, 3.3061951398849487e-06, 3.541819751262665e-06, 3.777444362640381e-06, 4.013068974018097e-06, 4.248693585395813e-06, 4.484318196773529e-06, 4.719942808151245e-06, 4.955567419528961e-06, 5.191192030906677e-06, 5.426816642284393e-06, 5.662441253662109e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 2.0, 6.0, 9.0, 11.0, 14.0, 34.0, 33.0, 62.0, 67.0, 118.0, 214.0, 402.0, 837.0, 2571.0, 11907.0, 973414.0, 51541.0, 4674.0, 1338.0, 565.0, 255.0, 157.0, 104.0, 66.0, 40.0, 23.0, 18.0, 22.0, 3.0, 6.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16312026977539e-05, -5.9689395129680634e-05, -5.774758756160736e-05, -5.580577999353409e-05, -5.3863972425460815e-05, -5.192216485738754e-05, -4.998035728931427e-05, -4.8038549721241e-05, -4.6096742153167725e-05, -4.415493458509445e-05, -4.221312701702118e-05, -4.0271319448947906e-05, -3.8329511880874634e-05, -3.638770431280136e-05, -3.444589674472809e-05, -3.2504089176654816e-05, -3.056228160858154e-05, -2.862047404050827e-05, -2.6678666472434998e-05, -2.4736858904361725e-05, -2.2795051336288452e-05, -2.085324376821518e-05, -1.8911436200141907e-05, -1.6969628632068634e-05, -1.5027821063995361e-05, -1.3086013495922089e-05, -1.1144205927848816e-05, -9.202398359775543e-06, -7.2605907917022705e-06, -5.318783223628998e-06, -3.376975655555725e-06, -1.4351680874824524e-06, 5.066394805908203e-07, 2.448447048664093e-06, 4.390254616737366e-06, 6.3320621848106384e-06, 8.273869752883911e-06, 1.0215677320957184e-05, 1.2157484889030457e-05, 1.409929245710373e-05, 1.6041100025177002e-05, 1.7982907593250275e-05, 1.9924715161323547e-05, 2.186652272939682e-05, 2.3808330297470093e-05, 2.5750137865543365e-05, 2.7691945433616638e-05, 2.963375300168991e-05, 3.1575560569763184e-05, 3.3517368137836456e-05, 3.545917570590973e-05, 3.7400983273983e-05, 3.9342790842056274e-05, 4.128459841012955e-05, 4.322640597820282e-05, 4.516821354627609e-05, 4.7110021114349365e-05, 4.905182868242264e-05, 5.099363625049591e-05, 5.293544381856918e-05, 5.4877251386642456e-05, 5.681905895471573e-05, 5.8760866522789e-05, 6.0702674090862274e-05, 6.264448165893555e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 8.0, 5.0, 6.0, 17.0, 14.0, 23.0, 37.0, 50.0, 89.0, 362.0, 173.0, 68.0, 33.0, 43.0, 20.0, 13.0, 9.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.4027580618858337e-05, -1.3571232557296753e-05, -1.3114884495735168e-05, -1.2658536434173584e-05, -1.2202188372612e-05, -1.1745840311050415e-05, -1.128949224948883e-05, -1.0833144187927246e-05, -1.0376796126365662e-05, -9.920448064804077e-06, -9.464100003242493e-06, -9.007751941680908e-06, -8.551403880119324e-06, -8.09505581855774e-06, -7.638707756996155e-06, -7.18235969543457e-06, -6.726011633872986e-06, -6.269663572311401e-06, -5.813315510749817e-06, -5.356967449188232e-06, -4.900619387626648e-06, -4.4442713260650635e-06, -3.987923264503479e-06, -3.5315752029418945e-06, -3.07522714138031e-06, -2.6188790798187256e-06, -2.162531018257141e-06, -1.7061829566955566e-06, -1.2498348951339722e-06, -7.934868335723877e-07, -3.371387720108032e-07, 1.1920928955078125e-07, 5.755573511123657e-07, 1.0319054126739502e-06, 1.4882534742355347e-06, 1.944601535797119e-06, 2.4009495973587036e-06, 2.857297658920288e-06, 3.3136457204818726e-06, 3.769993782043457e-06, 4.2263418436050415e-06, 4.682689905166626e-06, 5.1390379667282104e-06, 5.595386028289795e-06, 6.051734089851379e-06, 6.508082151412964e-06, 6.964430212974548e-06, 7.420778274536133e-06, 7.877126336097717e-06, 8.333474397659302e-06, 8.789822459220886e-06, 9.24617052078247e-06, 9.702518582344055e-06, 1.015886664390564e-05, 1.0615214705467224e-05, 1.1071562767028809e-05, 1.1527910828590393e-05, 1.1984258890151978e-05, 1.2440606951713562e-05, 1.2896955013275146e-05, 1.3353303074836731e-05, 1.3809651136398315e-05, 1.42659991979599e-05, 1.4722347259521484e-05]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 9.0, 9.0, 14.0, 23.0, 99.0, 508.0, 229.0, 47.0, 18.0, 16.0, 7.0, 3.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.525599718093872, -1.4792274236679077, -1.4328551292419434, -1.3864829540252686, -1.3401106595993042, -1.2937383651733398, -1.247366189956665, -1.2009938955307007, -1.1546216011047363, -1.108249306678772, -1.0618770122528076, -1.0155048370361328, -0.9691325426101685, -0.9227602481842041, -0.8763880133628845, -0.8300157785415649, -0.7836434841156006, -0.7372711896896362, -0.6908989548683167, -0.6445267200469971, -0.5981544256210327, -0.5517821311950684, -0.5054098963737488, -0.4590376317501068, -0.41266536712646484, -0.3662931025028229, -0.3199208378791809, -0.27354857325553894, -0.22717630863189697, -0.180804044008255, -0.13443177938461304, -0.08805951476097107, -0.0416872501373291, 0.004685014486312866, 0.051057279109954834, 0.0974295437335968, 0.14380180835723877, 0.19017407298088074, 0.2365463376045227, 0.2829186022281647, 0.32929086685180664, 0.3756631314754486, 0.4220353960990906, 0.46840766072273254, 0.5147799253463745, 0.5611522197723389, 0.6075244545936584, 0.653896689414978, 0.7002689838409424, 0.7466412782669067, 0.7930135130882263, 0.8393857479095459, 0.8857580423355103, 0.9321303367614746, 0.9785025715827942, 1.0248748064041138, 1.0712471008300781, 1.1176193952560425, 1.1639916896820068, 1.2103638648986816, 1.256736159324646, 1.3031084537506104, 1.3494806289672852, 1.3958529233932495, 1.4422252178192139]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 7.0, 3.0, 3.0, 11.0, 6.0, 8.0, 9.0, 18.0, 23.0, 36.0, 61.0, 67.0, 116.0, 123.0, 113.0, 103.0, 85.0, 54.0, 44.0, 18.0, 16.0, 9.0, 14.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5926666855812073, -0.5752219557762146, -0.5577771663665771, -0.5403324365615845, -0.522887647151947, -0.5054429173469543, -0.4879981577396393, -0.4705533981323242, -0.45310863852500916, -0.4356638789176941, -0.41821911931037903, -0.40077435970306396, -0.3833296298980713, -0.36588484048843384, -0.34844011068344116, -0.3309953510761261, -0.31355059146881104, -0.29610583186149597, -0.2786610722541809, -0.26121631264686584, -0.24377156794071198, -0.2263268083333969, -0.20888206362724304, -0.19143730401992798, -0.17399254441261292, -0.15654778480529785, -0.1391030251979828, -0.12165828049182892, -0.10421352088451385, -0.08676876127719879, -0.06932400912046432, -0.05187925696372986, -0.03443443775177002, -0.016989681869745255, 0.0004550740122795105, 0.017899829894304276, 0.03534458577632904, 0.052789345383644104, 0.07023409754037857, 0.08767884969711304, 0.1051236093044281, 0.12256836891174316, 0.14001312851905823, 0.1574578732252121, 0.17490263283252716, 0.19234739243984222, 0.2097921371459961, 0.22723689675331116, 0.24468165636062622, 0.2621264159679413, 0.27957117557525635, 0.2970159351825714, 0.3144606947898865, 0.33190542459487915, 0.3493501842021942, 0.3667949438095093, 0.38423970341682434, 0.4016844630241394, 0.41912922263145447, 0.43657398223876953, 0.4540187120437622, 0.47146350145339966, 0.48890823125839233, 0.5063530206680298, 0.5237977504730225]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 8.0, 3.0, 11.0, 8.0, 19.0, 17.0, 25.0, 32.0, 67.0, 267.0, 3679.0, 4148563.0, 40270.0, 996.0, 124.0, 50.0, 26.0, 24.0, 16.0, 7.0, 11.0, 10.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -16.0546875, -15.515625, -14.9765625, -14.4375, -13.8984375, -13.359375, -12.8203125, -12.28125, -11.7421875, -11.203125, -10.6640625, -10.125, -9.5859375, -9.046875, -8.5078125, -7.96875, -7.4296875, -6.890625, -6.3515625, -5.8125, -5.2734375, -4.734375, -4.1953125, -3.65625, -3.1171875, -2.578125, -2.0390625, -1.5, -0.9609375, -0.421875, 0.1171875, 0.65625, 1.1953125, 1.734375, 2.2734375, 2.8125, 3.3515625, 3.890625, 4.4296875, 4.96875, 5.5078125, 6.046875, 6.5859375, 7.125, 7.6640625, 8.203125, 8.7421875, 9.28125, 9.8203125, 10.359375, 10.8984375, 11.4375, 11.9765625, 12.515625, 13.0546875, 13.59375, 14.1328125, 14.671875, 15.2109375, 15.75, 16.2890625, 16.828125, 17.3671875, 17.90625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 7.0, 3.0, 10.0, 9.0, 10.0, 8.0, 17.0, 57.0, 155.0, 255.0, 247.0, 105.0, 34.0, 15.0, 10.0, 4.0, 4.0, 5.0, 4.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00823974609375, -0.007972240447998047, -0.007704734802246094, -0.007437229156494141, -0.0071697235107421875, -0.006902217864990234, -0.006634712219238281, -0.006367206573486328, -0.006099700927734375, -0.005832195281982422, -0.005564689636230469, -0.005297183990478516, -0.0050296783447265625, -0.004762172698974609, -0.004494667053222656, -0.004227161407470703, -0.00395965576171875, -0.003692150115966797, -0.0034246444702148438, -0.0031571388244628906, -0.0028896331787109375, -0.0026221275329589844, -0.0023546218872070312, -0.002087116241455078, -0.001819610595703125, -0.0015521049499511719, -0.0012845993041992188, -0.0010170936584472656, -0.0007495880126953125, -0.0004820823669433594, -0.00021457672119140625, 5.2928924560546875e-05, 0.0003204345703125, 0.0005879402160644531, 0.0008554458618164062, 0.0011229515075683594, 0.0013904571533203125, 0.0016579627990722656, 0.0019254684448242188, 0.002192974090576172, 0.002460479736328125, 0.002727985382080078, 0.0029954910278320312, 0.0032629966735839844, 0.0035305023193359375, 0.0037980079650878906, 0.004065513610839844, 0.004333019256591797, 0.00460052490234375, 0.004868030548095703, 0.005135536193847656, 0.005403041839599609, 0.0056705474853515625, 0.005938053131103516, 0.006205558776855469, 0.006473064422607422, 0.006740570068359375, 0.007008075714111328, 0.007275581359863281, 0.007543087005615234, 0.0078105926513671875, 0.00807809829711914, 0.008345603942871094, 0.008613109588623047, 0.008880615234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 5.0, 3.0, 6.0, 5.0, 6.0, 14.0, 12.0, 18.0, 12.0, 20.0, 18.0, 29.0, 36.0, 44.0, 43.0, 57.0, 58.0, 64.0, 102.0, 298.0, 7418.0, 4157579.0, 26331.0, 976.0, 182.0, 134.0, 89.0, 85.0, 85.0, 75.0, 68.0, 58.0, 56.0, 56.0, 43.0, 36.0, 30.0, 19.0, 22.0, 15.0, 15.0, 7.0, 10.0, 8.0, 12.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.310546875, -2.235107421875, -2.15966796875, -2.084228515625, -2.0087890625, -1.933349609375, -1.85791015625, -1.782470703125, -1.70703125, -1.631591796875, -1.55615234375, -1.480712890625, -1.4052734375, -1.329833984375, -1.25439453125, -1.178955078125, -1.103515625, -1.028076171875, -0.95263671875, -0.877197265625, -0.8017578125, -0.726318359375, -0.65087890625, -0.575439453125, -0.5, -0.424560546875, -0.34912109375, -0.273681640625, -0.1982421875, -0.122802734375, -0.04736328125, 0.028076171875, 0.103515625, 0.178955078125, 0.25439453125, 0.329833984375, 0.4052734375, 0.480712890625, 0.55615234375, 0.631591796875, 0.70703125, 0.782470703125, 0.85791015625, 0.933349609375, 1.0087890625, 1.084228515625, 1.15966796875, 1.235107421875, 1.310546875, 1.385986328125, 1.46142578125, 1.536865234375, 1.6123046875, 1.687744140625, 1.76318359375, 1.838623046875, 1.9140625, 1.989501953125, 2.06494140625, 2.140380859375, 2.2158203125, 2.291259765625, 2.36669921875, 2.442138671875, 2.517578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 5.0, 5.0, 4.0, 5.0, 6.0, 14.0, 12.0, 18.0, 12.0, 20.0, 19.0, 29.0, 35.0, 44.0, 44.0, 57.0, 58.0, 61.0, 77.0, 103.0, 139.0, 1948.0, 199.0, 134.0, 100.0, 116.0, 87.0, 87.0, 83.0, 75.0, 70.0, 57.0, 55.0, 56.0, 43.0, 36.0, 30.0, 19.0, 22.0, 15.0, 15.0, 7.0, 10.0, 8.0, 12.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0181732177734375, -0.01757979393005371, -0.016986370086669922, -0.016392946243286133, -0.015799522399902344, -0.015206098556518555, -0.014612674713134766, -0.014019250869750977, -0.013425827026367188, -0.012832403182983398, -0.01223897933959961, -0.01164555549621582, -0.011052131652832031, -0.010458707809448242, -0.009865283966064453, -0.009271860122680664, -0.008678436279296875, -0.008085012435913086, -0.007491588592529297, -0.006898164749145508, -0.006304740905761719, -0.00571131706237793, -0.005117893218994141, -0.0045244693756103516, -0.0039310455322265625, -0.0033376216888427734, -0.0027441978454589844, -0.0021507740020751953, -0.0015573501586914062, -0.0009639263153076172, -0.0003705024719238281, 0.00022292137145996094, 0.00081634521484375, 0.001409769058227539, 0.002003192901611328, 0.002596616744995117, 0.0031900405883789062, 0.0037834644317626953, 0.004376888275146484, 0.0049703121185302734, 0.0055637359619140625, 0.0061571598052978516, 0.006750583648681641, 0.00734400749206543, 0.007937431335449219, 0.008530855178833008, 0.009124279022216797, 0.009717702865600586, 0.010311126708984375, 0.010904550552368164, 0.011497974395751953, 0.012091398239135742, 0.012684822082519531, 0.01327824592590332, 0.01387166976928711, 0.014465093612670898, 0.015058517456054688, 0.015651941299438477, 0.016245365142822266, 0.016838788986206055, 0.017432212829589844, 0.018025636672973633, 0.018619060516357422, 0.01921248435974121, 0.019805908203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 14.0, 20.0, 117.0, 522.0, 161.0, 77.0, 35.0, 27.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8999651670455933, -0.8597136735916138, -0.8194621205329895, -0.77921062707901, -0.7389590740203857, -0.6987075805664062, -0.6584560871124268, -0.6182045936584473, -0.577953040599823, -0.5377015471458435, -0.49744999408721924, -0.45719850063323975, -0.41694697737693787, -0.376695454120636, -0.3364439606666565, -0.2961924374103546, -0.25594091415405273, -0.21568939089775085, -0.17543788254261017, -0.13518637418746948, -0.0949348509311676, -0.05468332767486572, -0.014431819319725037, 0.02581968903541565, 0.06607121229171753, 0.10632272809743881, 0.1465742439031601, 0.18682575225830078, 0.22707727551460266, 0.26732879877090454, 0.30758029222488403, 0.3478318154811859, 0.38808345794677734, 0.4283349812030792, 0.4685865044593811, 0.5088379979133606, 0.5490895509719849, 0.5893410444259644, 0.6295925378799438, 0.6698440313339233, 0.7100955843925476, 0.7503470778465271, 0.7905986309051514, 0.8308501243591309, 0.8711016178131104, 0.9113531708717346, 0.9516046643257141, 0.9918562173843384, 1.0321077108383179, 1.0723592042922974, 1.1126106977462769, 1.152862310409546, 1.1931138038635254, 1.2333652973175049, 1.2736167907714844, 1.3138682842254639, 1.3541197776794434, 1.3943712711334229, 1.4346227645874023, 1.4748743772506714, 1.5151258707046509, 1.5553773641586304, 1.5956288576126099, 1.6358803510665894, 1.6761319637298584]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 9.0, 8.0, 13.0, 8.0, 16.0, 16.0, 36.0, 38.0, 25.0, 35.0, 61.0, 70.0, 63.0, 61.0, 74.0, 74.0, 54.0, 57.0, 47.0, 43.0, 34.0, 40.0, 30.0, 15.0, 15.0, 11.0, 7.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4819045066833496, -0.46891212463378906, -0.4559197425842285, -0.4429273307323456, -0.42993494868278503, -0.4169425666332245, -0.40395015478134155, -0.390957772731781, -0.37796539068222046, -0.3649730086326599, -0.35198062658309937, -0.33898821473121643, -0.3259958326816559, -0.31300345063209534, -0.3000110387802124, -0.28701865673065186, -0.2740262746810913, -0.26103389263153076, -0.24804149568080902, -0.23504909873008728, -0.22205671668052673, -0.2090643346309662, -0.19607193768024445, -0.1830795407295227, -0.17008715867996216, -0.1570947766304016, -0.14410237967967987, -0.13110998272895813, -0.11811760067939758, -0.10512521117925644, -0.0921328216791153, -0.07914043217897415, -0.06614804267883301, -0.053155653178691864, -0.04016326367855072, -0.027170874178409576, -0.014178484678268433, -0.0011860951781272888, 0.011806294322013855, 0.024798683822155, 0.03779107332229614, 0.050783462822437286, 0.06377585232257843, 0.07676824182271957, 0.08976063132286072, 0.10275302082300186, 0.115745410323143, 0.12873780727386475, 0.1417301893234253, 0.15472257137298584, 0.16771496832370758, 0.18070736527442932, 0.19369974732398987, 0.20669212937355042, 0.21968452632427216, 0.2326769232749939, 0.24566930532455444, 0.258661687374115, 0.27165406942367554, 0.28464648127555847, 0.297638863325119, 0.31063124537467957, 0.3236236572265625, 0.33661603927612305, 0.3496084213256836]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 10.0, 8.0, 9.0, 17.0, 17.0, 16.0, 30.0, 43.0, 60.0, 71.0, 117.0, 159.0, 189.0, 265.0, 363.0, 492.0, 732.0, 995.0, 1401.0, 2005.0, 3269.0, 4983.0, 8418.0, 17614.0, 88312.0, 804837.0, 74639.0, 16594.0, 8169.0, 4784.0, 3109.0, 1984.0, 1356.0, 971.0, 669.0, 506.0, 346.0, 248.0, 215.0, 137.0, 106.0, 86.0, 63.0, 25.0, 34.0, 17.0, 19.0, 16.0, 9.0, 12.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-0.182861328125, -0.1773967742919922, -0.17193222045898438, -0.16646766662597656, -0.16100311279296875, -0.15553855895996094, -0.15007400512695312, -0.1446094512939453, -0.1391448974609375, -0.1336803436279297, -0.12821578979492188, -0.12275123596191406, -0.11728668212890625, -0.11182212829589844, -0.10635757446289062, -0.10089302062988281, -0.095428466796875, -0.08996391296386719, -0.08449935913085938, -0.07903480529785156, -0.07357025146484375, -0.06810569763183594, -0.06264114379882812, -0.05717658996582031, -0.0517120361328125, -0.04624748229980469, -0.040782928466796875, -0.03531837463378906, -0.02985382080078125, -0.024389266967773438, -0.018924713134765625, -0.013460159301757812, -0.00799560546875, -0.0025310516357421875, 0.002933502197265625, 0.008398056030273438, 0.01386260986328125, 0.019327163696289062, 0.024791717529296875, 0.030256271362304688, 0.0357208251953125, 0.04118537902832031, 0.046649932861328125, 0.05211448669433594, 0.05757904052734375, 0.06304359436035156, 0.06850814819335938, 0.07397270202636719, 0.079437255859375, 0.08490180969238281, 0.09036636352539062, 0.09583091735839844, 0.10129547119140625, 0.10676002502441406, 0.11222457885742188, 0.11768913269042969, 0.1231536865234375, 0.1286182403564453, 0.13408279418945312, 0.13954734802246094, 0.14501190185546875, 0.15047645568847656, 0.15594100952148438, 0.1614055633544922, 0.1668701171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 10.0, 7.0, 12.0, 10.0, 21.0, 98.0, 172.0, 265.0, 200.0, 82.0, 31.0, 15.0, 7.0, 3.0, 6.0, 4.0, 3.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00798797607421875, -0.007726311683654785, -0.00746464729309082, -0.0072029829025268555, -0.006941318511962891, -0.006679654121398926, -0.006417989730834961, -0.006156325340270996, -0.005894660949707031, -0.005632996559143066, -0.0053713321685791016, -0.005109667778015137, -0.004848003387451172, -0.004586338996887207, -0.004324674606323242, -0.004063010215759277, -0.0038013458251953125, -0.0035396814346313477, -0.003278017044067383, -0.003016352653503418, -0.002754688262939453, -0.0024930238723754883, -0.0022313594818115234, -0.0019696950912475586, -0.0017080307006835938, -0.001446366310119629, -0.001184701919555664, -0.0009230375289916992, -0.0006613731384277344, -0.00039970874786376953, -0.0001380443572998047, 0.00012362003326416016, 0.000385284423828125, 0.0006469488143920898, 0.0009086132049560547, 0.0011702775955200195, 0.0014319419860839844, 0.0016936063766479492, 0.001955270767211914, 0.002216935157775879, 0.0024785995483398438, 0.0027402639389038086, 0.0030019283294677734, 0.0032635927200317383, 0.003525257110595703, 0.003786921501159668, 0.004048585891723633, 0.004310250282287598, 0.0045719146728515625, 0.004833579063415527, 0.005095243453979492, 0.005356907844543457, 0.005618572235107422, 0.005880236625671387, 0.0061419010162353516, 0.006403565406799316, 0.006665229797363281, 0.006926894187927246, 0.007188558578491211, 0.007450222969055176, 0.007711887359619141, 0.007973551750183105, 0.00823521614074707, 0.008496880531311035, 0.008758544921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 7.0, 14.0, 13.0, 9.0, 16.0, 12.0, 19.0, 19.0, 23.0, 27.0, 31.0, 41.0, 43.0, 74.0, 239.0, 1543.0, 17898.0, 1000128.0, 25642.0, 2021.0, 261.0, 81.0, 54.0, 30.0, 32.0, 35.0, 26.0, 28.0, 26.0, 23.0, 12.0, 16.0, 15.0, 19.0, 7.0, 10.0, 3.0, 7.0, 8.0, 2.0, 7.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48583984375, -0.4704399108886719, -0.45503997802734375, -0.4396400451660156, -0.4242401123046875, -0.4088401794433594, -0.39344024658203125, -0.3780403137207031, -0.362640380859375, -0.3472404479980469, -0.33184051513671875, -0.3164405822753906, -0.3010406494140625, -0.2856407165527344, -0.27024078369140625, -0.2548408508300781, -0.23944091796875, -0.22404098510742188, -0.20864105224609375, -0.19324111938476562, -0.1778411865234375, -0.16244125366210938, -0.14704132080078125, -0.13164138793945312, -0.116241455078125, -0.10084152221679688, -0.08544158935546875, -0.07004165649414062, -0.0546417236328125, -0.039241790771484375, -0.02384185791015625, -0.008441925048828125, 0.0069580078125, 0.022357940673828125, 0.03775787353515625, 0.053157806396484375, 0.0685577392578125, 0.08395767211914062, 0.09935760498046875, 0.11475753784179688, 0.130157470703125, 0.14555740356445312, 0.16095733642578125, 0.17635726928710938, 0.1917572021484375, 0.20715713500976562, 0.22255706787109375, 0.23795700073242188, 0.25335693359375, 0.2687568664550781, 0.28415679931640625, 0.2995567321777344, 0.3149566650390625, 0.3303565979003906, 0.34575653076171875, 0.3611564636230469, 0.376556396484375, 0.3919563293457031, 0.40735626220703125, 0.4227561950683594, 0.4381561279296875, 0.4535560607910156, 0.46895599365234375, 0.4843559265136719, 0.499755859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 3.0, 5.0, 1.0, 7.0, 8.0, 7.0, 14.0, 13.0, 9.0, 16.0, 12.0, 19.0, 19.0, 23.0, 27.0, 31.0, 40.0, 29.0, 42.0, 36.0, 41.0, 33.0, 51.0, 38.0, 42.0, 33.0, 44.0, 45.0, 29.0, 32.0, 35.0, 26.0, 28.0, 26.0, 23.0, 12.0, 16.0, 15.0, 19.0, 7.0, 10.0, 3.0, 7.0, 8.0, 2.0, 7.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0242156982421875, -0.02344822883605957, -0.02268075942993164, -0.02191329002380371, -0.02114582061767578, -0.02037835121154785, -0.019610881805419922, -0.018843412399291992, -0.018075942993164062, -0.017308473587036133, -0.016541004180908203, -0.015773534774780273, -0.015006065368652344, -0.014238595962524414, -0.013471126556396484, -0.012703657150268555, -0.011936187744140625, -0.011168718338012695, -0.010401248931884766, -0.009633779525756836, -0.008866310119628906, -0.008098840713500977, -0.007331371307373047, -0.006563901901245117, -0.0057964324951171875, -0.005028963088989258, -0.004261493682861328, -0.0034940242767333984, -0.0027265548706054688, -0.001959085464477539, -0.0011916160583496094, -0.0004241466522216797, 0.00034332275390625, 0.0011107921600341797, 0.0018782615661621094, 0.002645730972290039, 0.0034132003784179688, 0.0041806697845458984, 0.004948139190673828, 0.005715608596801758, 0.0064830780029296875, 0.007250547409057617, 0.008018016815185547, 0.008785486221313477, 0.009552955627441406, 0.010320425033569336, 0.011087894439697266, 0.011855363845825195, 0.012622833251953125, 0.013390302658081055, 0.014157772064208984, 0.014925241470336914, 0.015692710876464844, 0.016460180282592773, 0.017227649688720703, 0.017995119094848633, 0.018762588500976562, 0.019530057907104492, 0.020297527313232422, 0.02106499671936035, 0.02183246612548828, 0.02259993553161621, 0.02336740493774414, 0.02413487434387207, 0.02490234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 20.0, 43.0, 106.0, 356.0, 7916.0, 1038186.0, 1521.0, 194.0, 75.0, 37.0, 31.0, 16.0, 12.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006136894226074219, -0.0005934387445449829, -0.0005731880664825439, -0.000552937388420105, -0.000532686710357666, -0.000512436032295227, -0.0004921853542327881, -0.0004719346761703491, -0.00045168399810791016, -0.0004314333200454712, -0.0004111826419830322, -0.00039093196392059326, -0.0003706812858581543, -0.00035043060779571533, -0.00033017992973327637, -0.0003099292516708374, -0.00028967857360839844, -0.00026942789554595947, -0.0002491772174835205, -0.00022892653942108154, -0.00020867586135864258, -0.0001884251832962036, -0.00016817450523376465, -0.00014792382717132568, -0.00012767314910888672, -0.00010742247104644775, -8.717179298400879e-05, -6.692111492156982e-05, -4.667043685913086e-05, -2.6419758796691895e-05, -6.16908073425293e-06, 1.4081597328186035e-05, 3.4332275390625e-05, 5.4582953453063965e-05, 7.483363151550293e-05, 9.50843095779419e-05, 0.00011533498764038086, 0.00013558566570281982, 0.0001558363437652588, 0.00017608702182769775, 0.00019633769989013672, 0.00021658837795257568, 0.00023683905601501465, 0.0002570897340774536, 0.0002773404121398926, 0.00029759109020233154, 0.0003178417682647705, 0.00033809244632720947, 0.00035834312438964844, 0.0003785938024520874, 0.00039884448051452637, 0.00041909515857696533, 0.0004393458366394043, 0.00045959651470184326, 0.0004798471927642822, 0.0005000978708267212, 0.0005203485488891602, 0.0005405992269515991, 0.0005608499050140381, 0.000581100583076477, 0.000601351261138916, 0.000621601939201355, 0.0006418526172637939, 0.0006621032953262329, 0.0006823539733886719]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 9.0, 11.0, 20.0, 34.0, 65.0, 98.0, 184.0, 202.0, 149.0, 69.0, 52.0, 33.0, 26.0, 18.0, 12.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-05, -2.939533442258835e-05, -2.8392300009727478e-05, -2.7389265596866608e-05, -2.6386231184005737e-05, -2.5383196771144867e-05, -2.4380162358283997e-05, -2.3377127945423126e-05, -2.2374093532562256e-05, -2.1371059119701385e-05, -2.0368024706840515e-05, -1.9364990293979645e-05, -1.8361955881118774e-05, -1.7358921468257904e-05, -1.6355887055397034e-05, -1.5352852642536163e-05, -1.4349818229675293e-05, -1.3346783816814423e-05, -1.2343749403953552e-05, -1.1340714991092682e-05, -1.0337680578231812e-05, -9.334646165370941e-06, -8.33161175251007e-06, -7.3285773396492004e-06, -6.32554292678833e-06, -5.32250851392746e-06, -4.319474101066589e-06, -3.316439688205719e-06, -2.3134052753448486e-06, -1.3103708624839783e-06, -3.073364496231079e-07, 6.956979632377625e-07, 1.6987323760986328e-06, 2.701766788959503e-06, 3.7048012018203735e-06, 4.707835614681244e-06, 5.710870027542114e-06, 6.713904440402985e-06, 7.716938853263855e-06, 8.719973266124725e-06, 9.723007678985596e-06, 1.0726042091846466e-05, 1.1729076504707336e-05, 1.2732110917568207e-05, 1.3735145330429077e-05, 1.4738179743289948e-05, 1.5741214156150818e-05, 1.6744248569011688e-05, 1.774728298187256e-05, 1.875031739473343e-05, 1.97533518075943e-05, 2.075638622045517e-05, 2.175942063331604e-05, 2.276245504617691e-05, 2.376548945903778e-05, 2.476852387189865e-05, 2.577155828475952e-05, 2.6774592697620392e-05, 2.7777627110481262e-05, 2.8780661523342133e-05, 2.9783695936203003e-05, 3.078673034906387e-05, 3.1789764761924744e-05, 3.2792799174785614e-05, 3.3795833587646484e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 16.0, 17.0, 25.0, 48.0, 127.0, 685.0, 379675.0, 666836.0, 806.0, 132.0, 63.0, 26.0, 22.0, 19.0, 7.0, 7.0, 2.0, 8.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006337165832519531, -0.0006139129400253296, -0.0005941092967987061, -0.0005743056535720825, -0.000554502010345459, -0.0005346983671188354, -0.0005148947238922119, -0.0004950910806655884, -0.00047528743743896484, -0.0004554837942123413, -0.0004356801509857178, -0.00041587650775909424, -0.0003960728645324707, -0.00037626922130584717, -0.00035646557807922363, -0.0003366619348526001, -0.00031685829162597656, -0.00029705464839935303, -0.0002772510051727295, -0.00025744736194610596, -0.00023764371871948242, -0.0002178400754928589, -0.00019803643226623535, -0.00017823278903961182, -0.00015842914581298828, -0.00013862550258636475, -0.00011882185935974121, -9.901821613311768e-05, -7.921457290649414e-05, -5.9410929679870605e-05, -3.960728645324707e-05, -1.9803643226623535e-05, 0.0, 1.9803643226623535e-05, 3.960728645324707e-05, 5.9410929679870605e-05, 7.921457290649414e-05, 9.901821613311768e-05, 0.00011882185935974121, 0.00013862550258636475, 0.00015842914581298828, 0.00017823278903961182, 0.00019803643226623535, 0.0002178400754928589, 0.00023764371871948242, 0.00025744736194610596, 0.0002772510051727295, 0.00029705464839935303, 0.00031685829162597656, 0.0003366619348526001, 0.00035646557807922363, 0.00037626922130584717, 0.0003960728645324707, 0.00041587650775909424, 0.0004356801509857178, 0.0004554837942123413, 0.00047528743743896484, 0.0004950910806655884, 0.0005148947238922119, 0.0005346983671188354, 0.000554502010345459, 0.0005743056535720825, 0.0005941092967987061, 0.0006139129400253296, 0.0006337165832519531]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 15.0, 17.0, 22.0, 35.0, 55.0, 66.0, 168.0, 331.0, 73.0, 53.0, 46.0, 25.0, 21.0, 18.0, 7.0, 7.0, 2.0, 8.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.159046173095703e-05, -3.0603259801864624e-05, -2.9616057872772217e-05, -2.862885594367981e-05, -2.7641654014587402e-05, -2.6654452085494995e-05, -2.5667250156402588e-05, -2.468004822731018e-05, -2.3692846298217773e-05, -2.2705644369125366e-05, -2.171844244003296e-05, -2.0731240510940552e-05, -1.9744038581848145e-05, -1.8756836652755737e-05, -1.776963472366333e-05, -1.6782432794570923e-05, -1.5795230865478516e-05, -1.4808028936386108e-05, -1.3820827007293701e-05, -1.2833625078201294e-05, -1.1846423149108887e-05, -1.085922122001648e-05, -9.872019290924072e-06, -8.884817361831665e-06, -7.897615432739258e-06, -6.910413503646851e-06, -5.923211574554443e-06, -4.936009645462036e-06, -3.948807716369629e-06, -2.9616057872772217e-06, -1.9744038581848145e-06, -9.872019290924072e-07, 0.0, 9.872019290924072e-07, 1.9744038581848145e-06, 2.9616057872772217e-06, 3.948807716369629e-06, 4.936009645462036e-06, 5.923211574554443e-06, 6.910413503646851e-06, 7.897615432739258e-06, 8.884817361831665e-06, 9.872019290924072e-06, 1.085922122001648e-05, 1.1846423149108887e-05, 1.2833625078201294e-05, 1.3820827007293701e-05, 1.4808028936386108e-05, 1.5795230865478516e-05, 1.6782432794570923e-05, 1.776963472366333e-05, 1.8756836652755737e-05, 1.9744038581848145e-05, 2.0731240510940552e-05, 2.171844244003296e-05, 2.2705644369125366e-05, 2.3692846298217773e-05, 2.468004822731018e-05, 2.5667250156402588e-05, 2.6654452085494995e-05, 2.7641654014587402e-05, 2.862885594367981e-05, 2.9616057872772217e-05, 3.0603259801864624e-05, 3.159046173095703e-05]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 11.0, 18.0, 43.0, 158.0, 620.0, 92.0, 19.0, 14.0, 9.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8127468824386597, -0.7807133197784424, -0.7486797571182251, -0.7166461944580078, -0.6846126317977905, -0.6525790691375732, -0.620545506477356, -0.5885119438171387, -0.5564783811569214, -0.5244448184967041, -0.4924112558364868, -0.46037769317626953, -0.42834413051605225, -0.39631056785583496, -0.3642770051956177, -0.3322434425354004, -0.3002098798751831, -0.2681763172149658, -0.23614275455474854, -0.20410919189453125, -0.17207562923431396, -0.14004206657409668, -0.1080085039138794, -0.07597494125366211, -0.043941378593444824, -0.011907815933227539, 0.020125746726989746, 0.05215930938720703, 0.08419287204742432, 0.1162264347076416, 0.1482599973678589, 0.18029356002807617, 0.2123270034790039, 0.2443605661392212, 0.2763941287994385, 0.30842769145965576, 0.34046125411987305, 0.37249481678009033, 0.4045283794403076, 0.4365619421005249, 0.4685955047607422, 0.5006290674209595, 0.5326626300811768, 0.564696192741394, 0.5967297554016113, 0.6287633180618286, 0.6607968807220459, 0.6928304433822632, 0.7248640060424805, 0.7568975687026978, 0.788931131362915, 0.8209646940231323, 0.8529982566833496, 0.8850318193435669, 0.9170653820037842, 0.9490989446640015, 0.9811325073242188, 1.013166069984436, 1.0451996326446533, 1.0772331953048706, 1.109266757965088, 1.1413003206253052, 1.1733338832855225, 1.2053674459457397, 1.237401008605957]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 5.0, 6.0, 5.0, 16.0, 11.0, 21.0, 41.0, 57.0, 66.0, 71.0, 74.0, 68.0, 107.0, 82.0, 58.0, 65.0, 63.0, 36.0, 35.0, 17.0, 21.0, 14.0, 13.0, 6.0, 9.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2577208876609802, -0.2492363303899765, -0.24075177311897278, -0.23226720094680786, -0.22378264367580414, -0.21529808640480042, -0.2068135291337967, -0.19832897186279297, -0.18984439969062805, -0.18135984241962433, -0.1728752851486206, -0.1643907129764557, -0.15590615570545197, -0.14742159843444824, -0.13893704116344452, -0.1304524838924408, -0.12196792662143707, -0.11348336935043335, -0.10499880462884903, -0.0965142473578453, -0.08802968263626099, -0.07954512536525726, -0.07106056809425354, -0.06257601082324982, -0.0540914461016655, -0.045606885105371475, -0.037122324109077454, -0.02863776683807373, -0.02015320584177971, -0.011668644845485687, -0.003184087574481964, 0.0053004734218120575, 0.013785034418106079, 0.0222695954144001, 0.030754154548048973, 0.039238713681697845, 0.04772327467799187, 0.05620783567428589, 0.06469239294528961, 0.07317695021629333, 0.08166151493787766, 0.09014607220888138, 0.0986306369304657, 0.10711519420146942, 0.11559975147247314, 0.12408431619405746, 0.1325688660144806, 0.1410534381866455, 0.14953799545764923, 0.15802255272865295, 0.16650710999965668, 0.1749916672706604, 0.18347623944282532, 0.19196079671382904, 0.20044535398483276, 0.2089299112558365, 0.2174144685268402, 0.22589902579784393, 0.23438358306884766, 0.24286815524101257, 0.2513526976108551, 0.25983726978302, 0.26832181215286255, 0.27680638432502747, 0.2852909564971924]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 8.0, 4.0, 10.0, 4.0, 4.0, 12.0, 12.0, 16.0, 22.0, 22.0, 14.0, 56.0, 200.0, 378.0, 4192723.0, 417.0, 162.0, 58.0, 32.0, 12.0, 10.0, 10.0, 6.0, 8.0, 16.0, 14.0, 6.0, 4.0, 2.0, 4.0, 4.0, 6.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.5234375, -11.1453857421875, -10.767333984375, -10.3892822265625, -10.01123046875, -9.6331787109375, -9.255126953125, -8.8770751953125, -8.4990234375, -8.1209716796875, -7.742919921875, -7.3648681640625, -6.98681640625, -6.6087646484375, -6.230712890625, -5.8526611328125, -5.474609375, -5.0965576171875, -4.718505859375, -4.3404541015625, -3.96240234375, -3.5843505859375, -3.206298828125, -2.8282470703125, -2.4501953125, -2.0721435546875, -1.694091796875, -1.3160400390625, -0.93798828125, -0.5599365234375, -0.181884765625, 0.1961669921875, 0.57421875, 0.9522705078125, 1.330322265625, 1.7083740234375, 2.08642578125, 2.4644775390625, 2.842529296875, 3.2205810546875, 3.5986328125, 3.9766845703125, 4.354736328125, 4.7327880859375, 5.11083984375, 5.4888916015625, 5.866943359375, 6.2449951171875, 6.623046875, 7.0010986328125, 7.379150390625, 7.7572021484375, 8.13525390625, 8.5133056640625, 8.891357421875, 9.2694091796875, 9.6474609375, 10.0255126953125, 10.403564453125, 10.7816162109375, 11.15966796875, 11.5377197265625, 11.915771484375, 12.2938232421875, 12.671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 11.0, 7.0, 28.0, 101.0, 175.0, 262.0, 194.0, 80.0, 29.0, 16.0, 6.0, 5.0, 5.0, 3.0, 4.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007808685302734375, -0.007552444934844971, -0.007296204566955566, -0.007039964199066162, -0.006783723831176758, -0.0065274834632873535, -0.006271243095397949, -0.006015002727508545, -0.005758762359619141, -0.005502521991729736, -0.005246281623840332, -0.004990041255950928, -0.0047338008880615234, -0.004477560520172119, -0.004221320152282715, -0.0039650797843933105, -0.0037088394165039062, -0.003452599048614502, -0.0031963586807250977, -0.0029401183128356934, -0.002683877944946289, -0.0024276375770568848, -0.0021713972091674805, -0.0019151568412780762, -0.0016589164733886719, -0.0014026761054992676, -0.0011464357376098633, -0.000890195369720459, -0.0006339550018310547, -0.0003777146339416504, -0.0001214742660522461, 0.0001347661018371582, 0.0003910064697265625, 0.0006472468376159668, 0.0009034872055053711, 0.0011597275733947754, 0.0014159679412841797, 0.001672208309173584, 0.0019284486770629883, 0.0021846890449523926, 0.002440929412841797, 0.002697169780731201, 0.0029534101486206055, 0.0032096505165100098, 0.003465890884399414, 0.0037221312522888184, 0.003978371620178223, 0.004234611988067627, 0.004490852355957031, 0.0047470927238464355, 0.00500333309173584, 0.005259573459625244, 0.0055158138275146484, 0.005772054195404053, 0.006028294563293457, 0.006284534931182861, 0.006540775299072266, 0.00679701566696167, 0.007053256034851074, 0.0073094964027404785, 0.007565736770629883, 0.007821977138519287, 0.008078217506408691, 0.008334457874298096, 0.0085906982421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 16.0, 14.0, 22.0, 36.0, 47.0, 60.0, 82.0, 79.0, 91.0, 133.0, 163.0, 109575.0, 4083120.0, 174.0, 132.0, 100.0, 105.0, 60.0, 68.0, 54.0, 29.0, 17.0, 23.0, 16.0, 6.0, 10.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.171875, -4.062286376953125, -3.95269775390625, -3.843109130859375, -3.7335205078125, -3.623931884765625, -3.51434326171875, -3.404754638671875, -3.295166015625, -3.185577392578125, -3.07598876953125, -2.966400146484375, -2.8568115234375, -2.747222900390625, -2.63763427734375, -2.528045654296875, -2.41845703125, -2.308868408203125, -2.19927978515625, -2.089691162109375, -1.9801025390625, -1.870513916015625, -1.76092529296875, -1.651336669921875, -1.541748046875, -1.432159423828125, -1.32257080078125, -1.212982177734375, -1.1033935546875, -0.993804931640625, -0.88421630859375, -0.774627685546875, -0.6650390625, -0.555450439453125, -0.44586181640625, -0.336273193359375, -0.2266845703125, -0.117095947265625, -0.00750732421875, 0.102081298828125, 0.211669921875, 0.321258544921875, 0.43084716796875, 0.540435791015625, 0.6500244140625, 0.759613037109375, 0.86920166015625, 0.978790283203125, 1.08837890625, 1.197967529296875, 1.30755615234375, 1.417144775390625, 1.5267333984375, 1.636322021484375, 1.74591064453125, 1.855499267578125, 1.965087890625, 2.074676513671875, 2.18426513671875, 2.293853759765625, 2.4034423828125, 2.513031005859375, 2.62261962890625, 2.732208251953125, 2.841796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 9.0, 10.0, 16.0, 14.0, 22.0, 36.0, 47.0, 60.0, 82.0, 79.0, 91.0, 133.0, 163.0, 400.0, 2091.0, 170.0, 132.0, 102.0, 103.0, 59.0, 69.0, 54.0, 29.0, 17.0, 23.0, 16.0, 6.0, 10.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.029632568359375, -0.0288541316986084, -0.028075695037841797, -0.027297258377075195, -0.026518821716308594, -0.025740385055541992, -0.02496194839477539, -0.02418351173400879, -0.023405075073242188, -0.022626638412475586, -0.021848201751708984, -0.021069765090942383, -0.02029132843017578, -0.01951289176940918, -0.018734455108642578, -0.017956018447875977, -0.017177581787109375, -0.016399145126342773, -0.015620708465576172, -0.01484227180480957, -0.014063835144042969, -0.013285398483276367, -0.012506961822509766, -0.011728525161743164, -0.010950088500976562, -0.010171651840209961, -0.00939321517944336, -0.008614778518676758, -0.007836341857910156, -0.007057905197143555, -0.006279468536376953, -0.0055010318756103516, -0.00472259521484375, -0.0039441585540771484, -0.003165721893310547, -0.0023872852325439453, -0.0016088485717773438, -0.0008304119110107422, -5.1975250244140625e-05, 0.0007264614105224609, 0.0015048980712890625, 0.002283334732055664, 0.0030617713928222656, 0.003840208053588867, 0.004618644714355469, 0.00539708137512207, 0.006175518035888672, 0.0069539546966552734, 0.007732391357421875, 0.008510828018188477, 0.009289264678955078, 0.01006770133972168, 0.010846138000488281, 0.011624574661254883, 0.012403011322021484, 0.013181447982788086, 0.013959884643554688, 0.014738321304321289, 0.01551675796508789, 0.016295194625854492, 0.017073631286621094, 0.017852067947387695, 0.018630504608154297, 0.0194089412689209, 0.0201873779296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 174.0, 841.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8255228996276855, -6.7060160636901855, -6.5865092277526855, -6.467002868652344, -6.347496032714844, -6.227989196777344, -6.108482360839844, -5.988975524902344, -5.869469165802002, -5.749962329864502, -5.630455493927002, -5.51094913482666, -5.39144229888916, -5.27193546295166, -5.15242862701416, -5.03292179107666, -4.91341495513916, -4.79390811920166, -4.67440128326416, -4.554894924163818, -4.435388088226318, -4.315881252288818, -4.196374416351318, -4.076867580413818, -3.9573612213134766, -3.8378543853759766, -3.7183477878570557, -3.5988409519195557, -3.4793343544006348, -3.3598275184631348, -3.2403206825256348, -3.120814085006714, -3.001307249069214, -2.881800413131714, -2.762293815612793, -2.642786979675293, -2.523280382156372, -2.403773546218872, -2.284266948699951, -2.164760112762451, -2.045253276824951, -1.9257465600967407, -1.8062398433685303, -1.6867330074310303, -1.5672262907028198, -1.4477195739746094, -1.328212857246399, -1.2087061405181885, -1.0891993045806885, -0.969692587852478, -0.8501858115196228, -0.7306790947914124, -0.6111723184585571, -0.4916656017303467, -0.37215888500213623, -0.252652108669281, -0.13314545154571533, -0.013638712465763092, 0.10586802661418915, 0.2253747582435608, 0.34488150477409363, 0.46438825130462646, 0.5838949680328369, 0.7034017443656921, 0.8229084610939026]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 3.0, 18.0, 27.0, 38.0, 78.0, 77.0, 124.0, 107.0, 134.0, 124.0, 91.0, 62.0, 45.0, 33.0, 8.0, 12.0, 4.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.4184265732765198, -0.40945902466773987, -0.4004914462566376, -0.39152389764785767, -0.38255631923675537, -0.37358877062797546, -0.36462122201919556, -0.35565364360809326, -0.34668609499931335, -0.33771854639053345, -0.32875096797943115, -0.31978341937065125, -0.31081584095954895, -0.30184829235076904, -0.29288071393966675, -0.28391316533088684, -0.27494561672210693, -0.265978068113327, -0.25701048970222473, -0.24804294109344482, -0.23907537758350372, -0.23010781407356262, -0.22114025056362152, -0.21217268705368042, -0.20320510864257812, -0.19423754513263702, -0.18526998162269592, -0.17630243301391602, -0.16733486950397491, -0.1583673059940338, -0.1493997424840927, -0.1404321789741516, -0.1314646303653717, -0.1224970668554306, -0.1135295107960701, -0.104561947286129, -0.0955943912267685, -0.08662682771682739, -0.07765926420688629, -0.06869170814752579, -0.059724144637584686, -0.050756584852933884, -0.04178902506828308, -0.03282146155834198, -0.023853901773691177, -0.014886341989040375, -0.005918778479099274, 0.0030487775802612305, 0.012016341090202332, 0.020983900874853134, 0.029951462522149086, 0.03891902416944504, 0.04788658395409584, 0.05685414373874664, 0.06582170724868774, 0.07478926330804825, 0.08375682681798935, 0.09272439032793045, 0.10169194638729095, 0.11065950989723206, 0.11962707340717316, 0.12859463691711426, 0.13756218552589417, 0.14652974903583527, 0.15549731254577637]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 12.0, 9.0, 18.0, 25.0, 39.0, 59.0, 93.0, 161.0, 348.0, 931.0, 3544.0, 25354.0, 947420.0, 62840.0, 5413.0, 1352.0, 445.0, 191.0, 101.0, 56.0, 33.0, 23.0, 22.0, 13.0, 11.0, 3.0, 6.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.25817108154296875, -0.2507171630859375, -0.24326324462890625, -0.235809326171875, -0.22835540771484375, -0.2209014892578125, -0.21344757080078125, -0.20599365234375, -0.19853973388671875, -0.1910858154296875, -0.18363189697265625, -0.176177978515625, -0.16872406005859375, -0.1612701416015625, -0.15381622314453125, -0.1463623046875, -0.13890838623046875, -0.1314544677734375, -0.12400054931640625, -0.116546630859375, -0.10909271240234375, -0.1016387939453125, -0.09418487548828125, -0.08673095703125, -0.07927703857421875, -0.0718231201171875, -0.06436920166015625, -0.056915283203125, -0.04946136474609375, -0.0420074462890625, -0.03455352783203125, -0.027099609375, -0.01964569091796875, -0.0121917724609375, -0.00473785400390625, 0.002716064453125, 0.01016998291015625, 0.0176239013671875, 0.02507781982421875, 0.03253173828125, 0.03998565673828125, 0.0474395751953125, 0.05489349365234375, 0.062347412109375, 0.06980133056640625, 0.0772552490234375, 0.08470916748046875, 0.0921630859375, 0.09961700439453125, 0.1070709228515625, 0.11452484130859375, 0.121978759765625, 0.12943267822265625, 0.1368865966796875, 0.14434051513671875, 0.15179443359375, 0.15924835205078125, 0.1667022705078125, 0.17415618896484375, 0.181610107421875, 0.18906402587890625, 0.1965179443359375, 0.20397186279296875, 0.21142578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 7.0, 13.0, 50.0, 100.0, 172.0, 243.0, 203.0, 105.0, 54.0, 15.0, 12.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0198516845703125, -0.019433975219726562, -0.019016265869140625, -0.018598556518554688, -0.01818084716796875, -0.017763137817382812, -0.017345428466796875, -0.016927719116210938, -0.016510009765625, -0.016092300415039062, -0.015674591064453125, -0.015256881713867188, -0.01483917236328125, -0.014421463012695312, -0.014003753662109375, -0.013586044311523438, -0.0131683349609375, -0.012750625610351562, -0.012332916259765625, -0.011915206909179688, -0.01149749755859375, -0.011079788208007812, -0.010662078857421875, -0.010244369506835938, -0.00982666015625, -0.009408950805664062, -0.008991241455078125, -0.008573532104492188, -0.00815582275390625, -0.0077381134033203125, -0.007320404052734375, -0.0069026947021484375, -0.0064849853515625, -0.0060672760009765625, -0.005649566650390625, -0.0052318572998046875, -0.00481414794921875, -0.0043964385986328125, -0.003978729248046875, -0.0035610198974609375, -0.003143310546875, -0.0027256011962890625, -0.002307891845703125, -0.0018901824951171875, -0.00147247314453125, -0.0010547637939453125, -0.000637054443359375, -0.0002193450927734375, 0.0001983642578125, 0.0006160736083984375, 0.001033782958984375, 0.0014514923095703125, 0.00186920166015625, 0.0022869110107421875, 0.002704620361328125, 0.0031223297119140625, 0.0035400390625, 0.0039577484130859375, 0.004375457763671875, 0.0047931671142578125, 0.00521087646484375, 0.0056285858154296875, 0.006046295166015625, 0.0064640045166015625, 0.0068817138671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 4.0, 3.0, 6.0, 6.0, 2.0, 8.0, 12.0, 12.0, 15.0, 25.0, 10.0, 24.0, 35.0, 59.0, 88.0, 146.0, 298.0, 697.0, 1495.0, 3783.0, 9890.0, 29452.0, 103396.0, 604003.0, 217674.0, 51499.0, 15951.0, 5685.0, 2264.0, 900.0, 470.0, 247.0, 128.0, 62.0, 41.0, 37.0, 33.0, 19.0, 12.0, 11.0, 8.0, 7.0, 10.0, 5.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.07879638671875, -0.07631301879882812, -0.07382965087890625, -0.07134628295898438, -0.0688629150390625, -0.06637954711914062, -0.06389617919921875, -0.061412811279296875, -0.058929443359375, -0.056446075439453125, -0.05396270751953125, -0.051479339599609375, -0.0489959716796875, -0.046512603759765625, -0.04402923583984375, -0.041545867919921875, -0.0390625, -0.036579132080078125, -0.03409576416015625, -0.031612396240234375, -0.0291290283203125, -0.026645660400390625, -0.02416229248046875, -0.021678924560546875, -0.019195556640625, -0.016712188720703125, -0.01422882080078125, -0.011745452880859375, -0.0092620849609375, -0.006778717041015625, -0.00429534912109375, -0.001811981201171875, 0.00067138671875, 0.003154754638671875, 0.00563812255859375, 0.008121490478515625, 0.0106048583984375, 0.013088226318359375, 0.01557159423828125, 0.018054962158203125, 0.020538330078125, 0.023021697998046875, 0.02550506591796875, 0.027988433837890625, 0.0304718017578125, 0.032955169677734375, 0.03543853759765625, 0.037921905517578125, 0.0404052734375, 0.042888641357421875, 0.04537200927734375, 0.047855377197265625, 0.0503387451171875, 0.052822113037109375, 0.05530548095703125, 0.057788848876953125, 0.060272216796875, 0.06275558471679688, 0.06523895263671875, 0.06772232055664062, 0.0702056884765625, 0.07268905639648438, 0.07517242431640625, 0.07765579223632812, 0.08013916015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 4.0, 3.0, 6.0, 6.0, 2.0, 8.0, 12.0, 12.0, 13.0, 22.0, 10.0, 17.0, 25.0, 22.0, 22.0, 24.0, 25.0, 30.0, 23.0, 37.0, 38.0, 37.0, 38.0, 42.0, 40.0, 45.0, 38.0, 35.0, 46.0, 33.0, 24.0, 37.0, 39.0, 24.0, 24.0, 22.0, 25.0, 18.0, 11.0, 11.0, 8.0, 7.0, 10.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.022247314453125, -0.021546125411987305, -0.02084493637084961, -0.020143747329711914, -0.01944255828857422, -0.018741369247436523, -0.018040180206298828, -0.017338991165161133, -0.016637802124023438, -0.015936613082885742, -0.015235424041748047, -0.014534235000610352, -0.013833045959472656, -0.013131856918334961, -0.012430667877197266, -0.01172947883605957, -0.011028289794921875, -0.01032710075378418, -0.009625911712646484, -0.008924722671508789, -0.008223533630371094, -0.0075223445892333984, -0.006821155548095703, -0.006119966506958008, -0.0054187774658203125, -0.004717588424682617, -0.004016399383544922, -0.0033152103424072266, -0.0026140213012695312, -0.001912832260131836, -0.0012116432189941406, -0.0005104541778564453, 0.00019073486328125, 0.0008919239044189453, 0.0015931129455566406, 0.002294301986694336, 0.0029954910278320312, 0.0036966800689697266, 0.004397869110107422, 0.005099058151245117, 0.0058002471923828125, 0.006501436233520508, 0.007202625274658203, 0.007903814315795898, 0.008605003356933594, 0.009306192398071289, 0.010007381439208984, 0.01070857048034668, 0.011409759521484375, 0.01211094856262207, 0.012812137603759766, 0.013513326644897461, 0.014214515686035156, 0.014915704727172852, 0.015616893768310547, 0.016318082809448242, 0.017019271850585938, 0.017720460891723633, 0.018421649932861328, 0.019122838973999023, 0.01982402801513672, 0.020525217056274414, 0.02122640609741211, 0.021927595138549805, 0.0226287841796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 5.0, 20.0, 13.0, 16.0, 24.0, 28.0, 32.0, 50.0, 103.0, 170.0, 270.0, 545.0, 1216.0, 3301.0, 11413.0, 69054.0, 889960.0, 56734.0, 10213.0, 3010.0, 1143.0, 483.0, 244.0, 157.0, 95.0, 72.0, 36.0, 29.0, 28.0, 16.0, 21.0, 12.0, 8.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010280609130859375, -0.0009943097829818726, -0.0009605586528778076, -0.0009268075227737427, -0.0008930563926696777, -0.0008593052625656128, -0.0008255541324615479, -0.0007918030023574829, -0.000758051872253418, -0.000724300742149353, -0.0006905496120452881, -0.0006567984819412231, -0.0006230473518371582, -0.0005892962217330933, -0.0005555450916290283, -0.0005217939615249634, -0.00048804283142089844, -0.0004542917013168335, -0.00042054057121276855, -0.0003867894411087036, -0.00035303831100463867, -0.00031928718090057373, -0.0002855360507965088, -0.00025178492069244385, -0.0002180337905883789, -0.00018428266048431396, -0.00015053153038024902, -0.00011678040027618408, -8.302927017211914e-05, -4.92781400680542e-05, -1.5527009963989258e-05, 1.8224120140075684e-05, 5.1975250244140625e-05, 8.572638034820557e-05, 0.00011947751045227051, 0.00015322864055633545, 0.0001869797706604004, 0.00022073090076446533, 0.0002544820308685303, 0.0002882331609725952, 0.00032198429107666016, 0.0003557354211807251, 0.00038948655128479004, 0.000423237681388855, 0.0004569888114929199, 0.0004907399415969849, 0.0005244910717010498, 0.0005582422018051147, 0.0005919933319091797, 0.0006257444620132446, 0.0006594955921173096, 0.0006932467222213745, 0.0007269978523254395, 0.0007607489824295044, 0.0007945001125335693, 0.0008282512426376343, 0.0008620023727416992, 0.0008957535028457642, 0.0009295046329498291, 0.000963255763053894, 0.000997006893157959, 0.001030758023262024, 0.0010645091533660889, 0.0010982602834701538, 0.0011320114135742188]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 3.0, 7.0, 6.0, 9.0, 5.0, 10.0, 13.0, 14.0, 18.0, 28.0, 35.0, 53.0, 76.0, 136.0, 165.0, 120.0, 81.0, 47.0, 32.0, 28.0, 22.0, 15.0, 14.0, 13.0, 10.0, 9.0, 2.0, 7.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1278858184814453e-05, -2.0643696188926697e-05, -2.000853419303894e-05, -1.9373372197151184e-05, -1.8738210201263428e-05, -1.810304820537567e-05, -1.7467886209487915e-05, -1.683272421360016e-05, -1.6197562217712402e-05, -1.5562400221824646e-05, -1.492723822593689e-05, -1.4292076230049133e-05, -1.3656914234161377e-05, -1.302175223827362e-05, -1.2386590242385864e-05, -1.1751428246498108e-05, -1.1116266250610352e-05, -1.0481104254722595e-05, -9.845942258834839e-06, -9.210780262947083e-06, -8.575618267059326e-06, -7.94045627117157e-06, -7.3052942752838135e-06, -6.670132279396057e-06, -6.034970283508301e-06, -5.3998082876205444e-06, -4.764646291732788e-06, -4.129484295845032e-06, -3.4943222999572754e-06, -2.859160304069519e-06, -2.2239983081817627e-06, -1.5888363122940063e-06, -9.5367431640625e-07, -3.1851232051849365e-07, 3.166496753692627e-07, 9.51811671257019e-07, 1.5869736671447754e-06, 2.2221356630325317e-06, 2.857297658920288e-06, 3.4924596548080444e-06, 4.127621650695801e-06, 4.762783646583557e-06, 5.3979456424713135e-06, 6.03310763835907e-06, 6.668269634246826e-06, 7.3034316301345825e-06, 7.938593626022339e-06, 8.573755621910095e-06, 9.208917617797852e-06, 9.844079613685608e-06, 1.0479241609573364e-05, 1.111440360546112e-05, 1.1749565601348877e-05, 1.2384727597236633e-05, 1.301988959312439e-05, 1.3655051589012146e-05, 1.4290213584899902e-05, 1.4925375580787659e-05, 1.5560537576675415e-05, 1.619569957256317e-05, 1.6830861568450928e-05, 1.7466023564338684e-05, 1.810118556022644e-05, 1.8736347556114197e-05, 1.9371509552001953e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 5.0, 16.0, 21.0, 36.0, 77.0, 134.0, 314.0, 823.0, 2428.0, 9851.0, 71284.0, 886228.0, 64191.0, 9436.0, 2345.0, 749.0, 299.0, 134.0, 61.0, 27.0, 24.0, 15.0, 15.0, 7.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010442733764648438, -0.0010164082050323486, -0.0009885430335998535, -0.0009606778621673584, -0.0009328126907348633, -0.0009049475193023682, -0.000877082347869873, -0.0008492171764373779, -0.0008213520050048828, -0.0007934868335723877, -0.0007656216621398926, -0.0007377564907073975, -0.0007098913192749023, -0.0006820261478424072, -0.0006541609764099121, -0.000626295804977417, -0.0005984306335449219, -0.0005705654621124268, -0.0005427002906799316, -0.0005148351192474365, -0.0004869699478149414, -0.0004591047763824463, -0.00043123960494995117, -0.00040337443351745605, -0.00037550926208496094, -0.0003476440906524658, -0.0003197789192199707, -0.0002919137477874756, -0.00026404857635498047, -0.00023618340492248535, -0.00020831823348999023, -0.00018045306205749512, -0.000152587890625, -0.00012472271919250488, -9.685754776000977e-05, -6.899237632751465e-05, -4.112720489501953e-05, -1.3262033462524414e-05, 1.4603137969970703e-05, 4.246830940246582e-05, 7.033348083496094e-05, 9.819865226745605e-05, 0.00012606382369995117, 0.0001539289951324463, 0.0001817941665649414, 0.00020965933799743652, 0.00023752450942993164, 0.00026538968086242676, 0.0002932548522949219, 0.000321120023727417, 0.0003489851951599121, 0.0003768503665924072, 0.00040471553802490234, 0.00043258070945739746, 0.0004604458808898926, 0.0004883110523223877, 0.0005161762237548828, 0.0005440413951873779, 0.000571906566619873, 0.0005997717380523682, 0.0006276369094848633, 0.0006555020809173584, 0.0006833672523498535, 0.0007112324237823486, 0.0007390975952148438]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 5.0, 4.0, 6.0, 7.0, 13.0, 18.0, 14.0, 39.0, 36.0, 51.0, 109.0, 114.0, 120.0, 108.0, 97.0, 72.0, 50.0, 27.0, 30.0, 15.0, 12.0, 11.0, 9.0, 10.0, 3.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002949237823486328, -0.000287054106593132, -0.0002791844308376312, -0.00027131475508213043, -0.00026344507932662964, -0.00025557540357112885, -0.00024770572781562805, -0.00023983605206012726, -0.00023196637630462646, -0.00022409670054912567, -0.00021622702479362488, -0.00020835734903812408, -0.0002004876732826233, -0.0001926179975271225, -0.0001847483217716217, -0.0001768786460161209, -0.00016900897026062012, -0.00016113929450511932, -0.00015326961874961853, -0.00014539994299411774, -0.00013753026723861694, -0.00012966059148311615, -0.00012179091572761536, -0.00011392123997211456, -0.00010605156421661377, -9.818188846111298e-05, -9.031221270561218e-05, -8.244253695011139e-05, -7.45728611946106e-05, -6.67031854391098e-05, -5.883350968360901e-05, -5.0963833928108215e-05, -4.309415817260742e-05, -3.522448241710663e-05, -2.7354806661605835e-05, -1.948513090610504e-05, -1.1615455150604248e-05, -3.7457793951034546e-06, 4.123896360397339e-06, 1.1993572115898132e-05, 1.9863247871398926e-05, 2.773292362689972e-05, 3.560259938240051e-05, 4.3472275137901306e-05, 5.13419508934021e-05, 5.921162664890289e-05, 6.708130240440369e-05, 7.495097815990448e-05, 8.282065391540527e-05, 9.069032967090607e-05, 9.856000542640686e-05, 0.00010642968118190765, 0.00011429935693740845, 0.00012216903269290924, 0.00013003870844841003, 0.00013790838420391083, 0.00014577805995941162, 0.00015364773571491241, 0.0001615174114704132, 0.000169387087225914, 0.0001772567629814148, 0.0001851264387369156, 0.00019299611449241638, 0.00020086579024791718, 0.00020873546600341797]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 118.0, 705.0, 127.0, 34.0, 16.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6601436138153076, -1.6071665287017822, -1.5541894435882568, -1.5012123584747314, -1.4482353925704956, -1.3952583074569702, -1.3422812223434448, -1.2893041372299194, -1.236327052116394, -1.1833499670028687, -1.1303728818893433, -1.0773959159851074, -1.024418830871582, -0.9714417457580566, -0.9184646606445312, -0.8654875755310059, -0.8125105500221252, -0.7595334649085999, -0.7065564393997192, -0.6535793542861938, -0.6006022691726685, -0.5476251840591431, -0.49464815855026245, -0.44167107343673706, -0.38869401812553406, -0.33571696281433105, -0.28273987770080566, -0.22976282238960266, -0.17678575217723846, -0.12380868196487427, -0.07083162665367126, -0.017854541540145874, 0.03512251377105713, 0.08809958398342133, 0.14107665419578552, 0.19405370950698853, 0.24703077971935272, 0.3000078499317169, 0.3529849052429199, 0.4059619903564453, 0.4589390456676483, 0.5119161009788513, 0.5648931860923767, 0.6178702116012573, 0.6708472967147827, 0.7238243818283081, 0.7768014669418335, 0.8297785520553589, 0.8827555775642395, 0.9357326626777649, 0.9887096881866455, 1.041686773300171, 1.0946638584136963, 1.1476409435272217, 1.200618028640747, 1.2535951137542725, 1.3065720796585083, 1.3595491647720337, 1.412526249885559, 1.465503215789795, 1.5184803009033203, 1.5714573860168457, 1.624434471130371, 1.6774115562438965, 1.7303886413574219]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 4.0, 15.0, 21.0, 10.0, 22.0, 23.0, 22.0, 34.0, 35.0, 36.0, 45.0, 54.0, 44.0, 37.0, 55.0, 54.0, 72.0, 49.0, 41.0, 50.0, 38.0, 46.0, 36.0, 33.0, 17.0, 25.0, 21.0, 12.0, 13.0, 10.0, 10.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2528589963912964, -0.2457127422094345, -0.23856650292873383, -0.23142024874687195, -0.22427399456501007, -0.2171277403831482, -0.2099815011024475, -0.20283524692058563, -0.19568899273872375, -0.18854273855686188, -0.1813964992761612, -0.17425024509429932, -0.16710399091243744, -0.15995773673057556, -0.15281149744987488, -0.145665243268013, -0.13851900398731232, -0.13137274980545044, -0.12422650307416916, -0.11708025634288788, -0.109934002161026, -0.10278775542974472, -0.09564150869846344, -0.08849525451660156, -0.08134900778532028, -0.074202761054039, -0.06705650687217712, -0.059910260140895844, -0.052764009684324265, -0.045617759227752686, -0.038471512496471405, -0.031325262039899826, -0.024179011583328247, -0.017032761126756668, -0.009886512532830238, -0.0027402639389038086, 0.00440598651766777, 0.01155223697423935, 0.01869848370552063, 0.02584473416209221, 0.03299098461866379, 0.04013723507523537, 0.047283485531806946, 0.054429732263088226, 0.061575982719659805, 0.06872223317623138, 0.07586847990751266, 0.08301472663879395, 0.09016098082065582, 0.0973072275519371, 0.10445348173379898, 0.11159972846508026, 0.11874598264694214, 0.12589222192764282, 0.1330384761095047, 0.14018473029136658, 0.14733096957206726, 0.15447722375392914, 0.16162346303462982, 0.1687697172164917, 0.17591597139835358, 0.18306222558021545, 0.19020846486091614, 0.19735471904277802, 0.2045009732246399]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 14.0, 24.0, 38.0, 92.0, 217.0, 546.0, 4835.0, 4181364.0, 6393.0, 490.0, 130.0, 53.0, 27.0, 12.0, 8.0, 6.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.583984375, -1.5513458251953125, -1.518707275390625, -1.4860687255859375, -1.45343017578125, -1.4207916259765625, -1.388153076171875, -1.3555145263671875, -1.3228759765625, -1.2902374267578125, -1.257598876953125, -1.2249603271484375, -1.19232177734375, -1.1596832275390625, -1.127044677734375, -1.0944061279296875, -1.061767578125, -1.0291290283203125, -0.996490478515625, -0.9638519287109375, -0.93121337890625, -0.8985748291015625, -0.865936279296875, -0.8332977294921875, -0.8006591796875, -0.7680206298828125, -0.735382080078125, -0.7027435302734375, -0.67010498046875, -0.6374664306640625, -0.604827880859375, -0.5721893310546875, -0.53955078125, -0.5069122314453125, -0.474273681640625, -0.4416351318359375, -0.40899658203125, -0.3763580322265625, -0.343719482421875, -0.3110809326171875, -0.2784423828125, -0.2458038330078125, -0.213165283203125, -0.1805267333984375, -0.14788818359375, -0.1152496337890625, -0.082611083984375, -0.0499725341796875, -0.017333984375, 0.0153045654296875, 0.047943115234375, 0.0805816650390625, 0.11322021484375, 0.1458587646484375, 0.178497314453125, 0.2111358642578125, 0.2437744140625, 0.2764129638671875, 0.309051513671875, 0.3416900634765625, 0.37432861328125, 0.4069671630859375, 0.439605712890625, 0.4722442626953125, 0.5048828125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 4.0, 21.0, 45.0, 100.0, 173.0, 241.0, 202.0, 111.0, 48.0, 18.0, 13.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0208587646484375, -0.020429015159606934, -0.019999265670776367, -0.0195695161819458, -0.019139766693115234, -0.018710017204284668, -0.0182802677154541, -0.017850518226623535, -0.01742076873779297, -0.016991019248962402, -0.016561269760131836, -0.01613152027130127, -0.015701770782470703, -0.015272021293640137, -0.01484227180480957, -0.014412522315979004, -0.013982772827148438, -0.013553023338317871, -0.013123273849487305, -0.012693524360656738, -0.012263774871826172, -0.011834025382995605, -0.011404275894165039, -0.010974526405334473, -0.010544776916503906, -0.01011502742767334, -0.009685277938842773, -0.009255528450012207, -0.00882577896118164, -0.008396029472351074, -0.007966279983520508, -0.007536530494689941, -0.007106781005859375, -0.006677031517028809, -0.006247282028198242, -0.005817532539367676, -0.005387783050537109, -0.004958033561706543, -0.0045282840728759766, -0.00409853458404541, -0.0036687850952148438, -0.0032390356063842773, -0.002809286117553711, -0.0023795366287231445, -0.0019497871398925781, -0.0015200376510620117, -0.0010902881622314453, -0.0006605386734008789, -0.0002307891845703125, 0.0001989603042602539, 0.0006287097930908203, 0.0010584592819213867, 0.0014882087707519531, 0.0019179582595825195, 0.002347707748413086, 0.0027774572372436523, 0.0032072067260742188, 0.003636956214904785, 0.0040667057037353516, 0.004496455192565918, 0.004926204681396484, 0.005355954170227051, 0.005785703659057617, 0.006215453147888184, 0.00664520263671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 13.0, 25.0, 43.0, 79.0, 127.0, 168.0, 279.0, 753.0, 112165.0, 4079000.0, 992.0, 261.0, 136.0, 92.0, 66.0, 34.0, 23.0, 13.0, 6.0, 3.0, 0.0, 2.0, 2.0], "bins": [-1.6279296875, -1.5954322814941406, -1.5629348754882812, -1.5304374694824219, -1.4979400634765625, -1.4654426574707031, -1.4329452514648438, -1.4004478454589844, -1.367950439453125, -1.3354530334472656, -1.3029556274414062, -1.2704582214355469, -1.2379608154296875, -1.2054634094238281, -1.1729660034179688, -1.1404685974121094, -1.10797119140625, -1.0754737854003906, -1.0429763793945312, -1.0104789733886719, -0.9779815673828125, -0.9454841613769531, -0.9129867553710938, -0.8804893493652344, -0.847991943359375, -0.8154945373535156, -0.7829971313476562, -0.7504997253417969, -0.7180023193359375, -0.6855049133300781, -0.6530075073242188, -0.6205101013183594, -0.5880126953125, -0.5555152893066406, -0.5230178833007812, -0.4905204772949219, -0.4580230712890625, -0.4255256652832031, -0.39302825927734375, -0.3605308532714844, -0.328033447265625, -0.2955360412597656, -0.26303863525390625, -0.23054122924804688, -0.1980438232421875, -0.16554641723632812, -0.13304901123046875, -0.10055160522460938, -0.06805419921875, -0.035556793212890625, -0.00305938720703125, 0.029438018798828125, 0.0619354248046875, 0.09443283081054688, 0.12693023681640625, 0.15942764282226562, 0.191925048828125, 0.22442245483398438, 0.25691986083984375, 0.2894172668457031, 0.3219146728515625, 0.3544120788574219, 0.38690948486328125, 0.4194068908691406, 0.451904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 13.0, 24.0, 29.0, 73.0, 126.0, 3367.0, 288.0, 87.0, 50.0, 15.0, 7.0, 4.0, 3.0, 2.0], "bins": [-0.111572265625, -0.10957574844360352, -0.10757923126220703, -0.10558271408081055, -0.10358619689941406, -0.10158967971801758, -0.0995931625366211, -0.09759664535522461, -0.09560012817382812, -0.09360361099243164, -0.09160709381103516, -0.08961057662963867, -0.08761405944824219, -0.0856175422668457, -0.08362102508544922, -0.08162450790405273, -0.07962799072265625, -0.07763147354125977, -0.07563495635986328, -0.0736384391784668, -0.07164192199707031, -0.06964540481567383, -0.06764888763427734, -0.06565237045288086, -0.06365585327148438, -0.06165933609008789, -0.059662818908691406, -0.05766630172729492, -0.05566978454589844, -0.05367326736450195, -0.05167675018310547, -0.049680233001708984, -0.0476837158203125, -0.045687198638916016, -0.04369068145751953, -0.04169416427612305, -0.03969764709472656, -0.03770112991333008, -0.035704612731933594, -0.03370809555053711, -0.031711578369140625, -0.02971506118774414, -0.027718544006347656, -0.025722026824951172, -0.023725509643554688, -0.021728992462158203, -0.01973247528076172, -0.017735958099365234, -0.01573944091796875, -0.013742923736572266, -0.011746406555175781, -0.009749889373779297, -0.0077533721923828125, -0.005756855010986328, -0.0037603378295898438, -0.0017638206481933594, 0.000232696533203125, 0.0022292137145996094, 0.004225730895996094, 0.006222248077392578, 0.008218765258789062, 0.010215282440185547, 0.012211799621582031, 0.014208316802978516, 0.016204833984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 31.0, 68.0, 417.0, 461.0, 19.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4453599452972412, -1.405264139175415, -1.3651682138442993, -1.3250724077224731, -1.2849764823913574, -1.2448806762695312, -1.204784870147705, -1.1646889448165894, -1.1245931386947632, -1.084497332572937, -1.0444014072418213, -1.0043056011199951, -0.9642097353935242, -0.9241138696670532, -0.8840180039405823, -0.8439221382141113, -0.8038262724876404, -0.7637304067611694, -0.7236345410346985, -0.6835386753082275, -0.6434428691864014, -0.6033470034599304, -0.5632511377334595, -0.5231553316116333, -0.48305943608283997, -0.442963570356369, -0.40286773443222046, -0.3627718687057495, -0.32267600297927856, -0.28258016705513, -0.24248430132865906, -0.2023884654045105, -0.16229259967803955, -0.1221967488527298, -0.08210089057683945, -0.0420050323009491, -0.0019091814756393433, 0.03818666934967041, 0.07828253507614136, 0.11837837100028992, 0.15847423672676086, 0.19857008755207062, 0.23866593837738037, 0.2787618041038513, 0.31885766983032227, 0.3589535057544708, 0.3990493714809418, 0.43914520740509033, 0.4792410731315613, 0.5193369388580322, 0.5594328045845032, 0.5995286703109741, 0.6396244764328003, 0.6797203421592712, 0.7198162078857422, 0.7599120140075684, 0.8000079393386841, 0.840103805065155, 0.880199670791626, 0.9202954769134521, 0.9603913426399231, 1.000487208366394, 1.0405831336975098, 1.080678939819336, 1.120774745941162]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 13.0, 25.0, 34.0, 58.0, 100.0, 115.0, 135.0, 149.0, 124.0, 95.0, 65.0, 37.0, 28.0, 13.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374489963054657, -0.36227187514305115, -0.3500537872314453, -0.3378356993198395, -0.32561761140823364, -0.3133995532989502, -0.301181435585022, -0.2889633774757385, -0.2767452895641327, -0.26452720165252686, -0.252309113740921, -0.24009102582931519, -0.22787295281887054, -0.2156548649072647, -0.20343677699565887, -0.19121870398521423, -0.1790006011724472, -0.16678251326084137, -0.15456442534923553, -0.1423463523387909, -0.13012826442718506, -0.11791017651557922, -0.10569208860397339, -0.09347400814294815, -0.08125592023134232, -0.06903783231973648, -0.05681975185871124, -0.04460166394710541, -0.03238357976078987, -0.020165495574474335, -0.0079474076628685, 0.004270672798156738, 0.016488760709762573, 0.02870684489607811, 0.040924929082393646, 0.05314301699399948, 0.06536109745502472, 0.07757918536663055, 0.08979727327823639, 0.10201535373926163, 0.11423344165086746, 0.1264515221118927, 0.13866961002349854, 0.15088769793510437, 0.1631057858467102, 0.17532387375831604, 0.18754196166992188, 0.19976003468036652, 0.21197812259197235, 0.22419621050357819, 0.23641429841518402, 0.24863237142562866, 0.2608504593372345, 0.27306854724884033, 0.28528663516044617, 0.297504723072052, 0.30972281098365784, 0.32194089889526367, 0.3341589868068695, 0.34637707471847534, 0.3585951626300812, 0.370813250541687, 0.38303130865097046, 0.3952493965625763, 0.40746748447418213]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 7.0, 3.0, 7.0, 10.0, 11.0, 20.0, 22.0, 31.0, 49.0, 68.0, 134.0, 290.0, 763.0, 3234.0, 28523.0, 947709.0, 61214.0, 4706.0, 1009.0, 341.0, 145.0, 91.0, 52.0, 40.0, 16.0, 23.0, 6.0, 8.0, 5.0, 6.0, 0.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26340675354003906, -0.2553291320800781, -0.2472515106201172, -0.23917388916015625, -0.2310962677001953, -0.22301864624023438, -0.21494102478027344, -0.2068634033203125, -0.19878578186035156, -0.19070816040039062, -0.1826305389404297, -0.17455291748046875, -0.1664752960205078, -0.15839767456054688, -0.15032005310058594, -0.142242431640625, -0.13416481018066406, -0.12608718872070312, -0.11800956726074219, -0.10993194580078125, -0.10185432434082031, -0.09377670288085938, -0.08569908142089844, -0.0776214599609375, -0.06954383850097656, -0.061466217041015625, -0.05338859558105469, -0.04531097412109375, -0.03723335266113281, -0.029155731201171875, -0.021078109741210938, -0.01300048828125, -0.0049228668212890625, 0.003154754638671875, 0.011232376098632812, 0.01930999755859375, 0.027387619018554688, 0.035465240478515625, 0.04354286193847656, 0.0516204833984375, 0.05969810485839844, 0.06777572631835938, 0.07585334777832031, 0.08393096923828125, 0.09200859069824219, 0.10008621215820312, 0.10816383361816406, 0.116241455078125, 0.12431907653808594, 0.13239669799804688, 0.1404743194580078, 0.14855194091796875, 0.1566295623779297, 0.16470718383789062, 0.17278480529785156, 0.1808624267578125, 0.18894004821777344, 0.19701766967773438, 0.2050952911376953, 0.21317291259765625, 0.2212505340576172, 0.22932815551757812, 0.23740577697753906, 0.2454833984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 4.0, 8.0, 12.0, 21.0, 44.0, 112.0, 190.0, 231.0, 169.0, 106.0, 66.0, 22.0, 9.0, 4.0, 4.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.020721435546875, -0.020275235176086426, -0.01982903480529785, -0.019382834434509277, -0.018936634063720703, -0.01849043369293213, -0.018044233322143555, -0.01759803295135498, -0.017151832580566406, -0.016705632209777832, -0.016259431838989258, -0.015813231468200684, -0.01536703109741211, -0.014920830726623535, -0.014474630355834961, -0.014028429985046387, -0.013582229614257812, -0.013136029243469238, -0.012689828872680664, -0.01224362850189209, -0.011797428131103516, -0.011351227760314941, -0.010905027389526367, -0.010458827018737793, -0.010012626647949219, -0.009566426277160645, -0.00912022590637207, -0.008674025535583496, -0.008227825164794922, -0.007781624794006348, -0.0073354244232177734, -0.006889224052429199, -0.006443023681640625, -0.005996823310852051, -0.0055506229400634766, -0.005104422569274902, -0.004658222198486328, -0.004212021827697754, -0.0037658214569091797, -0.0033196210861206055, -0.0028734207153320312, -0.002427220344543457, -0.001981019973754883, -0.0015348196029663086, -0.0010886192321777344, -0.0006424188613891602, -0.00019621849060058594, 0.0002499818801879883, 0.0006961822509765625, 0.0011423826217651367, 0.001588582992553711, 0.002034783363342285, 0.0024809837341308594, 0.0029271841049194336, 0.003373384475708008, 0.003819584846496582, 0.004265785217285156, 0.0047119855880737305, 0.005158185958862305, 0.005604386329650879, 0.006050586700439453, 0.006496787071228027, 0.0069429874420166016, 0.007389187812805176, 0.00783538818359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 8.0, 4.0, 7.0, 11.0, 12.0, 24.0, 15.0, 45.0, 40.0, 80.0, 108.0, 207.0, 386.0, 759.0, 1653.0, 3976.0, 9955.0, 28078.0, 94414.0, 559444.0, 258111.0, 59372.0, 19168.0, 7130.0, 2918.0, 1228.0, 644.0, 293.0, 149.0, 77.0, 61.0, 34.0, 24.0, 31.0, 18.0, 17.0, 11.0, 5.0, 6.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08184814453125, -0.07935428619384766, -0.07686042785644531, -0.07436656951904297, -0.07187271118164062, -0.06937885284423828, -0.06688499450683594, -0.0643911361694336, -0.06189727783203125, -0.059403419494628906, -0.05690956115722656, -0.05441570281982422, -0.051921844482421875, -0.04942798614501953, -0.04693412780761719, -0.044440269470214844, -0.0419464111328125, -0.039452552795410156, -0.03695869445800781, -0.03446483612060547, -0.031970977783203125, -0.02947711944580078, -0.026983261108398438, -0.024489402770996094, -0.02199554443359375, -0.019501686096191406, -0.017007827758789062, -0.014513969421386719, -0.012020111083984375, -0.009526252746582031, -0.0070323944091796875, -0.004538536071777344, -0.002044677734375, 0.00044918060302734375, 0.0029430389404296875, 0.005436897277832031, 0.007930755615234375, 0.010424613952636719, 0.012918472290039062, 0.015412330627441406, 0.01790618896484375, 0.020400047302246094, 0.022893905639648438, 0.02538776397705078, 0.027881622314453125, 0.03037548065185547, 0.03286933898925781, 0.035363197326660156, 0.0378570556640625, 0.040350914001464844, 0.04284477233886719, 0.04533863067626953, 0.047832489013671875, 0.05032634735107422, 0.05282020568847656, 0.055314064025878906, 0.05780792236328125, 0.060301780700683594, 0.06279563903808594, 0.06528949737548828, 0.06778335571289062, 0.07027721405029297, 0.07277107238769531, 0.07526493072509766, 0.0777587890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 8.0, 4.0, 6.0, 9.0, 7.0, 20.0, 10.0, 27.0, 19.0, 26.0, 22.0, 31.0, 32.0, 36.0, 44.0, 42.0, 33.0, 34.0, 31.0, 51.0, 49.0, 33.0, 37.0, 36.0, 44.0, 40.0, 41.0, 30.0, 25.0, 21.0, 22.0, 13.0, 17.0, 25.0, 13.0, 16.0, 8.0, 3.0, 6.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0263214111328125, -0.025519371032714844, -0.024717330932617188, -0.02391529083251953, -0.023113250732421875, -0.02231121063232422, -0.021509170532226562, -0.020707130432128906, -0.01990509033203125, -0.019103050231933594, -0.018301010131835938, -0.01749897003173828, -0.016696929931640625, -0.01589488983154297, -0.015092849731445312, -0.014290809631347656, -0.01348876953125, -0.012686729431152344, -0.011884689331054688, -0.011082649230957031, -0.010280609130859375, -0.009478569030761719, -0.008676528930664062, -0.007874488830566406, -0.00707244873046875, -0.006270408630371094, -0.0054683685302734375, -0.004666328430175781, -0.003864288330078125, -0.0030622482299804688, -0.0022602081298828125, -0.0014581680297851562, -0.0006561279296875, 0.00014591217041015625, 0.0009479522705078125, 0.0017499923706054688, 0.002552032470703125, 0.0033540725708007812, 0.0041561126708984375, 0.004958152770996094, 0.00576019287109375, 0.006562232971191406, 0.0073642730712890625, 0.008166313171386719, 0.008968353271484375, 0.009770393371582031, 0.010572433471679688, 0.011374473571777344, 0.012176513671875, 0.012978553771972656, 0.013780593872070312, 0.014582633972167969, 0.015384674072265625, 0.01618671417236328, 0.016988754272460938, 0.017790794372558594, 0.01859283447265625, 0.019394874572753906, 0.020196914672851562, 0.02099895477294922, 0.021800994873046875, 0.02260303497314453, 0.023405075073242188, 0.024207115173339844, 0.0250091552734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 9.0, 11.0, 5.0, 9.0, 12.0, 19.0, 27.0, 29.0, 44.0, 64.0, 93.0, 106.0, 205.0, 357.0, 580.0, 1312.0, 3229.0, 8514.0, 31899.0, 773018.0, 196006.0, 21579.0, 6485.0, 2514.0, 1069.0, 555.0, 287.0, 167.0, 110.0, 66.0, 42.0, 26.0, 23.0, 22.0, 13.0, 8.0, 10.0, 4.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0015649795532226562, -0.0015213489532470703, -0.0014777183532714844, -0.0014340877532958984, -0.0013904571533203125, -0.0013468265533447266, -0.0013031959533691406, -0.0012595653533935547, -0.0012159347534179688, -0.0011723041534423828, -0.0011286735534667969, -0.001085042953491211, -0.001041412353515625, -0.000997781753540039, -0.0009541511535644531, -0.0009105205535888672, -0.0008668899536132812, -0.0008232593536376953, -0.0007796287536621094, -0.0007359981536865234, -0.0006923675537109375, -0.0006487369537353516, -0.0006051063537597656, -0.0005614757537841797, -0.0005178451538085938, -0.0004742145538330078, -0.0004305839538574219, -0.00038695335388183594, -0.00034332275390625, -0.00029969215393066406, -0.0002560615539550781, -0.0002124309539794922, -0.00016880035400390625, -0.0001251697540283203, -8.153915405273438e-05, -3.790855407714844e-05, 5.7220458984375e-06, 4.935264587402344e-05, 9.298324584960938e-05, 0.0001366138458251953, 0.00018024444580078125, 0.0002238750457763672, 0.0002675056457519531, 0.00031113624572753906, 0.000354766845703125, 0.00039839744567871094, 0.0004420280456542969, 0.0004856586456298828, 0.0005292892456054688, 0.0005729198455810547, 0.0006165504455566406, 0.0006601810455322266, 0.0007038116455078125, 0.0007474422454833984, 0.0007910728454589844, 0.0008347034454345703, 0.0008783340454101562, 0.0009219646453857422, 0.0009655952453613281, 0.001009225845336914, 0.0010528564453125, 0.001096487045288086, 0.0011401176452636719, 0.0011837482452392578, 0.0012273788452148438]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 5.0, 9.0, 11.0, 13.0, 13.0, 33.0, 26.0, 51.0, 78.0, 148.0, 208.0, 136.0, 56.0, 50.0, 49.0, 20.0, 17.0, 16.0, 13.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9087066650390625e-05, -2.8135254979133606e-05, -2.7183443307876587e-05, -2.6231631636619568e-05, -2.527981996536255e-05, -2.432800829410553e-05, -2.337619662284851e-05, -2.2424384951591492e-05, -2.1472573280334473e-05, -2.0520761609077454e-05, -1.9568949937820435e-05, -1.8617138266563416e-05, -1.7665326595306396e-05, -1.6713514924049377e-05, -1.576170325279236e-05, -1.480989158153534e-05, -1.385807991027832e-05, -1.2906268239021301e-05, -1.1954456567764282e-05, -1.1002644896507263e-05, -1.0050833225250244e-05, -9.099021553993225e-06, -8.147209882736206e-06, -7.195398211479187e-06, -6.243586540222168e-06, -5.291774868965149e-06, -4.33996319770813e-06, -3.388151526451111e-06, -2.436339855194092e-06, -1.4845281839370728e-06, -5.327165126800537e-07, 4.1909515857696533e-07, 1.3709068298339844e-06, 2.3227185010910034e-06, 3.2745301723480225e-06, 4.2263418436050415e-06, 5.1781535148620605e-06, 6.12996518611908e-06, 7.081776857376099e-06, 8.033588528633118e-06, 8.985400199890137e-06, 9.937211871147156e-06, 1.0889023542404175e-05, 1.1840835213661194e-05, 1.2792646884918213e-05, 1.3744458556175232e-05, 1.4696270227432251e-05, 1.564808189868927e-05, 1.659989356994629e-05, 1.7551705241203308e-05, 1.8503516912460327e-05, 1.9455328583717346e-05, 2.0407140254974365e-05, 2.1358951926231384e-05, 2.2310763597488403e-05, 2.3262575268745422e-05, 2.421438694000244e-05, 2.516619861125946e-05, 2.611801028251648e-05, 2.70698219537735e-05, 2.8021633625030518e-05, 2.8973445296287537e-05, 2.9925256967544556e-05, 3.0877068638801575e-05, 3.1828880310058594e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 12.0, 16.0, 16.0, 35.0, 33.0, 69.0, 93.0, 196.0, 355.0, 784.0, 2371.0, 10225.0, 161442.0, 851314.0, 16424.0, 3262.0, 962.0, 418.0, 210.0, 123.0, 76.0, 43.0, 26.0, 20.0, 12.0, 5.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.002716064453125, -0.002650022506713867, -0.0025839805603027344, -0.0025179386138916016, -0.0024518966674804688, -0.002385854721069336, -0.002319812774658203, -0.0022537708282470703, -0.0021877288818359375, -0.0021216869354248047, -0.002055644989013672, -0.001989603042602539, -0.0019235610961914062, -0.0018575191497802734, -0.0017914772033691406, -0.0017254352569580078, -0.001659393310546875, -0.0015933513641357422, -0.0015273094177246094, -0.0014612674713134766, -0.0013952255249023438, -0.001329183578491211, -0.0012631416320800781, -0.0011970996856689453, -0.0011310577392578125, -0.0010650157928466797, -0.0009989738464355469, -0.0009329319000244141, -0.0008668899536132812, -0.0008008480072021484, -0.0007348060607910156, -0.0006687641143798828, -0.00060272216796875, -0.0005366802215576172, -0.0004706382751464844, -0.00040459632873535156, -0.00033855438232421875, -0.00027251243591308594, -0.00020647048950195312, -0.0001404285430908203, -7.43865966796875e-05, -8.344650268554688e-06, 5.7697296142578125e-05, 0.00012373924255371094, 0.00018978118896484375, 0.00025582313537597656, 0.0003218650817871094, 0.0003879070281982422, 0.000453948974609375, 0.0005199909210205078, 0.0005860328674316406, 0.0006520748138427734, 0.0007181167602539062, 0.0007841587066650391, 0.0008502006530761719, 0.0009162425994873047, 0.0009822845458984375, 0.0010483264923095703, 0.0011143684387207031, 0.001180410385131836, 0.0012464523315429688, 0.0013124942779541016, 0.0013785362243652344, 0.0014445781707763672, 0.0015106201171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 5.0, 5.0, 10.0, 10.0, 14.0, 30.0, 54.0, 104.0, 223.0, 249.0, 127.0, 55.0, 34.0, 20.0, 14.0, 11.0, 7.0, 12.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0008740425109863281, -0.0008527897298336029, -0.0008315369486808777, -0.0008102841675281525, -0.0007890313863754272, -0.000767778605222702, -0.0007465258240699768, -0.0007252730429172516, -0.0007040202617645264, -0.0006827674806118011, -0.0006615146994590759, -0.0006402619183063507, -0.0006190091371536255, -0.0005977563560009003, -0.000576503574848175, -0.0005552507936954498, -0.0005339980125427246, -0.0005127452313899994, -0.0004914924502372742, -0.00047023966908454895, -0.00044898688793182373, -0.0004277341067790985, -0.0004064813256263733, -0.00038522854447364807, -0.00036397576332092285, -0.00034272298216819763, -0.0003214702010154724, -0.0003002174198627472, -0.00027896463871002197, -0.00025771185755729675, -0.00023645907640457153, -0.0002152062952518463, -0.0001939535140991211, -0.00017270073294639587, -0.00015144795179367065, -0.00013019517064094543, -0.00010894238948822021, -8.7689608335495e-05, -6.643682718276978e-05, -4.5184046030044556e-05, -2.3931264877319336e-05, -2.678483724594116e-06, 1.8574297428131104e-05, 3.982707858085632e-05, 6.107985973358154e-05, 8.233264088630676e-05, 0.00010358542203903198, 0.0001248382031917572, 0.00014609098434448242, 0.00016734376549720764, 0.00018859654664993286, 0.00020984932780265808, 0.0002311021089553833, 0.0002523548901081085, 0.00027360767126083374, 0.00029486045241355896, 0.0003161132335662842, 0.0003373660147190094, 0.0003586187958717346, 0.00037987157702445984, 0.00040112435817718506, 0.0004223771393299103, 0.0004436299204826355, 0.0004648827016353607, 0.00048613548278808594]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 20.0, 166.0, 661.0, 111.0, 35.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40777289867401123, -0.3510960042476654, -0.2944191098213196, -0.23774221539497375, -0.18106532096862793, -0.1243884265422821, -0.06771153211593628, -0.011034637689590454, 0.04564225673675537, 0.1023191511631012, 0.15899604558944702, 0.21567294001579285, 0.27234983444213867, 0.3290267288684845, 0.3857036232948303, 0.44238051772117615, 0.499057412147522, 0.5557342767715454, 0.6124112010002136, 0.6690881252288818, 0.7257649898529053, 0.7824418544769287, 0.8391187787055969, 0.8957957029342651, 0.9524725675582886, 1.009149432182312, 1.065826416015625, 1.1225032806396484, 1.1791801452636719, 1.2358570098876953, 1.2925338745117188, 1.3492108583450317, 1.4058876037597656, 1.462564468383789, 1.5192413330078125, 1.5759183168411255, 1.632595181465149, 1.6892720460891724, 1.7459490299224854, 1.8026258945465088, 1.8593027591705322, 1.9159796237945557, 1.972656488418579, 2.0293333530426025, 2.086010456085205, 2.1426873207092285, 2.199364185333252, 2.2560410499572754, 2.312717914581299, 2.3693947792053223, 2.4260716438293457, 2.482748508453369, 2.5394253730773926, 2.596102476119995, 2.6527793407440186, 2.709456205368042, 2.7661330699920654, 2.822809934616089, 2.8794867992401123, 2.9361636638641357, 2.9928407669067383, 3.0495176315307617, 3.106194496154785, 3.1628713607788086, 3.219548225402832]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 9.0, 9.0, 16.0, 21.0, 32.0, 37.0, 46.0, 34.0, 32.0, 51.0, 50.0, 54.0, 46.0, 57.0, 50.0, 61.0, 60.0, 46.0, 45.0, 36.0, 45.0, 19.0, 15.0, 17.0, 21.0, 17.0, 13.0, 8.0, 11.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2274121642112732, -0.2198096662759781, -0.21220716834068298, -0.20460467040538788, -0.19700217247009277, -0.18939965963363647, -0.18179716169834137, -0.17419466376304626, -0.16659216582775116, -0.15898966789245605, -0.15138716995716095, -0.14378467202186584, -0.13618215918540955, -0.12857967615127563, -0.12097716331481934, -0.11337466537952423, -0.10577216744422913, -0.09816966950893402, -0.09056717157363892, -0.08296466618776321, -0.07536216825246811, -0.067759670317173, -0.0601571686565876, -0.0525546669960022, -0.04495216906070709, -0.03734967112541199, -0.029747169464826584, -0.02214466966688633, -0.014542169868946075, -0.0069396719336509705, 0.000662829726934433, 0.008265331387519836, 0.01586782932281494, 0.023470329120755196, 0.03107282891869545, 0.03867533057928085, 0.04627782851457596, 0.05388032644987106, 0.06148282811045647, 0.06908532977104187, 0.07668782770633698, 0.08429032564163208, 0.09189282357692719, 0.09949532896280289, 0.10709782689809799, 0.1147003248333931, 0.1223028302192688, 0.1299053281545639, 0.137507826089859, 0.1451103240251541, 0.15271282196044922, 0.16031531989574432, 0.16791781783103943, 0.17552033066749573, 0.18312282860279083, 0.19072532653808594, 0.19832782447338104, 0.20593032240867615, 0.21353282034397125, 0.22113531827926636, 0.22873783111572266, 0.23634031414985657, 0.24394282698631287, 0.2515453100204468, 0.2591478228569031]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 9.0, 24.0, 24.0, 39.0, 80.0, 129.0, 259.0, 713.0, 3036.0, 60119.0, 4122958.0, 5300.0, 1048.0, 288.0, 108.0, 48.0, 24.0, 19.0, 14.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5847625732421875, -0.572357177734375, -0.5599517822265625, -0.54754638671875, -0.5351409912109375, -0.522735595703125, -0.5103302001953125, -0.4979248046875, -0.4855194091796875, -0.473114013671875, -0.4607086181640625, -0.44830322265625, -0.4358978271484375, -0.423492431640625, -0.4110870361328125, -0.398681640625, -0.3862762451171875, -0.373870849609375, -0.3614654541015625, -0.34906005859375, -0.3366546630859375, -0.324249267578125, -0.3118438720703125, -0.2994384765625, -0.2870330810546875, -0.274627685546875, -0.2622222900390625, -0.24981689453125, -0.2374114990234375, -0.225006103515625, -0.2126007080078125, -0.2001953125, -0.1877899169921875, -0.175384521484375, -0.1629791259765625, -0.15057373046875, -0.1381683349609375, -0.125762939453125, -0.1133575439453125, -0.1009521484375, -0.0885467529296875, -0.076141357421875, -0.0637359619140625, -0.05133056640625, -0.0389251708984375, -0.026519775390625, -0.0141143798828125, -0.001708984375, 0.0106964111328125, 0.023101806640625, 0.0355072021484375, 0.04791259765625, 0.0603179931640625, 0.072723388671875, 0.0851287841796875, 0.0975341796875, 0.1099395751953125, 0.122344970703125, 0.1347503662109375, 0.14715576171875, 0.1595611572265625, 0.171966552734375, 0.1843719482421875, 0.19677734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 9.0, 17.0, 29.0, 64.0, 125.0, 217.0, 204.0, 157.0, 95.0, 49.0, 18.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02166748046875, -0.02121734619140625, -0.0207672119140625, -0.02031707763671875, -0.019866943359375, -0.01941680908203125, -0.0189666748046875, -0.01851654052734375, -0.01806640625, -0.01761627197265625, -0.0171661376953125, -0.01671600341796875, -0.016265869140625, -0.01581573486328125, -0.0153656005859375, -0.01491546630859375, -0.01446533203125, -0.01401519775390625, -0.0135650634765625, -0.01311492919921875, -0.012664794921875, -0.01221466064453125, -0.0117645263671875, -0.01131439208984375, -0.0108642578125, -0.01041412353515625, -0.0099639892578125, -0.00951385498046875, -0.009063720703125, -0.00861358642578125, -0.0081634521484375, -0.00771331787109375, -0.00726318359375, -0.00681304931640625, -0.0063629150390625, -0.00591278076171875, -0.005462646484375, -0.00501251220703125, -0.0045623779296875, -0.00411224365234375, -0.003662109375, -0.00321197509765625, -0.0027618408203125, -0.00231170654296875, -0.001861572265625, -0.00141143798828125, -0.0009613037109375, -0.00051116943359375, -6.103515625e-05, 0.00038909912109375, 0.0008392333984375, 0.00128936767578125, 0.001739501953125, 0.00218963623046875, 0.0026397705078125, 0.00308990478515625, 0.0035400390625, 0.00399017333984375, 0.0044403076171875, 0.00489044189453125, 0.005340576171875, 0.00579071044921875, 0.0062408447265625, 0.00669097900390625, 0.00714111328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 14.0, 11.0, 38.0, 65.0, 151.0, 341.0, 1562.0, 25243.0, 4156941.0, 8725.0, 800.0, 198.0, 89.0, 52.0, 14.0, 23.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.783203125, -0.7655448913574219, -0.7478866577148438, -0.7302284240722656, -0.7125701904296875, -0.6949119567871094, -0.6772537231445312, -0.6595954895019531, -0.641937255859375, -0.6242790222167969, -0.6066207885742188, -0.5889625549316406, -0.5713043212890625, -0.5536460876464844, -0.5359878540039062, -0.5183296203613281, -0.50067138671875, -0.4830131530761719, -0.46535491943359375, -0.4476966857910156, -0.4300384521484375, -0.4123802185058594, -0.39472198486328125, -0.3770637512207031, -0.359405517578125, -0.3417472839355469, -0.32408905029296875, -0.3064308166503906, -0.2887725830078125, -0.2711143493652344, -0.25345611572265625, -0.23579788208007812, -0.2181396484375, -0.20048141479492188, -0.18282318115234375, -0.16516494750976562, -0.1475067138671875, -0.12984848022460938, -0.11219024658203125, -0.09453201293945312, -0.076873779296875, -0.059215545654296875, -0.04155731201171875, -0.023899078369140625, -0.0062408447265625, 0.011417388916015625, 0.02907562255859375, 0.046733856201171875, 0.06439208984375, 0.08205032348632812, 0.09970855712890625, 0.11736679077148438, 0.1350250244140625, 0.15268325805664062, 0.17034149169921875, 0.18799972534179688, 0.205657958984375, 0.22331619262695312, 0.24097442626953125, 0.2586326599121094, 0.2762908935546875, 0.2939491271972656, 0.31160736083984375, 0.3292655944824219, 0.346923828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 12.0, 10.0, 23.0, 28.0, 49.0, 114.0, 3627.0, 61.0, 51.0, 22.0, 25.0, 14.0, 5.0, 18.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.057220458984375, -0.055930376052856445, -0.05464029312133789, -0.053350210189819336, -0.05206012725830078, -0.05077004432678223, -0.04947996139526367, -0.04818987846374512, -0.04689979553222656, -0.04560971260070801, -0.04431962966918945, -0.0430295467376709, -0.041739463806152344, -0.04044938087463379, -0.039159297943115234, -0.03786921501159668, -0.036579132080078125, -0.03528904914855957, -0.033998966217041016, -0.03270888328552246, -0.031418800354003906, -0.03012871742248535, -0.028838634490966797, -0.027548551559448242, -0.026258468627929688, -0.024968385696411133, -0.023678302764892578, -0.022388219833374023, -0.02109813690185547, -0.019808053970336914, -0.01851797103881836, -0.017227888107299805, -0.01593780517578125, -0.014647722244262695, -0.01335763931274414, -0.012067556381225586, -0.010777473449707031, -0.009487390518188477, -0.008197307586669922, -0.006907224655151367, -0.0056171417236328125, -0.004327058792114258, -0.003036975860595703, -0.0017468929290771484, -0.00045680999755859375, 0.0008332729339599609, 0.0021233558654785156, 0.0034134387969970703, 0.004703521728515625, 0.00599360466003418, 0.007283687591552734, 0.008573770523071289, 0.009863853454589844, 0.011153936386108398, 0.012444019317626953, 0.013734102249145508, 0.015024185180664062, 0.016314268112182617, 0.017604351043701172, 0.018894433975219727, 0.02018451690673828, 0.021474599838256836, 0.02276468276977539, 0.024054765701293945, 0.0253448486328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 10.0, 11.0, 20.0, 27.0, 50.0, 76.0, 207.0, 383.0, 103.0, 54.0, 29.0, 14.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3843596279621124, -0.3758871853351593, -0.3674147129058838, -0.35894227027893066, -0.35046982765197754, -0.3419973850250244, -0.3335249125957489, -0.3250524699687958, -0.31657999753952026, -0.30810755491256714, -0.2996350824832916, -0.2911626398563385, -0.2826901972293854, -0.27421772480010986, -0.26574528217315674, -0.2572728395462036, -0.2488003969192505, -0.24032793939113617, -0.23185549676418304, -0.22338303923606873, -0.2149105966091156, -0.20643813908100128, -0.19796568155288696, -0.18949323892593384, -0.18102078139781952, -0.1725483238697052, -0.16407588124275208, -0.15560342371463776, -0.14713096618652344, -0.1386585235595703, -0.130186066031456, -0.12171361595392227, -0.11324116587638855, -0.10476871579885483, -0.0962962657213211, -0.08782380819320679, -0.07935135811567307, -0.07087890803813934, -0.06240645423531532, -0.0539340004324913, -0.04546155035495758, -0.03698910027742386, -0.028516646474599838, -0.020044194534420967, -0.011571742594242096, -0.003099292516708374, 0.005373161286115646, 0.013845615088939667, 0.02231806516647339, 0.03079051710665226, 0.03926296904683113, 0.04773542284965515, 0.05620787292718887, 0.0646803230047226, 0.07315278053283691, 0.08162523061037064, 0.09009768068790436, 0.09857013076543808, 0.1070425808429718, 0.11551503837108612, 0.12398748844861984, 0.13245993852615356, 0.14093239605426788, 0.1494048535823822, 0.15787729620933533]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 4.0, 10.0, 16.0, 35.0, 36.0, 64.0, 73.0, 89.0, 78.0, 116.0, 96.0, 109.0, 79.0, 67.0, 53.0, 28.0, 24.0, 14.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18515360355377197, -0.1793646365404129, -0.17357566952705383, -0.16778670251369476, -0.1619977355003357, -0.15620876848697662, -0.15041980147361755, -0.14463083446025848, -0.13884186744689941, -0.13305290043354034, -0.12726393342018127, -0.1214749664068222, -0.11568599939346313, -0.10989703238010406, -0.104108065366745, -0.09831909835338593, -0.09253013134002686, -0.08674116432666779, -0.08095219731330872, -0.07516323029994965, -0.06937426328659058, -0.0635852962732315, -0.057796329259872437, -0.05200736224651337, -0.0462183952331543, -0.04042942821979523, -0.03464046120643616, -0.028851494193077087, -0.023062527179718018, -0.017273560166358948, -0.011484593152999878, -0.005695626139640808, 9.334087371826172e-05, 0.0058823078870773315, 0.011671274900436401, 0.01746024191379547, 0.02324920892715454, 0.02903817594051361, 0.03482714295387268, 0.04061610996723175, 0.04640507698059082, 0.05219404399394989, 0.05798301100730896, 0.06377197802066803, 0.0695609450340271, 0.07534991204738617, 0.08113887906074524, 0.08692784607410431, 0.09271681308746338, 0.09850578010082245, 0.10429474711418152, 0.11008371412754059, 0.11587268114089966, 0.12166164815425873, 0.1274506151676178, 0.13323958218097687, 0.13902854919433594, 0.144817516207695, 0.15060648322105408, 0.15639545023441315, 0.16218441724777222, 0.1679733842611313, 0.17376235127449036, 0.17955131828784943, 0.1853402853012085]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 10.0, 10.0, 19.0, 20.0, 29.0, 36.0, 53.0, 59.0, 115.0, 229.0, 537.0, 1519.0, 6412.0, 51413.0, 868462.0, 106172.0, 9896.0, 2109.0, 705.0, 284.0, 128.0, 83.0, 42.0, 36.0, 26.0, 19.0, 18.0, 16.0, 13.0, 10.0, 6.0, 5.0, 5.0, 4.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134765625, -0.13050460815429688, -0.12624359130859375, -0.12198257446289062, -0.1177215576171875, -0.11346054077148438, -0.10919952392578125, -0.10493850708007812, -0.100677490234375, -0.09641647338867188, -0.09215545654296875, -0.08789443969726562, -0.0836334228515625, -0.07937240600585938, -0.07511138916015625, -0.07085037231445312, -0.06658935546875, -0.062328338623046875, -0.05806732177734375, -0.053806304931640625, -0.0495452880859375, -0.045284271240234375, -0.04102325439453125, -0.036762237548828125, -0.032501220703125, -0.028240203857421875, -0.02397918701171875, -0.019718170166015625, -0.0154571533203125, -0.011196136474609375, -0.00693511962890625, -0.002674102783203125, 0.0015869140625, 0.005847930908203125, 0.01010894775390625, 0.014369964599609375, 0.0186309814453125, 0.022891998291015625, 0.02715301513671875, 0.031414031982421875, 0.035675048828125, 0.039936065673828125, 0.04419708251953125, 0.048458099365234375, 0.0527191162109375, 0.056980133056640625, 0.06124114990234375, 0.06550216674804688, 0.06976318359375, 0.07402420043945312, 0.07828521728515625, 0.08254623413085938, 0.0868072509765625, 0.09106826782226562, 0.09532928466796875, 0.09959030151367188, 0.103851318359375, 0.10811233520507812, 0.11237335205078125, 0.11663436889648438, 0.1208953857421875, 0.12515640258789062, 0.12941741943359375, 0.13367843627929688, 0.137939453125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 0.0, 8.0, 14.0, 21.0, 53.0, 100.0, 152.0, 210.0, 188.0, 122.0, 65.0, 44.0, 13.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209197998046875, -0.020471692085266113, -0.020023584365844727, -0.01957547664642334, -0.019127368927001953, -0.018679261207580566, -0.01823115348815918, -0.017783045768737793, -0.017334938049316406, -0.01688683032989502, -0.016438722610473633, -0.015990614891052246, -0.01554250717163086, -0.015094399452209473, -0.014646291732788086, -0.0141981840133667, -0.013750076293945312, -0.013301968574523926, -0.012853860855102539, -0.012405753135681152, -0.011957645416259766, -0.011509537696838379, -0.011061429977416992, -0.010613322257995605, -0.010165214538574219, -0.009717106819152832, -0.009268999099731445, -0.008820891380310059, -0.008372783660888672, -0.007924675941467285, -0.0074765682220458984, -0.007028460502624512, -0.006580352783203125, -0.006132245063781738, -0.0056841373443603516, -0.005236029624938965, -0.004787921905517578, -0.004339814186096191, -0.0038917064666748047, -0.003443598747253418, -0.0029954910278320312, -0.0025473833084106445, -0.002099275588989258, -0.001651167869567871, -0.0012030601501464844, -0.0007549524307250977, -0.00030684471130371094, 0.00014126300811767578, 0.0005893707275390625, 0.0010374784469604492, 0.001485586166381836, 0.0019336938858032227, 0.0023818016052246094, 0.002829909324645996, 0.003278017044067383, 0.0037261247634887695, 0.004174232482910156, 0.004622340202331543, 0.00507044792175293, 0.005518555641174316, 0.005966663360595703, 0.00641477108001709, 0.0068628787994384766, 0.007310986518859863, 0.00775909423828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 17.0, 22.0, 27.0, 49.0, 50.0, 93.0, 141.0, 239.0, 343.0, 660.0, 1120.0, 1937.0, 3654.0, 7006.0, 14020.0, 30534.0, 73964.0, 230030.0, 481056.0, 118338.0, 44746.0, 19899.0, 9566.0, 4897.0, 2627.0, 1455.0, 782.0, 458.0, 277.0, 167.0, 124.0, 67.0, 51.0, 43.0, 19.0, 14.0, 6.0, 6.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04144287109375, -0.0401158332824707, -0.038788795471191406, -0.03746175765991211, -0.03613471984863281, -0.034807682037353516, -0.03348064422607422, -0.03215360641479492, -0.030826568603515625, -0.029499530792236328, -0.02817249298095703, -0.026845455169677734, -0.025518417358398438, -0.02419137954711914, -0.022864341735839844, -0.021537303924560547, -0.02021026611328125, -0.018883228302001953, -0.017556190490722656, -0.01622915267944336, -0.014902114868164062, -0.013575077056884766, -0.012248039245605469, -0.010921001434326172, -0.009593963623046875, -0.008266925811767578, -0.006939888000488281, -0.005612850189208984, -0.0042858123779296875, -0.0029587745666503906, -0.0016317367553710938, -0.0003046989440917969, 0.0010223388671875, 0.002349376678466797, 0.0036764144897460938, 0.005003452301025391, 0.0063304901123046875, 0.007657527923583984, 0.008984565734863281, 0.010311603546142578, 0.011638641357421875, 0.012965679168701172, 0.014292716979980469, 0.015619754791259766, 0.016946792602539062, 0.01827383041381836, 0.019600868225097656, 0.020927906036376953, 0.02225494384765625, 0.023581981658935547, 0.024909019470214844, 0.02623605728149414, 0.027563095092773438, 0.028890132904052734, 0.03021717071533203, 0.03154420852661133, 0.032871246337890625, 0.03419828414916992, 0.03552532196044922, 0.036852359771728516, 0.03817939758300781, 0.03950643539428711, 0.040833473205566406, 0.0421605110168457, 0.043487548828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 12.0, 9.0, 12.0, 11.0, 14.0, 16.0, 20.0, 28.0, 38.0, 35.0, 28.0, 39.0, 30.0, 51.0, 48.0, 37.0, 48.0, 45.0, 51.0, 33.0, 52.0, 34.0, 41.0, 34.0, 35.0, 23.0, 35.0, 15.0, 17.0, 23.0, 18.0, 15.0, 9.0, 8.0, 7.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0235137939453125, -0.022761106491088867, -0.022008419036865234, -0.0212557315826416, -0.02050304412841797, -0.019750356674194336, -0.018997669219970703, -0.01824498176574707, -0.017492294311523438, -0.016739606857299805, -0.015986919403076172, -0.015234231948852539, -0.014481544494628906, -0.013728857040405273, -0.01297616958618164, -0.012223482131958008, -0.011470794677734375, -0.010718107223510742, -0.00996541976928711, -0.009212732315063477, -0.008460044860839844, -0.007707357406616211, -0.006954669952392578, -0.006201982498168945, -0.0054492950439453125, -0.00469660758972168, -0.003943920135498047, -0.003191232681274414, -0.0024385452270507812, -0.0016858577728271484, -0.0009331703186035156, -0.0001804828643798828, 0.00057220458984375, 0.0013248920440673828, 0.0020775794982910156, 0.0028302669525146484, 0.0035829544067382812, 0.004335641860961914, 0.005088329315185547, 0.00584101676940918, 0.0065937042236328125, 0.007346391677856445, 0.008099079132080078, 0.008851766586303711, 0.009604454040527344, 0.010357141494750977, 0.01110982894897461, 0.011862516403198242, 0.012615203857421875, 0.013367891311645508, 0.01412057876586914, 0.014873266220092773, 0.015625953674316406, 0.01637864112854004, 0.017131328582763672, 0.017884016036987305, 0.018636703491210938, 0.01938939094543457, 0.020142078399658203, 0.020894765853881836, 0.02164745330810547, 0.0224001407623291, 0.023152828216552734, 0.023905515670776367, 0.024658203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 10.0, 19.0, 18.0, 28.0, 47.0, 100.0, 190.0, 345.0, 750.0, 1576.0, 3852.0, 12165.0, 79908.0, 873450.0, 59385.0, 10332.0, 3564.0, 1414.0, 637.0, 343.0, 168.0, 84.0, 40.0, 26.0, 24.0, 18.0, 11.0, 7.0, 7.0, 9.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0010423660278320312, -0.0010121017694473267, -0.000981837511062622, -0.0009515732526779175, -0.0009213089942932129, -0.0008910447359085083, -0.0008607804775238037, -0.0008305162191390991, -0.0008002519607543945, -0.0007699877023696899, -0.0007397234439849854, -0.0007094591856002808, -0.0006791949272155762, -0.0006489306688308716, -0.000618666410446167, -0.0005884021520614624, -0.0005581378936767578, -0.0005278736352920532, -0.0004976093769073486, -0.00046734511852264404, -0.00043708086013793945, -0.00040681660175323486, -0.0003765523433685303, -0.0003462880849838257, -0.0003160238265991211, -0.0002857595682144165, -0.0002554953098297119, -0.00022523105144500732, -0.00019496679306030273, -0.00016470253467559814, -0.00013443827629089355, -0.00010417401790618896, -7.390975952148438e-05, -4.3645501136779785e-05, -1.3381242752075195e-05, 1.6883015632629395e-05, 4.7147274017333984e-05, 7.741153240203857e-05, 0.00010767579078674316, 0.00013794004917144775, 0.00016820430755615234, 0.00019846856594085693, 0.00022873282432556152, 0.0002589970827102661, 0.0002892613410949707, 0.0003195255994796753, 0.0003497898578643799, 0.00038005411624908447, 0.00041031837463378906, 0.00044058263301849365, 0.00047084689140319824, 0.0005011111497879028, 0.0005313754081726074, 0.000561639666557312, 0.0005919039249420166, 0.0006221681833267212, 0.0006524324417114258, 0.0006826967000961304, 0.000712960958480835, 0.0007432252168655396, 0.0007734894752502441, 0.0008037537336349487, 0.0008340179920196533, 0.0008642822504043579, 0.0008945465087890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 9.0, 12.0, 10.0, 13.0, 23.0, 32.0, 66.0, 167.0, 337.0, 136.0, 62.0, 37.0, 25.0, 17.0, 11.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.273653030395508e-05, -4.1330233216285706e-05, -3.992393612861633e-05, -3.851763904094696e-05, -3.711134195327759e-05, -3.5705044865608215e-05, -3.429874777793884e-05, -3.289245069026947e-05, -3.14861536026001e-05, -3.0079856514930725e-05, -2.8673559427261353e-05, -2.726726233959198e-05, -2.5860965251922607e-05, -2.4454668164253235e-05, -2.3048371076583862e-05, -2.164207398891449e-05, -2.0235776901245117e-05, -1.8829479813575745e-05, -1.7423182725906372e-05, -1.6016885638237e-05, -1.4610588550567627e-05, -1.3204291462898254e-05, -1.1797994375228882e-05, -1.039169728755951e-05, -8.985400199890137e-06, -7.579103112220764e-06, -6.172806024551392e-06, -4.766508936882019e-06, -3.3602118492126465e-06, -1.953914761543274e-06, -5.476176738739014e-07, 8.586794137954712e-07, 2.2649765014648438e-06, 3.6712735891342163e-06, 5.077570676803589e-06, 6.4838677644729614e-06, 7.890164852142334e-06, 9.296461939811707e-06, 1.0702759027481079e-05, 1.2109056115150452e-05, 1.3515353202819824e-05, 1.4921650290489197e-05, 1.632794737815857e-05, 1.7734244465827942e-05, 1.9140541553497314e-05, 2.0546838641166687e-05, 2.195313572883606e-05, 2.3359432816505432e-05, 2.4765729904174805e-05, 2.6172026991844177e-05, 2.757832407951355e-05, 2.8984621167182922e-05, 3.0390918254852295e-05, 3.179721534252167e-05, 3.320351243019104e-05, 3.460980951786041e-05, 3.6016106605529785e-05, 3.742240369319916e-05, 3.882870078086853e-05, 4.02349978685379e-05, 4.1641294956207275e-05, 4.304759204387665e-05, 4.445388913154602e-05, 4.586018621921539e-05, 4.7266483306884766e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 4.0, 9.0, 13.0, 19.0, 25.0, 35.0, 58.0, 121.0, 210.0, 433.0, 986.0, 2499.0, 8343.0, 51888.0, 891901.0, 76472.0, 10352.0, 3020.0, 1134.0, 487.0, 233.0, 122.0, 66.0, 42.0, 25.0, 17.0, 14.0, 12.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010385513305664062, -0.0010076165199279785, -0.0009766817092895508, -0.000945746898651123, -0.0009148120880126953, -0.0008838772773742676, -0.0008529424667358398, -0.0008220076560974121, -0.0007910728454589844, -0.0007601380348205566, -0.0007292032241821289, -0.0006982684135437012, -0.0006673336029052734, -0.0006363987922668457, -0.000605463981628418, -0.0005745291709899902, -0.0005435943603515625, -0.0005126595497131348, -0.00048172473907470703, -0.0004507899284362793, -0.00041985511779785156, -0.00038892030715942383, -0.0003579854965209961, -0.00032705068588256836, -0.0002961158752441406, -0.0002651810646057129, -0.00023424625396728516, -0.00020331144332885742, -0.0001723766326904297, -0.00014144182205200195, -0.00011050701141357422, -7.957220077514648e-05, -4.863739013671875e-05, -1.7702579498291016e-05, 1.3232231140136719e-05, 4.416704177856445e-05, 7.510185241699219e-05, 0.00010603666305541992, 0.00013697147369384766, 0.0001679062843322754, 0.00019884109497070312, 0.00022977590560913086, 0.0002607107162475586, 0.00029164552688598633, 0.00032258033752441406, 0.0003535151481628418, 0.00038444995880126953, 0.00041538476943969727, 0.000446319580078125, 0.00047725439071655273, 0.0005081892013549805, 0.0005391240119934082, 0.0005700588226318359, 0.0006009936332702637, 0.0006319284439086914, 0.0006628632545471191, 0.0006937980651855469, 0.0007247328758239746, 0.0007556676864624023, 0.0007866024971008301, 0.0008175373077392578, 0.0008484721183776855, 0.0008794069290161133, 0.000910341739654541, 0.0009412765502929688]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 12.0, 25.0, 32.0, 39.0, 64.0, 124.0, 183.0, 179.0, 122.0, 76.0, 47.0, 30.0, 6.0, 11.0, 8.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005903244018554688, -0.0005762539803981781, -0.0005621835589408875, -0.0005481131374835968, -0.0005340427160263062, -0.0005199722945690155, -0.0005059018731117249, -0.0004918314516544342, -0.00047776103019714355, -0.0004636906087398529, -0.00044962018728256226, -0.0004355497658252716, -0.00042147934436798096, -0.0004074089229106903, -0.00039333850145339966, -0.000379268079996109, -0.00036519765853881836, -0.0003511272370815277, -0.00033705681562423706, -0.0003229863941669464, -0.00030891597270965576, -0.0002948455512523651, -0.00028077512979507446, -0.0002667047083377838, -0.00025263428688049316, -0.00023856386542320251, -0.00022449344396591187, -0.00021042302250862122, -0.00019635260105133057, -0.00018228217959403992, -0.00016821175813674927, -0.00015414133667945862, -0.00014007091522216797, -0.00012600049376487732, -0.00011193007230758667, -9.785965085029602e-05, -8.378922939300537e-05, -6.971880793571472e-05, -5.564838647842407e-05, -4.157796502113342e-05, -2.7507543563842773e-05, -1.3437122106552124e-05, 6.332993507385254e-07, 1.4703720808029175e-05, 2.8774142265319824e-05, 4.2844563722610474e-05, 5.691498517990112e-05, 7.098540663719177e-05, 8.505582809448242e-05, 9.912624955177307e-05, 0.00011319667100906372, 0.00012726709246635437, 0.00014133751392364502, 0.00015540793538093567, 0.00016947835683822632, 0.00018354877829551697, 0.00019761919975280762, 0.00021168962121009827, 0.00022576004266738892, 0.00023983046412467957, 0.0002539008855819702, 0.00026797130703926086, 0.0002820417284965515, 0.00029611214995384216, 0.0003101825714111328]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 67.0, 302.0, 445.0, 102.0, 43.0, 24.0, 13.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7805824279785156, -0.7527408599853516, -0.7248993515968323, -0.697057843208313, -0.6692162752151489, -0.6413747072219849, -0.6135331988334656, -0.5856916904449463, -0.5578501224517822, -0.5300085544586182, -0.5021670460700989, -0.4743255078792572, -0.4464839696884155, -0.41864243149757385, -0.3908008933067322, -0.3629593551158905, -0.33511781692504883, -0.30727627873420715, -0.2794347405433655, -0.2515932023525238, -0.22375166416168213, -0.19591012597084045, -0.16806858777999878, -0.1402270495891571, -0.11238551139831543, -0.08454397320747375, -0.05670243501663208, -0.028860896825790405, -0.0010193586349487305, 0.026822179555892944, 0.05466371774673462, 0.0825052559375763, 0.11034679412841797, 0.13818833231925964, 0.16602987051010132, 0.193871408700943, 0.22171294689178467, 0.24955448508262634, 0.277396023273468, 0.3052375614643097, 0.33307909965515137, 0.36092063784599304, 0.3887621760368347, 0.4166037142276764, 0.44444525241851807, 0.47228679060935974, 0.5001283288002014, 0.5279698371887207, 0.5558114051818848, 0.5836529731750488, 0.6114944815635681, 0.6393359899520874, 0.6671775579452515, 0.6950191259384155, 0.7228606343269348, 0.7507021427154541, 0.7785437107086182, 0.8063852787017822, 0.8342267870903015, 0.8620682954788208, 0.8899098634719849, 0.9177514314651489, 0.9455929398536682, 0.9734344482421875, 1.0012760162353516]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 13.0, 8.0, 16.0, 21.0, 19.0, 19.0, 40.0, 31.0, 43.0, 44.0, 49.0, 61.0, 69.0, 60.0, 66.0, 63.0, 52.0, 42.0, 44.0, 32.0, 33.0, 35.0, 24.0, 24.0, 19.0, 18.0, 14.0, 9.0, 5.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18730640411376953, -0.18169750273227692, -0.1760886013507843, -0.1704796999692917, -0.16487079858779907, -0.15926188230514526, -0.15365298092365265, -0.14804407954216003, -0.14243517816066742, -0.1368262767791748, -0.1312173753976822, -0.12560847401618958, -0.11999956518411636, -0.11439066380262375, -0.10878175497055054, -0.10317285358905792, -0.09756395220756531, -0.09195505082607269, -0.08634614944458008, -0.08073724061250687, -0.07512833923101425, -0.06951943784952164, -0.06391052901744843, -0.05830162763595581, -0.052692726254463196, -0.04708382487297058, -0.04147491976618767, -0.035866014659404755, -0.03025711327791214, -0.024648210033774376, -0.019039306789636612, -0.013430401682853699, -0.007821500301361084, -0.00221259705722332, 0.003396306186914444, 0.009005209431052208, 0.014614112675189972, 0.020223015919327736, 0.0258319191634655, 0.03144082427024841, 0.03704972565174103, 0.04265862703323364, 0.048267532140016556, 0.05387643724679947, 0.059485338628292084, 0.0650942400097847, 0.07070314884185791, 0.07631205022335052, 0.08192095160484314, 0.08752985298633575, 0.09313875436782837, 0.09874766319990158, 0.1043565645813942, 0.10996546596288681, 0.11557437479496002, 0.12118327617645264, 0.12679217755794525, 0.13240107893943787, 0.13800998032093048, 0.1436188817024231, 0.1492277979850769, 0.15483669936656952, 0.16044560074806213, 0.16605450212955475, 0.17166340351104736]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 7.0, 4.0, 10.0, 15.0, 20.0, 44.0, 58.0, 135.0, 338.0, 1274.0, 11045.0, 4167738.0, 11750.0, 1281.0, 329.0, 125.0, 51.0, 22.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.529296875, -0.5181541442871094, -0.5070114135742188, -0.4958686828613281, -0.4847259521484375, -0.4735832214355469, -0.46244049072265625, -0.4512977600097656, -0.440155029296875, -0.4290122985839844, -0.41786956787109375, -0.4067268371582031, -0.3955841064453125, -0.3844413757324219, -0.37329864501953125, -0.3621559143066406, -0.35101318359375, -0.3398704528808594, -0.32872772216796875, -0.3175849914550781, -0.3064422607421875, -0.2952995300292969, -0.28415679931640625, -0.2730140686035156, -0.261871337890625, -0.2507286071777344, -0.23958587646484375, -0.22844314575195312, -0.2173004150390625, -0.20615768432617188, -0.19501495361328125, -0.18387222290039062, -0.1727294921875, -0.16158676147460938, -0.15044403076171875, -0.13930130004882812, -0.1281585693359375, -0.11701583862304688, -0.10587310791015625, -0.09473037719726562, -0.083587646484375, -0.07244491577148438, -0.06130218505859375, -0.050159454345703125, -0.0390167236328125, -0.027873992919921875, -0.01673126220703125, -0.005588531494140625, 0.00555419921875, 0.016696929931640625, 0.02783966064453125, 0.038982391357421875, 0.0501251220703125, 0.061267852783203125, 0.07241058349609375, 0.08355331420898438, 0.094696044921875, 0.10583877563476562, 0.11698150634765625, 0.12812423706054688, 0.1392669677734375, 0.15040969848632812, 0.16155242919921875, 0.17269515991210938, 0.183837890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 14.0, 21.0, 60.0, 109.0, 172.0, 206.0, 176.0, 114.0, 61.0, 35.0, 15.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0214385986328125, -0.020987331867218018, -0.020536065101623535, -0.020084798336029053, -0.01963353157043457, -0.019182264804840088, -0.018730998039245605, -0.018279731273651123, -0.01782846450805664, -0.017377197742462158, -0.016925930976867676, -0.016474664211273193, -0.01602339744567871, -0.015572130680084229, -0.015120863914489746, -0.014669597148895264, -0.014218330383300781, -0.013767063617706299, -0.013315796852111816, -0.012864530086517334, -0.012413263320922852, -0.01196199655532837, -0.011510729789733887, -0.011059463024139404, -0.010608196258544922, -0.01015692949295044, -0.009705662727355957, -0.009254395961761475, -0.008803129196166992, -0.00835186243057251, -0.007900595664978027, -0.007449328899383545, -0.0069980621337890625, -0.00654679536819458, -0.006095528602600098, -0.005644261837005615, -0.005192995071411133, -0.00474172830581665, -0.004290461540222168, -0.0038391947746276855, -0.003387928009033203, -0.0029366612434387207, -0.0024853944778442383, -0.002034127712249756, -0.0015828609466552734, -0.001131594181060791, -0.0006803274154663086, -0.00022906064987182617, 0.00022220611572265625, 0.0006734728813171387, 0.001124739646911621, 0.0015760064125061035, 0.002027273178100586, 0.0024785399436950684, 0.0029298067092895508, 0.003381073474884033, 0.0038323402404785156, 0.004283607006072998, 0.0047348737716674805, 0.005186140537261963, 0.005637407302856445, 0.006088674068450928, 0.00653994083404541, 0.006991207599639893, 0.007442474365234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 15.0, 18.0, 28.0, 46.0, 80.0, 152.0, 361.0, 1719.0, 43167.0, 4142542.0, 5084.0, 549.0, 198.0, 108.0, 68.0, 36.0, 34.0, 27.0, 10.0, 15.0, 5.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.2643890380859375, -0.251922607421875, -0.2394561767578125, -0.22698974609375, -0.2145233154296875, -0.202056884765625, -0.1895904541015625, -0.1771240234375, -0.1646575927734375, -0.152191162109375, -0.1397247314453125, -0.12725830078125, -0.1147918701171875, -0.102325439453125, -0.0898590087890625, -0.077392578125, -0.0649261474609375, -0.052459716796875, -0.0399932861328125, -0.02752685546875, -0.0150604248046875, -0.002593994140625, 0.0098724365234375, 0.0223388671875, 0.0348052978515625, 0.047271728515625, 0.0597381591796875, 0.07220458984375, 0.0846710205078125, 0.097137451171875, 0.1096038818359375, 0.1220703125, 0.1345367431640625, 0.147003173828125, 0.1594696044921875, 0.17193603515625, 0.1844024658203125, 0.196868896484375, 0.2093353271484375, 0.2218017578125, 0.2342681884765625, 0.246734619140625, 0.2592010498046875, 0.27166748046875, 0.2841339111328125, 0.296600341796875, 0.3090667724609375, 0.321533203125, 0.3339996337890625, 0.346466064453125, 0.3589324951171875, 0.37139892578125, 0.3838653564453125, 0.396331787109375, 0.4087982177734375, 0.4212646484375, 0.4337310791015625, 0.446197509765625, 0.4586639404296875, 0.47113037109375, 0.4835968017578125, 0.496063232421875, 0.5085296630859375, 0.52099609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 14.0, 17.0, 29.0, 87.0, 3783.0, 57.0, 36.0, 23.0, 12.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271759033203125, -0.02561354637145996, -0.024051189422607422, -0.022488832473754883, -0.020926475524902344, -0.019364118576049805, -0.017801761627197266, -0.016239404678344727, -0.014677047729492188, -0.013114690780639648, -0.01155233383178711, -0.00998997688293457, -0.008427619934082031, -0.006865262985229492, -0.005302906036376953, -0.003740549087524414, -0.002178192138671875, -0.0006158351898193359, 0.0009465217590332031, 0.002508878707885742, 0.004071235656738281, 0.00563359260559082, 0.007195949554443359, 0.008758306503295898, 0.010320663452148438, 0.011883020401000977, 0.013445377349853516, 0.015007734298706055, 0.016570091247558594, 0.018132448196411133, 0.019694805145263672, 0.02125716209411621, 0.02281951904296875, 0.02438187599182129, 0.025944232940673828, 0.027506589889526367, 0.029068946838378906, 0.030631303787231445, 0.032193660736083984, 0.03375601768493652, 0.03531837463378906, 0.0368807315826416, 0.03844308853149414, 0.04000544548034668, 0.04156780242919922, 0.04313015937805176, 0.0446925163269043, 0.046254873275756836, 0.047817230224609375, 0.049379587173461914, 0.05094194412231445, 0.05250430107116699, 0.05406665802001953, 0.05562901496887207, 0.05719137191772461, 0.05875372886657715, 0.06031608581542969, 0.06187844276428223, 0.06344079971313477, 0.0650031566619873, 0.06656551361083984, 0.06812787055969238, 0.06969022750854492, 0.07125258445739746, 0.07281494140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 13.0, 170.0, 774.0, 49.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9727463722229004, -0.9497187733650208, -0.9266911745071411, -0.9036635756492615, -0.8806359767913818, -0.8576083779335022, -0.8345807790756226, -0.8115531802177429, -0.7885255813598633, -0.7654979825019836, -0.742470383644104, -0.7194427847862244, -0.6964151859283447, -0.6733875870704651, -0.6503599882125854, -0.6273323893547058, -0.6043047904968262, -0.5812771916389465, -0.5582495927810669, -0.5352219939231873, -0.5121943950653076, -0.489166796207428, -0.46613919734954834, -0.4431115984916687, -0.42008399963378906, -0.3970564007759094, -0.3740288019180298, -0.35100120306015015, -0.3279736042022705, -0.30494600534439087, -0.28191840648651123, -0.2588908076286316, -0.23586320877075195, -0.21283560991287231, -0.18980801105499268, -0.16678041219711304, -0.1437528133392334, -0.12072521448135376, -0.09769761562347412, -0.07467001676559448, -0.051642417907714844, -0.028614819049835205, -0.005587220191955566, 0.017440378665924072, 0.04046797752380371, 0.06349557638168335, 0.08652317523956299, 0.10955077409744263, 0.13257837295532227, 0.1556059718132019, 0.17863357067108154, 0.20166116952896118, 0.22468876838684082, 0.24771636724472046, 0.2707439661026001, 0.29377156496047974, 0.3167991638183594, 0.339826762676239, 0.36285436153411865, 0.3858819603919983, 0.40890955924987793, 0.43193715810775757, 0.4549647569656372, 0.47799235582351685, 0.5010199546813965]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 18.0, 31.0, 26.0, 50.0, 56.0, 79.0, 69.0, 89.0, 101.0, 97.0, 80.0, 86.0, 62.0, 51.0, 35.0, 30.0, 12.0, 15.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10517275333404541, -0.1022692397236824, -0.0993657261133194, -0.09646221250295639, -0.09355869889259338, -0.09065519273281097, -0.08775167912244797, -0.08484816551208496, -0.08194465190172195, -0.07904113829135895, -0.07613762468099594, -0.07323411107063293, -0.07033060491085052, -0.06742709130048752, -0.06452357769012451, -0.061620064079761505, -0.0587165504693985, -0.05581303685903549, -0.052909523248672485, -0.05000601336359978, -0.04710249975323677, -0.044198986142873764, -0.041295476257801056, -0.03839196264743805, -0.03548844903707504, -0.032584935426712036, -0.02968142367899418, -0.02677791193127632, -0.023874398320913315, -0.020970884710550308, -0.01806737296283245, -0.015163861215114594, -0.012260347604751587, -0.009356834925711155, -0.006453322246670723, -0.003549809567630291, -0.000646296888589859, 0.002257215790450573, 0.005160728469491005, 0.008064240217208862, 0.010967753827571869, 0.013871266506612301, 0.016774779185652733, 0.01967829093337059, 0.022581804543733597, 0.025485318154096603, 0.02838882990181446, 0.03129234164953232, 0.034195855259895325, 0.03709936887025833, 0.04000288248062134, 0.042906392365694046, 0.04580990597605705, 0.04871341958642006, 0.05161692947149277, 0.054520443081855774, 0.05742395669221878, 0.06032747030258179, 0.0632309839129448, 0.0661344975233078, 0.06903800368309021, 0.07194151729345322, 0.07484503090381622, 0.07774854451417923, 0.08065205812454224]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 7.0, 10.0, 8.0, 8.0, 17.0, 19.0, 18.0, 25.0, 34.0, 31.0, 48.0, 75.0, 120.0, 250.0, 592.0, 2091.0, 9668.0, 106344.0, 872347.0, 48434.0, 5864.0, 1486.0, 489.0, 212.0, 115.0, 57.0, 39.0, 34.0, 25.0, 19.0, 12.0, 10.0, 10.0, 5.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.1236572265625, -0.11971473693847656, -0.11577224731445312, -0.11182975769042969, -0.10788726806640625, -0.10394477844238281, -0.10000228881835938, -0.09605979919433594, -0.0921173095703125, -0.08817481994628906, -0.08423233032226562, -0.08028984069824219, -0.07634735107421875, -0.07240486145019531, -0.06846237182617188, -0.06451988220214844, -0.060577392578125, -0.05663490295410156, -0.052692413330078125, -0.04874992370605469, -0.04480743408203125, -0.04086494445800781, -0.036922454833984375, -0.03297996520996094, -0.0290374755859375, -0.025094985961914062, -0.021152496337890625, -0.017210006713867188, -0.01326751708984375, -0.009325027465820312, -0.005382537841796875, -0.0014400482177734375, 0.00250244140625, 0.0064449310302734375, 0.010387420654296875, 0.014329910278320312, 0.01827239990234375, 0.022214889526367188, 0.026157379150390625, 0.030099868774414062, 0.0340423583984375, 0.03798484802246094, 0.041927337646484375, 0.04586982727050781, 0.04981231689453125, 0.05375480651855469, 0.057697296142578125, 0.06163978576660156, 0.065582275390625, 0.06952476501464844, 0.07346725463867188, 0.07740974426269531, 0.08135223388671875, 0.08529472351074219, 0.08923721313476562, 0.09317970275878906, 0.0971221923828125, 0.10106468200683594, 0.10500717163085938, 0.10894966125488281, 0.11289215087890625, 0.11683464050292969, 0.12077713012695312, 0.12471961975097656, 0.128662109375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 23.0, 15.0, 62.0, 117.0, 161.0, 196.0, 175.0, 119.0, 58.0, 38.0, 17.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.020660400390625, -0.020225465297698975, -0.01979053020477295, -0.019355595111846924, -0.0189206600189209, -0.018485724925994873, -0.018050789833068848, -0.017615854740142822, -0.017180919647216797, -0.01674598455429077, -0.016311049461364746, -0.01587611436843872, -0.015441179275512695, -0.01500624418258667, -0.014571309089660645, -0.01413637399673462, -0.013701438903808594, -0.013266503810882568, -0.012831568717956543, -0.012396633625030518, -0.011961698532104492, -0.011526763439178467, -0.011091828346252441, -0.010656893253326416, -0.01022195816040039, -0.009787023067474365, -0.00935208797454834, -0.008917152881622314, -0.008482217788696289, -0.008047282695770264, -0.007612347602844238, -0.007177412509918213, -0.0067424774169921875, -0.006307542324066162, -0.005872607231140137, -0.005437672138214111, -0.005002737045288086, -0.0045678019523620605, -0.004132866859436035, -0.0036979317665100098, -0.0032629966735839844, -0.002828061580657959, -0.0023931264877319336, -0.001958191394805908, -0.0015232563018798828, -0.0010883212089538574, -0.000653386116027832, -0.00021845102310180664, 0.00021648406982421875, 0.0006514191627502441, 0.0010863542556762695, 0.001521289348602295, 0.0019562244415283203, 0.0023911595344543457, 0.002826094627380371, 0.0032610297203063965, 0.003695964813232422, 0.004130899906158447, 0.004565834999084473, 0.005000770092010498, 0.0054357051849365234, 0.005870640277862549, 0.006305575370788574, 0.0067405104637146, 0.007175445556640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 11.0, 16.0, 32.0, 41.0, 65.0, 102.0, 139.0, 258.0, 445.0, 835.0, 1632.0, 3451.0, 7389.0, 17549.0, 48306.0, 167559.0, 578338.0, 148535.0, 44223.0, 16190.0, 6752.0, 3182.0, 1572.0, 818.0, 426.0, 259.0, 136.0, 95.0, 62.0, 43.0, 25.0, 20.0, 10.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0469970703125, -0.04545402526855469, -0.043910980224609375, -0.04236793518066406, -0.04082489013671875, -0.03928184509277344, -0.037738800048828125, -0.03619575500488281, -0.0346527099609375, -0.03310966491699219, -0.031566619873046875, -0.030023574829101562, -0.02848052978515625, -0.026937484741210938, -0.025394439697265625, -0.023851394653320312, -0.022308349609375, -0.020765304565429688, -0.019222259521484375, -0.017679214477539062, -0.01613616943359375, -0.014593124389648438, -0.013050079345703125, -0.011507034301757812, -0.0099639892578125, -0.008420944213867188, -0.006877899169921875, -0.0053348541259765625, -0.00379180908203125, -0.0022487640380859375, -0.000705718994140625, 0.0008373260498046875, 0.00238037109375, 0.0039234161376953125, 0.005466461181640625, 0.0070095062255859375, 0.00855255126953125, 0.010095596313476562, 0.011638641357421875, 0.013181686401367188, 0.0147247314453125, 0.016267776489257812, 0.017810821533203125, 0.019353866577148438, 0.02089691162109375, 0.022439956665039062, 0.023983001708984375, 0.025526046752929688, 0.027069091796875, 0.028612136840820312, 0.030155181884765625, 0.03169822692871094, 0.03324127197265625, 0.03478431701660156, 0.036327362060546875, 0.03787040710449219, 0.0394134521484375, 0.04095649719238281, 0.042499542236328125, 0.04404258728027344, 0.04558563232421875, 0.04712867736816406, 0.048671722412109375, 0.05021476745605469, 0.0517578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 1.0, 9.0, 11.0, 8.0, 11.0, 9.0, 17.0, 22.0, 32.0, 33.0, 45.0, 34.0, 41.0, 60.0, 53.0, 53.0, 48.0, 61.0, 46.0, 38.0, 46.0, 50.0, 35.0, 40.0, 37.0, 26.0, 25.0, 19.0, 26.0, 19.0, 10.0, 10.0, 8.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03204345703125, -0.031200885772705078, -0.030358314514160156, -0.029515743255615234, -0.028673171997070312, -0.02783060073852539, -0.02698802947998047, -0.026145458221435547, -0.025302886962890625, -0.024460315704345703, -0.02361774444580078, -0.02277517318725586, -0.021932601928710938, -0.021090030670166016, -0.020247459411621094, -0.019404888153076172, -0.01856231689453125, -0.017719745635986328, -0.016877174377441406, -0.016034603118896484, -0.015192031860351562, -0.01434946060180664, -0.013506889343261719, -0.012664318084716797, -0.011821746826171875, -0.010979175567626953, -0.010136604309082031, -0.00929403305053711, -0.008451461791992188, -0.007608890533447266, -0.006766319274902344, -0.005923748016357422, -0.0050811767578125, -0.004238605499267578, -0.0033960342407226562, -0.0025534629821777344, -0.0017108917236328125, -0.0008683204650878906, -2.574920654296875e-05, 0.0008168220520019531, 0.001659393310546875, 0.002501964569091797, 0.0033445358276367188, 0.004187107086181641, 0.0050296783447265625, 0.005872249603271484, 0.006714820861816406, 0.007557392120361328, 0.00839996337890625, 0.009242534637451172, 0.010085105895996094, 0.010927677154541016, 0.011770248413085938, 0.01261281967163086, 0.013455390930175781, 0.014297962188720703, 0.015140533447265625, 0.015983104705810547, 0.01682567596435547, 0.01766824722290039, 0.018510818481445312, 0.019353389739990234, 0.020195960998535156, 0.021038532257080078, 0.021881103515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 4.0, 17.0, 22.0, 23.0, 27.0, 61.0, 97.0, 137.0, 208.0, 388.0, 754.0, 1554.0, 3561.0, 10290.0, 44229.0, 713450.0, 233285.0, 27357.0, 7463.0, 2860.0, 1256.0, 621.0, 349.0, 177.0, 118.0, 75.0, 57.0, 27.0, 23.0, 16.0, 8.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006628036499023438, -0.0006413236260414124, -0.000619843602180481, -0.0005983635783195496, -0.0005768835544586182, -0.0005554035305976868, -0.0005339235067367554, -0.000512443482875824, -0.0004909634590148926, -0.0004694834351539612, -0.0004480034112930298, -0.0004265233874320984, -0.000405043363571167, -0.0003835633397102356, -0.0003620833158493042, -0.0003406032919883728, -0.0003191232681274414, -0.00029764324426651, -0.0002761632204055786, -0.0002546831965446472, -0.00023320317268371582, -0.00021172314882278442, -0.00019024312496185303, -0.00016876310110092163, -0.00014728307723999023, -0.00012580305337905884, -0.00010432302951812744, -8.284300565719604e-05, -6.136298179626465e-05, -3.988295793533325e-05, -1.8402934074401855e-05, 3.077089786529541e-06, 2.4557113647460938e-05, 4.6037137508392334e-05, 6.751716136932373e-05, 8.899718523025513e-05, 0.00011047720909118652, 0.00013195723295211792, 0.00015343725681304932, 0.0001749172806739807, 0.0001963973045349121, 0.0002178773283958435, 0.0002393573522567749, 0.0002608373761177063, 0.0002823173999786377, 0.0003037974238395691, 0.0003252774477005005, 0.0003467574715614319, 0.0003682374954223633, 0.0003897175192832947, 0.0004111975431442261, 0.00043267756700515747, 0.00045415759086608887, 0.00047563761472702026, 0.0004971176385879517, 0.0005185976624488831, 0.0005400776863098145, 0.0005615577101707458, 0.0005830377340316772, 0.0006045177578926086, 0.00062599778175354, 0.0006474778056144714, 0.0006689578294754028, 0.0006904378533363342, 0.0007119178771972656]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 11.0, 10.0, 16.0, 13.0, 20.0, 29.0, 38.0, 51.0, 71.0, 160.0, 164.0, 129.0, 80.0, 55.0, 34.0, 30.0, 17.0, 12.0, 9.0, 9.0, 9.0, 3.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.141164779663086e-05, -3.0411407351493835e-05, -2.941116690635681e-05, -2.8410926461219788e-05, -2.7410686016082764e-05, -2.641044557094574e-05, -2.5410205125808716e-05, -2.4409964680671692e-05, -2.3409724235534668e-05, -2.2409483790397644e-05, -2.140924334526062e-05, -2.0409002900123596e-05, -1.9408762454986572e-05, -1.840852200984955e-05, -1.7408281564712524e-05, -1.64080411195755e-05, -1.5407800674438477e-05, -1.4407560229301453e-05, -1.3407319784164429e-05, -1.2407079339027405e-05, -1.1406838893890381e-05, -1.0406598448753357e-05, -9.406358003616333e-06, -8.406117558479309e-06, -7.405877113342285e-06, -6.405636668205261e-06, -5.405396223068237e-06, -4.405155777931213e-06, -3.4049153327941895e-06, -2.4046748876571655e-06, -1.4044344425201416e-06, -4.041939973831177e-07, 5.960464477539062e-07, 1.5962868928909302e-06, 2.596527338027954e-06, 3.596767783164978e-06, 4.597008228302002e-06, 5.597248673439026e-06, 6.59748911857605e-06, 7.597729563713074e-06, 8.597970008850098e-06, 9.598210453987122e-06, 1.0598450899124146e-05, 1.159869134426117e-05, 1.2598931789398193e-05, 1.3599172234535217e-05, 1.4599412679672241e-05, 1.5599653124809265e-05, 1.659989356994629e-05, 1.7600134015083313e-05, 1.8600374460220337e-05, 1.960061490535736e-05, 2.0600855350494385e-05, 2.160109579563141e-05, 2.2601336240768433e-05, 2.3601576685905457e-05, 2.460181713104248e-05, 2.5602057576179504e-05, 2.660229802131653e-05, 2.7602538466453552e-05, 2.8602778911590576e-05, 2.96030193567276e-05, 3.0603259801864624e-05, 3.160350024700165e-05, 3.260374069213867e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 5.0, 8.0, 17.0, 17.0, 32.0, 38.0, 57.0, 93.0, 172.0, 265.0, 513.0, 1108.0, 3263.0, 14200.0, 141803.0, 836419.0, 40320.0, 6685.0, 1838.0, 755.0, 362.0, 206.0, 128.0, 74.0, 53.0, 39.0, 27.0, 15.0, 14.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007157325744628906, -0.0006920844316482544, -0.0006684362888336182, -0.0006447881460189819, -0.0006211400032043457, -0.0005974918603897095, -0.0005738437175750732, -0.000550195574760437, -0.0005265474319458008, -0.0005028992891311646, -0.0004792511463165283, -0.0004556030035018921, -0.00043195486068725586, -0.00040830671787261963, -0.0003846585750579834, -0.00036101043224334717, -0.00033736228942871094, -0.0003137141466140747, -0.0002900660037994385, -0.00026641786098480225, -0.00024276971817016602, -0.00021912157535552979, -0.00019547343254089355, -0.00017182528972625732, -0.0001481771469116211, -0.00012452900409698486, -0.00010088086128234863, -7.72327184677124e-05, -5.358457565307617e-05, -2.993643283843994e-05, -6.288290023803711e-06, 1.735985279083252e-05, 4.100799560546875e-05, 6.465613842010498e-05, 8.830428123474121e-05, 0.00011195242404937744, 0.00013560056686401367, 0.0001592487096786499, 0.00018289685249328613, 0.00020654499530792236, 0.0002301931381225586, 0.0002538412809371948, 0.00027748942375183105, 0.0003011375665664673, 0.0003247857093811035, 0.00034843385219573975, 0.000372081995010376, 0.0003957301378250122, 0.00041937828063964844, 0.00044302642345428467, 0.0004666745662689209, 0.0004903227090835571, 0.0005139708518981934, 0.0005376189947128296, 0.0005612671375274658, 0.000584915280342102, 0.0006085634231567383, 0.0006322115659713745, 0.0006558597087860107, 0.000679507851600647, 0.0007031559944152832, 0.0007268041372299194, 0.0007504522800445557, 0.0007741004228591919, 0.0007977485656738281]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 14.0, 17.0, 24.0, 40.0, 54.0, 96.0, 144.0, 184.0, 160.0, 83.0, 57.0, 51.0, 25.0, 18.0, 12.0, 10.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004892349243164062, -0.00047710537910461426, -0.00046497583389282227, -0.0004528462886810303, -0.0004407167434692383, -0.0004285871982574463, -0.0004164576530456543, -0.0004043281078338623, -0.0003921985626220703, -0.0003800690174102783, -0.00036793947219848633, -0.00035580992698669434, -0.00034368038177490234, -0.00033155083656311035, -0.00031942129135131836, -0.00030729174613952637, -0.0002951622009277344, -0.0002830326557159424, -0.0002709031105041504, -0.0002587735652923584, -0.0002466440200805664, -0.00023451447486877441, -0.00022238492965698242, -0.00021025538444519043, -0.00019812583923339844, -0.00018599629402160645, -0.00017386674880981445, -0.00016173720359802246, -0.00014960765838623047, -0.00013747811317443848, -0.00012534856796264648, -0.00011321902275085449, -0.0001010894775390625, -8.895993232727051e-05, -7.683038711547852e-05, -6.470084190368652e-05, -5.257129669189453e-05, -4.044175148010254e-05, -2.8312206268310547e-05, -1.6182661056518555e-05, -4.0531158447265625e-06, 8.07642936706543e-06, 2.0205974578857422e-05, 3.2335519790649414e-05, 4.4465065002441406e-05, 5.65946102142334e-05, 6.872415542602539e-05, 8.085370063781738e-05, 9.298324584960938e-05, 0.00010511279106140137, 0.00011724233627319336, 0.00012937188148498535, 0.00014150142669677734, 0.00015363097190856934, 0.00016576051712036133, 0.00017789006233215332, 0.0001900196075439453, 0.0002021491527557373, 0.0002142786979675293, 0.0002264082431793213, 0.00023853778839111328, 0.0002506673336029053, 0.00026279687881469727, 0.00027492642402648926, 0.00028705596923828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 12.0, 22.0, 52.0, 113.0, 399.0, 197.0, 83.0, 48.0, 25.0, 15.0, 15.0, 10.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47009068727493286, -0.45615702867507935, -0.44222334027290344, -0.42828965187072754, -0.414355993270874, -0.4004223346710205, -0.3864886462688446, -0.3725549578666687, -0.3586212992668152, -0.34468764066696167, -0.33075395226478577, -0.31682026386260986, -0.30288660526275635, -0.28895294666290283, -0.27501925826072693, -0.261085569858551, -0.2471519112586975, -0.2332182377576828, -0.2192845642566681, -0.20535089075565338, -0.19141721725463867, -0.17748354375362396, -0.16354987025260925, -0.14961619675159454, -0.13568252325057983, -0.12174884974956512, -0.10781517624855042, -0.0938815027475357, -0.079947829246521, -0.06601415574550629, -0.05208048224449158, -0.03814680874347687, -0.024213165044784546, -0.010279491543769836, 0.003654181957244873, 0.017587855458259583, 0.03152152895927429, 0.045455202460289, 0.05938887596130371, 0.07332254946231842, 0.08725622296333313, 0.10118989646434784, 0.11512356996536255, 0.12905724346637726, 0.14299091696739197, 0.15692459046840668, 0.1708582639694214, 0.1847919374704361, 0.1987256109714508, 0.21265928447246552, 0.22659295797348022, 0.24052663147449493, 0.25446030497550964, 0.26839399337768555, 0.28232765197753906, 0.2962613105773926, 0.3101949989795685, 0.3241286873817444, 0.3380623459815979, 0.3519960045814514, 0.3659296929836273, 0.3798633813858032, 0.39379703998565674, 0.40773069858551025, 0.42166438698768616]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 12.0, 12.0, 10.0, 18.0, 13.0, 21.0, 24.0, 36.0, 46.0, 45.0, 54.0, 54.0, 63.0, 66.0, 59.0, 62.0, 52.0, 50.0, 52.0, 52.0, 38.0, 33.0, 36.0, 26.0, 17.0, 14.0, 6.0, 9.0, 8.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18377745151519775, -0.17875464260578156, -0.17373183369636536, -0.16870903968811035, -0.16368623077869415, -0.15866342186927795, -0.15364061295986176, -0.14861780405044556, -0.14359501004219055, -0.13857220113277435, -0.13354939222335815, -0.12852659821510315, -0.12350378930568695, -0.11848098039627075, -0.11345817148685455, -0.10843536257743835, -0.10341255366802216, -0.09838974475860596, -0.09336694329977036, -0.08834413439035416, -0.08332133293151855, -0.07829852402210236, -0.07327571511268616, -0.06825290620326996, -0.06323010474443436, -0.058207299560308456, -0.053184494376182556, -0.04816168546676636, -0.04313888028264046, -0.03811607509851456, -0.03309326618909836, -0.028070461004972458, -0.023047655820846558, -0.018024850636720657, -0.013002043589949608, -0.007979237474501133, -0.002956431359052658, 0.002066373825073242, 0.007089180871844292, 0.012111987918615341, 0.01713479310274124, 0.02215759828686714, 0.02718040533363819, 0.03220321238040924, 0.03722601756453514, 0.04224882274866104, 0.04727163165807724, 0.05229443684220314, 0.05731724202632904, 0.06234004721045494, 0.06736285239458084, 0.07238566130399704, 0.07740846276283264, 0.08243127167224884, 0.08745408058166504, 0.09247688949108124, 0.09749969094991684, 0.10252249985933304, 0.10754530131816864, 0.11256811022758484, 0.11759091913700104, 0.12261372059583664, 0.12763652205467224, 0.13265933096408844, 0.13768213987350464]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 11.0, 5.0, 5.0, 6.0, 8.0, 7.0, 6.0, 7.0, 10.0, 11.0, 12.0, 15.0, 26.0, 19.0, 34.0, 51.0, 96.0, 176.0, 435.0, 972.0, 3148.0, 13576.0, 3647162.0, 509823.0, 13845.0, 3049.0, 963.0, 378.0, 187.0, 92.0, 61.0, 24.0, 20.0, 14.0, 5.0, 6.0, 4.0, 1.0, 2.0], "bins": [-0.2239990234375, -0.2193317413330078, -0.21466445922851562, -0.20999717712402344, -0.20532989501953125, -0.20066261291503906, -0.19599533081054688, -0.1913280487060547, -0.1866607666015625, -0.1819934844970703, -0.17732620239257812, -0.17265892028808594, -0.16799163818359375, -0.16332435607910156, -0.15865707397460938, -0.1539897918701172, -0.149322509765625, -0.1446552276611328, -0.13998794555664062, -0.13532066345214844, -0.13065338134765625, -0.12598609924316406, -0.12131881713867188, -0.11665153503417969, -0.1119842529296875, -0.10731697082519531, -0.10264968872070312, -0.09798240661621094, -0.09331512451171875, -0.08864784240722656, -0.08398056030273438, -0.07931327819824219, -0.07464599609375, -0.06997871398925781, -0.06531143188476562, -0.06064414978027344, -0.05597686767578125, -0.05130958557128906, -0.046642303466796875, -0.04197502136230469, -0.0373077392578125, -0.03264045715332031, -0.027973175048828125, -0.023305892944335938, -0.01863861083984375, -0.013971328735351562, -0.009304046630859375, -0.0046367645263671875, 3.0517578125e-05, 0.0046977996826171875, 0.009365081787109375, 0.014032363891601562, 0.01869964599609375, 0.023366928100585938, 0.028034210205078125, 0.03270149230957031, 0.0373687744140625, 0.04203605651855469, 0.046703338623046875, 0.05137062072753906, 0.05603790283203125, 0.06070518493652344, 0.06537246704101562, 0.07003974914550781, 0.07470703125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 11.0, 22.0, 35.0, 86.0, 146.0, 197.0, 177.0, 158.0, 84.0, 49.0, 16.0, 11.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0209197998046875, -0.020483970642089844, -0.020048141479492188, -0.01961231231689453, -0.019176483154296875, -0.01874065399169922, -0.018304824829101562, -0.017868995666503906, -0.01743316650390625, -0.016997337341308594, -0.016561508178710938, -0.01612567901611328, -0.015689849853515625, -0.015254020690917969, -0.014818191528320312, -0.014382362365722656, -0.013946533203125, -0.013510704040527344, -0.013074874877929688, -0.012639045715332031, -0.012203216552734375, -0.011767387390136719, -0.011331558227539062, -0.010895729064941406, -0.01045989990234375, -0.010024070739746094, -0.009588241577148438, -0.009152412414550781, -0.008716583251953125, -0.008280754089355469, -0.007844924926757812, -0.007409095764160156, -0.0069732666015625, -0.006537437438964844, -0.0061016082763671875, -0.005665779113769531, -0.005229949951171875, -0.004794120788574219, -0.0043582916259765625, -0.003922462463378906, -0.00348663330078125, -0.0030508041381835938, -0.0026149749755859375, -0.0021791458129882812, -0.001743316650390625, -0.0013074874877929688, -0.0008716583251953125, -0.00043582916259765625, 0.0, 0.00043582916259765625, 0.0008716583251953125, 0.0013074874877929688, 0.001743316650390625, 0.0021791458129882812, 0.0026149749755859375, 0.0030508041381835938, 0.00348663330078125, 0.003922462463378906, 0.0043582916259765625, 0.004794120788574219, 0.005229949951171875, 0.005665779113769531, 0.0061016082763671875, 0.006537437438964844, 0.0069732666015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 12.0, 6.0, 7.0, 9.0, 16.0, 22.0, 29.0, 74.0, 101.0, 164.0, 250.0, 517.0, 944.0, 2029.0, 5988.0, 28885.0, 4015062.0, 120767.0, 13358.0, 3451.0, 1228.0, 599.0, 307.0, 156.0, 106.0, 66.0, 51.0, 33.0, 17.0, 12.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.141845703125, -0.13788318634033203, -0.13392066955566406, -0.1299581527709961, -0.12599563598632812, -0.12203311920166016, -0.11807060241699219, -0.11410808563232422, -0.11014556884765625, -0.10618305206298828, -0.10222053527832031, -0.09825801849365234, -0.09429550170898438, -0.0903329849243164, -0.08637046813964844, -0.08240795135498047, -0.0784454345703125, -0.07448291778564453, -0.07052040100097656, -0.0665578842163086, -0.06259536743164062, -0.058632850646972656, -0.05467033386230469, -0.05070781707763672, -0.04674530029296875, -0.04278278350830078, -0.03882026672363281, -0.034857749938964844, -0.030895233154296875, -0.026932716369628906, -0.022970199584960938, -0.01900768280029297, -0.015045166015625, -0.011082649230957031, -0.0071201324462890625, -0.0031576156616210938, 0.000804901123046875, 0.004767417907714844, 0.008729934692382812, 0.012692451477050781, 0.01665496826171875, 0.02061748504638672, 0.024580001831054688, 0.028542518615722656, 0.032505035400390625, 0.036467552185058594, 0.04043006896972656, 0.04439258575439453, 0.0483551025390625, 0.05231761932373047, 0.05628013610839844, 0.060242652893066406, 0.06420516967773438, 0.06816768646240234, 0.07213020324707031, 0.07609272003173828, 0.08005523681640625, 0.08401775360107422, 0.08798027038574219, 0.09194278717041016, 0.09590530395507812, 0.0998678207397461, 0.10383033752441406, 0.10779285430908203, 0.11175537109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 11.0, 12.0, 24.0, 26.0, 29.0, 42.0, 70.0, 3283.0, 385.0, 55.0, 41.0, 29.0, 17.0, 14.0, 8.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036346435546875, -0.035331010818481445, -0.03431558609008789, -0.033300161361694336, -0.03228473663330078, -0.03126931190490723, -0.030253887176513672, -0.029238462448120117, -0.028223037719726562, -0.027207612991333008, -0.026192188262939453, -0.0251767635345459, -0.024161338806152344, -0.02314591407775879, -0.022130489349365234, -0.02111506462097168, -0.020099639892578125, -0.01908421516418457, -0.018068790435791016, -0.01705336570739746, -0.016037940979003906, -0.015022516250610352, -0.014007091522216797, -0.012991666793823242, -0.011976242065429688, -0.010960817337036133, -0.009945392608642578, -0.008929967880249023, -0.007914543151855469, -0.006899118423461914, -0.005883693695068359, -0.004868268966674805, -0.00385284423828125, -0.0028374195098876953, -0.0018219947814941406, -0.0008065700531005859, 0.00020885467529296875, 0.0012242794036865234, 0.002239704132080078, 0.003255128860473633, 0.0042705535888671875, 0.005285978317260742, 0.006301403045654297, 0.0073168277740478516, 0.008332252502441406, 0.009347677230834961, 0.010363101959228516, 0.01137852668762207, 0.012393951416015625, 0.01340937614440918, 0.014424800872802734, 0.015440225601196289, 0.016455650329589844, 0.0174710750579834, 0.018486499786376953, 0.019501924514770508, 0.020517349243164062, 0.021532773971557617, 0.022548198699951172, 0.023563623428344727, 0.02457904815673828, 0.025594472885131836, 0.02660989761352539, 0.027625322341918945, 0.0286407470703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 9.0, 5.0, 43.0, 226.0, 633.0, 67.0, 20.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8044624328613281, -0.7858608961105347, -0.7672593593597412, -0.7486578226089478, -0.7300562858581543, -0.7114547491073608, -0.6928532123565674, -0.6742516756057739, -0.6556501388549805, -0.637048602104187, -0.6184470653533936, -0.5998455286026001, -0.5812439918518066, -0.5626424551010132, -0.5440409183502197, -0.5254393815994263, -0.5068378448486328, -0.48823630809783936, -0.4696347713470459, -0.45103323459625244, -0.432431697845459, -0.4138301610946655, -0.39522862434387207, -0.3766270875930786, -0.3580254912376404, -0.3394239544868469, -0.32082241773605347, -0.30222088098526, -0.28361934423446655, -0.2650178074836731, -0.24641625583171844, -0.227814719080925, -0.20921319723129272, -0.19061166048049927, -0.1720101237297058, -0.15340858697891235, -0.1348070502281189, -0.11620550602674484, -0.09760396182537079, -0.07900242507457733, -0.060400888323783875, -0.04179935157299042, -0.023197811096906662, -0.0045962706208229065, 0.01400526612997055, 0.03260680288076401, 0.05120834708213806, 0.06980988383293152, 0.08841142058372498, 0.10701295733451843, 0.1256144940853119, 0.14421603083610535, 0.1628175675868988, 0.18141910433769226, 0.2000206559896469, 0.21862219274044037, 0.23722372949123383, 0.2558252811431885, 0.27442681789398193, 0.2930283546447754, 0.31162989139556885, 0.3302314281463623, 0.34883296489715576, 0.3674345016479492, 0.3860360383987427]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 13.0, 15.0, 21.0, 31.0, 47.0, 100.0, 103.0, 101.0, 93.0, 101.0, 104.0, 98.0, 56.0, 40.0, 30.0, 16.0, 12.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15818160772323608, -0.1537822037935257, -0.1493828147649765, -0.1449834108352661, -0.14058400690555573, -0.13618460297584534, -0.13178521394729614, -0.12738581001758575, -0.12298641353845596, -0.11858701705932617, -0.11418761312961578, -0.10978821665048599, -0.1053888201713562, -0.10098941624164581, -0.09659001976251602, -0.09219062328338623, -0.08779121935367584, -0.08339182287454605, -0.07899241894483566, -0.07459302246570587, -0.07019361853599548, -0.06579422205686569, -0.0613948255777359, -0.05699542537331581, -0.05259602516889572, -0.04819662496447563, -0.04379722476005554, -0.03939782828092575, -0.03499842807650566, -0.03059902787208557, -0.02619962953031063, -0.02180023118853569, -0.0174008309841156, -0.013001431711018085, -0.00860203243792057, -0.004202633164823055, 0.00019676610827445984, 0.0045961663126945496, 0.00899556465446949, 0.01339496299624443, 0.01779436320066452, 0.02219376340508461, 0.02659316174685955, 0.03099256008863449, 0.03539196029305458, 0.03979136049747467, 0.04419075697660446, 0.04859015718102455, 0.05298955738544464, 0.05738895758986473, 0.06178835779428482, 0.06618775427341461, 0.070587158203125, 0.07498655468225479, 0.07938595116138458, 0.08378535509109497, 0.08818475157022476, 0.09258414804935455, 0.09698355197906494, 0.10138294845819473, 0.10578234493732452, 0.11018174886703491, 0.1145811453461647, 0.1189805418252945, 0.12337994575500488]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 8.0, 6.0, 8.0, 8.0, 8.0, 8.0, 14.0, 15.0, 17.0, 20.0, 29.0, 31.0, 30.0, 58.0, 95.0, 182.0, 401.0, 1111.0, 3604.0, 18781.0, 191196.0, 772612.0, 49517.0, 7563.0, 1871.0, 611.0, 279.0, 131.0, 70.0, 43.0, 28.0, 32.0, 30.0, 13.0, 21.0, 16.0, 18.0, 12.0, 8.0, 13.0, 9.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.09942626953125, -0.09634208679199219, -0.09325790405273438, -0.09017372131347656, -0.08708953857421875, -0.08400535583496094, -0.08092117309570312, -0.07783699035644531, -0.0747528076171875, -0.07166862487792969, -0.06858444213867188, -0.06550025939941406, -0.06241607666015625, -0.05933189392089844, -0.056247711181640625, -0.05316352844238281, -0.050079345703125, -0.04699516296386719, -0.043910980224609375, -0.04082679748535156, -0.03774261474609375, -0.03465843200683594, -0.031574249267578125, -0.028490066528320312, -0.0254058837890625, -0.022321701049804688, -0.019237518310546875, -0.016153335571289062, -0.01306915283203125, -0.009984970092773438, -0.006900787353515625, -0.0038166046142578125, -0.000732421875, 0.0023517608642578125, 0.005435943603515625, 0.008520126342773438, 0.01160430908203125, 0.014688491821289062, 0.017772674560546875, 0.020856857299804688, 0.0239410400390625, 0.027025222778320312, 0.030109405517578125, 0.03319358825683594, 0.03627777099609375, 0.03936195373535156, 0.042446136474609375, 0.04553031921386719, 0.048614501953125, 0.05169868469238281, 0.054782867431640625, 0.05786705017089844, 0.06095123291015625, 0.06403541564941406, 0.06711959838867188, 0.07020378112792969, 0.0732879638671875, 0.07637214660644531, 0.07945632934570312, 0.08254051208496094, 0.08562469482421875, 0.08870887756347656, 0.09179306030273438, 0.09487724304199219, 0.09796142578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 7.0, 22.0, 27.0, 78.0, 120.0, 179.0, 188.0, 161.0, 101.0, 63.0, 25.0, 18.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01995849609375, -0.019536495208740234, -0.01911449432373047, -0.018692493438720703, -0.018270492553710938, -0.017848491668701172, -0.017426490783691406, -0.01700448989868164, -0.016582489013671875, -0.01616048812866211, -0.015738487243652344, -0.015316486358642578, -0.014894485473632812, -0.014472484588623047, -0.014050483703613281, -0.013628482818603516, -0.01320648193359375, -0.012784481048583984, -0.012362480163574219, -0.011940479278564453, -0.011518478393554688, -0.011096477508544922, -0.010674476623535156, -0.01025247573852539, -0.009830474853515625, -0.00940847396850586, -0.008986473083496094, -0.008564472198486328, -0.008142471313476562, -0.007720470428466797, -0.007298469543457031, -0.006876468658447266, -0.0064544677734375, -0.006032466888427734, -0.005610466003417969, -0.005188465118408203, -0.0047664642333984375, -0.004344463348388672, -0.003922462463378906, -0.0035004615783691406, -0.003078460693359375, -0.0026564598083496094, -0.0022344589233398438, -0.0018124580383300781, -0.0013904571533203125, -0.0009684562683105469, -0.0005464553833007812, -0.00012445449829101562, 0.00029754638671875, 0.0007195472717285156, 0.0011415481567382812, 0.0015635490417480469, 0.0019855499267578125, 0.002407550811767578, 0.0028295516967773438, 0.0032515525817871094, 0.003673553466796875, 0.004095554351806641, 0.004517555236816406, 0.004939556121826172, 0.0053615570068359375, 0.005783557891845703, 0.006205558776855469, 0.006627559661865234, 0.007049560546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 13.0, 17.0, 26.0, 34.0, 49.0, 78.0, 124.0, 176.0, 316.0, 565.0, 903.0, 1489.0, 2551.0, 4677.0, 8808.0, 16884.0, 33702.0, 72401.0, 176101.0, 449428.0, 151829.0, 64655.0, 30520.0, 15069.0, 7986.0, 4299.0, 2411.0, 1381.0, 780.0, 466.0, 305.0, 188.0, 110.0, 67.0, 38.0, 30.0, 17.0, 14.0, 6.0, 9.0, 7.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02862548828125, -0.027652740478515625, -0.02667999267578125, -0.025707244873046875, -0.0247344970703125, -0.023761749267578125, -0.02278900146484375, -0.021816253662109375, -0.020843505859375, -0.019870758056640625, -0.01889801025390625, -0.017925262451171875, -0.0169525146484375, -0.015979766845703125, -0.01500701904296875, -0.014034271240234375, -0.0130615234375, -0.012088775634765625, -0.01111602783203125, -0.010143280029296875, -0.0091705322265625, -0.008197784423828125, -0.00722503662109375, -0.006252288818359375, -0.005279541015625, -0.004306793212890625, -0.00333404541015625, -0.002361297607421875, -0.0013885498046875, -0.000415802001953125, 0.00055694580078125, 0.001529693603515625, 0.00250244140625, 0.003475189208984375, 0.00444793701171875, 0.005420684814453125, 0.0063934326171875, 0.007366180419921875, 0.00833892822265625, 0.009311676025390625, 0.010284423828125, 0.011257171630859375, 0.01222991943359375, 0.013202667236328125, 0.0141754150390625, 0.015148162841796875, 0.01612091064453125, 0.017093658447265625, 0.01806640625, 0.019039154052734375, 0.02001190185546875, 0.020984649658203125, 0.0219573974609375, 0.022930145263671875, 0.02390289306640625, 0.024875640869140625, 0.025848388671875, 0.026821136474609375, 0.02779388427734375, 0.028766632080078125, 0.0297393798828125, 0.030712127685546875, 0.03168487548828125, 0.032657623291015625, 0.03363037109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 14.0, 8.0, 12.0, 23.0, 25.0, 23.0, 28.0, 24.0, 32.0, 34.0, 27.0, 49.0, 36.0, 39.0, 30.0, 37.0, 44.0, 49.0, 40.0, 34.0, 41.0, 29.0, 37.0, 36.0, 26.0, 29.0, 29.0, 16.0, 27.0, 17.0, 19.0, 7.0, 13.0, 7.0, 5.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186920166015625, -0.018056392669677734, -0.01742076873779297, -0.016785144805908203, -0.016149520874023438, -0.015513896942138672, -0.014878273010253906, -0.01424264907836914, -0.013607025146484375, -0.01297140121459961, -0.012335777282714844, -0.011700153350830078, -0.011064529418945312, -0.010428905487060547, -0.009793281555175781, -0.009157657623291016, -0.00852203369140625, -0.007886409759521484, -0.007250785827636719, -0.006615161895751953, -0.0059795379638671875, -0.005343914031982422, -0.004708290100097656, -0.004072666168212891, -0.003437042236328125, -0.0028014183044433594, -0.0021657943725585938, -0.0015301704406738281, -0.0008945465087890625, -0.0002589225769042969, 0.00037670135498046875, 0.0010123252868652344, 0.00164794921875, 0.0022835731506347656, 0.0029191970825195312, 0.003554821014404297, 0.0041904449462890625, 0.004826068878173828, 0.005461692810058594, 0.006097316741943359, 0.006732940673828125, 0.007368564605712891, 0.008004188537597656, 0.008639812469482422, 0.009275436401367188, 0.009911060333251953, 0.010546684265136719, 0.011182308197021484, 0.01181793212890625, 0.012453556060791016, 0.013089179992675781, 0.013724803924560547, 0.014360427856445312, 0.014996051788330078, 0.015631675720214844, 0.01626729965209961, 0.016902923583984375, 0.01753854751586914, 0.018174171447753906, 0.018809795379638672, 0.019445419311523438, 0.020081043243408203, 0.02071666717529297, 0.021352291107177734, 0.0219879150390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 2.0, 10.0, 17.0, 25.0, 35.0, 60.0, 99.0, 179.0, 331.0, 632.0, 1284.0, 2787.0, 6795.0, 20071.0, 96606.0, 770329.0, 113529.0, 22623.0, 7361.0, 2926.0, 1364.0, 666.0, 359.0, 171.0, 102.0, 58.0, 29.0, 28.0, 19.0, 8.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 5.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005059242248535156, -0.0004898831248283386, -0.0004738420248031616, -0.0004578009247779846, -0.0004417598247528076, -0.0004257187247276306, -0.0004096776247024536, -0.0003936365246772766, -0.0003775954246520996, -0.0003615543246269226, -0.0003455132246017456, -0.0003294721245765686, -0.0003134310245513916, -0.0002973899245262146, -0.0002813488245010376, -0.0002653077244758606, -0.0002492666244506836, -0.0002332255244255066, -0.0002171844244003296, -0.0002011433243751526, -0.00018510222434997559, -0.00016906112432479858, -0.00015302002429962158, -0.00013697892427444458, -0.00012093782424926758, -0.00010489672422409058, -8.885562419891357e-05, -7.281452417373657e-05, -5.677342414855957e-05, -4.073232412338257e-05, -2.4691224098205566e-05, -8.650124073028564e-06, 7.3909759521484375e-06, 2.343207597732544e-05, 3.947317600250244e-05, 5.551427602767944e-05, 7.155537605285645e-05, 8.759647607803345e-05, 0.00010363757610321045, 0.00011967867612838745, 0.00013571977615356445, 0.00015176087617874146, 0.00016780197620391846, 0.00018384307622909546, 0.00019988417625427246, 0.00021592527627944946, 0.00023196637630462646, 0.00024800747632980347, 0.00026404857635498047, 0.00028008967638015747, 0.00029613077640533447, 0.0003121718764305115, 0.0003282129764556885, 0.0003442540764808655, 0.0003602951765060425, 0.0003763362765312195, 0.0003923773765563965, 0.0004084184765815735, 0.0004244595766067505, 0.0004405006766319275, 0.0004565417766571045, 0.0004725828766822815, 0.0004886239767074585, 0.0005046650767326355, 0.0005207061767578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 12.0, 10.0, 15.0, 12.0, 31.0, 35.0, 69.0, 111.0, 221.0, 197.0, 97.0, 76.0, 45.0, 32.0, 8.0, 10.0, 11.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.67572021484375e-05, -6.513018161058426e-05, -6.350316107273102e-05, -6.187614053487778e-05, -6.0249119997024536e-05, -5.8622099459171295e-05, -5.6995078921318054e-05, -5.536805838346481e-05, -5.374103784561157e-05, -5.211401730775833e-05, -5.048699676990509e-05, -4.885997623205185e-05, -4.723295569419861e-05, -4.560593515634537e-05, -4.3978914618492126e-05, -4.2351894080638885e-05, -4.0724873542785645e-05, -3.9097853004932404e-05, -3.747083246707916e-05, -3.584381192922592e-05, -3.421679139137268e-05, -3.258977085351944e-05, -3.09627503156662e-05, -2.9335729777812958e-05, -2.7708709239959717e-05, -2.6081688702106476e-05, -2.4454668164253235e-05, -2.2827647626399994e-05, -2.1200627088546753e-05, -1.9573606550693512e-05, -1.794658601284027e-05, -1.631956547498703e-05, -1.4692544937133789e-05, -1.3065524399280548e-05, -1.1438503861427307e-05, -9.811483323574066e-06, -8.184462785720825e-06, -6.557442247867584e-06, -4.930421710014343e-06, -3.3034011721611023e-06, -1.6763806343078613e-06, -4.936009645462036e-08, 1.5776604413986206e-06, 3.2046809792518616e-06, 4.8317015171051025e-06, 6.4587220549583435e-06, 8.085742592811584e-06, 9.712763130664825e-06, 1.1339783668518066e-05, 1.2966804206371307e-05, 1.4593824744224548e-05, 1.622084528207779e-05, 1.784786581993103e-05, 1.947488635778427e-05, 2.1101906895637512e-05, 2.2728927433490753e-05, 2.4355947971343994e-05, 2.5982968509197235e-05, 2.7609989047050476e-05, 2.9237009584903717e-05, 3.086403012275696e-05, 3.24910506606102e-05, 3.411807119846344e-05, 3.574509173631668e-05, 3.737211227416992e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 10.0, 15.0, 9.0, 8.0, 22.0, 37.0, 64.0, 86.0, 146.0, 314.0, 570.0, 1255.0, 3260.0, 9901.0, 40275.0, 489860.0, 447760.0, 39417.0, 9807.0, 3232.0, 1271.0, 531.0, 288.0, 151.0, 115.0, 43.0, 36.0, 17.0, 18.0, 12.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043654441833496094, -0.00042037293314933777, -0.0004042014479637146, -0.00038802996277809143, -0.00037185847759246826, -0.0003556869924068451, -0.0003395155072212219, -0.00032334402203559875, -0.0003071725368499756, -0.0002910010516643524, -0.00027482956647872925, -0.0002586580812931061, -0.0002424865961074829, -0.00022631511092185974, -0.00021014362573623657, -0.0001939721405506134, -0.00017780065536499023, -0.00016162917017936707, -0.0001454576849937439, -0.00012928619980812073, -0.00011311471462249756, -9.694322943687439e-05, -8.077174425125122e-05, -6.460025906562805e-05, -4.842877388000488e-05, -3.2257288694381714e-05, -1.6085803508758545e-05, 8.568167686462402e-08, 1.6257166862487793e-05, 3.242865204811096e-05, 4.860013723373413e-05, 6.47716224193573e-05, 8.094310760498047e-05, 9.711459279060364e-05, 0.0001132860779762268, 0.00012945756316184998, 0.00014562904834747314, 0.0001618005335330963, 0.00017797201871871948, 0.00019414350390434265, 0.00021031498908996582, 0.000226486474275589, 0.00024265795946121216, 0.00025882944464683533, 0.0002750009298324585, 0.00029117241501808167, 0.00030734390020370483, 0.000323515385389328, 0.00033968687057495117, 0.00035585835576057434, 0.0003720298409461975, 0.0003882013261318207, 0.00040437281131744385, 0.000420544296503067, 0.0004367157816886902, 0.00045288726687431335, 0.0004690587520599365, 0.0004852302372455597, 0.0005014017224311829, 0.000517573207616806, 0.0005337446928024292, 0.0005499161779880524, 0.0005660876631736755, 0.0005822591483592987, 0.0005984306335449219]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 9.0, 7.0, 20.0, 20.0, 27.0, 32.0, 34.0, 72.0, 115.0, 142.0, 145.0, 101.0, 82.0, 66.0, 40.0, 21.0, 21.0, 12.0, 6.0, 12.0, 5.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022268295288085938, -0.00021306052803993225, -0.00020343810319900513, -0.000193815678358078, -0.00018419325351715088, -0.00017457082867622375, -0.00016494840383529663, -0.0001553259789943695, -0.00014570355415344238, -0.00013608112931251526, -0.00012645870447158813, -0.00011683627963066101, -0.00010721385478973389, -9.759142994880676e-05, -8.796900510787964e-05, -7.834658026695251e-05, -6.872415542602539e-05, -5.9101730585098267e-05, -4.947930574417114e-05, -3.985688090324402e-05, -3.0234456062316895e-05, -2.061203122138977e-05, -1.0989606380462646e-05, -1.3671815395355225e-06, 8.255243301391602e-06, 1.7877668142318726e-05, 2.750009298324585e-05, 3.7122517824172974e-05, 4.67449426651001e-05, 5.636736750602722e-05, 6.598979234695435e-05, 7.561221718788147e-05, 8.52346420288086e-05, 9.485706686973572e-05, 0.00010447949171066284, 0.00011410191655158997, 0.0001237243413925171, 0.00013334676623344421, 0.00014296919107437134, 0.00015259161591529846, 0.00016221404075622559, 0.0001718364655971527, 0.00018145889043807983, 0.00019108131527900696, 0.00020070374011993408, 0.0002103261649608612, 0.00021994858980178833, 0.00022957101464271545, 0.00023919343948364258, 0.0002488158643245697, 0.0002584382891654968, 0.00026806071400642395, 0.0002776831388473511, 0.0002873055636882782, 0.0002969279885292053, 0.00030655041337013245, 0.00031617283821105957, 0.0003257952630519867, 0.0003354176878929138, 0.00034504011273384094, 0.00035466253757476807, 0.0003642849624156952, 0.0003739073872566223, 0.00038352981209754944, 0.00039315223693847656]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 24.0, 90.0, 562.0, 202.0, 70.0, 35.0, 17.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5318701267242432, -0.5061094760894775, -0.4803488254547119, -0.4545882046222687, -0.42882755398750305, -0.4030669033527374, -0.3773062825202942, -0.35154563188552856, -0.32578498125076294, -0.3000243306159973, -0.2742636799812317, -0.24850305914878845, -0.22274240851402283, -0.1969817578792572, -0.17122112214565277, -0.14546048641204834, -0.11969983577728271, -0.09393919259309769, -0.06817854940891266, -0.04241790622472763, -0.016657263040542603, 0.009103387594223022, 0.034864023327827454, 0.060624659061431885, 0.08638530969619751, 0.11214595288038254, 0.13790659606456757, 0.163667231798172, 0.18942788243293762, 0.21518853306770325, 0.24094916880130768, 0.2667098045349121, 0.29247045516967773, 0.31823110580444336, 0.343991756439209, 0.3697523772716522, 0.39551302790641785, 0.42127367854118347, 0.4470342993736267, 0.47279495000839233, 0.49855560064315796, 0.5243162512779236, 0.5500769019126892, 0.5758375525474548, 0.6015981435775757, 0.6273587942123413, 0.6531194448471069, 0.6788800954818726, 0.7046407461166382, 0.7304013967514038, 0.7561620473861694, 0.7819226980209351, 0.8076833486557007, 0.8334439992904663, 0.8592045903205872, 0.8849652409553528, 0.9107258915901184, 0.936486542224884, 0.9622471928596497, 0.9880078434944153, 1.0137684345245361, 1.0395290851593018, 1.0652897357940674, 1.091050386428833, 1.1168110370635986]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 13.0, 21.0, 24.0, 33.0, 37.0, 51.0, 51.0, 62.0, 53.0, 74.0, 81.0, 66.0, 70.0, 70.0, 58.0, 48.0, 43.0, 38.0, 38.0, 17.0, 12.0, 16.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1306578516960144, -0.12466008216142654, -0.11866230517625809, -0.11266453564167023, -0.10666675865650177, -0.10066898912191391, -0.09467121958732605, -0.08867344260215759, -0.08267567306756973, -0.07667790353298187, -0.07068012654781342, -0.06468235701322556, -0.0586845837533474, -0.05268681049346924, -0.04668904095888138, -0.04069126769900322, -0.03469349443912506, -0.028695721179246902, -0.022697949782013893, -0.016700178384780884, -0.010702405124902725, -0.004704631865024567, 0.0012931376695632935, 0.007290910929441452, 0.01328868418931961, 0.01928645744919777, 0.02528422884643078, 0.03128200024366379, 0.037279773503541946, 0.043277546763420105, 0.049275316298007965, 0.055273089557886124, 0.06127086281776428, 0.06726863235235214, 0.0732664093375206, 0.07926417887210846, 0.08526195585727692, 0.09125972539186478, 0.09725749492645264, 0.1032552719116211, 0.10925304144620895, 0.11525081098079681, 0.12124858796596527, 0.12724635004997253, 0.133244127035141, 0.13924190402030945, 0.1452396810054779, 0.15123744308948517, 0.15723522007465363, 0.16323299705982208, 0.16923075914382935, 0.1752285361289978, 0.18122631311416626, 0.18722409009933472, 0.19322185218334198, 0.19921962916851044, 0.2052173912525177, 0.21121516823768616, 0.21721293032169342, 0.22321070730686188, 0.22920848429203033, 0.2352062463760376, 0.24120402336120605, 0.2472018003463745, 0.25319957733154297]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 2.0, 4.0, 7.0, 3.0, 19.0, 17.0, 29.0, 55.0, 99.0, 270.0, 561.0, 1694.0, 5927.0, 46566.0, 4123963.0, 11067.0, 2600.0, 730.0, 300.0, 161.0, 72.0, 43.0, 23.0, 15.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.1563720703125, -0.15305709838867188, -0.14974212646484375, -0.14642715454101562, -0.1431121826171875, -0.13979721069335938, -0.13648223876953125, -0.13316726684570312, -0.129852294921875, -0.12653732299804688, -0.12322235107421875, -0.11990737915039062, -0.1165924072265625, -0.11327743530273438, -0.10996246337890625, -0.10664749145507812, -0.10333251953125, -0.10001754760742188, -0.09670257568359375, -0.09338760375976562, -0.0900726318359375, -0.08675765991210938, -0.08344268798828125, -0.08012771606445312, -0.076812744140625, -0.07349777221679688, -0.07018280029296875, -0.06686782836914062, -0.0635528564453125, -0.060237884521484375, -0.05692291259765625, -0.053607940673828125, -0.05029296875, -0.046977996826171875, -0.04366302490234375, -0.040348052978515625, -0.0370330810546875, -0.033718109130859375, -0.03040313720703125, -0.027088165283203125, -0.023773193359375, -0.020458221435546875, -0.01714324951171875, -0.013828277587890625, -0.0105133056640625, -0.007198333740234375, -0.00388336181640625, -0.000568389892578125, 0.00274658203125, 0.006061553955078125, 0.00937652587890625, 0.012691497802734375, 0.0160064697265625, 0.019321441650390625, 0.02263641357421875, 0.025951385498046875, 0.029266357421875, 0.032581329345703125, 0.03589630126953125, 0.039211273193359375, 0.0425262451171875, 0.045841217041015625, 0.04915618896484375, 0.052471160888671875, 0.0557861328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 12.0, 26.0, 33.0, 78.0, 130.0, 177.0, 166.0, 155.0, 101.0, 59.0, 29.0, 20.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.018798828125, -0.01840066909790039, -0.01800251007080078, -0.017604351043701172, -0.017206192016601562, -0.016808032989501953, -0.016409873962402344, -0.016011714935302734, -0.015613555908203125, -0.015215396881103516, -0.014817237854003906, -0.014419078826904297, -0.014020919799804688, -0.013622760772705078, -0.013224601745605469, -0.01282644271850586, -0.01242828369140625, -0.01203012466430664, -0.011631965637207031, -0.011233806610107422, -0.010835647583007812, -0.010437488555908203, -0.010039329528808594, -0.009641170501708984, -0.009243011474609375, -0.008844852447509766, -0.008446693420410156, -0.008048534393310547, -0.0076503753662109375, -0.007252216339111328, -0.006854057312011719, -0.006455898284912109, -0.0060577392578125, -0.005659580230712891, -0.005261421203613281, -0.004863262176513672, -0.0044651031494140625, -0.004066944122314453, -0.0036687850952148438, -0.0032706260681152344, -0.002872467041015625, -0.0024743080139160156, -0.0020761489868164062, -0.0016779899597167969, -0.0012798309326171875, -0.0008816719055175781, -0.00048351287841796875, -8.535385131835938e-05, 0.00031280517578125, 0.0007109642028808594, 0.0011091232299804688, 0.0015072822570800781, 0.0019054412841796875, 0.002303600311279297, 0.0027017593383789062, 0.0030999183654785156, 0.003498077392578125, 0.0038962364196777344, 0.004294395446777344, 0.004692554473876953, 0.0050907135009765625, 0.005488872528076172, 0.005887031555175781, 0.006285190582275391, 0.006683349609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 10.0, 4.0, 11.0, 15.0, 18.0, 22.0, 41.0, 54.0, 73.0, 89.0, 171.0, 271.0, 552.0, 1215.0, 3280.0, 11191.0, 67549.0, 4071508.0, 27511.0, 6513.0, 2133.0, 887.0, 422.0, 240.0, 149.0, 86.0, 87.0, 63.0, 26.0, 22.0, 25.0, 11.0, 14.0, 7.0, 8.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0611572265625, -0.05873870849609375, -0.0563201904296875, -0.05390167236328125, -0.051483154296875, -0.04906463623046875, -0.0466461181640625, -0.04422760009765625, -0.04180908203125, -0.03939056396484375, -0.0369720458984375, -0.03455352783203125, -0.032135009765625, -0.02971649169921875, -0.0272979736328125, -0.02487945556640625, -0.0224609375, -0.02004241943359375, -0.0176239013671875, -0.01520538330078125, -0.012786865234375, -0.01036834716796875, -0.0079498291015625, -0.00553131103515625, -0.00311279296875, -0.00069427490234375, 0.0017242431640625, 0.00414276123046875, 0.006561279296875, 0.00897979736328125, 0.0113983154296875, 0.01381683349609375, 0.0162353515625, 0.01865386962890625, 0.0210723876953125, 0.02349090576171875, 0.025909423828125, 0.02832794189453125, 0.0307464599609375, 0.03316497802734375, 0.03558349609375, 0.03800201416015625, 0.0404205322265625, 0.04283905029296875, 0.045257568359375, 0.04767608642578125, 0.0500946044921875, 0.05251312255859375, 0.054931640625, 0.05735015869140625, 0.0597686767578125, 0.06218719482421875, 0.064605712890625, 0.06702423095703125, 0.0694427490234375, 0.07186126708984375, 0.07427978515625, 0.07669830322265625, 0.0791168212890625, 0.08153533935546875, 0.083953857421875, 0.08637237548828125, 0.0887908935546875, 0.09120941162109375, 0.0936279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 5.0, 16.0, 12.0, 11.0, 20.0, 37.0, 292.0, 3465.0, 96.0, 26.0, 25.0, 15.0, 14.0, 9.0, 4.0, 6.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01042938232421875, -0.009822249412536621, -0.009215116500854492, -0.008607983589172363, -0.008000850677490234, -0.0073937177658081055, -0.0067865848541259766, -0.006179451942443848, -0.005572319030761719, -0.00496518611907959, -0.004358053207397461, -0.003750920295715332, -0.003143787384033203, -0.0025366544723510742, -0.0019295215606689453, -0.0013223886489868164, -0.0007152557373046875, -0.0001081228256225586, 0.0004990100860595703, 0.0011061429977416992, 0.0017132759094238281, 0.002320408821105957, 0.002927541732788086, 0.003534674644470215, 0.004141807556152344, 0.004748940467834473, 0.0053560733795166016, 0.0059632062911987305, 0.006570339202880859, 0.007177472114562988, 0.007784605026245117, 0.008391737937927246, 0.008998870849609375, 0.009606003761291504, 0.010213136672973633, 0.010820269584655762, 0.01142740249633789, 0.01203453540802002, 0.012641668319702148, 0.013248801231384277, 0.013855934143066406, 0.014463067054748535, 0.015070199966430664, 0.015677332878112793, 0.016284465789794922, 0.01689159870147705, 0.01749873161315918, 0.01810586452484131, 0.018712997436523438, 0.019320130348205566, 0.019927263259887695, 0.020534396171569824, 0.021141529083251953, 0.021748661994934082, 0.02235579490661621, 0.02296292781829834, 0.02357006072998047, 0.024177193641662598, 0.024784326553344727, 0.025391459465026855, 0.025998592376708984, 0.026605725288391113, 0.027212858200073242, 0.02781999111175537, 0.0284271240234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 14.0, 54.0, 349.0, 499.0, 70.0, 15.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3638467788696289, -0.3534621596336365, -0.34307754039764404, -0.332692950963974, -0.32230833172798157, -0.31192371249198914, -0.3015391230583191, -0.29115450382232666, -0.28076988458633423, -0.2703852653503418, -0.26000064611434937, -0.24961605668067932, -0.2392314374446869, -0.22884681820869446, -0.21846221387386322, -0.20807760953903198, -0.19769299030303955, -0.18730837106704712, -0.17692376673221588, -0.16653916239738464, -0.1561545431613922, -0.14576992392539978, -0.13538531959056854, -0.1250007152557373, -0.11461609601974487, -0.10423148423433304, -0.0938468724489212, -0.08346226066350937, -0.07307764887809753, -0.0626930370926857, -0.052308425307273865, -0.04192381352186203, -0.03153923153877258, -0.02115461975336075, -0.010770007967948914, -0.00038539618253707886, 0.009999215602874756, 0.02038382738828659, 0.030768439173698425, 0.04115305095911026, 0.051537662744522095, 0.06192227452993393, 0.07230688631534576, 0.0826914981007576, 0.09307610988616943, 0.10346072167158127, 0.1138453334569931, 0.12422994524240494, 0.13461455702781677, 0.1449991762638092, 0.15538378059864044, 0.16576838493347168, 0.1761530041694641, 0.18653762340545654, 0.19692222774028778, 0.20730683207511902, 0.21769145131111145, 0.22807607054710388, 0.23846067488193512, 0.24884527921676636, 0.2592298984527588, 0.2696145176887512, 0.27999913692474365, 0.2903837263584137, 0.30076834559440613]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 11.0, 17.0, 35.0, 52.0, 57.0, 69.0, 89.0, 111.0, 93.0, 105.0, 86.0, 86.0, 67.0, 45.0, 23.0, 20.0, 17.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07523179054260254, -0.07285727560520172, -0.0704827532172203, -0.06810823827981949, -0.06573371589183807, -0.06335920095443726, -0.06098468601703644, -0.05861016735434532, -0.056235648691654205, -0.05386113002896309, -0.05148661136627197, -0.049112096428871155, -0.04673757776618004, -0.04436305910348892, -0.041988544166088104, -0.03961402550339699, -0.03723950684070587, -0.034864988178014755, -0.03249046951532364, -0.03011595457792282, -0.027741435915231705, -0.02536691725254059, -0.02299240045249462, -0.020617883652448654, -0.018243364989757538, -0.01586884632706642, -0.013494329527020454, -0.011119811795651913, -0.008745294064283371, -0.006370776332914829, -0.0039962586015462875, -0.0016217418015003204, 0.0007527768611907959, 0.0031272945925593376, 0.005501812323927879, 0.007876330055296421, 0.010250847786664963, 0.012625365518033504, 0.014999883249402046, 0.017374400049448013, 0.01974891871213913, 0.022123437374830246, 0.024497954174876213, 0.02687247097492218, 0.029246989637613297, 0.03162150830030441, 0.03399602323770523, 0.03637054190039635, 0.03874506056308746, 0.04111957922577858, 0.043494097888469696, 0.045868612825870514, 0.04824313148856163, 0.05061765015125275, 0.052992165088653564, 0.05536668375134468, 0.0577412024140358, 0.06011572107672691, 0.06249023973941803, 0.06486475467681885, 0.06723926961421967, 0.06961379200220108, 0.0719883069396019, 0.07436282932758331, 0.07673734426498413]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 13.0, 19.0, 23.0, 25.0, 36.0, 45.0, 75.0, 101.0, 267.0, 914.0, 4492.0, 47941.0, 900360.0, 85828.0, 6500.0, 1144.0, 356.0, 136.0, 66.0, 41.0, 29.0, 34.0, 23.0, 17.0, 14.0, 14.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1392822265625, -0.1352558135986328, -0.13122940063476562, -0.12720298767089844, -0.12317657470703125, -0.11915016174316406, -0.11512374877929688, -0.11109733581542969, -0.1070709228515625, -0.10304450988769531, -0.09901809692382812, -0.09499168395996094, -0.09096527099609375, -0.08693885803222656, -0.08291244506835938, -0.07888603210449219, -0.074859619140625, -0.07083320617675781, -0.06680679321289062, -0.06278038024902344, -0.05875396728515625, -0.05472755432128906, -0.050701141357421875, -0.04667472839355469, -0.0426483154296875, -0.03862190246582031, -0.034595489501953125, -0.030569076538085938, -0.02654266357421875, -0.022516250610351562, -0.018489837646484375, -0.014463424682617188, -0.01043701171875, -0.0064105987548828125, -0.002384185791015625, 0.0016422271728515625, 0.00566864013671875, 0.009695053100585938, 0.013721466064453125, 0.017747879028320312, 0.0217742919921875, 0.025800704956054688, 0.029827117919921875, 0.03385353088378906, 0.03787994384765625, 0.04190635681152344, 0.045932769775390625, 0.04995918273925781, 0.053985595703125, 0.05801200866699219, 0.062038421630859375, 0.06606483459472656, 0.07009124755859375, 0.07411766052246094, 0.07814407348632812, 0.08217048645019531, 0.0861968994140625, 0.09022331237792969, 0.09424972534179688, 0.09827613830566406, 0.10230255126953125, 0.10632896423339844, 0.11035537719726562, 0.11438179016113281, 0.118408203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 16.0, 20.0, 33.0, 81.0, 110.0, 185.0, 171.0, 157.0, 93.0, 68.0, 30.0, 19.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.018524169921875, -0.018132269382476807, -0.017740368843078613, -0.01734846830368042, -0.016956567764282227, -0.016564667224884033, -0.01617276668548584, -0.015780866146087646, -0.015388965606689453, -0.01499706506729126, -0.014605164527893066, -0.014213263988494873, -0.01382136344909668, -0.013429462909698486, -0.013037562370300293, -0.0126456618309021, -0.012253761291503906, -0.011861860752105713, -0.01146996021270752, -0.011078059673309326, -0.010686159133911133, -0.01029425859451294, -0.009902358055114746, -0.009510457515716553, -0.00911855697631836, -0.008726656436920166, -0.008334755897521973, -0.00794285535812378, -0.007550954818725586, -0.007159054279327393, -0.006767153739929199, -0.006375253200531006, -0.0059833526611328125, -0.005591452121734619, -0.005199551582336426, -0.004807651042938232, -0.004415750503540039, -0.004023849964141846, -0.0036319494247436523, -0.003240048885345459, -0.0028481483459472656, -0.0024562478065490723, -0.002064347267150879, -0.0016724467277526855, -0.0012805461883544922, -0.0008886456489562988, -0.0004967451095581055, -0.00010484457015991211, 0.00028705596923828125, 0.0006789565086364746, 0.001070857048034668, 0.0014627575874328613, 0.0018546581268310547, 0.002246558666229248, 0.0026384592056274414, 0.0030303597450256348, 0.003422260284423828, 0.0038141608238220215, 0.004206061363220215, 0.004597961902618408, 0.0049898624420166016, 0.005381762981414795, 0.005773663520812988, 0.006165564060211182, 0.006557464599609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 15.0, 6.0, 25.0, 29.0, 44.0, 58.0, 96.0, 165.0, 235.0, 394.0, 628.0, 1059.0, 1857.0, 3219.0, 5924.0, 10923.0, 21362.0, 43779.0, 96783.0, 268809.0, 380221.0, 111627.0, 49878.0, 23954.0, 12303.0, 6486.0, 3593.0, 2013.0, 1190.0, 707.0, 426.0, 253.0, 172.0, 103.0, 73.0, 48.0, 24.0, 29.0, 13.0, 8.0, 5.0, 11.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251617431640625, -0.02432537078857422, -0.023488998413085938, -0.022652626037597656, -0.021816253662109375, -0.020979881286621094, -0.020143508911132812, -0.01930713653564453, -0.01847076416015625, -0.01763439178466797, -0.016798019409179688, -0.015961647033691406, -0.015125274658203125, -0.014288902282714844, -0.013452529907226562, -0.012616157531738281, -0.01177978515625, -0.010943412780761719, -0.010107040405273438, -0.009270668029785156, -0.008434295654296875, -0.007597923278808594, -0.0067615509033203125, -0.005925178527832031, -0.00508880615234375, -0.004252433776855469, -0.0034160614013671875, -0.0025796890258789062, -0.001743316650390625, -0.0009069442749023438, -7.05718994140625e-05, 0.0007658004760742188, 0.0016021728515625, 0.0024385452270507812, 0.0032749176025390625, 0.004111289978027344, 0.004947662353515625, 0.005784034729003906, 0.0066204071044921875, 0.007456779479980469, 0.00829315185546875, 0.009129524230957031, 0.009965896606445312, 0.010802268981933594, 0.011638641357421875, 0.012475013732910156, 0.013311386108398438, 0.014147758483886719, 0.014984130859375, 0.01582050323486328, 0.016656875610351562, 0.017493247985839844, 0.018329620361328125, 0.019165992736816406, 0.020002365112304688, 0.02083873748779297, 0.02167510986328125, 0.02251148223876953, 0.023347854614257812, 0.024184226989746094, 0.025020599365234375, 0.025856971740722656, 0.026693344116210938, 0.02752971649169922, 0.0283660888671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 13.0, 19.0, 18.0, 20.0, 22.0, 21.0, 34.0, 35.0, 31.0, 37.0, 42.0, 49.0, 45.0, 33.0, 40.0, 50.0, 49.0, 36.0, 36.0, 39.0, 46.0, 42.0, 35.0, 31.0, 25.0, 28.0, 13.0, 19.0, 13.0, 13.0, 9.0, 8.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019073486328125, -0.018439531326293945, -0.01780557632446289, -0.017171621322631836, -0.01653766632080078, -0.015903711318969727, -0.015269756317138672, -0.014635801315307617, -0.014001846313476562, -0.013367891311645508, -0.012733936309814453, -0.012099981307983398, -0.011466026306152344, -0.010832071304321289, -0.010198116302490234, -0.00956416130065918, -0.008930206298828125, -0.00829625129699707, -0.007662296295166016, -0.007028341293334961, -0.006394386291503906, -0.0057604312896728516, -0.005126476287841797, -0.004492521286010742, -0.0038585662841796875, -0.003224611282348633, -0.002590656280517578, -0.0019567012786865234, -0.0013227462768554688, -0.0006887912750244141, -5.4836273193359375e-05, 0.0005791187286376953, 0.00121307373046875, 0.0018470287322998047, 0.0024809837341308594, 0.003114938735961914, 0.0037488937377929688, 0.0043828487396240234, 0.005016803741455078, 0.005650758743286133, 0.0062847137451171875, 0.006918668746948242, 0.007552623748779297, 0.008186578750610352, 0.008820533752441406, 0.009454488754272461, 0.010088443756103516, 0.01072239875793457, 0.011356353759765625, 0.01199030876159668, 0.012624263763427734, 0.013258218765258789, 0.013892173767089844, 0.014526128768920898, 0.015160083770751953, 0.015794038772583008, 0.016427993774414062, 0.017061948776245117, 0.017695903778076172, 0.018329858779907227, 0.01896381378173828, 0.019597768783569336, 0.02023172378540039, 0.020865678787231445, 0.0214996337890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 14.0, 20.0, 31.0, 50.0, 98.0, 137.0, 249.0, 448.0, 827.0, 1722.0, 3827.0, 10276.0, 38301.0, 501310.0, 436740.0, 37111.0, 9967.0, 3810.0, 1708.0, 859.0, 414.0, 249.0, 142.0, 78.0, 58.0, 27.0, 20.0, 12.0, 13.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004763603210449219, -0.0004619210958480835, -0.0004474818706512451, -0.00043304264545440674, -0.00041860342025756836, -0.00040416419506073, -0.0003897249698638916, -0.0003752857446670532, -0.00036084651947021484, -0.00034640729427337646, -0.0003319680690765381, -0.0003175288438796997, -0.00030308961868286133, -0.00028865039348602295, -0.00027421116828918457, -0.0002597719430923462, -0.0002453327178955078, -0.00023089349269866943, -0.00021645426750183105, -0.00020201504230499268, -0.0001875758171081543, -0.00017313659191131592, -0.00015869736671447754, -0.00014425814151763916, -0.00012981891632080078, -0.0001153796911239624, -0.00010094046592712402, -8.650124073028564e-05, -7.206201553344727e-05, -5.762279033660889e-05, -4.318356513977051e-05, -2.874433994293213e-05, -1.430511474609375e-05, 1.341104507446289e-07, 1.4573335647583008e-05, 2.9012560844421387e-05, 4.3451786041259766e-05, 5.7891011238098145e-05, 7.233023643493652e-05, 8.67694616317749e-05, 0.00010120868682861328, 0.00011564791202545166, 0.00013008713722229004, 0.00014452636241912842, 0.0001589655876159668, 0.00017340481281280518, 0.00018784403800964355, 0.00020228326320648193, 0.0002167224884033203, 0.0002311617136001587, 0.00024560093879699707, 0.00026004016399383545, 0.00027447938919067383, 0.0002889186143875122, 0.0003033578395843506, 0.00031779706478118896, 0.00033223628997802734, 0.0003466755151748657, 0.0003611147403717041, 0.0003755539655685425, 0.00038999319076538086, 0.00040443241596221924, 0.0004188716411590576, 0.000433310866355896, 0.0004477500915527344]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 15.0, 12.0, 16.0, 16.0, 16.0, 32.0, 49.0, 116.0, 156.0, 191.0, 147.0, 75.0, 51.0, 35.0, 10.0, 16.0, 6.0, 6.0, 4.0, 6.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.4681521356105804e-05, -3.354065120220184e-05, -3.239978104829788e-05, -3.125891089439392e-05, -3.011804074048996e-05, -2.8977170586586e-05, -2.7836300432682037e-05, -2.6695430278778076e-05, -2.5554560124874115e-05, -2.4413689970970154e-05, -2.3272819817066193e-05, -2.213194966316223e-05, -2.099107950925827e-05, -1.985020935535431e-05, -1.8709339201450348e-05, -1.7568469047546387e-05, -1.6427598893642426e-05, -1.5286728739738464e-05, -1.4145858585834503e-05, -1.3004988431930542e-05, -1.186411827802658e-05, -1.072324812412262e-05, -9.582377970218658e-06, -8.441507816314697e-06, -7.300637662410736e-06, -6.159767508506775e-06, -5.018897354602814e-06, -3.8780272006988525e-06, -2.7371570467948914e-06, -1.5962868928909302e-06, -4.55416738986969e-07, 6.854534149169922e-07, 1.8263235688209534e-06, 2.9671937227249146e-06, 4.108063876628876e-06, 5.248934030532837e-06, 6.389804184436798e-06, 7.530674338340759e-06, 8.67154449224472e-06, 9.812414646148682e-06, 1.0953284800052643e-05, 1.2094154953956604e-05, 1.3235025107860565e-05, 1.4375895261764526e-05, 1.5516765415668488e-05, 1.665763556957245e-05, 1.779850572347641e-05, 1.893937587738037e-05, 2.0080246031284332e-05, 2.1221116185188293e-05, 2.2361986339092255e-05, 2.3502856492996216e-05, 2.4643726646900177e-05, 2.5784596800804138e-05, 2.69254669547081e-05, 2.806633710861206e-05, 2.9207207262516022e-05, 3.0348077416419983e-05, 3.1488947570323944e-05, 3.2629817724227905e-05, 3.3770687878131866e-05, 3.491155803203583e-05, 3.605242818593979e-05, 3.719329833984375e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 12.0, 12.0, 16.0, 17.0, 38.0, 53.0, 74.0, 145.0, 281.0, 708.0, 1841.0, 5756.0, 21897.0, 142248.0, 791841.0, 64253.0, 13286.0, 3750.0, 1243.0, 500.0, 251.0, 121.0, 62.0, 33.0, 23.0, 25.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0005502700805664062, -0.0005346909165382385, -0.0005191117525100708, -0.0005035325884819031, -0.00048795342445373535, -0.0004723742604255676, -0.0004567950963973999, -0.0004412159323692322, -0.00042563676834106445, -0.00041005760431289673, -0.000394478440284729, -0.0003788992762565613, -0.00036332011222839355, -0.00034774094820022583, -0.0003321617841720581, -0.0003165826201438904, -0.00030100345611572266, -0.00028542429208755493, -0.0002698451280593872, -0.0002542659640312195, -0.00023868680000305176, -0.00022310763597488403, -0.0002075284719467163, -0.00019194930791854858, -0.00017637014389038086, -0.00016079097986221313, -0.0001452118158340454, -0.00012963265180587769, -0.00011405348777770996, -9.847432374954224e-05, -8.289515972137451e-05, -6.731599569320679e-05, -5.173683166503906e-05, -3.615766763687134e-05, -2.0578503608703613e-05, -4.999339580535889e-06, 1.0579824447631836e-05, 2.615898847579956e-05, 4.1738152503967285e-05, 5.731731653213501e-05, 7.289648056030273e-05, 8.847564458847046e-05, 0.00010405480861663818, 0.00011963397264480591, 0.00013521313667297363, 0.00015079230070114136, 0.00016637146472930908, 0.0001819506287574768, 0.00019752979278564453, 0.00021310895681381226, 0.00022868812084197998, 0.0002442672848701477, 0.00025984644889831543, 0.00027542561292648315, 0.0002910047769546509, 0.0003065839409828186, 0.00032216310501098633, 0.00033774226903915405, 0.0003533214330673218, 0.0003689005970954895, 0.0003844797611236572, 0.00040005892515182495, 0.0004156380891799927, 0.0004312172532081604, 0.0004467964172363281]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 22.0, 17.0, 23.0, 33.0, 51.0, 74.0, 92.0, 144.0, 174.0, 123.0, 77.0, 41.0, 35.0, 16.0, 18.0, 19.0, 14.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00041866302490234375, -0.0004091579467058182, -0.0003996528685092926, -0.00039014779031276703, -0.00038064271211624146, -0.0003711376339197159, -0.0003616325557231903, -0.00035212747752666473, -0.00034262239933013916, -0.0003331173211336136, -0.000323612242937088, -0.00031410716474056244, -0.00030460208654403687, -0.0002950970083475113, -0.0002855919301509857, -0.00027608685195446014, -0.00026658177375793457, -0.000257076695561409, -0.0002475716173648834, -0.00023806653916835785, -0.00022856146097183228, -0.0002190563827753067, -0.00020955130457878113, -0.00020004622638225555, -0.00019054114818572998, -0.0001810360699892044, -0.00017153099179267883, -0.00016202591359615326, -0.00015252083539962769, -0.0001430157572031021, -0.00013351067900657654, -0.00012400560081005096, -0.00011450052261352539, -0.00010499544441699982, -9.549036622047424e-05, -8.598528802394867e-05, -7.64802098274231e-05, -6.697513163089752e-05, -5.747005343437195e-05, -4.7964975237846375e-05, -3.84598970413208e-05, -2.8954818844795227e-05, -1.9449740648269653e-05, -9.94466245174408e-06, -4.3958425521850586e-07, 9.065493941307068e-06, 1.857057213783264e-05, 2.8075650334358215e-05, 3.758072853088379e-05, 4.708580672740936e-05, 5.6590884923934937e-05, 6.609596312046051e-05, 7.560104131698608e-05, 8.510611951351166e-05, 9.461119771003723e-05, 0.0001041162759065628, 0.00011362135410308838, 0.00012312643229961395, 0.00013263151049613953, 0.0001421365886926651, 0.00015164166688919067, 0.00016114674508571625, 0.00017065182328224182, 0.0001801569014787674, 0.00018966197967529297]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 5.0, 10.0, 11.0, 22.0, 62.0, 142.0, 379.0, 147.0, 80.0, 50.0, 33.0, 19.0, 15.0, 11.0, 10.0, 6.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10913528501987457, -0.09747326374053955, -0.08581123501062393, -0.07414921373128891, -0.06248718872666359, -0.05082516372203827, -0.03916314244270325, -0.027501113712787628, -0.015839092433452606, -0.00417706836014986, 0.0074849557131528854, 0.019146978855133057, 0.030809003859758377, 0.0424710288643837, 0.05413305014371872, 0.06579507887363434, 0.07745710015296936, 0.08911912143230438, 0.10078115016222, 0.11244317144155502, 0.12410520017147064, 0.13576722145080566, 0.14742924273014069, 0.1590912640094757, 0.17075330018997192, 0.18241532146930695, 0.19407734274864197, 0.20573937892913818, 0.2174014002084732, 0.22906342148780823, 0.24072544276714325, 0.25238746404647827, 0.2640495002269745, 0.2757115364074707, 0.28737354278564453, 0.29903557896614075, 0.3106975853443146, 0.3223596215248108, 0.3340216279029846, 0.34568366408348083, 0.35734570026397705, 0.36900773644447327, 0.3806697428226471, 0.3923317790031433, 0.40399378538131714, 0.41565582156181335, 0.42731785774230957, 0.4389798641204834, 0.4506418704986572, 0.46230390667915344, 0.47396591305732727, 0.4856279492378235, 0.4972899556159973, 0.5089520215988159, 0.5206140279769897, 0.5322760343551636, 0.5439381003379822, 0.555600106716156, 0.5672621726989746, 0.5789241790771484, 0.5905861854553223, 0.6022481918334961, 0.6139102578163147, 0.6255722641944885, 0.6372342705726624]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 11.0, 19.0, 16.0, 16.0, 23.0, 18.0, 38.0, 37.0, 40.0, 53.0, 43.0, 62.0, 61.0, 67.0, 63.0, 57.0, 44.0, 65.0, 56.0, 32.0, 32.0, 32.0, 26.0, 17.0, 21.0, 9.0, 10.0, 6.0, 9.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11584603786468506, -0.11133427172899246, -0.10682250559329987, -0.10231074690818787, -0.09779898077249527, -0.09328721463680267, -0.08877545595169067, -0.08426368981599808, -0.07975192368030548, -0.07524015754461288, -0.07072839140892029, -0.06621663272380829, -0.06170486658811569, -0.057193100452423096, -0.0526813380420208, -0.0481695756316185, -0.0436578094959259, -0.03914604336023331, -0.03463428094983101, -0.03012251667678356, -0.025610752403736115, -0.021098988130688667, -0.01658722385764122, -0.012075461447238922, -0.007563695311546326, -0.0030519310384988785, 0.0014598332345485687, 0.005971597507596016, 0.010483361780643463, 0.01499512605369091, 0.019506890326738358, 0.024018652737140656, 0.028530418872833252, 0.03304218500852585, 0.037553947418928146, 0.042065709829330444, 0.04657747596502304, 0.05108924210071564, 0.055601004511117935, 0.06011276692152023, 0.06462453305721283, 0.06913629919290543, 0.07364806532859802, 0.07815982401371002, 0.08267159014940262, 0.08718335628509521, 0.09169511497020721, 0.09620688110589981, 0.10071864724159241, 0.105230413377285, 0.1097421795129776, 0.1142539381980896, 0.1187657043337822, 0.12327747046947479, 0.1277892291545868, 0.13230100274085999, 0.13681276142597198, 0.14132452011108398, 0.14583629369735718, 0.15034805238246918, 0.15485981106758118, 0.15937158465385437, 0.16388334333896637, 0.16839510202407837, 0.17290687561035156]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 9.0, 11.0, 11.0, 18.0, 21.0, 39.0, 70.0, 166.0, 535.0, 2294.0, 20844.0, 4158936.0, 9361.0, 1301.0, 400.0, 133.0, 55.0, 33.0, 17.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.20068359375, -0.19644451141357422, -0.19220542907714844, -0.18796634674072266, -0.18372726440429688, -0.1794881820678711, -0.1752490997314453, -0.17101001739501953, -0.16677093505859375, -0.16253185272216797, -0.1582927703857422, -0.1540536880493164, -0.14981460571289062, -0.14557552337646484, -0.14133644104003906, -0.13709735870361328, -0.1328582763671875, -0.12861919403076172, -0.12438011169433594, -0.12014102935791016, -0.11590194702148438, -0.1116628646850586, -0.10742378234863281, -0.10318470001220703, -0.09894561767578125, -0.09470653533935547, -0.09046745300292969, -0.0862283706665039, -0.08198928833007812, -0.07775020599365234, -0.07351112365722656, -0.06927204132080078, -0.065032958984375, -0.06079387664794922, -0.05655479431152344, -0.052315711975097656, -0.048076629638671875, -0.043837547302246094, -0.03959846496582031, -0.03535938262939453, -0.03112030029296875, -0.02688121795654297, -0.022642135620117188, -0.018403053283691406, -0.014163970947265625, -0.009924888610839844, -0.0056858062744140625, -0.0014467239379882812, 0.0027923583984375, 0.007031440734863281, 0.011270523071289062, 0.015509605407714844, 0.019748687744140625, 0.023987770080566406, 0.028226852416992188, 0.03246593475341797, 0.03670501708984375, 0.04094409942626953, 0.04518318176269531, 0.049422264099121094, 0.053661346435546875, 0.057900428771972656, 0.06213951110839844, 0.06637859344482422, 0.07061767578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 5.0, 16.0, 18.0, 41.0, 77.0, 108.0, 162.0, 184.0, 152.0, 94.0, 71.0, 36.0, 19.0, 12.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0176849365234375, -0.017311394214630127, -0.016937851905822754, -0.01656430959701538, -0.016190767288208008, -0.015817224979400635, -0.015443682670593262, -0.015070140361785889, -0.014696598052978516, -0.014323055744171143, -0.01394951343536377, -0.013575971126556396, -0.013202428817749023, -0.01282888650894165, -0.012455344200134277, -0.012081801891326904, -0.011708259582519531, -0.011334717273712158, -0.010961174964904785, -0.010587632656097412, -0.010214090347290039, -0.009840548038482666, -0.009467005729675293, -0.00909346342086792, -0.008719921112060547, -0.008346378803253174, -0.0079728364944458, -0.007599294185638428, -0.007225751876831055, -0.006852209568023682, -0.006478667259216309, -0.0061051249504089355, -0.0057315826416015625, -0.0053580403327941895, -0.004984498023986816, -0.004610955715179443, -0.00423741340637207, -0.0038638710975646973, -0.0034903287887573242, -0.003116786479949951, -0.002743244171142578, -0.002369701862335205, -0.001996159553527832, -0.001622617244720459, -0.001249074935913086, -0.0008755326271057129, -0.0005019903182983398, -0.0001284480094909668, 0.00024509429931640625, 0.0006186366081237793, 0.0009921789169311523, 0.0013657212257385254, 0.0017392635345458984, 0.0021128058433532715, 0.0024863481521606445, 0.0028598904609680176, 0.0032334327697753906, 0.0036069750785827637, 0.003980517387390137, 0.00435405969619751, 0.004727602005004883, 0.005101144313812256, 0.005474686622619629, 0.005848228931427002, 0.006221771240234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 6.0, 3.0, 3.0, 4.0, 8.0, 15.0, 16.0, 15.0, 20.0, 25.0, 30.0, 64.0, 84.0, 143.0, 163.0, 225.0, 354.0, 566.0, 865.0, 1270.0, 2008.0, 3471.0, 5856.0, 11110.0, 23079.0, 97705.0, 3953120.0, 53347.0, 18316.0, 9122.0, 4975.0, 2947.0, 1820.0, 1198.0, 758.0, 468.0, 307.0, 242.0, 164.0, 108.0, 76.0, 65.0, 33.0, 28.0, 30.0, 20.0, 12.0, 11.0, 5.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0253143310546875, -0.024389028549194336, -0.023463726043701172, -0.022538423538208008, -0.021613121032714844, -0.02068781852722168, -0.019762516021728516, -0.01883721351623535, -0.017911911010742188, -0.016986608505249023, -0.01606130599975586, -0.015136003494262695, -0.014210700988769531, -0.013285398483276367, -0.012360095977783203, -0.011434793472290039, -0.010509490966796875, -0.009584188461303711, -0.008658885955810547, -0.007733583450317383, -0.006808280944824219, -0.005882978439331055, -0.004957675933837891, -0.0040323734283447266, -0.0031070709228515625, -0.0021817684173583984, -0.0012564659118652344, -0.0003311634063720703, 0.0005941390991210938, 0.0015194416046142578, 0.002444744110107422, 0.003370046615600586, 0.00429534912109375, 0.005220651626586914, 0.006145954132080078, 0.007071256637573242, 0.007996559143066406, 0.00892186164855957, 0.009847164154052734, 0.010772466659545898, 0.011697769165039062, 0.012623071670532227, 0.01354837417602539, 0.014473676681518555, 0.015398979187011719, 0.016324281692504883, 0.017249584197998047, 0.01817488670349121, 0.019100189208984375, 0.02002549171447754, 0.020950794219970703, 0.021876096725463867, 0.02280139923095703, 0.023726701736450195, 0.02465200424194336, 0.025577306747436523, 0.026502609252929688, 0.02742791175842285, 0.028353214263916016, 0.02927851676940918, 0.030203819274902344, 0.031129121780395508, 0.03205442428588867, 0.032979726791381836, 0.033905029296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 9.0, 9.0, 6.0, 5.0, 16.0, 15.0, 20.0, 34.0, 117.0, 3214.0, 389.0, 98.0, 20.0, 20.0, 19.0, 14.0, 7.0, 9.0, 6.0, 1.0, 3.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01140594482421875, -0.010980725288391113, -0.010555505752563477, -0.01013028621673584, -0.009705066680908203, -0.009279847145080566, -0.00885462760925293, -0.008429408073425293, -0.008004188537597656, -0.0075789690017700195, -0.007153749465942383, -0.006728529930114746, -0.006303310394287109, -0.005878090858459473, -0.005452871322631836, -0.005027651786804199, -0.0046024322509765625, -0.004177212715148926, -0.003751993179321289, -0.0033267736434936523, -0.0029015541076660156, -0.002476334571838379, -0.002051115036010742, -0.0016258955001831055, -0.0012006759643554688, -0.000775456428527832, -0.0003502368927001953, 7.49826431274414e-05, 0.0005002021789550781, 0.0009254217147827148, 0.0013506412506103516, 0.0017758607864379883, 0.002201080322265625, 0.0026262998580932617, 0.0030515193939208984, 0.003476738929748535, 0.003901958465576172, 0.004327178001403809, 0.004752397537231445, 0.005177617073059082, 0.005602836608886719, 0.0060280561447143555, 0.006453275680541992, 0.006878495216369629, 0.007303714752197266, 0.007728934288024902, 0.008154153823852539, 0.008579373359680176, 0.009004592895507812, 0.00942981243133545, 0.009855031967163086, 0.010280251502990723, 0.01070547103881836, 0.011130690574645996, 0.011555910110473633, 0.01198112964630127, 0.012406349182128906, 0.012831568717956543, 0.01325678825378418, 0.013682007789611816, 0.014107227325439453, 0.01453244686126709, 0.014957666397094727, 0.015382885932922363, 0.01580810546875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 13.0, 27.0, 37.0, 86.0, 230.0, 357.0, 124.0, 64.0, 29.0, 13.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07526051253080368, -0.07132313400506973, -0.06738575547933578, -0.06344837695360184, -0.05951100215315819, -0.05557362362742424, -0.05163624882698059, -0.04769887030124664, -0.043761491775512695, -0.03982411324977875, -0.0358867347240448, -0.03194935992360115, -0.028011981397867203, -0.024074602872133255, -0.020137226209044456, -0.016199849545955658, -0.01226247102022171, -0.008325093425810337, -0.004387715831398964, -0.0004503382369875908, 0.0034870393574237823, 0.00742441788315773, 0.011361794546246529, 0.015299171209335327, 0.019236549735069275, 0.023173928260803223, 0.02711130492389202, 0.03104868158698082, 0.03498606011271477, 0.038923438638448715, 0.042860813438892365, 0.04679819196462631, 0.05073556303977966, 0.05467294156551361, 0.05861032009124756, 0.0625476986169815, 0.06648507714271545, 0.0704224556684494, 0.07435982674360275, 0.0782972052693367, 0.08223458379507065, 0.0861719623208046, 0.09010934084653854, 0.09404671937227249, 0.09798409044742584, 0.10192146897315979, 0.10585884749889374, 0.10979622602462769, 0.11373360455036163, 0.11767098307609558, 0.12160836160182953, 0.12554574012756348, 0.12948311865329742, 0.13342049717903137, 0.13735787570476532, 0.14129525423049927, 0.14523261785507202, 0.14916999638080597, 0.15310737490653992, 0.15704475343227386, 0.1609821319580078, 0.16491951048374176, 0.1688568890094757, 0.17279425263404846, 0.1767316460609436]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 13.0, 8.0, 18.0, 16.0, 19.0, 27.0, 43.0, 52.0, 40.0, 57.0, 66.0, 65.0, 54.0, 73.0, 72.0, 54.0, 59.0, 49.0, 41.0, 40.0, 49.0, 16.0, 27.0, 13.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04995453357696533, -0.04853484407067299, -0.047115154564380646, -0.0456954650580883, -0.04427577555179596, -0.042856086045503616, -0.04143639653921127, -0.04001670703291893, -0.03859701752662659, -0.037177328020334244, -0.0357576385140419, -0.03433794900774956, -0.032918259501457214, -0.03149856999516487, -0.030078880488872528, -0.028659190982580185, -0.027239501476287842, -0.0258198119699955, -0.024400122463703156, -0.022980432957410812, -0.02156074345111847, -0.020141053944826126, -0.018721364438533783, -0.01730167493224144, -0.015881985425949097, -0.014462295919656754, -0.01304260641336441, -0.011622916907072067, -0.010203227400779724, -0.008783537894487381, -0.007363848388195038, -0.005944158881902695, -0.0045244693756103516, -0.0031047798693180084, -0.0016850903630256653, -0.00026540085673332214, 0.001154288649559021, 0.002573978155851364, 0.003993667662143707, 0.00541335716843605, 0.0068330466747283936, 0.008252736181020737, 0.00967242568731308, 0.011092115193605423, 0.012511804699897766, 0.01393149420619011, 0.015351183712482452, 0.016770873218774796, 0.01819056272506714, 0.019610252231359482, 0.021029941737651825, 0.022449631243944168, 0.02386932075023651, 0.025289010256528854, 0.026708699762821198, 0.02812838926911354, 0.029548078775405884, 0.030967768281698227, 0.03238745778799057, 0.03380714729428291, 0.035226836800575256, 0.0366465263068676, 0.03806621581315994, 0.039485905319452286, 0.04090559482574463]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 10.0, 3.0, 11.0, 9.0, 9.0, 14.0, 19.0, 19.0, 26.0, 29.0, 33.0, 55.0, 76.0, 164.0, 368.0, 1095.0, 3883.0, 21029.0, 249599.0, 722679.0, 40600.0, 6211.0, 1487.0, 524.0, 211.0, 113.0, 68.0, 41.0, 29.0, 25.0, 28.0, 11.0, 10.0, 16.0, 10.0, 9.0, 8.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0819091796875, -0.0793619155883789, -0.07681465148925781, -0.07426738739013672, -0.07172012329101562, -0.06917285919189453, -0.06662559509277344, -0.06407833099365234, -0.06153106689453125, -0.058983802795410156, -0.05643653869628906, -0.05388927459716797, -0.051342010498046875, -0.04879474639892578, -0.04624748229980469, -0.043700218200683594, -0.0411529541015625, -0.038605690002441406, -0.03605842590332031, -0.03351116180419922, -0.030963897705078125, -0.02841663360595703, -0.025869369506835938, -0.023322105407714844, -0.02077484130859375, -0.018227577209472656, -0.015680313110351562, -0.013133049011230469, -0.010585784912109375, -0.008038520812988281, -0.0054912567138671875, -0.0029439926147460938, -0.000396728515625, 0.0021505355834960938, 0.0046977996826171875, 0.007245063781738281, 0.009792327880859375, 0.012339591979980469, 0.014886856079101562, 0.017434120178222656, 0.01998138427734375, 0.022528648376464844, 0.025075912475585938, 0.02762317657470703, 0.030170440673828125, 0.03271770477294922, 0.03526496887207031, 0.037812232971191406, 0.0403594970703125, 0.042906761169433594, 0.04545402526855469, 0.04800128936767578, 0.050548553466796875, 0.05309581756591797, 0.05564308166503906, 0.058190345764160156, 0.06073760986328125, 0.06328487396240234, 0.06583213806152344, 0.06837940216064453, 0.07092666625976562, 0.07347393035888672, 0.07602119445800781, 0.0785684585571289, 0.08111572265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 14.0, 19.0, 47.0, 73.0, 110.0, 171.0, 172.0, 155.0, 92.0, 69.0, 38.0, 14.0, 13.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0174407958984375, -0.017072081565856934, -0.016703367233276367, -0.0163346529006958, -0.015965938568115234, -0.015597224235534668, -0.015228509902954102, -0.014859795570373535, -0.014491081237792969, -0.014122366905212402, -0.013753652572631836, -0.01338493824005127, -0.013016223907470703, -0.012647509574890137, -0.01227879524230957, -0.011910080909729004, -0.011541366577148438, -0.011172652244567871, -0.010803937911987305, -0.010435223579406738, -0.010066509246826172, -0.009697794914245605, -0.009329080581665039, -0.008960366249084473, -0.008591651916503906, -0.00822293758392334, -0.007854223251342773, -0.007485508918762207, -0.007116794586181641, -0.006748080253601074, -0.006379365921020508, -0.006010651588439941, -0.005641937255859375, -0.005273222923278809, -0.004904508590698242, -0.004535794258117676, -0.004167079925537109, -0.003798365592956543, -0.0034296512603759766, -0.00306093692779541, -0.0026922225952148438, -0.0023235082626342773, -0.001954793930053711, -0.0015860795974731445, -0.0012173652648925781, -0.0008486509323120117, -0.0004799365997314453, -0.0001112222671508789, 0.0002574920654296875, 0.0006262063980102539, 0.0009949207305908203, 0.0013636350631713867, 0.0017323493957519531, 0.0021010637283325195, 0.002469778060913086, 0.0028384923934936523, 0.0032072067260742188, 0.003575921058654785, 0.0039446353912353516, 0.004313349723815918, 0.004682064056396484, 0.005050778388977051, 0.005419492721557617, 0.005788207054138184, 0.00615692138671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 8.0, 13.0, 18.0, 26.0, 34.0, 46.0, 83.0, 109.0, 157.0, 188.0, 282.0, 441.0, 663.0, 961.0, 1420.0, 2181.0, 3327.0, 5211.0, 8522.0, 13461.0, 22885.0, 39665.0, 72626.0, 154317.0, 400625.0, 151348.0, 71551.0, 38893.0, 22635.0, 13435.0, 8359.0, 5174.0, 3301.0, 2162.0, 1417.0, 934.0, 625.0, 446.0, 316.0, 206.0, 128.0, 118.0, 68.0, 35.0, 46.0, 27.0, 15.0, 13.0, 9.0, 8.0, 6.0, 1.0, 4.0, 2.0, 0.0, 3.0], "bins": [-0.018798828125, -0.018220186233520508, -0.017641544342041016, -0.017062902450561523, -0.01648426055908203, -0.01590561866760254, -0.015326976776123047, -0.014748334884643555, -0.014169692993164062, -0.01359105110168457, -0.013012409210205078, -0.012433767318725586, -0.011855125427246094, -0.011276483535766602, -0.01069784164428711, -0.010119199752807617, -0.009540557861328125, -0.008961915969848633, -0.00838327407836914, -0.0078046321868896484, -0.007225990295410156, -0.006647348403930664, -0.006068706512451172, -0.00549006462097168, -0.0049114227294921875, -0.004332780838012695, -0.003754138946533203, -0.003175497055053711, -0.0025968551635742188, -0.0020182132720947266, -0.0014395713806152344, -0.0008609294891357422, -0.00028228759765625, 0.0002963542938232422, 0.0008749961853027344, 0.0014536380767822266, 0.0020322799682617188, 0.002610921859741211, 0.003189563751220703, 0.0037682056427001953, 0.0043468475341796875, 0.00492548942565918, 0.005504131317138672, 0.006082773208618164, 0.006661415100097656, 0.0072400569915771484, 0.00781869888305664, 0.008397340774536133, 0.008975982666015625, 0.009554624557495117, 0.01013326644897461, 0.010711908340454102, 0.011290550231933594, 0.011869192123413086, 0.012447834014892578, 0.01302647590637207, 0.013605117797851562, 0.014183759689331055, 0.014762401580810547, 0.015341043472290039, 0.01591968536376953, 0.016498327255249023, 0.017076969146728516, 0.017655611038208008, 0.0182342529296875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 1.0, 11.0, 8.0, 11.0, 11.0, 12.0, 12.0, 14.0, 19.0, 18.0, 17.0, 29.0, 36.0, 32.0, 37.0, 31.0, 35.0, 36.0, 44.0, 37.0, 45.0, 47.0, 41.0, 45.0, 34.0, 39.0, 23.0, 31.0, 23.0, 28.0, 27.0, 20.0, 24.0, 23.0, 14.0, 9.0, 11.0, 10.0, 13.0, 9.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 4.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.0178070068359375, -0.017276525497436523, -0.016746044158935547, -0.01621556282043457, -0.015685081481933594, -0.015154600143432617, -0.01462411880493164, -0.014093637466430664, -0.013563156127929688, -0.013032674789428711, -0.012502193450927734, -0.011971712112426758, -0.011441230773925781, -0.010910749435424805, -0.010380268096923828, -0.009849786758422852, -0.009319305419921875, -0.008788824081420898, -0.008258342742919922, -0.007727861404418945, -0.007197380065917969, -0.006666898727416992, -0.006136417388916016, -0.005605936050415039, -0.0050754547119140625, -0.004544973373413086, -0.004014492034912109, -0.003484010696411133, -0.0029535293579101562, -0.0024230480194091797, -0.0018925666809082031, -0.0013620853424072266, -0.00083160400390625, -0.00030112266540527344, 0.00022935867309570312, 0.0007598400115966797, 0.0012903213500976562, 0.0018208026885986328, 0.0023512840270996094, 0.002881765365600586, 0.0034122467041015625, 0.003942728042602539, 0.004473209381103516, 0.005003690719604492, 0.005534172058105469, 0.006064653396606445, 0.006595134735107422, 0.0071256160736083984, 0.007656097412109375, 0.008186578750610352, 0.008717060089111328, 0.009247541427612305, 0.009778022766113281, 0.010308504104614258, 0.010838985443115234, 0.011369466781616211, 0.011899948120117188, 0.012430429458618164, 0.01296091079711914, 0.013491392135620117, 0.014021873474121094, 0.01455235481262207, 0.015082836151123047, 0.015613317489624023, 0.016143798828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 8.0, 11.0, 18.0, 37.0, 64.0, 114.0, 201.0, 363.0, 685.0, 1436.0, 3017.0, 7874.0, 31131.0, 625046.0, 340634.0, 25354.0, 7061.0, 2795.0, 1282.0, 648.0, 332.0, 190.0, 95.0, 59.0, 30.0, 22.0, 14.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042319297790527344, -0.00040905922651290894, -0.00039492547512054443, -0.00038079172372817993, -0.00036665797233581543, -0.00035252422094345093, -0.0003383904695510864, -0.0003242567181587219, -0.0003101229667663574, -0.0002959892153739929, -0.0002818554639816284, -0.0002677217125892639, -0.0002535879611968994, -0.0002394542098045349, -0.0002253204584121704, -0.0002111867070198059, -0.0001970529556274414, -0.0001829192042350769, -0.0001687854528427124, -0.0001546517014503479, -0.0001405179500579834, -0.0001263841986656189, -0.0001122504472732544, -9.811669588088989e-05, -8.398294448852539e-05, -6.984919309616089e-05, -5.571544170379639e-05, -4.1581690311431885e-05, -2.7447938919067383e-05, -1.3314187526702881e-05, 8.195638656616211e-07, 1.4953315258026123e-05, 2.9087066650390625e-05, 4.322081804275513e-05, 5.735456943511963e-05, 7.148832082748413e-05, 8.562207221984863e-05, 9.975582361221313e-05, 0.00011388957500457764, 0.00012802332639694214, 0.00014215707778930664, 0.00015629082918167114, 0.00017042458057403564, 0.00018455833196640015, 0.00019869208335876465, 0.00021282583475112915, 0.00022695958614349365, 0.00024109333753585815, 0.00025522708892822266, 0.00026936084032058716, 0.00028349459171295166, 0.00029762834310531616, 0.00031176209449768066, 0.00032589584589004517, 0.00034002959728240967, 0.00035416334867477417, 0.00036829710006713867, 0.0003824308514595032, 0.0003965646028518677, 0.0004106983542442322, 0.0004248321056365967, 0.0004389658570289612, 0.0004530996084213257, 0.0004672333598136902, 0.0004813671112060547]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 6.0, 8.0, 14.0, 20.0, 34.0, 43.0, 59.0, 128.0, 184.0, 180.0, 114.0, 52.0, 25.0, 28.0, 26.0, 19.0, 9.0, 2.0, 4.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.792213439941406e-05, -4.6319328248500824e-05, -4.4716522097587585e-05, -4.311371594667435e-05, -4.151090979576111e-05, -3.990810364484787e-05, -3.830529749393463e-05, -3.670249134302139e-05, -3.5099685192108154e-05, -3.3496879041194916e-05, -3.189407289028168e-05, -3.029126673936844e-05, -2.86884605884552e-05, -2.708565443754196e-05, -2.5482848286628723e-05, -2.3880042135715485e-05, -2.2277235984802246e-05, -2.0674429833889008e-05, -1.907162368297577e-05, -1.746881753206253e-05, -1.5866011381149292e-05, -1.4263205230236053e-05, -1.2660399079322815e-05, -1.1057592928409576e-05, -9.454786777496338e-06, -7.8519806265831e-06, -6.249174475669861e-06, -4.646368324756622e-06, -3.043562173843384e-06, -1.4407560229301453e-06, 1.6205012798309326e-07, 1.7648562788963318e-06, 3.3676624298095703e-06, 4.970468580722809e-06, 6.573274731636047e-06, 8.176080882549286e-06, 9.778887033462524e-06, 1.1381693184375763e-05, 1.2984499335289001e-05, 1.458730548620224e-05, 1.619011163711548e-05, 1.7792917788028717e-05, 1.9395723938941956e-05, 2.0998530089855194e-05, 2.2601336240768433e-05, 2.420414239168167e-05, 2.580694854259491e-05, 2.7409754693508148e-05, 2.9012560844421387e-05, 3.0615366995334625e-05, 3.2218173146247864e-05, 3.38209792971611e-05, 3.542378544807434e-05, 3.702659159898758e-05, 3.862939774990082e-05, 4.0232203900814056e-05, 4.1835010051727295e-05, 4.3437816202640533e-05, 4.504062235355377e-05, 4.664342850446701e-05, 4.824623465538025e-05, 4.984904080629349e-05, 5.1451846957206726e-05, 5.3054653108119965e-05, 5.46574592590332e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 11.0, 9.0, 20.0, 21.0, 33.0, 39.0, 52.0, 72.0, 105.0, 162.0, 201.0, 329.0, 472.0, 707.0, 1231.0, 2001.0, 3647.0, 7495.0, 18097.0, 59091.0, 439480.0, 423268.0, 57682.0, 17847.0, 7423.0, 3642.0, 1993.0, 1166.0, 721.0, 452.0, 320.0, 219.0, 157.0, 97.0, 80.0, 55.0, 38.0, 33.0, 19.0, 17.0, 10.0, 11.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00023794174194335938, -0.00023050419986248016, -0.00022306665778160095, -0.00021562911570072174, -0.00020819157361984253, -0.00020075403153896332, -0.0001933164894580841, -0.0001858789473772049, -0.00017844140529632568, -0.00017100386321544647, -0.00016356632113456726, -0.00015612877905368805, -0.00014869123697280884, -0.00014125369489192963, -0.00013381615281105042, -0.0001263786107301712, -0.00011894106864929199, -0.00011150352656841278, -0.00010406598448753357, -9.662844240665436e-05, -8.919090032577515e-05, -8.175335824489594e-05, -7.431581616401672e-05, -6.687827408313751e-05, -5.94407320022583e-05, -5.200318992137909e-05, -4.456564784049988e-05, -3.7128105759620667e-05, -2.9690563678741455e-05, -2.2253021597862244e-05, -1.4815479516983032e-05, -7.377937436103821e-06, 5.960464477539063e-08, 7.497146725654602e-06, 1.4934688806533813e-05, 2.2372230887413025e-05, 2.9809772968292236e-05, 3.724731504917145e-05, 4.468485713005066e-05, 5.212239921092987e-05, 5.955994129180908e-05, 6.69974833726883e-05, 7.44350254535675e-05, 8.187256753444672e-05, 8.931010961532593e-05, 9.674765169620514e-05, 0.00010418519377708435, 0.00011162273585796356, 0.00011906027793884277, 0.00012649782001972198, 0.0001339353621006012, 0.0001413729041814804, 0.00014881044626235962, 0.00015624798834323883, 0.00016368553042411804, 0.00017112307250499725, 0.00017856061458587646, 0.00018599815666675568, 0.0001934356987476349, 0.0002008732408285141, 0.0002083107829093933, 0.00021574832499027252, 0.00022318586707115173, 0.00023062340915203094, 0.00023806095123291016]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 4.0, 10.0, 6.0, 12.0, 17.0, 21.0, 45.0, 50.0, 65.0, 109.0, 140.0, 127.0, 107.0, 87.0, 71.0, 39.0, 29.0, 10.0, 5.0, 11.0, 10.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022721290588378906, -0.00022012554109096527, -0.00021303817629814148, -0.0002059508115053177, -0.0001988634467124939, -0.0001917760819196701, -0.0001846887171268463, -0.00017760135233402252, -0.00017051398754119873, -0.00016342662274837494, -0.00015633925795555115, -0.00014925189316272736, -0.00014216452836990356, -0.00013507716357707977, -0.00012798979878425598, -0.00012090243399143219, -0.0001138150691986084, -0.00010672770440578461, -9.964033961296082e-05, -9.255297482013702e-05, -8.546561002731323e-05, -7.837824523448944e-05, -7.129088044166565e-05, -6.420351564884186e-05, -5.7116150856018066e-05, -5.0028786063194275e-05, -4.2941421270370483e-05, -3.585405647754669e-05, -2.87666916847229e-05, -2.167932689189911e-05, -1.4591962099075317e-05, -7.504597306251526e-06, -4.172325134277344e-07, 6.670132279396057e-06, 1.3757497072219849e-05, 2.084486186504364e-05, 2.793222665786743e-05, 3.501959145069122e-05, 4.2106956243515015e-05, 4.9194321036338806e-05, 5.62816858291626e-05, 6.336905062198639e-05, 7.045641541481018e-05, 7.754378020763397e-05, 8.463114500045776e-05, 9.171850979328156e-05, 9.880587458610535e-05, 0.00010589323937892914, 0.00011298060417175293, 0.00012006796896457672, 0.0001271553337574005, 0.0001342426985502243, 0.0001413300633430481, 0.0001484174281358719, 0.00015550479292869568, 0.00016259215772151947, 0.00016967952251434326, 0.00017676688730716705, 0.00018385425209999084, 0.00019094161689281464, 0.00019802898168563843, 0.00020511634647846222, 0.000212203711271286, 0.0002192910760641098, 0.0002263784408569336]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 9.0, 18.0, 21.0, 55.0, 132.0, 368.0, 154.0, 85.0, 48.0, 32.0, 28.0, 16.0, 12.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13259384036064148, -0.12279576063156128, -0.11299768835306168, -0.10319961607456207, -0.09340153634548187, -0.08360345661640167, -0.07380538433790207, -0.06400731205940247, -0.054209232330322266, -0.044411156326532364, -0.03461308032274246, -0.02481500431895256, -0.015016928315162659, -0.005218852311372757, 0.004579223692417145, 0.014377295970916748, 0.024175375699996948, 0.03397345170378685, 0.04377152770757675, 0.05356960371136665, 0.06336767971515656, 0.07316575944423676, 0.08296383172273636, 0.09276190400123596, 0.10255998373031616, 0.11235806345939636, 0.12215613573789597, 0.13195420801639557, 0.14175228774547577, 0.15155036747455597, 0.16134843230247498, 0.17114651203155518, 0.18094459176063538, 0.19074267148971558, 0.20054075121879578, 0.21033881604671478, 0.22013689577579498, 0.22993497550487518, 0.2397330403327942, 0.2495311200618744, 0.2593291997909546, 0.2691272795200348, 0.278925359249115, 0.2887234389781952, 0.2985215187072754, 0.3083195686340332, 0.3181176483631134, 0.3279157280921936, 0.3377138078212738, 0.347511887550354, 0.3573099672794342, 0.3671080470085144, 0.3769060969352722, 0.3867041766643524, 0.3965022563934326, 0.4063003361225128, 0.416098415851593, 0.4258964955806732, 0.4356945753097534, 0.4454926550388336, 0.4552907347679138, 0.46508878469467163, 0.47488686442375183, 0.48468494415283203, 0.49448302388191223]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 14.0, 6.0, 13.0, 16.0, 16.0, 21.0, 31.0, 39.0, 37.0, 43.0, 40.0, 54.0, 57.0, 55.0, 71.0, 74.0, 50.0, 67.0, 48.0, 38.0, 39.0, 42.0, 27.0, 23.0, 22.0, 13.0, 19.0, 7.0, 6.0, 4.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10395467281341553, -0.09981619566679001, -0.09567771852016449, -0.09153924882411957, -0.08740077167749405, -0.08326229453086853, -0.07912382483482361, -0.07498534768819809, -0.07084687054157257, -0.06670839339494705, -0.06256991624832153, -0.05843144655227661, -0.05429296940565109, -0.050154492259025574, -0.04601601883769035, -0.04187754541635513, -0.037739068269729614, -0.033600591123104095, -0.029462117701768875, -0.025323642417788506, -0.021185167133808136, -0.017046691849827766, -0.012908216565847397, -0.008769741281867027, -0.004631265997886658, -0.0004927907139062881, 0.0036456845700740814, 0.007784159854054451, 0.01192263513803482, 0.01606111042201519, 0.02019958570599556, 0.02433806098997593, 0.0284765362739563, 0.03261501342058182, 0.03675348684191704, 0.04089196026325226, 0.04503043740987778, 0.049168914556503296, 0.053307387977838516, 0.05744586139917374, 0.061584338545799255, 0.06572281569242477, 0.06986129283905029, 0.07399976253509521, 0.07813823968172073, 0.08227671682834625, 0.08641518652439117, 0.0905536636710167, 0.09469214081764221, 0.09883061796426773, 0.10296909511089325, 0.10710756480693817, 0.11124604195356369, 0.11538451910018921, 0.11952298879623413, 0.12366146594285965, 0.12779994308948517, 0.1319384127855301, 0.1360768973827362, 0.14021536707878113, 0.14435383677482605, 0.14849232137203217, 0.1526307910680771, 0.1567692756652832, 0.16090774536132812]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 10.0, 14.0, 20.0, 52.0, 90.0, 226.0, 667.0, 2674.0, 261496.0, 3925126.0, 2808.0, 661.0, 220.0, 98.0, 51.0, 29.0, 12.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1260986328125, -0.12341594696044922, -0.12073326110839844, -0.11805057525634766, -0.11536788940429688, -0.1126852035522461, -0.11000251770019531, -0.10731983184814453, -0.10463714599609375, -0.10195446014404297, -0.09927177429199219, -0.0965890884399414, -0.09390640258789062, -0.09122371673583984, -0.08854103088378906, -0.08585834503173828, -0.0831756591796875, -0.08049297332763672, -0.07781028747558594, -0.07512760162353516, -0.07244491577148438, -0.0697622299194336, -0.06707954406738281, -0.06439685821533203, -0.06171417236328125, -0.05903148651123047, -0.05634880065917969, -0.053666114807128906, -0.050983428955078125, -0.048300743103027344, -0.04561805725097656, -0.04293537139892578, -0.040252685546875, -0.03756999969482422, -0.03488731384277344, -0.032204627990722656, -0.029521942138671875, -0.026839256286621094, -0.024156570434570312, -0.02147388458251953, -0.01879119873046875, -0.01610851287841797, -0.013425827026367188, -0.010743141174316406, -0.008060455322265625, -0.005377769470214844, -0.0026950836181640625, -1.239776611328125e-05, 0.0026702880859375, 0.005352973937988281, 0.008035659790039062, 0.010718345642089844, 0.013401031494140625, 0.016083717346191406, 0.018766403198242188, 0.02144908905029297, 0.02413177490234375, 0.02681446075439453, 0.029497146606445312, 0.032179832458496094, 0.034862518310546875, 0.037545204162597656, 0.04022789001464844, 0.04291057586669922, 0.04559326171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 6.0, 21.0, 23.0, 51.0, 82.0, 127.0, 180.0, 151.0, 152.0, 77.0, 63.0, 31.0, 16.0, 13.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01666259765625, -0.016308367252349854, -0.015954136848449707, -0.01559990644454956, -0.015245676040649414, -0.014891445636749268, -0.014537215232849121, -0.014182984828948975, -0.013828754425048828, -0.013474524021148682, -0.013120293617248535, -0.012766063213348389, -0.012411832809448242, -0.012057602405548096, -0.01170337200164795, -0.011349141597747803, -0.010994911193847656, -0.01064068078994751, -0.010286450386047363, -0.009932219982147217, -0.00957798957824707, -0.009223759174346924, -0.008869528770446777, -0.00851529836654663, -0.008161067962646484, -0.007806837558746338, -0.007452607154846191, -0.007098376750946045, -0.0067441463470458984, -0.006389915943145752, -0.0060356855392456055, -0.005681455135345459, -0.0053272247314453125, -0.004972994327545166, -0.0046187639236450195, -0.004264533519744873, -0.0039103031158447266, -0.00355607271194458, -0.0032018423080444336, -0.002847611904144287, -0.0024933815002441406, -0.002139151096343994, -0.0017849206924438477, -0.0014306902885437012, -0.0010764598846435547, -0.0007222294807434082, -0.0003679990768432617, -1.3768672943115234e-05, 0.00034046173095703125, 0.0006946921348571777, 0.0010489225387573242, 0.0014031529426574707, 0.0017573833465576172, 0.0021116137504577637, 0.00246584415435791, 0.0028200745582580566, 0.003174304962158203, 0.0035285353660583496, 0.003882765769958496, 0.004236996173858643, 0.004591226577758789, 0.0049454569816589355, 0.005299687385559082, 0.0056539177894592285, 0.006008148193359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 5.0, 6.0, 5.0, 12.0, 15.0, 19.0, 24.0, 35.0, 49.0, 83.0, 83.0, 125.0, 210.0, 342.0, 651.0, 1142.0, 2365.0, 5404.0, 19290.0, 4123117.0, 28558.0, 6520.0, 2818.0, 1314.0, 774.0, 456.0, 233.0, 156.0, 114.0, 86.0, 41.0, 63.0, 34.0, 26.0, 22.0, 17.0, 13.0, 10.0, 3.0, 6.0, 5.0, 3.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038543701171875, -0.03714609146118164, -0.03574848175048828, -0.03435087203979492, -0.03295326232910156, -0.0315556526184082, -0.030158042907714844, -0.028760433197021484, -0.027362823486328125, -0.025965213775634766, -0.024567604064941406, -0.023169994354248047, -0.021772384643554688, -0.020374774932861328, -0.01897716522216797, -0.01757955551147461, -0.01618194580078125, -0.01478433609008789, -0.013386726379394531, -0.011989116668701172, -0.010591506958007812, -0.009193897247314453, -0.007796287536621094, -0.006398677825927734, -0.005001068115234375, -0.0036034584045410156, -0.0022058486938476562, -0.0008082389831542969, 0.0005893707275390625, 0.001986980438232422, 0.0033845901489257812, 0.004782199859619141, 0.0061798095703125, 0.007577419281005859, 0.008975028991699219, 0.010372638702392578, 0.011770248413085938, 0.013167858123779297, 0.014565467834472656, 0.015963077545166016, 0.017360687255859375, 0.018758296966552734, 0.020155906677246094, 0.021553516387939453, 0.022951126098632812, 0.024348735809326172, 0.02574634552001953, 0.02714395523071289, 0.02854156494140625, 0.02993917465209961, 0.03133678436279297, 0.03273439407348633, 0.03413200378417969, 0.03552961349487305, 0.036927223205566406, 0.038324832916259766, 0.039722442626953125, 0.041120052337646484, 0.042517662048339844, 0.0439152717590332, 0.04531288146972656, 0.04671049118041992, 0.04810810089111328, 0.04950571060180664, 0.0509033203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 5.0, 18.0, 63.0, 3744.0, 147.0, 33.0, 14.0, 9.0, 7.0, 4.0, 6.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006134033203125, -0.005685091018676758, -0.005236148834228516, -0.0047872066497802734, -0.004338264465332031, -0.003889322280883789, -0.003440380096435547, -0.0029914379119873047, -0.0025424957275390625, -0.0020935535430908203, -0.0016446113586425781, -0.001195669174194336, -0.0007467269897460938, -0.00029778480529785156, 0.00015115737915039062, 0.0006000995635986328, 0.001049041748046875, 0.0014979839324951172, 0.0019469261169433594, 0.0023958683013916016, 0.0028448104858398438, 0.003293752670288086, 0.003742694854736328, 0.00419163703918457, 0.0046405792236328125, 0.005089521408081055, 0.005538463592529297, 0.005987405776977539, 0.006436347961425781, 0.0068852901458740234, 0.007334232330322266, 0.007783174514770508, 0.00823211669921875, 0.008681058883666992, 0.009130001068115234, 0.009578943252563477, 0.010027885437011719, 0.010476827621459961, 0.010925769805908203, 0.011374711990356445, 0.011823654174804688, 0.01227259635925293, 0.012721538543701172, 0.013170480728149414, 0.013619422912597656, 0.014068365097045898, 0.01451730728149414, 0.014966249465942383, 0.015415191650390625, 0.015864133834838867, 0.01631307601928711, 0.01676201820373535, 0.017210960388183594, 0.017659902572631836, 0.018108844757080078, 0.01855778694152832, 0.019006729125976562, 0.019455671310424805, 0.019904613494873047, 0.02035355567932129, 0.02080249786376953, 0.021251440048217773, 0.021700382232666016, 0.022149324417114258, 0.0225982666015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 15.0, 25.0, 67.0, 176.0, 444.0, 119.0, 62.0, 28.0, 22.0, 9.0, 8.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07073025405406952, -0.06793145835399628, -0.06513265520334244, -0.062333859503269196, -0.05953506380319595, -0.05673626437783241, -0.05393746495246887, -0.05113866925239563, -0.04833986982703209, -0.04554107040166855, -0.042742274701595306, -0.039943475276231766, -0.037144675850868225, -0.03434588015079498, -0.03154708072543144, -0.02874828316271305, -0.02594948559999466, -0.023150688037276268, -0.020351890474557877, -0.017553091049194336, -0.014754293486475945, -0.011955495923757553, -0.009156696498394012, -0.006357898935675621, -0.0035591013729572296, -0.0007603033445775509, 0.002038494683802128, 0.004837293177843094, 0.007636090740561485, 0.010434888303279877, 0.013233687728643417, 0.01603248529136181, 0.018831275403499603, 0.021630072966217995, 0.024428870528936386, 0.027227669954299927, 0.030026467517018318, 0.03282526507973671, 0.03562406450510025, 0.03842286020517349, 0.04122165963053703, 0.044020459055900574, 0.046819254755973816, 0.04961805418133736, 0.0524168536067009, 0.05521564930677414, 0.05801444873213768, 0.06081324815750122, 0.06361204385757446, 0.0664108395576477, 0.06920964270830154, 0.07200843840837479, 0.07480723410844803, 0.07760603725910187, 0.08040483295917511, 0.08320362865924835, 0.0860024243593216, 0.08880122005939484, 0.09160002321004868, 0.09439881891012192, 0.09719761461019516, 0.099996417760849, 0.10279521346092224, 0.10559400916099548, 0.10839281231164932]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 11.0, 9.0, 18.0, 32.0, 21.0, 40.0, 38.0, 63.0, 56.0, 71.0, 62.0, 73.0, 77.0, 82.0, 60.0, 61.0, 46.0, 40.0, 28.0, 21.0, 18.0, 17.0, 13.0, 13.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02626824378967285, -0.02526085451245308, -0.024253465235233307, -0.023246075958013535, -0.022238686680793762, -0.02123129740357399, -0.020223908126354218, -0.019216518849134445, -0.018209129571914673, -0.0172017402946949, -0.016194351017475128, -0.015186961740255356, -0.014179572463035583, -0.013172183185815811, -0.012164793908596039, -0.011157404631376266, -0.010150015354156494, -0.009142626076936722, -0.00813523679971695, -0.007127847522497177, -0.006120458245277405, -0.0051130689680576324, -0.00410567969083786, -0.0030982904136180878, -0.0020909011363983154, -0.001083511859178543, -7.612258195877075e-05, 0.0009312666952610016, 0.001938655972480774, 0.0029460452497005463, 0.003953434526920319, 0.004960823804140091, 0.005968213081359863, 0.006975602358579636, 0.007982991635799408, 0.00899038091301918, 0.009997770190238953, 0.011005159467458725, 0.012012548744678497, 0.01301993802189827, 0.014027327299118042, 0.015034716576337814, 0.016042105853557587, 0.01704949513077736, 0.01805688440799713, 0.019064273685216904, 0.020071662962436676, 0.02107905223965645, 0.02208644151687622, 0.023093830794095993, 0.024101220071315765, 0.025108609348535538, 0.02611599862575531, 0.027123387902975082, 0.028130777180194855, 0.029138166457414627, 0.0301455557346344, 0.031152945011854172, 0.032160334289073944, 0.033167723566293716, 0.03417511284351349, 0.03518250212073326, 0.03618989139795303, 0.037197280675172806, 0.03820466995239258]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 7.0, 10.0, 15.0, 15.0, 19.0, 21.0, 28.0, 29.0, 46.0, 62.0, 124.0, 216.0, 525.0, 1570.0, 5578.0, 29341.0, 355221.0, 607628.0, 38414.0, 6594.0, 1744.0, 601.0, 270.0, 125.0, 76.0, 52.0, 46.0, 32.0, 24.0, 15.0, 14.0, 18.0, 8.0, 6.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0628662109375, -0.06084251403808594, -0.058818817138671875, -0.05679512023925781, -0.05477142333984375, -0.05274772644042969, -0.050724029541015625, -0.04870033264160156, -0.0466766357421875, -0.04465293884277344, -0.042629241943359375, -0.04060554504394531, -0.03858184814453125, -0.03655815124511719, -0.034534454345703125, -0.03251075744628906, -0.030487060546875, -0.028463363647460938, -0.026439666748046875, -0.024415969848632812, -0.02239227294921875, -0.020368576049804688, -0.018344879150390625, -0.016321182250976562, -0.0142974853515625, -0.012273788452148438, -0.010250091552734375, -0.008226394653320312, -0.00620269775390625, -0.0041790008544921875, -0.002155303955078125, -0.0001316070556640625, 0.00189208984375, 0.0039157867431640625, 0.005939483642578125, 0.007963180541992188, 0.00998687744140625, 0.012010574340820312, 0.014034271240234375, 0.016057968139648438, 0.0180816650390625, 0.020105361938476562, 0.022129058837890625, 0.024152755737304688, 0.02617645263671875, 0.028200149536132812, 0.030223846435546875, 0.03224754333496094, 0.034271240234375, 0.03629493713378906, 0.038318634033203125, 0.04034233093261719, 0.04236602783203125, 0.04438972473144531, 0.046413421630859375, 0.04843711853027344, 0.0504608154296875, 0.05248451232910156, 0.054508209228515625, 0.05653190612792969, 0.05855560302734375, 0.06057929992675781, 0.06260299682617188, 0.06462669372558594, 0.066650390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 22.0, 15.0, 55.0, 80.0, 115.0, 172.0, 146.0, 160.0, 92.0, 63.0, 37.0, 14.0, 17.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.016632080078125, -0.016279637813568115, -0.01592719554901123, -0.015574753284454346, -0.015222311019897461, -0.014869868755340576, -0.014517426490783691, -0.014164984226226807, -0.013812541961669922, -0.013460099697113037, -0.013107657432556152, -0.012755215167999268, -0.012402772903442383, -0.012050330638885498, -0.011697888374328613, -0.011345446109771729, -0.010993003845214844, -0.010640561580657959, -0.010288119316101074, -0.00993567705154419, -0.009583234786987305, -0.00923079252243042, -0.008878350257873535, -0.00852590799331665, -0.008173465728759766, -0.00782102346420288, -0.007468581199645996, -0.007116138935089111, -0.0067636966705322266, -0.006411254405975342, -0.006058812141418457, -0.005706369876861572, -0.0053539276123046875, -0.005001485347747803, -0.004649043083190918, -0.004296600818634033, -0.0039441585540771484, -0.0035917162895202637, -0.003239274024963379, -0.002886831760406494, -0.0025343894958496094, -0.0021819472312927246, -0.0018295049667358398, -0.001477062702178955, -0.0011246204376220703, -0.0007721781730651855, -0.0004197359085083008, -6.729364395141602e-05, 0.00028514862060546875, 0.0006375908851623535, 0.0009900331497192383, 0.001342475414276123, 0.0016949176788330078, 0.0020473599433898926, 0.0023998022079467773, 0.002752244472503662, 0.003104686737060547, 0.0034571290016174316, 0.0038095712661743164, 0.004162013530731201, 0.004514455795288086, 0.004866898059844971, 0.0052193403244018555, 0.00557178258895874, 0.005924224853515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 9.0, 9.0, 23.0, 24.0, 24.0, 46.0, 66.0, 108.0, 155.0, 247.0, 372.0, 567.0, 820.0, 1380.0, 2206.0, 3455.0, 5764.0, 9485.0, 15755.0, 27945.0, 49823.0, 93439.0, 211462.0, 355976.0, 122116.0, 62960.0, 34931.0, 19863.0, 11314.0, 6884.0, 4127.0, 2548.0, 1627.0, 1032.0, 657.0, 459.0, 290.0, 225.0, 129.0, 75.0, 59.0, 29.0, 28.0, 20.0, 7.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0165557861328125, -0.01604151725769043, -0.01552724838256836, -0.015012979507446289, -0.014498710632324219, -0.013984441757202148, -0.013470172882080078, -0.012955904006958008, -0.012441635131835938, -0.011927366256713867, -0.011413097381591797, -0.010898828506469727, -0.010384559631347656, -0.009870290756225586, -0.009356021881103516, -0.008841753005981445, -0.008327484130859375, -0.007813215255737305, -0.007298946380615234, -0.006784677505493164, -0.006270408630371094, -0.0057561397552490234, -0.005241870880126953, -0.004727602005004883, -0.0042133331298828125, -0.003699064254760742, -0.003184795379638672, -0.0026705265045166016, -0.0021562576293945312, -0.001641988754272461, -0.0011277198791503906, -0.0006134510040283203, -9.918212890625e-05, 0.0004150867462158203, 0.0009293556213378906, 0.001443624496459961, 0.0019578933715820312, 0.0024721622467041016, 0.002986431121826172, 0.003500699996948242, 0.0040149688720703125, 0.004529237747192383, 0.005043506622314453, 0.0055577754974365234, 0.006072044372558594, 0.006586313247680664, 0.007100582122802734, 0.007614850997924805, 0.008129119873046875, 0.008643388748168945, 0.009157657623291016, 0.009671926498413086, 0.010186195373535156, 0.010700464248657227, 0.011214733123779297, 0.011729001998901367, 0.012243270874023438, 0.012757539749145508, 0.013271808624267578, 0.013786077499389648, 0.014300346374511719, 0.014814615249633789, 0.01532888412475586, 0.01584315299987793, 0.016357421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 7.0, 10.0, 11.0, 22.0, 14.0, 19.0, 24.0, 27.0, 28.0, 32.0, 32.0, 44.0, 37.0, 38.0, 51.0, 37.0, 50.0, 37.0, 39.0, 35.0, 37.0, 52.0, 32.0, 46.0, 37.0, 24.0, 29.0, 28.0, 23.0, 23.0, 16.0, 11.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016265869140625, -0.015728235244750977, -0.015190601348876953, -0.01465296745300293, -0.014115333557128906, -0.013577699661254883, -0.01304006576538086, -0.012502431869506836, -0.011964797973632812, -0.011427164077758789, -0.010889530181884766, -0.010351896286010742, -0.009814262390136719, -0.009276628494262695, -0.008738994598388672, -0.008201360702514648, -0.007663726806640625, -0.0071260929107666016, -0.006588459014892578, -0.006050825119018555, -0.005513191223144531, -0.004975557327270508, -0.004437923431396484, -0.003900289535522461, -0.0033626556396484375, -0.002825021743774414, -0.0022873878479003906, -0.0017497539520263672, -0.0012121200561523438, -0.0006744861602783203, -0.00013685226440429688, 0.00040078163146972656, 0.00093841552734375, 0.0014760494232177734, 0.002013683319091797, 0.0025513172149658203, 0.0030889511108398438, 0.003626585006713867, 0.004164218902587891, 0.004701852798461914, 0.0052394866943359375, 0.005777120590209961, 0.006314754486083984, 0.006852388381958008, 0.007390022277832031, 0.007927656173706055, 0.008465290069580078, 0.009002923965454102, 0.009540557861328125, 0.010078191757202148, 0.010615825653076172, 0.011153459548950195, 0.011691093444824219, 0.012228727340698242, 0.012766361236572266, 0.013303995132446289, 0.013841629028320312, 0.014379262924194336, 0.01491689682006836, 0.015454530715942383, 0.015992164611816406, 0.01652979850769043, 0.017067432403564453, 0.017605066299438477, 0.0181427001953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 7.0, 11.0, 21.0, 39.0, 33.0, 70.0, 124.0, 239.0, 401.0, 956.0, 2325.0, 6648.0, 22746.0, 132681.0, 773197.0, 83559.0, 16848.0, 5105.0, 1883.0, 793.0, 396.0, 183.0, 106.0, 63.0, 37.0, 34.0, 14.0, 10.0, 7.0, 9.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00041937828063964844, -0.0004087314009666443, -0.00039808452129364014, -0.000387437641620636, -0.00037679076194763184, -0.0003661438822746277, -0.00035549700260162354, -0.0003448501229286194, -0.00033420324325561523, -0.0003235563635826111, -0.00031290948390960693, -0.0003022626042366028, -0.00029161572456359863, -0.0002809688448905945, -0.00027032196521759033, -0.0002596750855445862, -0.00024902820587158203, -0.00023838132619857788, -0.00022773444652557373, -0.00021708756685256958, -0.00020644068717956543, -0.00019579380750656128, -0.00018514692783355713, -0.00017450004816055298, -0.00016385316848754883, -0.00015320628881454468, -0.00014255940914154053, -0.00013191252946853638, -0.00012126564979553223, -0.00011061877012252808, -9.997189044952393e-05, -8.932501077651978e-05, -7.867813110351562e-05, -6.803125143051147e-05, -5.7384371757507324e-05, -4.6737492084503174e-05, -3.6090612411499023e-05, -2.5443732738494873e-05, -1.4796853065490723e-05, -4.149973392486572e-06, 6.496906280517578e-06, 1.714378595352173e-05, 2.779066562652588e-05, 3.843754529953003e-05, 4.908442497253418e-05, 5.973130464553833e-05, 7.037818431854248e-05, 8.102506399154663e-05, 9.167194366455078e-05, 0.00010231882333755493, 0.00011296570301055908, 0.00012361258268356323, 0.00013425946235656738, 0.00014490634202957153, 0.00015555322170257568, 0.00016620010137557983, 0.00017684698104858398, 0.00018749386072158813, 0.00019814074039459229, 0.00020878762006759644, 0.00021943449974060059, 0.00023008137941360474, 0.0002407282590866089, 0.00025137513875961304, 0.0002620220184326172]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 7.0, 12.0, 15.0, 20.0, 22.0, 41.0, 46.0, 63.0, 93.0, 166.0, 152.0, 93.0, 67.0, 52.0, 43.0, 28.0, 20.0, 12.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.594160079956055e-05, -3.4918077290058136e-05, -3.3894553780555725e-05, -3.2871030271053314e-05, -3.18475067615509e-05, -3.082398325204849e-05, -2.980045974254608e-05, -2.877693623304367e-05, -2.775341272354126e-05, -2.672988921403885e-05, -2.5706365704536438e-05, -2.4682842195034027e-05, -2.3659318685531616e-05, -2.2635795176029205e-05, -2.1612271666526794e-05, -2.0588748157024384e-05, -1.9565224647521973e-05, -1.8541701138019562e-05, -1.751817762851715e-05, -1.649465411901474e-05, -1.547113060951233e-05, -1.4447607100009918e-05, -1.3424083590507507e-05, -1.2400560081005096e-05, -1.1377036571502686e-05, -1.0353513062000275e-05, -9.329989552497864e-06, -8.306466042995453e-06, -7.282942533493042e-06, -6.259419023990631e-06, -5.23589551448822e-06, -4.212372004985809e-06, -3.1888484954833984e-06, -2.1653249859809875e-06, -1.1418014764785767e-06, -1.1827796697616577e-07, 9.052455425262451e-07, 1.928769052028656e-06, 2.952292561531067e-06, 3.975816071033478e-06, 4.999339580535889e-06, 6.0228630900382996e-06, 7.0463865995407104e-06, 8.069910109043121e-06, 9.093433618545532e-06, 1.0116957128047943e-05, 1.1140480637550354e-05, 1.2164004147052765e-05, 1.3187527656555176e-05, 1.4211051166057587e-05, 1.5234574675559998e-05, 1.625809818506241e-05, 1.728162169456482e-05, 1.830514520406723e-05, 1.932866871356964e-05, 2.0352192223072052e-05, 2.1375715732574463e-05, 2.2399239242076874e-05, 2.3422762751579285e-05, 2.4446286261081696e-05, 2.5469809770584106e-05, 2.6493333280086517e-05, 2.7516856789588928e-05, 2.854038029909134e-05, 2.956390380859375e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 4.0, 11.0, 12.0, 19.0, 19.0, 26.0, 43.0, 68.0, 72.0, 115.0, 197.0, 302.0, 608.0, 1361.0, 3839.0, 13713.0, 66733.0, 749198.0, 175046.0, 26383.0, 6700.0, 2107.0, 869.0, 392.0, 232.0, 114.0, 78.0, 75.0, 45.0, 37.0, 32.0, 23.0, 20.0, 12.0, 10.0, 10.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00036072731018066406, -0.00034970417618751526, -0.00033868104219436646, -0.00032765790820121765, -0.00031663477420806885, -0.00030561164021492004, -0.00029458850622177124, -0.00028356537222862244, -0.00027254223823547363, -0.00026151910424232483, -0.000250495970249176, -0.00023947283625602722, -0.00022844970226287842, -0.00021742656826972961, -0.0002064034342765808, -0.000195380300283432, -0.0001843571662902832, -0.0001733340322971344, -0.0001623108983039856, -0.0001512877643108368, -0.000140264630317688, -0.00012924149632453918, -0.00011821836233139038, -0.00010719522833824158, -9.617209434509277e-05, -8.514896035194397e-05, -7.412582635879517e-05, -6.310269236564636e-05, -5.207955837249756e-05, -4.1056424379348755e-05, -3.003329038619995e-05, -1.9010156393051147e-05, -7.987022399902344e-06, 3.03611159324646e-06, 1.4059245586395264e-05, 2.5082379579544067e-05, 3.610551357269287e-05, 4.7128647565841675e-05, 5.815178155899048e-05, 6.917491555213928e-05, 8.019804954528809e-05, 9.122118353843689e-05, 0.0001022443175315857, 0.0001132674515247345, 0.0001242905855178833, 0.0001353137195110321, 0.0001463368535041809, 0.0001573599874973297, 0.00016838312149047852, 0.00017940625548362732, 0.00019042938947677612, 0.00020145252346992493, 0.00021247565746307373, 0.00022349879145622253, 0.00023452192544937134, 0.00024554505944252014, 0.00025656819343566895, 0.00026759132742881775, 0.00027861446142196655, 0.00028963759541511536, 0.00030066072940826416, 0.00031168386340141296, 0.00032270699739456177, 0.00033373013138771057, 0.0003447532653808594]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 7.0, 13.0, 28.0, 39.0, 62.0, 94.0, 127.0, 202.0, 166.0, 104.0, 62.0, 32.0, 30.0, 14.0, 10.0, 8.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000274658203125, -0.00026436150074005127, -0.00025406479835510254, -0.0002437680959701538, -0.00023347139358520508, -0.00022317469120025635, -0.00021287798881530762, -0.0002025812864303589, -0.00019228458404541016, -0.00018198788166046143, -0.0001716911792755127, -0.00016139447689056396, -0.00015109777450561523, -0.0001408010721206665, -0.00013050436973571777, -0.00012020766735076904, -0.00010991096496582031, -9.961426258087158e-05, -8.931756019592285e-05, -7.902085781097412e-05, -6.872415542602539e-05, -5.842745304107666e-05, -4.813075065612793e-05, -3.78340482711792e-05, -2.753734588623047e-05, -1.7240643501281738e-05, -6.943941116333008e-06, 3.3527612686157227e-06, 1.3649463653564453e-05, 2.3946166038513184e-05, 3.4242868423461914e-05, 4.4539570808410645e-05, 5.4836273193359375e-05, 6.51329755783081e-05, 7.542967796325684e-05, 8.572638034820557e-05, 9.60230827331543e-05, 0.00010631978511810303, 0.00011661648750305176, 0.0001269131898880005, 0.00013720989227294922, 0.00014750659465789795, 0.00015780329704284668, 0.0001680999994277954, 0.00017839670181274414, 0.00018869340419769287, 0.0001989901065826416, 0.00020928680896759033, 0.00021958351135253906, 0.0002298802137374878, 0.00024017691612243652, 0.00025047361850738525, 0.000260770320892334, 0.0002710670232772827, 0.00028136372566223145, 0.0002916604280471802, 0.0003019571304321289, 0.00031225383281707764, 0.00032255053520202637, 0.0003328472375869751, 0.00034314393997192383, 0.00035344064235687256, 0.0003637373447418213, 0.00037403404712677, 0.00038433074951171875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 13.0, 18.0, 32.0, 61.0, 110.0, 272.0, 199.0, 91.0, 58.0, 31.0, 35.0, 16.0, 15.0, 11.0, 6.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1721349060535431, -0.16547891497612, -0.1588229387998581, -0.152166947722435, -0.1455109715461731, -0.13885498046875, -0.1321989893913269, -0.125543013215065, -0.1188870221376419, -0.11223103851079941, -0.10557505488395691, -0.09891906380653381, -0.09226308017969131, -0.08560709655284882, -0.07895111292600632, -0.07229512929916382, -0.06563914567232132, -0.05898316204547882, -0.052327174693346024, -0.045671191066503525, -0.03901520371437073, -0.03235922008752823, -0.02570323646068573, -0.019047249108552933, -0.012391265481710434, -0.005735280457884073, 0.0009207045659422874, 0.007576689124107361, 0.014232674613595009, 0.020888660103082657, 0.027544643729925156, 0.03420063108205795, 0.04085661470890045, 0.04751259833574295, 0.05416858568787575, 0.060824569314718246, 0.06748055666685104, 0.07413654029369354, 0.08079252392053604, 0.08744850754737854, 0.09410449862480164, 0.10076048225164413, 0.10741646587848663, 0.11407245695590973, 0.12072844058275223, 0.12738442420959473, 0.13404041528701782, 0.14069639146327972, 0.14735236763954163, 0.15400835871696472, 0.16066433489322662, 0.16732032597064972, 0.17397630214691162, 0.18063229322433472, 0.1872882843017578, 0.19394426047801971, 0.2006002515554428, 0.2072562426328659, 0.2139122188091278, 0.2205682098865509, 0.2272241860628128, 0.2338801771402359, 0.2405361533164978, 0.2471921443939209, 0.253848135471344]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 8.0, 8.0, 9.0, 10.0, 13.0, 16.0, 18.0, 18.0, 18.0, 30.0, 34.0, 34.0, 36.0, 42.0, 30.0, 40.0, 48.0, 47.0, 53.0, 47.0, 50.0, 55.0, 43.0, 42.0, 39.0, 32.0, 27.0, 16.0, 22.0, 19.0, 12.0, 24.0, 14.0, 7.0, 9.0, 11.0, 5.0, 9.0, 3.0, 1.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07878965139389038, -0.0760628879070282, -0.07333612442016602, -0.07060935348272324, -0.06788258999586105, -0.06515582650899887, -0.06242905929684639, -0.05970229208469391, -0.056975528597831726, -0.05424876511096954, -0.05152199789881706, -0.04879523068666458, -0.0460684671998024, -0.043341703712940216, -0.040614936500787735, -0.037888169288635254, -0.03516140580177307, -0.03243464231491089, -0.029707875102758408, -0.026981109753251076, -0.024254344403743744, -0.021527579054236412, -0.01880081370472908, -0.01607404835522175, -0.013347283005714417, -0.010620517656207085, -0.007893752306699753, -0.005166986957192421, -0.002440221607685089, 0.00028654374182224274, 0.0030133090913295746, 0.005740074440836906, 0.008466839790344238, 0.01119360513985157, 0.013920370489358902, 0.016647135838866234, 0.019373901188373566, 0.022100666537880898, 0.02482743188738823, 0.02755419723689556, 0.030280962586402893, 0.033007726073265076, 0.03573449328541756, 0.03846126049757004, 0.04118802398443222, 0.0439147874712944, 0.046641554683446884, 0.049368321895599365, 0.05209508538246155, 0.05482184886932373, 0.05754861608147621, 0.06027538329362869, 0.06300214678049088, 0.06572891026735306, 0.06845568120479584, 0.07118244469165802, 0.0739092081785202, 0.07663597166538239, 0.07936273515224457, 0.08208950608968735, 0.08481626957654953, 0.08754303306341171, 0.09026980400085449, 0.09299656748771667, 0.09572333097457886]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 8.0, 16.0, 32.0, 50.0, 121.0, 218.0, 498.0, 1306.0, 3994.0, 4165003.0, 18324.0, 2910.0, 1024.0, 395.0, 166.0, 85.0, 43.0, 27.0, 11.0, 15.0, 10.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.0994873046875, -0.09736394882202148, -0.09524059295654297, -0.09311723709106445, -0.09099388122558594, -0.08887052536010742, -0.0867471694946289, -0.08462381362915039, -0.08250045776367188, -0.08037710189819336, -0.07825374603271484, -0.07613039016723633, -0.07400703430175781, -0.0718836784362793, -0.06976032257080078, -0.06763696670532227, -0.06551361083984375, -0.06339025497436523, -0.06126689910888672, -0.0591435432434082, -0.05702018737792969, -0.05489683151245117, -0.052773475646972656, -0.05065011978149414, -0.048526763916015625, -0.04640340805053711, -0.044280052185058594, -0.04215669631958008, -0.04003334045410156, -0.03790998458862305, -0.03578662872314453, -0.033663272857666016, -0.0315399169921875, -0.029416561126708984, -0.02729320526123047, -0.025169849395751953, -0.023046493530273438, -0.020923137664794922, -0.018799781799316406, -0.01667642593383789, -0.014553070068359375, -0.01242971420288086, -0.010306358337402344, -0.008183002471923828, -0.0060596466064453125, -0.003936290740966797, -0.0018129348754882812, 0.0003104209899902344, 0.00243377685546875, 0.004557132720947266, 0.006680488586425781, 0.008803844451904297, 0.010927200317382812, 0.013050556182861328, 0.015173912048339844, 0.01729726791381836, 0.019420623779296875, 0.02154397964477539, 0.023667335510253906, 0.025790691375732422, 0.027914047241210938, 0.030037403106689453, 0.03216075897216797, 0.034284114837646484, 0.036407470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 13.0, 14.0, 39.0, 45.0, 93.0, 139.0, 168.0, 152.0, 136.0, 76.0, 50.0, 38.0, 20.0, 9.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0161285400390625, -0.015784502029418945, -0.01544046401977539, -0.015096426010131836, -0.014752388000488281, -0.014408349990844727, -0.014064311981201172, -0.013720273971557617, -0.013376235961914062, -0.013032197952270508, -0.012688159942626953, -0.012344121932983398, -0.012000083923339844, -0.011656045913696289, -0.011312007904052734, -0.01096796989440918, -0.010623931884765625, -0.01027989387512207, -0.009935855865478516, -0.009591817855834961, -0.009247779846191406, -0.008903741836547852, -0.008559703826904297, -0.008215665817260742, -0.007871627807617188, -0.007527589797973633, -0.007183551788330078, -0.0068395137786865234, -0.006495475769042969, -0.006151437759399414, -0.005807399749755859, -0.005463361740112305, -0.00511932373046875, -0.004775285720825195, -0.004431247711181641, -0.004087209701538086, -0.0037431716918945312, -0.0033991336822509766, -0.003055095672607422, -0.002711057662963867, -0.0023670196533203125, -0.002022981643676758, -0.0016789436340332031, -0.0013349056243896484, -0.0009908676147460938, -0.0006468296051025391, -0.0003027915954589844, 4.124641418457031e-05, 0.000385284423828125, 0.0007293224334716797, 0.0010733604431152344, 0.001417398452758789, 0.0017614364624023438, 0.0021054744720458984, 0.002449512481689453, 0.002793550491333008, 0.0031375885009765625, 0.003481626510620117, 0.003825664520263672, 0.0041697025299072266, 0.004513740539550781, 0.004857778549194336, 0.005201816558837891, 0.005545854568481445, 0.005889892578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 15.0, 18.0, 23.0, 29.0, 36.0, 41.0, 52.0, 61.0, 91.0, 100.0, 117.0, 182.0, 217.0, 250.0, 356.0, 429.0, 554.0, 786.0, 931.0, 1284.0, 1712.0, 2466.0, 4002.0, 7339.0, 21642.0, 4061054.0, 62206.0, 11324.0, 5289.0, 3118.0, 2091.0, 1504.0, 1123.0, 858.0, 646.0, 507.0, 387.0, 305.0, 244.0, 184.0, 149.0, 133.0, 83.0, 61.0, 74.0, 56.0, 33.0, 31.0, 23.0, 25.0, 13.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.01861572265625, -0.018029212951660156, -0.017442703247070312, -0.01685619354248047, -0.016269683837890625, -0.01568317413330078, -0.015096664428710938, -0.014510154724121094, -0.01392364501953125, -0.013337135314941406, -0.012750625610351562, -0.012164115905761719, -0.011577606201171875, -0.010991096496582031, -0.010404586791992188, -0.009818077087402344, -0.0092315673828125, -0.008645057678222656, -0.008058547973632812, -0.007472038269042969, -0.006885528564453125, -0.006299018859863281, -0.0057125091552734375, -0.005125999450683594, -0.00453948974609375, -0.003952980041503906, -0.0033664703369140625, -0.0027799606323242188, -0.002193450927734375, -0.0016069412231445312, -0.0010204315185546875, -0.00043392181396484375, 0.000152587890625, 0.0007390975952148438, 0.0013256072998046875, 0.0019121170043945312, 0.002498626708984375, 0.0030851364135742188, 0.0036716461181640625, 0.004258155822753906, 0.00484466552734375, 0.005431175231933594, 0.0060176849365234375, 0.006604194641113281, 0.007190704345703125, 0.007777214050292969, 0.008363723754882812, 0.008950233459472656, 0.0095367431640625, 0.010123252868652344, 0.010709762573242188, 0.011296272277832031, 0.011882781982421875, 0.012469291687011719, 0.013055801391601562, 0.013642311096191406, 0.01422882080078125, 0.014815330505371094, 0.015401840209960938, 0.01598834991455078, 0.016574859619140625, 0.01716136932373047, 0.017747879028320312, 0.018334388732910156, 0.0189208984375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 16.0, 74.0, 3765.0, 101.0, 31.0, 14.0, 10.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0084228515625, -0.008157014846801758, -0.007891178131103516, -0.0076253414154052734, -0.007359504699707031, -0.007093667984008789, -0.006827831268310547, -0.006561994552612305, -0.0062961578369140625, -0.00603032112121582, -0.005764484405517578, -0.005498647689819336, -0.005232810974121094, -0.0049669742584228516, -0.004701137542724609, -0.004435300827026367, -0.004169464111328125, -0.003903627395629883, -0.0036377906799316406, -0.0033719539642333984, -0.0031061172485351562, -0.002840280532836914, -0.002574443817138672, -0.0023086071014404297, -0.0020427703857421875, -0.0017769336700439453, -0.0015110969543457031, -0.001245260238647461, -0.0009794235229492188, -0.0007135868072509766, -0.0004477500915527344, -0.0001819133758544922, 8.392333984375e-05, 0.0003497600555419922, 0.0006155967712402344, 0.0008814334869384766, 0.0011472702026367188, 0.001413106918334961, 0.0016789436340332031, 0.0019447803497314453, 0.0022106170654296875, 0.0024764537811279297, 0.002742290496826172, 0.003008127212524414, 0.0032739639282226562, 0.0035398006439208984, 0.0038056373596191406, 0.004071474075317383, 0.004337310791015625, 0.004603147506713867, 0.004868984222412109, 0.0051348209381103516, 0.005400657653808594, 0.005666494369506836, 0.005932331085205078, 0.00619816780090332, 0.0064640045166015625, 0.006729841232299805, 0.006995677947998047, 0.007261514663696289, 0.007527351379394531, 0.0077931880950927734, 0.008059024810791016, 0.008324861526489258, 0.0085906982421875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 5.0, 5.0, 6.0, 9.0, 15.0, 20.0, 41.0, 56.0, 118.0, 309.0, 183.0, 93.0, 54.0, 28.0, 14.0, 9.0, 13.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.06678162515163422, -0.06535442918539047, -0.06392724066972733, -0.06250004470348358, -0.061072852462530136, -0.05964566022157669, -0.05821846425533295, -0.0567912720143795, -0.055364079773426056, -0.05393688753247261, -0.052509695291519165, -0.05108249932527542, -0.049655307084321976, -0.04822811484336853, -0.046800918877124786, -0.04537372663617134, -0.043946534395217896, -0.04251934215426445, -0.041092149913311005, -0.03966495394706726, -0.038237761706113815, -0.03681056946516037, -0.035383373498916626, -0.03395618125796318, -0.032528989017009735, -0.03110179677605629, -0.029674602672457695, -0.0282474085688591, -0.026820216327905655, -0.02539302408695221, -0.023965829983353615, -0.02253863587975502, -0.021111439913511276, -0.01968424767255783, -0.018257053568959236, -0.01682985946536064, -0.015402667224407196, -0.013975474052131176, -0.012548280879855156, -0.011121087707579136, -0.009693894535303116, -0.008266701363027096, -0.006839508190751076, -0.005412315018475056, -0.003985121846199036, -0.0025579286739230156, -0.0011307355016469955, 0.0002964576706290245, 0.0017236508429050446, 0.0031508440151810646, 0.004578037187457085, 0.006005230359733105, 0.007432423532009125, 0.008859616704285145, 0.010286809876561165, 0.011714003048837185, 0.013141196221113205, 0.014568389393389225, 0.015995582565665245, 0.01742277666926384, 0.018849968910217285, 0.02027716115117073, 0.021704355254769325, 0.02313154935836792, 0.024558741599321365]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 0.0, 6.0, 9.0, 7.0, 10.0, 8.0, 16.0, 22.0, 21.0, 24.0, 24.0, 40.0, 43.0, 25.0, 54.0, 41.0, 64.0, 48.0, 46.0, 51.0, 60.0, 46.0, 58.0, 34.0, 48.0, 28.0, 24.0, 27.0, 21.0, 19.0, 14.0, 16.0, 13.0, 8.0, 7.0, 2.0, 6.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018233835697174072, -0.01767660304903984, -0.01711937040090561, -0.016562137752771378, -0.016004905104637146, -0.015447672456502914, -0.014890439808368683, -0.014333207160234451, -0.01377597451210022, -0.013218741863965988, -0.012661509215831757, -0.012104276567697525, -0.011547043919563293, -0.010989811271429062, -0.01043257862329483, -0.009875345975160599, -0.009318113327026367, -0.008760880678892136, -0.008203648030757904, -0.0076464153826236725, -0.007089182734489441, -0.006531950086355209, -0.005974717438220978, -0.005417484790086746, -0.004860252141952515, -0.004303019493818283, -0.0037457868456840515, -0.00318855419754982, -0.0026313215494155884, -0.002074088901281357, -0.0015168562531471252, -0.0009596236050128937, -0.0004023909568786621, 0.00015484169125556946, 0.000712074339389801, 0.0012693069875240326, 0.0018265396356582642, 0.0023837722837924957, 0.0029410049319267273, 0.003498237580060959, 0.00405547022819519, 0.004612702876329422, 0.0051699355244636536, 0.005727168172597885, 0.006284400820732117, 0.006841633468866348, 0.00739886611700058, 0.007956098765134811, 0.008513331413269043, 0.009070564061403275, 0.009627796709537506, 0.010185029357671738, 0.01074226200580597, 0.0112994946539402, 0.011856727302074432, 0.012413959950208664, 0.012971192598342896, 0.013528425246477127, 0.014085657894611359, 0.01464289054274559, 0.015200123190879822, 0.015757355839014053, 0.016314588487148285, 0.016871821135282516, 0.017429053783416748]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 11.0, 4.0, 15.0, 17.0, 28.0, 35.0, 49.0, 76.0, 131.0, 380.0, 1102.0, 5249.0, 51688.0, 877786.0, 101161.0, 8422.0, 1518.0, 400.0, 172.0, 83.0, 54.0, 38.0, 27.0, 31.0, 16.0, 17.0, 6.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0848388671875, -0.08187389373779297, -0.07890892028808594, -0.0759439468383789, -0.07297897338867188, -0.07001399993896484, -0.06704902648925781, -0.06408405303955078, -0.06111907958984375, -0.05815410614013672, -0.05518913269042969, -0.052224159240722656, -0.049259185791015625, -0.046294212341308594, -0.04332923889160156, -0.04036426544189453, -0.0373992919921875, -0.03443431854248047, -0.03146934509277344, -0.028504371643066406, -0.025539398193359375, -0.022574424743652344, -0.019609451293945312, -0.01664447784423828, -0.01367950439453125, -0.010714530944824219, -0.0077495574951171875, -0.004784584045410156, -0.001819610595703125, 0.0011453628540039062, 0.0041103363037109375, 0.007075309753417969, 0.010040283203125, 0.013005256652832031, 0.015970230102539062, 0.018935203552246094, 0.021900177001953125, 0.024865150451660156, 0.027830123901367188, 0.03079509735107422, 0.03376007080078125, 0.03672504425048828, 0.03969001770019531, 0.042654991149902344, 0.045619964599609375, 0.048584938049316406, 0.05154991149902344, 0.05451488494873047, 0.0574798583984375, 0.06044483184814453, 0.06340980529785156, 0.0663747787475586, 0.06933975219726562, 0.07230472564697266, 0.07526969909667969, 0.07823467254638672, 0.08119964599609375, 0.08416461944580078, 0.08712959289550781, 0.09009456634521484, 0.09305953979492188, 0.0960245132446289, 0.09898948669433594, 0.10195446014404297, 0.10491943359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 13.0, 17.0, 39.0, 45.0, 106.0, 138.0, 164.0, 146.0, 134.0, 78.0, 49.0, 37.0, 17.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01605224609375, -0.015709340572357178, -0.015366435050964355, -0.015023529529571533, -0.014680624008178711, -0.014337718486785889, -0.013994812965393066, -0.013651907444000244, -0.013309001922607422, -0.0129660964012146, -0.012623190879821777, -0.012280285358428955, -0.011937379837036133, -0.01159447431564331, -0.011251568794250488, -0.010908663272857666, -0.010565757751464844, -0.010222852230072021, -0.0098799467086792, -0.009537041187286377, -0.009194135665893555, -0.008851230144500732, -0.00850832462310791, -0.008165419101715088, -0.007822513580322266, -0.007479608058929443, -0.007136702537536621, -0.006793797016143799, -0.0064508914947509766, -0.006107985973358154, -0.005765080451965332, -0.00542217493057251, -0.0050792694091796875, -0.004736363887786865, -0.004393458366394043, -0.004050552845001221, -0.0037076473236083984, -0.003364741802215576, -0.003021836280822754, -0.0026789307594299316, -0.0023360252380371094, -0.001993119716644287, -0.0016502141952514648, -0.0013073086738586426, -0.0009644031524658203, -0.000621497631072998, -0.0002785921096801758, 6.431341171264648e-05, 0.00040721893310546875, 0.000750124454498291, 0.0010930299758911133, 0.0014359354972839355, 0.0017788410186767578, 0.00212174654006958, 0.0024646520614624023, 0.0028075575828552246, 0.003150463104248047, 0.003493368625640869, 0.0038362741470336914, 0.004179179668426514, 0.004522085189819336, 0.004864990711212158, 0.0052078962326049805, 0.005550801753997803, 0.005893707275390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 9.0, 22.0, 26.0, 48.0, 41.0, 67.0, 120.0, 163.0, 243.0, 379.0, 614.0, 912.0, 1531.0, 2450.0, 3927.0, 6747.0, 11417.0, 19397.0, 34899.0, 65991.0, 138496.0, 416367.0, 172730.0, 77180.0, 40269.0, 22282.0, 12963.0, 7487.0, 4582.0, 2651.0, 1656.0, 991.0, 683.0, 401.0, 257.0, 180.0, 115.0, 77.0, 57.0, 34.0, 24.0, 16.0, 14.0, 9.0, 9.0, 5.0, 4.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0], "bins": [-0.01629638671875, -0.015746116638183594, -0.015195846557617188, -0.014645576477050781, -0.014095306396484375, -0.013545036315917969, -0.012994766235351562, -0.012444496154785156, -0.01189422607421875, -0.011343955993652344, -0.010793685913085938, -0.010243415832519531, -0.009693145751953125, -0.009142875671386719, -0.008592605590820312, -0.008042335510253906, -0.0074920654296875, -0.006941795349121094, -0.0063915252685546875, -0.005841255187988281, -0.005290985107421875, -0.004740715026855469, -0.0041904449462890625, -0.0036401748657226562, -0.00308990478515625, -0.0025396347045898438, -0.0019893646240234375, -0.0014390945434570312, -0.000888824462890625, -0.00033855438232421875, 0.0002117156982421875, 0.0007619857788085938, 0.001312255859375, 0.0018625259399414062, 0.0024127960205078125, 0.0029630661010742188, 0.003513336181640625, 0.004063606262207031, 0.0046138763427734375, 0.005164146423339844, 0.00571441650390625, 0.006264686584472656, 0.0068149566650390625, 0.007365226745605469, 0.007915496826171875, 0.008465766906738281, 0.009016036987304688, 0.009566307067871094, 0.0101165771484375, 0.010666847229003906, 0.011217117309570312, 0.011767387390136719, 0.012317657470703125, 0.012867927551269531, 0.013418197631835938, 0.013968467712402344, 0.01451873779296875, 0.015069007873535156, 0.015619277954101562, 0.01616954803466797, 0.016719818115234375, 0.01727008819580078, 0.017820358276367188, 0.018370628356933594, 0.0189208984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 4.0, 13.0, 7.0, 13.0, 12.0, 13.0, 29.0, 22.0, 16.0, 26.0, 20.0, 28.0, 47.0, 35.0, 37.0, 46.0, 33.0, 45.0, 47.0, 50.0, 42.0, 38.0, 37.0, 40.0, 47.0, 30.0, 29.0, 31.0, 25.0, 29.0, 19.0, 15.0, 11.0, 16.0, 8.0, 6.0, 8.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0185546875, -0.018015384674072266, -0.01747608184814453, -0.016936779022216797, -0.016397476196289062, -0.015858173370361328, -0.015318870544433594, -0.01477956771850586, -0.014240264892578125, -0.01370096206665039, -0.013161659240722656, -0.012622356414794922, -0.012083053588867188, -0.011543750762939453, -0.011004447937011719, -0.010465145111083984, -0.00992584228515625, -0.009386539459228516, -0.008847236633300781, -0.008307933807373047, -0.0077686309814453125, -0.007229328155517578, -0.006690025329589844, -0.006150722503662109, -0.005611419677734375, -0.005072116851806641, -0.004532814025878906, -0.003993511199951172, -0.0034542083740234375, -0.002914905548095703, -0.0023756027221679688, -0.0018362998962402344, -0.0012969970703125, -0.0007576942443847656, -0.00021839141845703125, 0.0003209114074707031, 0.0008602142333984375, 0.0013995170593261719, 0.0019388198852539062, 0.0024781227111816406, 0.003017425537109375, 0.0035567283630371094, 0.004096031188964844, 0.004635334014892578, 0.0051746368408203125, 0.005713939666748047, 0.006253242492675781, 0.006792545318603516, 0.00733184814453125, 0.007871150970458984, 0.008410453796386719, 0.008949756622314453, 0.009489059448242188, 0.010028362274169922, 0.010567665100097656, 0.01110696792602539, 0.011646270751953125, 0.01218557357788086, 0.012724876403808594, 0.013264179229736328, 0.013803482055664062, 0.014342784881591797, 0.014882087707519531, 0.015421390533447266, 0.015960693359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 10.0, 16.0, 20.0, 33.0, 36.0, 79.0, 97.0, 187.0, 295.0, 526.0, 990.0, 1949.0, 4529.0, 11483.0, 39247.0, 303514.0, 611247.0, 50348.0, 13924.0, 5175.0, 2237.0, 1100.0, 595.0, 342.0, 207.0, 127.0, 87.0, 33.0, 26.0, 22.0, 21.0, 13.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0002655982971191406, -0.0002567693591117859, -0.00024794042110443115, -0.00023911148309707642, -0.00023028254508972168, -0.00022145360708236694, -0.0002126246690750122, -0.00020379573106765747, -0.00019496679306030273, -0.000186137855052948, -0.00017730891704559326, -0.00016847997903823853, -0.0001596510410308838, -0.00015082210302352905, -0.00014199316501617432, -0.00013316422700881958, -0.00012433528900146484, -0.00011550635099411011, -0.00010667741298675537, -9.784847497940063e-05, -8.90195369720459e-05, -8.019059896469116e-05, -7.136166095733643e-05, -6.253272294998169e-05, -5.370378494262695e-05, -4.487484693527222e-05, -3.604590892791748e-05, -2.7216970920562744e-05, -1.8388032913208008e-05, -9.559094905853271e-06, -7.301568984985352e-07, 8.098781108856201e-06, 1.6927719116210938e-05, 2.5756657123565674e-05, 3.458559513092041e-05, 4.3414533138275146e-05, 5.224347114562988e-05, 6.107240915298462e-05, 6.990134716033936e-05, 7.873028516769409e-05, 8.755922317504883e-05, 9.638816118240356e-05, 0.0001052170991897583, 0.00011404603719711304, 0.00012287497520446777, 0.0001317039132118225, 0.00014053285121917725, 0.00014936178922653198, 0.00015819072723388672, 0.00016701966524124146, 0.0001758486032485962, 0.00018467754125595093, 0.00019350647926330566, 0.0002023354172706604, 0.00021116435527801514, 0.00021999329328536987, 0.0002288222312927246, 0.00023765116930007935, 0.0002464801073074341, 0.0002553090453147888, 0.00026413798332214355, 0.0002729669213294983, 0.00028179585933685303, 0.00029062479734420776, 0.0002994537353515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 9.0, 7.0, 18.0, 28.0, 27.0, 24.0, 35.0, 49.0, 55.0, 94.0, 118.0, 119.0, 101.0, 78.0, 54.0, 26.0, 33.0, 28.0, 10.0, 17.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1696090698242188e-05, -2.103857696056366e-05, -2.0381063222885132e-05, -1.9723549485206604e-05, -1.9066035747528076e-05, -1.840852200984955e-05, -1.775100827217102e-05, -1.7093494534492493e-05, -1.6435980796813965e-05, -1.5778467059135437e-05, -1.512095332145691e-05, -1.4463439583778381e-05, -1.3805925846099854e-05, -1.3148412108421326e-05, -1.2490898370742798e-05, -1.183338463306427e-05, -1.1175870895385742e-05, -1.0518357157707214e-05, -9.860843420028687e-06, -9.203329682350159e-06, -8.545815944671631e-06, -7.888302206993103e-06, -7.230788469314575e-06, -6.573274731636047e-06, -5.9157609939575195e-06, -5.258247256278992e-06, -4.600733518600464e-06, -3.943219780921936e-06, -3.285706043243408e-06, -2.6281923055648804e-06, -1.9706785678863525e-06, -1.3131648302078247e-06, -6.556510925292969e-07, 1.862645149230957e-09, 6.593763828277588e-07, 1.3168901205062866e-06, 1.9744038581848145e-06, 2.6319175958633423e-06, 3.28943133354187e-06, 3.946945071220398e-06, 4.604458808898926e-06, 5.261972546577454e-06, 5.9194862842559814e-06, 6.577000021934509e-06, 7.234513759613037e-06, 7.892027497291565e-06, 8.549541234970093e-06, 9.20705497264862e-06, 9.864568710327148e-06, 1.0522082448005676e-05, 1.1179596185684204e-05, 1.1837109923362732e-05, 1.249462366104126e-05, 1.3152137398719788e-05, 1.3809651136398315e-05, 1.4467164874076843e-05, 1.5124678611755371e-05, 1.57821923494339e-05, 1.6439706087112427e-05, 1.7097219824790955e-05, 1.7754733562469482e-05, 1.841224730014801e-05, 1.9069761037826538e-05, 1.9727274775505066e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 14.0, 21.0, 16.0, 30.0, 35.0, 52.0, 88.0, 159.0, 347.0, 647.0, 1227.0, 2528.0, 5457.0, 12950.0, 36790.0, 175159.0, 692687.0, 80868.0, 22749.0, 8829.0, 3893.0, 1937.0, 951.0, 464.0, 246.0, 149.0, 72.0, 46.0, 37.0, 22.0, 11.0, 13.0, 13.0, 8.0, 4.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00029730796813964844, -0.0002893339842557907, -0.000281360000371933, -0.00027338601648807526, -0.00026541203260421753, -0.0002574380487203598, -0.0002494640648365021, -0.00024149008095264435, -0.00023351609706878662, -0.0002255421131849289, -0.00021756812930107117, -0.00020959414541721344, -0.0002016201615333557, -0.00019364617764949799, -0.00018567219376564026, -0.00017769820988178253, -0.0001697242259979248, -0.00016175024211406708, -0.00015377625823020935, -0.00014580227434635162, -0.0001378282904624939, -0.00012985430657863617, -0.00012188032269477844, -0.00011390633881092072, -0.00010593235492706299, -9.795837104320526e-05, -8.998438715934753e-05, -8.201040327548981e-05, -7.403641939163208e-05, -6.606243550777435e-05, -5.8088451623916626e-05, -5.01144677400589e-05, -4.214048385620117e-05, -3.4166499972343445e-05, -2.6192516088485718e-05, -1.821853220462799e-05, -1.0244548320770264e-05, -2.2705644369125366e-06, 5.7034194469451904e-06, 1.3677403330802917e-05, 2.1651387214660645e-05, 2.962537109851837e-05, 3.75993549823761e-05, 4.5573338866233826e-05, 5.354732275009155e-05, 6.152130663394928e-05, 6.949529051780701e-05, 7.746927440166473e-05, 8.544325828552246e-05, 9.341724216938019e-05, 0.00010139122605323792, 0.00010936520993709564, 0.00011733919382095337, 0.0001253131777048111, 0.00013328716158866882, 0.00014126114547252655, 0.00014923512935638428, 0.000157209113240242, 0.00016518309712409973, 0.00017315708100795746, 0.00018113106489181519, 0.0001891050487756729, 0.00019707903265953064, 0.00020505301654338837, 0.0002130270004272461]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 10.0, 7.0, 6.0, 16.0, 19.0, 23.0, 40.0, 44.0, 70.0, 93.0, 173.0, 109.0, 106.0, 77.0, 59.0, 26.0, 36.0, 14.0, 14.0, 14.0, 13.0, 5.0, 5.0, 4.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015163421630859375, -0.00014471635222434998, -0.0001377984881401062, -0.00013088062405586243, -0.00012396275997161865, -0.00011704489588737488, -0.0001101270318031311, -0.00010320916771888733, -9.629130363464355e-05, -8.937343955039978e-05, -8.2455575466156e-05, -7.553771138191223e-05, -6.861984729766846e-05, -6.170198321342468e-05, -5.478411912918091e-05, -4.7866255044937134e-05, -4.094839096069336e-05, -3.4030526876449585e-05, -2.711266279220581e-05, -2.0194798707962036e-05, -1.3276934623718262e-05, -6.359070539474487e-06, 5.587935447692871e-07, 7.4766576290130615e-06, 1.4394521713256836e-05, 2.131238579750061e-05, 2.8230249881744385e-05, 3.514811396598816e-05, 4.2065978050231934e-05, 4.898384213447571e-05, 5.590170621871948e-05, 6.281957030296326e-05, 6.973743438720703e-05, 7.66552984714508e-05, 8.357316255569458e-05, 9.049102663993835e-05, 9.740889072418213e-05, 0.0001043267548084259, 0.00011124461889266968, 0.00011816248297691345, 0.00012508034706115723, 0.000131998211145401, 0.00013891607522964478, 0.00014583393931388855, 0.00015275180339813232, 0.0001596696674823761, 0.00016658753156661987, 0.00017350539565086365, 0.00018042325973510742, 0.0001873411238193512, 0.00019425898790359497, 0.00020117685198783875, 0.00020809471607208252, 0.0002150125801563263, 0.00022193044424057007, 0.00022884830832481384, 0.00023576617240905762, 0.0002426840364933014, 0.00024960190057754517, 0.00025651976466178894, 0.0002634376287460327, 0.0002703554928302765, 0.00027727335691452026, 0.00028419122099876404, 0.0002911090850830078]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 5.0, 12.0, 15.0, 22.0, 39.0, 73.0, 151.0, 293.0, 122.0, 76.0, 46.0, 34.0, 31.0, 21.0, 18.0, 11.0, 10.0, 6.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14017176628112793, -0.1336183100938797, -0.12706485390663147, -0.12051139026880264, -0.11395792663097382, -0.10740447044372559, -0.10085101425647736, -0.09429755806922913, -0.0877440944314003, -0.08119063824415207, -0.07463717460632324, -0.06808371841907501, -0.061530258506536484, -0.054976798593997955, -0.048423342406749725, -0.0418698824942112, -0.03531642258167267, -0.02876296266913414, -0.02220950461924076, -0.01565604656934738, -0.009102586656808853, -0.0025491267442703247, 0.004004329442977905, 0.010557789355516434, 0.017111249268054962, 0.02366470918059349, 0.03021816723048687, 0.03677162528038025, 0.04332508519291878, 0.049878545105457306, 0.056432001292705536, 0.06298546493053436, 0.06953892111778259, 0.07609237730503082, 0.08264584094285965, 0.08919929713010788, 0.0957527607679367, 0.10230621695518494, 0.10885967314243317, 0.1154131293296814, 0.12196659296751022, 0.12852005660533905, 0.13507351279258728, 0.1416269689798355, 0.14818042516708374, 0.15473389625549316, 0.1612873375415802, 0.16784080862998962, 0.17439426481723785, 0.18094772100448608, 0.18750117719173431, 0.19405463337898254, 0.20060810446739197, 0.2071615606546402, 0.21371501684188843, 0.22026847302913666, 0.2268219292163849, 0.23337538540363312, 0.23992884159088135, 0.24648231267929077, 0.2530357539653778, 0.25958922505378723, 0.26614266633987427, 0.2726961374282837, 0.2792496085166931]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 2.0, 6.0, 10.0, 7.0, 16.0, 24.0, 25.0, 32.0, 30.0, 38.0, 45.0, 48.0, 50.0, 69.0, 63.0, 65.0, 66.0, 59.0, 53.0, 45.0, 42.0, 36.0, 33.0, 25.0, 19.0, 20.0, 13.0, 13.0, 11.0, 11.0, 5.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09801137447357178, -0.09446129202842712, -0.09091120958328247, -0.08736112713813782, -0.08381104469299316, -0.08026096224784851, -0.07671087235212326, -0.07316078990697861, -0.06961070746183395, -0.0660606250166893, -0.06251054257154465, -0.058960456401109695, -0.05541037395596504, -0.05186029151082039, -0.04831020534038544, -0.044760122895240784, -0.04121004045009613, -0.03765995800495148, -0.034109875559806824, -0.030559789389371872, -0.02700970694422722, -0.023459624499082565, -0.019909540191292763, -0.01635945588350296, -0.012809373438358307, -0.009259290061891079, -0.005709206685423851, -0.002159123308956623, 0.0013909600675106049, 0.004941042512655258, 0.00849112682044506, 0.012041211128234863, 0.015591293573379517, 0.01914137601852417, 0.022691460326313972, 0.026241544634103775, 0.02979162707924843, 0.03334170952439308, 0.03689179569482803, 0.04044187813997269, 0.04399196058511734, 0.04754204303026199, 0.05109212547540665, 0.0546422116458416, 0.05819229409098625, 0.061742376536130905, 0.06529246270656586, 0.06884254515171051, 0.07239262759685516, 0.07594271004199982, 0.07949279248714447, 0.08304287493228912, 0.08659295737743378, 0.09014303982257843, 0.09369312971830368, 0.09724321216344833, 0.10079329460859299, 0.10434337705373764, 0.1078934594988823, 0.11144354194402695, 0.1149936318397522, 0.11854371428489685, 0.1220937967300415, 0.12564387917518616, 0.1291939616203308]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 10.0, 22.0, 32.0, 53.0, 122.0, 272.0, 648.0, 2028.0, 13411.0, 4172109.0, 3808.0, 1018.0, 407.0, 156.0, 79.0, 39.0, 17.0, 16.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.095458984375, -0.09339284896850586, -0.09132671356201172, -0.08926057815551758, -0.08719444274902344, -0.0851283073425293, -0.08306217193603516, -0.08099603652954102, -0.07892990112304688, -0.07686376571655273, -0.0747976303100586, -0.07273149490356445, -0.07066535949707031, -0.06859922409057617, -0.06653308868408203, -0.06446695327758789, -0.06240081787109375, -0.06033468246459961, -0.05826854705810547, -0.05620241165161133, -0.05413627624511719, -0.05207014083862305, -0.050004005432128906, -0.047937870025634766, -0.045871734619140625, -0.043805599212646484, -0.041739463806152344, -0.0396733283996582, -0.03760719299316406, -0.03554105758666992, -0.03347492218017578, -0.03140878677368164, -0.0293426513671875, -0.02727651596069336, -0.02521038055419922, -0.023144245147705078, -0.021078109741210938, -0.019011974334716797, -0.016945838928222656, -0.014879703521728516, -0.012813568115234375, -0.010747432708740234, -0.008681297302246094, -0.006615161895751953, -0.0045490264892578125, -0.002482891082763672, -0.00041675567626953125, 0.0016493797302246094, 0.00371551513671875, 0.005781650543212891, 0.007847785949707031, 0.009913921356201172, 0.011980056762695312, 0.014046192169189453, 0.016112327575683594, 0.018178462982177734, 0.020244598388671875, 0.022310733795166016, 0.024376869201660156, 0.026443004608154297, 0.028509140014648438, 0.030575275421142578, 0.03264141082763672, 0.03470754623413086, 0.036773681640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 13.0, 16.0, 35.0, 49.0, 92.0, 135.0, 165.0, 136.0, 146.0, 81.0, 53.0, 43.0, 17.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0153350830078125, -0.015001475811004639, -0.014667868614196777, -0.014334261417388916, -0.014000654220581055, -0.013667047023773193, -0.013333439826965332, -0.01299983263015747, -0.01266622543334961, -0.012332618236541748, -0.011999011039733887, -0.011665403842926025, -0.011331796646118164, -0.010998189449310303, -0.010664582252502441, -0.01033097505569458, -0.009997367858886719, -0.009663760662078857, -0.009330153465270996, -0.008996546268463135, -0.008662939071655273, -0.008329331874847412, -0.00799572467803955, -0.0076621174812316895, -0.007328510284423828, -0.006994903087615967, -0.0066612958908081055, -0.006327688694000244, -0.005994081497192383, -0.0056604743003845215, -0.00532686710357666, -0.004993259906768799, -0.0046596527099609375, -0.004326045513153076, -0.003992438316345215, -0.0036588311195373535, -0.003325223922729492, -0.002991616725921631, -0.0026580095291137695, -0.002324402332305908, -0.001990795135498047, -0.0016571879386901855, -0.0013235807418823242, -0.0009899735450744629, -0.0006563663482666016, -0.00032275915145874023, 1.0848045349121094e-05, 0.0003444552421569824, 0.0006780624389648438, 0.001011669635772705, 0.0013452768325805664, 0.0016788840293884277, 0.002012491226196289, 0.0023460984230041504, 0.0026797056198120117, 0.003013312816619873, 0.0033469200134277344, 0.0036805272102355957, 0.004014134407043457, 0.004347741603851318, 0.00468134880065918, 0.005014955997467041, 0.005348563194274902, 0.005682170391082764, 0.006015777587890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 6.0, 4.0, 8.0, 11.0, 11.0, 9.0, 13.0, 16.0, 27.0, 28.0, 37.0, 45.0, 70.0, 162.0, 269.0, 570.0, 1055.0, 2129.0, 5006.0, 20478.0, 4140119.0, 15628.0, 4400.0, 2005.0, 978.0, 487.0, 249.0, 147.0, 79.0, 58.0, 43.0, 20.0, 22.0, 11.0, 17.0, 7.0, 17.0, 9.0, 5.0, 1.0, 6.0, 2.0, 7.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0], "bins": [-0.043853759765625, -0.04261636734008789, -0.04137897491455078, -0.04014158248901367, -0.03890419006347656, -0.03766679763793945, -0.036429405212402344, -0.035192012786865234, -0.033954620361328125, -0.032717227935791016, -0.031479835510253906, -0.030242443084716797, -0.029005050659179688, -0.027767658233642578, -0.02653026580810547, -0.02529287338256836, -0.02405548095703125, -0.02281808853149414, -0.02158069610595703, -0.020343303680419922, -0.019105911254882812, -0.017868518829345703, -0.016631126403808594, -0.015393733978271484, -0.014156341552734375, -0.012918949127197266, -0.011681556701660156, -0.010444164276123047, -0.009206771850585938, -0.007969379425048828, -0.006731986999511719, -0.005494594573974609, -0.0042572021484375, -0.0030198097229003906, -0.0017824172973632812, -0.0005450248718261719, 0.0006923675537109375, 0.0019297599792480469, 0.0031671524047851562, 0.004404544830322266, 0.005641937255859375, 0.006879329681396484, 0.008116722106933594, 0.009354114532470703, 0.010591506958007812, 0.011828899383544922, 0.013066291809082031, 0.01430368423461914, 0.01554107666015625, 0.01677846908569336, 0.01801586151123047, 0.019253253936767578, 0.020490646362304688, 0.021728038787841797, 0.022965431213378906, 0.024202823638916016, 0.025440216064453125, 0.026677608489990234, 0.027915000915527344, 0.029152393341064453, 0.030389785766601562, 0.03162717819213867, 0.03286457061767578, 0.03410196304321289, 0.03533935546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 10.0, 14.0, 85.0, 3840.0, 78.0, 13.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00949859619140625, -0.009011626243591309, -0.008524656295776367, -0.008037686347961426, -0.007550716400146484, -0.007063746452331543, -0.0065767765045166016, -0.00608980655670166, -0.005602836608886719, -0.005115866661071777, -0.004628896713256836, -0.0041419267654418945, -0.003654956817626953, -0.0031679868698120117, -0.0026810169219970703, -0.002194046974182129, -0.0017070770263671875, -0.001220107078552246, -0.0007331371307373047, -0.0002461671829223633, 0.00024080276489257812, 0.0007277727127075195, 0.001214742660522461, 0.0017017126083374023, 0.0021886825561523438, 0.002675652503967285, 0.0031626224517822266, 0.003649592399597168, 0.004136562347412109, 0.004623532295227051, 0.005110502243041992, 0.005597472190856934, 0.006084442138671875, 0.006571412086486816, 0.007058382034301758, 0.007545351982116699, 0.00803232192993164, 0.008519291877746582, 0.009006261825561523, 0.009493231773376465, 0.009980201721191406, 0.010467171669006348, 0.010954141616821289, 0.01144111156463623, 0.011928081512451172, 0.012415051460266113, 0.012902021408081055, 0.013388991355895996, 0.013875961303710938, 0.014362931251525879, 0.01484990119934082, 0.015336871147155762, 0.015823841094970703, 0.016310811042785645, 0.016797780990600586, 0.017284750938415527, 0.01777172088623047, 0.01825869083404541, 0.01874566078186035, 0.019232630729675293, 0.019719600677490234, 0.020206570625305176, 0.020693540573120117, 0.02118051052093506, 0.02166748046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 11.0, 14.0, 19.0, 18.0, 23.0, 37.0, 66.0, 78.0, 119.0, 236.0, 112.0, 76.0, 40.0, 33.0, 20.0, 31.0, 22.0, 5.0, 4.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.03700931370258331, -0.03596419841051102, -0.03491908311843872, -0.03387397155165672, -0.03282885625958443, -0.03178374096751213, -0.030738625675439835, -0.029693512246012688, -0.02864839881658554, -0.027603283524513245, -0.026558170095086098, -0.0255130548030138, -0.024467941373586655, -0.02342282608151436, -0.022377710789442062, -0.021332597360014915, -0.02028748206794262, -0.019242366775870323, -0.018197253346443176, -0.01715213805437088, -0.016107024624943733, -0.015061909332871437, -0.014016794972121716, -0.012971680611371994, -0.011926566250622272, -0.010881451889872551, -0.00983633752912283, -0.008791223168373108, -0.007746108341962099, -0.0067009939812123775, -0.005655879154801369, -0.004610764794051647, -0.003565652295947075, -0.0025205379351973534, -0.0014754233416169882, -0.000430308748036623, 0.0006148056127130985, 0.00165991997346282, 0.002705034799873829, 0.0037501491606235504, 0.004795263521373272, 0.0058403778821229935, 0.006885492242872715, 0.007930606603622437, 0.008975721895694733, 0.01002083532512188, 0.011065950617194176, 0.012111064977943897, 0.013156179338693619, 0.01420129369944334, 0.015246408060193062, 0.016291523352265358, 0.017336636781692505, 0.0183817520737648, 0.019426867365837097, 0.020471980795264244, 0.02151709422469139, 0.022562209516763687, 0.023607322946190834, 0.02465243823826313, 0.025697551667690277, 0.026742666959762573, 0.02778778225183487, 0.028832895681262016, 0.029878010973334312]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 11.0, 14.0, 18.0, 13.0, 21.0, 24.0, 18.0, 33.0, 33.0, 31.0, 25.0, 42.0, 53.0, 33.0, 40.0, 35.0, 35.0, 44.0, 32.0, 45.0, 34.0, 36.0, 38.0, 35.0, 34.0, 24.0, 22.0, 24.0, 27.0, 19.0, 13.0, 11.0, 9.0, 11.0, 9.0, 9.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.017805039882659912, -0.017306458204984665, -0.016807876527309418, -0.01630929484963417, -0.015810713171958923, -0.015312131494283676, -0.014813549816608429, -0.014314968138933182, -0.013816386461257935, -0.013317804783582687, -0.01281922310590744, -0.012320641428232193, -0.011822059750556946, -0.011323478072881699, -0.010824896395206451, -0.010326314717531204, -0.009827733039855957, -0.00932915136218071, -0.008830569684505463, -0.008331988006830215, -0.007833406329154968, -0.007334824651479721, -0.006836242973804474, -0.006337661296129227, -0.0058390796184539795, -0.005340497940778732, -0.004841916263103485, -0.004343334585428238, -0.0038447529077529907, -0.0033461712300777435, -0.0028475895524024963, -0.002349007874727249, -0.001850426197052002, -0.0013518445193767548, -0.0008532628417015076, -0.0003546811640262604, 0.00014390051364898682, 0.000642482191324234, 0.0011410638689994812, 0.0016396455466747284, 0.0021382272243499756, 0.0026368089020252228, 0.00313539057970047, 0.003633972257375717, 0.004132553935050964, 0.0046311356127262115, 0.005129717290401459, 0.005628298968076706, 0.006126880645751953, 0.0066254623234272, 0.0071240440011024475, 0.007622625678777695, 0.008121207356452942, 0.008619789034128189, 0.009118370711803436, 0.009616952389478683, 0.01011553406715393, 0.010614115744829178, 0.011112697422504425, 0.011611279100179672, 0.01210986077785492, 0.012608442455530167, 0.013107024133205414, 0.013605605810880661, 0.014104187488555908]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 6.0, 13.0, 14.0, 8.0, 6.0, 12.0, 20.0, 28.0, 40.0, 31.0, 50.0, 84.0, 149.0, 293.0, 711.0, 2137.0, 8592.0, 49654.0, 704470.0, 248186.0, 26176.0, 5267.0, 1428.0, 509.0, 223.0, 141.0, 78.0, 50.0, 31.0, 29.0, 22.0, 11.0, 16.0, 13.0, 9.0, 8.0, 8.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06402587890625, -0.06201457977294922, -0.06000328063964844, -0.057991981506347656, -0.055980682373046875, -0.053969383239746094, -0.05195808410644531, -0.04994678497314453, -0.04793548583984375, -0.04592418670654297, -0.04391288757324219, -0.041901588439941406, -0.039890289306640625, -0.037878990173339844, -0.03586769104003906, -0.03385639190673828, -0.0318450927734375, -0.02983379364013672, -0.027822494506835938, -0.025811195373535156, -0.023799896240234375, -0.021788597106933594, -0.019777297973632812, -0.01776599884033203, -0.01575469970703125, -0.013743400573730469, -0.011732101440429688, -0.009720802307128906, -0.007709503173828125, -0.005698204040527344, -0.0036869049072265625, -0.0016756057739257812, 0.000335693359375, 0.0023469924926757812, 0.0043582916259765625, 0.006369590759277344, 0.008380889892578125, 0.010392189025878906, 0.012403488159179688, 0.014414787292480469, 0.01642608642578125, 0.01843738555908203, 0.020448684692382812, 0.022459983825683594, 0.024471282958984375, 0.026482582092285156, 0.028493881225585938, 0.03050518035888672, 0.0325164794921875, 0.03452777862548828, 0.03653907775878906, 0.038550376892089844, 0.040561676025390625, 0.042572975158691406, 0.04458427429199219, 0.04659557342529297, 0.04860687255859375, 0.05061817169189453, 0.05262947082519531, 0.054640769958496094, 0.056652069091796875, 0.058663368225097656, 0.06067466735839844, 0.06268596649169922, 0.064697265625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 14.0, 15.0, 33.0, 56.0, 95.0, 132.0, 164.0, 147.0, 134.0, 80.0, 57.0, 40.0, 14.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.015289306640625, -0.014956295490264893, -0.014623284339904785, -0.014290273189544678, -0.01395726203918457, -0.013624250888824463, -0.013291239738464355, -0.012958228588104248, -0.01262521743774414, -0.012292206287384033, -0.011959195137023926, -0.011626183986663818, -0.011293172836303711, -0.010960161685943604, -0.010627150535583496, -0.010294139385223389, -0.009961128234863281, -0.009628117084503174, -0.009295105934143066, -0.008962094783782959, -0.008629083633422852, -0.008296072483062744, -0.007963061332702637, -0.007630050182342529, -0.007297039031982422, -0.0069640278816223145, -0.006631016731262207, -0.0062980055809021, -0.005964994430541992, -0.005631983280181885, -0.005298972129821777, -0.00496596097946167, -0.0046329498291015625, -0.004299938678741455, -0.003966927528381348, -0.0036339163780212402, -0.003300905227661133, -0.0029678940773010254, -0.002634882926940918, -0.0023018717765808105, -0.001968860626220703, -0.0016358494758605957, -0.0013028383255004883, -0.0009698271751403809, -0.0006368160247802734, -0.000303804874420166, 2.9206275939941406e-05, 0.00036221742630004883, 0.0006952285766601562, 0.0010282397270202637, 0.001361250877380371, 0.0016942620277404785, 0.002027273178100586, 0.0023602843284606934, 0.0026932954788208008, 0.003026306629180908, 0.0033593177795410156, 0.003692328929901123, 0.0040253400802612305, 0.004358351230621338, 0.004691362380981445, 0.005024373531341553, 0.00535738468170166, 0.005690395832061768, 0.006023406982421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 11.0, 2.0, 8.0, 16.0, 23.0, 57.0, 52.0, 84.0, 182.0, 342.0, 692.0, 1217.0, 2533.0, 5101.0, 10876.0, 24884.0, 61214.0, 177679.0, 529174.0, 143136.0, 51588.0, 21100.0, 9539.0, 4374.0, 2185.0, 1126.0, 591.0, 290.0, 153.0, 119.0, 71.0, 42.0, 33.0, 23.0, 12.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251617431640625, -0.02436065673828125, -0.0235595703125, -0.02275848388671875, -0.0219573974609375, -0.02115631103515625, -0.020355224609375, -0.01955413818359375, -0.0187530517578125, -0.01795196533203125, -0.01715087890625, -0.01634979248046875, -0.0155487060546875, -0.01474761962890625, -0.013946533203125, -0.01314544677734375, -0.0123443603515625, -0.01154327392578125, -0.0107421875, -0.00994110107421875, -0.0091400146484375, -0.00833892822265625, -0.007537841796875, -0.00673675537109375, -0.0059356689453125, -0.00513458251953125, -0.00433349609375, -0.00353240966796875, -0.0027313232421875, -0.00193023681640625, -0.001129150390625, -0.00032806396484375, 0.0004730224609375, 0.00127410888671875, 0.0020751953125, 0.00287628173828125, 0.0036773681640625, 0.00447845458984375, 0.005279541015625, 0.00608062744140625, 0.0068817138671875, 0.00768280029296875, 0.00848388671875, 0.00928497314453125, 0.0100860595703125, 0.01088714599609375, 0.011688232421875, 0.01248931884765625, 0.0132904052734375, 0.01409149169921875, 0.014892578125, 0.01569366455078125, 0.0164947509765625, 0.01729583740234375, 0.018096923828125, 0.01889801025390625, 0.0196990966796875, 0.02050018310546875, 0.02130126953125, 0.02210235595703125, 0.0229034423828125, 0.02370452880859375, 0.024505615234375, 0.02530670166015625, 0.0261077880859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 2.0, 11.0, 15.0, 9.0, 10.0, 17.0, 24.0, 19.0, 32.0, 20.0, 33.0, 43.0, 38.0, 45.0, 51.0, 41.0, 66.0, 49.0, 51.0, 45.0, 51.0, 44.0, 43.0, 35.0, 39.0, 40.0, 28.0, 22.0, 16.0, 11.0, 9.0, 9.0, 9.0, 4.0, 1.0, 5.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0201568603515625, -0.01953864097595215, -0.018920421600341797, -0.018302202224731445, -0.017683982849121094, -0.017065763473510742, -0.01644754409790039, -0.01582932472229004, -0.015211105346679688, -0.014592885971069336, -0.013974666595458984, -0.013356447219848633, -0.012738227844238281, -0.01212000846862793, -0.011501789093017578, -0.010883569717407227, -0.010265350341796875, -0.009647130966186523, -0.009028911590576172, -0.00841069221496582, -0.007792472839355469, -0.007174253463745117, -0.006556034088134766, -0.005937814712524414, -0.0053195953369140625, -0.004701375961303711, -0.004083156585693359, -0.003464937210083008, -0.0028467178344726562, -0.0022284984588623047, -0.0016102790832519531, -0.0009920597076416016, -0.00037384033203125, 0.00024437904357910156, 0.0008625984191894531, 0.0014808177947998047, 0.0020990371704101562, 0.002717256546020508, 0.0033354759216308594, 0.003953695297241211, 0.0045719146728515625, 0.005190134048461914, 0.005808353424072266, 0.006426572799682617, 0.007044792175292969, 0.00766301155090332, 0.008281230926513672, 0.008899450302124023, 0.009517669677734375, 0.010135889053344727, 0.010754108428955078, 0.01137232780456543, 0.011990547180175781, 0.012608766555786133, 0.013226985931396484, 0.013845205307006836, 0.014463424682617188, 0.015081644058227539, 0.01569986343383789, 0.016318082809448242, 0.016936302185058594, 0.017554521560668945, 0.018172740936279297, 0.01879096031188965, 0.0194091796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 10.0, 11.0, 24.0, 32.0, 66.0, 108.0, 197.0, 340.0, 728.0, 1495.0, 3532.0, 9364.0, 30597.0, 183959.0, 720734.0, 69993.0, 16986.0, 5812.0, 2364.0, 1069.0, 479.0, 254.0, 159.0, 71.0, 60.0, 36.0, 22.0, 13.0, 9.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003070831298828125, -0.00029582157731056213, -0.00028456002473831177, -0.0002732984721660614, -0.00026203691959381104, -0.00025077536702156067, -0.0002395138144493103, -0.00022825226187705994, -0.00021699070930480957, -0.0002057291567325592, -0.00019446760416030884, -0.00018320605158805847, -0.0001719444990158081, -0.00016068294644355774, -0.00014942139387130737, -0.000138159841299057, -0.00012689828872680664, -0.00011563673615455627, -0.00010437518358230591, -9.311363101005554e-05, -8.185207843780518e-05, -7.059052586555481e-05, -5.932897329330444e-05, -4.806742072105408e-05, -3.680586814880371e-05, -2.5544315576553345e-05, -1.4282763004302979e-05, -3.0212104320526123e-06, 8.240342140197754e-06, 1.950189471244812e-05, 3.0763447284698486e-05, 4.202499985694885e-05, 5.328655242919922e-05, 6.454810500144958e-05, 7.580965757369995e-05, 8.707121014595032e-05, 9.833276271820068e-05, 0.00010959431529045105, 0.00012085586786270142, 0.00013211742043495178, 0.00014337897300720215, 0.00015464052557945251, 0.00016590207815170288, 0.00017716363072395325, 0.0001884251832962036, 0.00019968673586845398, 0.00021094828844070435, 0.0002222098410129547, 0.00023347139358520508, 0.00024473294615745544, 0.0002559944987297058, 0.0002672560513019562, 0.00027851760387420654, 0.0002897791564464569, 0.0003010407090187073, 0.00031230226159095764, 0.000323563814163208, 0.0003348253667354584, 0.00034608691930770874, 0.0003573484718799591, 0.00036861002445220947, 0.00037987157702445984, 0.0003911331295967102, 0.00040239468216896057, 0.00041365623474121094]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 1.0, 7.0, 7.0, 7.0, 7.0, 7.0, 11.0, 16.0, 15.0, 20.0, 17.0, 13.0, 15.0, 36.0, 45.0, 46.0, 65.0, 113.0, 114.0, 101.0, 72.0, 39.0, 43.0, 33.0, 23.0, 15.0, 15.0, 22.0, 12.0, 8.0, 17.0, 7.0, 8.0, 4.0, 8.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.0934810638427734e-05, -3.0083581805229187e-05, -2.923235297203064e-05, -2.8381124138832092e-05, -2.7529895305633545e-05, -2.6678666472434998e-05, -2.582743763923645e-05, -2.4976208806037903e-05, -2.4124979972839355e-05, -2.3273751139640808e-05, -2.242252230644226e-05, -2.1571293473243713e-05, -2.0720064640045166e-05, -1.986883580684662e-05, -1.901760697364807e-05, -1.8166378140449524e-05, -1.7315149307250977e-05, -1.646392047405243e-05, -1.5612691640853882e-05, -1.4761462807655334e-05, -1.3910233974456787e-05, -1.305900514125824e-05, -1.2207776308059692e-05, -1.1356547474861145e-05, -1.0505318641662598e-05, -9.65408980846405e-06, -8.802860975265503e-06, -7.951632142066956e-06, -7.100403308868408e-06, -6.249174475669861e-06, -5.3979456424713135e-06, -4.546716809272766e-06, -3.6954879760742188e-06, -2.8442591428756714e-06, -1.993030309677124e-06, -1.1418014764785767e-06, -2.905726432800293e-07, 5.606561899185181e-07, 1.4118850231170654e-06, 2.263113856315613e-06, 3.11434268951416e-06, 3.9655715227127075e-06, 4.816800355911255e-06, 5.668029189109802e-06, 6.51925802230835e-06, 7.370486855506897e-06, 8.221715688705444e-06, 9.072944521903992e-06, 9.924173355102539e-06, 1.0775402188301086e-05, 1.1626631021499634e-05, 1.2477859854698181e-05, 1.3329088687896729e-05, 1.4180317521095276e-05, 1.5031546354293823e-05, 1.588277518749237e-05, 1.6734004020690918e-05, 1.7585232853889465e-05, 1.8436461687088013e-05, 1.928769052028656e-05, 2.0138919353485107e-05, 2.0990148186683655e-05, 2.1841377019882202e-05, 2.269260585308075e-05, 2.3543834686279297e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 9.0, 14.0, 12.0, 15.0, 24.0, 58.0, 79.0, 161.0, 212.0, 342.0, 705.0, 1503.0, 3169.0, 7403.0, 19202.0, 62978.0, 480768.0, 382358.0, 58254.0, 18357.0, 6954.0, 2926.0, 1388.0, 743.0, 375.0, 201.0, 138.0, 69.0, 41.0, 21.0, 21.0, 15.0, 15.0, 10.0, 9.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019693374633789062, -0.0001887194812297821, -0.00018050521612167358, -0.00017229095101356506, -0.00016407668590545654, -0.00015586242079734802, -0.0001476481556892395, -0.00013943389058113098, -0.00013121962547302246, -0.00012300536036491394, -0.00011479109525680542, -0.0001065768301486969, -9.836256504058838e-05, -9.014829993247986e-05, -8.193403482437134e-05, -7.371976971626282e-05, -6.55055046081543e-05, -5.7291239500045776e-05, -4.9076974391937256e-05, -4.0862709283828735e-05, -3.2648444175720215e-05, -2.4434179067611694e-05, -1.6219913959503174e-05, -8.005648851394653e-06, 2.086162567138672e-07, 8.422881364822388e-06, 1.6637146472930908e-05, 2.485141158103943e-05, 3.306567668914795e-05, 4.127994179725647e-05, 4.949420690536499e-05, 5.770847201347351e-05, 6.592273712158203e-05, 7.413700222969055e-05, 8.235126733779907e-05, 9.056553244590759e-05, 9.877979755401611e-05, 0.00010699406266212463, 0.00011520832777023315, 0.00012342259287834167, 0.0001316368579864502, 0.00013985112309455872, 0.00014806538820266724, 0.00015627965331077576, 0.00016449391841888428, 0.0001727081835269928, 0.00018092244863510132, 0.00018913671374320984, 0.00019735097885131836, 0.00020556524395942688, 0.0002137795090675354, 0.00022199377417564392, 0.00023020803928375244, 0.00023842230439186096, 0.0002466365694999695, 0.000254850834608078, 0.0002630650997161865, 0.00027127936482429504, 0.00027949362993240356, 0.0002877078950405121, 0.0002959221601486206, 0.0003041364252567291, 0.00031235069036483765, 0.00032056495547294617, 0.0003287792205810547]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 6.0, 1.0, 4.0, 9.0, 20.0, 19.0, 20.0, 24.0, 35.0, 42.0, 44.0, 57.0, 83.0, 85.0, 95.0, 83.0, 83.0, 66.0, 46.0, 37.0, 32.0, 25.0, 11.0, 15.0, 11.0, 8.0, 13.0, 4.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.0002536773681640625, -0.00024774298071861267, -0.00024180859327316284, -0.000235874205827713, -0.00022993981838226318, -0.00022400543093681335, -0.00021807104349136353, -0.0002121366560459137, -0.00020620226860046387, -0.00020026788115501404, -0.0001943334937095642, -0.00018839910626411438, -0.00018246471881866455, -0.00017653033137321472, -0.0001705959439277649, -0.00016466155648231506, -0.00015872716903686523, -0.0001527927815914154, -0.00014685839414596558, -0.00014092400670051575, -0.00013498961925506592, -0.0001290552318096161, -0.00012312084436416626, -0.00011718645691871643, -0.0001112520694732666, -0.00010531768202781677, -9.938329458236694e-05, -9.344890713691711e-05, -8.751451969146729e-05, -8.158013224601746e-05, -7.564574480056763e-05, -6.97113573551178e-05, -6.377696990966797e-05, -5.784258246421814e-05, -5.190819501876831e-05, -4.597380757331848e-05, -4.003942012786865e-05, -3.410503268241882e-05, -2.8170645236968994e-05, -2.2236257791519165e-05, -1.6301870346069336e-05, -1.0367482900619507e-05, -4.433095455169678e-06, 1.5012919902801514e-06, 7.4356794357299805e-06, 1.337006688117981e-05, 1.930445432662964e-05, 2.5238841772079468e-05, 3.11732292175293e-05, 3.7107616662979126e-05, 4.3042004108428955e-05, 4.8976391553878784e-05, 5.491077899932861e-05, 6.084516644477844e-05, 6.677955389022827e-05, 7.27139413356781e-05, 7.864832878112793e-05, 8.458271622657776e-05, 9.051710367202759e-05, 9.645149111747742e-05, 0.00010238587856292725, 0.00010832026600837708, 0.0001142546534538269, 0.00012018904089927673, 0.00012612342834472656]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 2.0, 7.0, 5.0, 9.0, 9.0, 14.0, 16.0, 27.0, 25.0, 49.0, 50.0, 79.0, 120.0, 166.0, 74.0, 62.0, 48.0, 41.0, 34.0, 30.0, 26.0, 21.0, 13.0, 11.0, 6.0, 7.0, 8.0, 4.0, 4.0, 4.0, 4.0, 0.0, 5.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06922060251235962, -0.0657728835940361, -0.062325168401002884, -0.058877453207969666, -0.05542973801493645, -0.05198202282190323, -0.04853430390357971, -0.045086588710546494, -0.041638873517513275, -0.03819115832448006, -0.03474343940615654, -0.03129572421312332, -0.027848009020090103, -0.024400291964411736, -0.020952574908733368, -0.01750485971570015, -0.014057140797376633, -0.01060942467302084, -0.007161708083003759, -0.003713991492986679, -0.0002662753686308861, 0.003181440755724907, 0.0066291578114032745, 0.010076873004436493, 0.01352459006011486, 0.016972307115793228, 0.020420022308826447, 0.023867739364504814, 0.027315456420183182, 0.0307631716132164, 0.03421089053153992, 0.03765860199928284, 0.041106320917606354, 0.04455403611063957, 0.04800175502896309, 0.05144947022199631, 0.054897185415029526, 0.058344900608062744, 0.06179261952638626, 0.06524033844470978, 0.0686880499124527, 0.07213576883077621, 0.07558348029851913, 0.07903119921684265, 0.08247891813516617, 0.08592662960290909, 0.0893743485212326, 0.09282205998897552, 0.09626978635787964, 0.09971750527620316, 0.10316521674394608, 0.10661293566226959, 0.11006065458059311, 0.11350836604833603, 0.11695608496665955, 0.12040379643440247, 0.12385151535272598, 0.1272992342710495, 0.13074694573879242, 0.13419467210769653, 0.13764238357543945, 0.14109009504318237, 0.1445378065109253, 0.1479855328798294, 0.15143324434757233]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 12.0, 6.0, 9.0, 12.0, 8.0, 17.0, 17.0, 27.0, 23.0, 26.0, 40.0, 37.0, 48.0, 39.0, 48.0, 53.0, 53.0, 68.0, 45.0, 46.0, 43.0, 44.0, 41.0, 25.0, 27.0, 33.0, 19.0, 24.0, 18.0, 21.0, 16.0, 14.0, 13.0, 9.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.10321676731109619, -0.10011403262615204, -0.09701129794120789, -0.09390856325626373, -0.09080582857131958, -0.08770310133695602, -0.08460036665201187, -0.08149763196706772, -0.07839489728212357, -0.07529216259717941, -0.07218942791223526, -0.06908669322729111, -0.06598396599292755, -0.0628812313079834, -0.059778496623039246, -0.05667576193809509, -0.05357302725315094, -0.05047029256820679, -0.047367557883262634, -0.04426482692360878, -0.04116209223866463, -0.038059357553720474, -0.03495662659406662, -0.03185389190912247, -0.028751157224178314, -0.02564842253923416, -0.022545689716935158, -0.019442956894636154, -0.016340222209692, -0.013237488456070423, -0.010134754702448845, -0.007032021880149841, -0.0039292871952056885, -0.0008265534415841103, 0.002276180312037468, 0.005378914065659046, 0.008481647819280624, 0.011584381572902203, 0.01468711532652378, 0.017789848148822784, 0.020892582833766937, 0.02399531751871109, 0.027098050341010094, 0.030200783163309097, 0.03330351784825325, 0.0364062525331974, 0.03950898349285126, 0.04261171817779541, 0.04571445286273956, 0.048817187547683716, 0.05191992223262787, 0.05502265319228172, 0.058125387877225876, 0.06122812256217003, 0.06433085352182388, 0.06743358820676804, 0.07053632289171219, 0.07363905757665634, 0.0767417922616005, 0.07984452694654465, 0.0829472541809082, 0.08604998886585236, 0.08915272355079651, 0.09225545823574066, 0.09535819292068481]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 15.0, 23.0, 39.0, 73.0, 115.0, 208.0, 446.0, 4192303.0, 502.0, 245.0, 129.0, 89.0, 46.0, 21.0, 9.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.08258056640625, -0.08076810836791992, -0.07895565032958984, -0.07714319229125977, -0.07533073425292969, -0.07351827621459961, -0.07170581817626953, -0.06989336013793945, -0.06808090209960938, -0.0662684440612793, -0.06445598602294922, -0.06264352798461914, -0.06083106994628906, -0.059018611907958984, -0.057206153869628906, -0.05539369583129883, -0.05358123779296875, -0.05176877975463867, -0.049956321716308594, -0.048143863677978516, -0.04633140563964844, -0.04451894760131836, -0.04270648956298828, -0.0408940315246582, -0.039081573486328125, -0.03726911544799805, -0.03545665740966797, -0.03364419937133789, -0.03183174133300781, -0.030019283294677734, -0.028206825256347656, -0.026394367218017578, -0.0245819091796875, -0.022769451141357422, -0.020956993103027344, -0.019144535064697266, -0.017332077026367188, -0.01551961898803711, -0.013707160949707031, -0.011894702911376953, -0.010082244873046875, -0.008269786834716797, -0.006457328796386719, -0.004644870758056641, -0.0028324127197265625, -0.0010199546813964844, 0.0007925033569335938, 0.002604961395263672, 0.00441741943359375, 0.006229877471923828, 0.008042335510253906, 0.009854793548583984, 0.011667251586914062, 0.01347970962524414, 0.015292167663574219, 0.017104625701904297, 0.018917083740234375, 0.020729541778564453, 0.02254199981689453, 0.02435445785522461, 0.026166915893554688, 0.027979373931884766, 0.029791831970214844, 0.03160429000854492, 0.033416748046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 15.0, 26.0, 48.0, 61.0, 116.0, 156.0, 144.0, 154.0, 112.0, 54.0, 55.0, 24.0, 15.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01470947265625, -0.014385521411895752, -0.014061570167541504, -0.013737618923187256, -0.013413667678833008, -0.01308971643447876, -0.012765765190124512, -0.012441813945770264, -0.012117862701416016, -0.011793911457061768, -0.01146996021270752, -0.011146008968353271, -0.010822057723999023, -0.010498106479644775, -0.010174155235290527, -0.00985020399093628, -0.009526252746582031, -0.009202301502227783, -0.008878350257873535, -0.008554399013519287, -0.008230447769165039, -0.007906496524810791, -0.007582545280456543, -0.007258594036102295, -0.006934642791748047, -0.006610691547393799, -0.006286740303039551, -0.005962789058685303, -0.005638837814331055, -0.005314886569976807, -0.004990935325622559, -0.0046669840812683105, -0.0043430328369140625, -0.0040190815925598145, -0.0036951303482055664, -0.0033711791038513184, -0.0030472278594970703, -0.0027232766151428223, -0.0023993253707885742, -0.002075374126434326, -0.0017514228820800781, -0.00142747163772583, -0.001103520393371582, -0.000779569149017334, -0.00045561790466308594, -0.0001316666603088379, 0.00019228458404541016, 0.0005162358283996582, 0.0008401870727539062, 0.0011641383171081543, 0.0014880895614624023, 0.0018120408058166504, 0.0021359920501708984, 0.0024599432945251465, 0.0027838945388793945, 0.0031078457832336426, 0.0034317970275878906, 0.0037557482719421387, 0.004079699516296387, 0.004403650760650635, 0.004727602005004883, 0.005051553249359131, 0.005375504493713379, 0.005699455738067627, 0.006023406982421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 10.0, 8.0, 19.0, 15.0, 21.0, 26.0, 19.0, 28.0, 38.0, 47.0, 72.0, 72.0, 91.0, 106.0, 177.0, 254.0, 565.0, 2820.0, 4188066.0, 755.0, 310.0, 184.0, 121.0, 88.0, 61.0, 64.0, 41.0, 34.0, 36.0, 25.0, 23.0, 11.0, 17.0, 10.0, 15.0, 3.0, 2.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00641632080078125, -0.006216764450073242, -0.006017208099365234, -0.0058176517486572266, -0.005618095397949219, -0.005418539047241211, -0.005218982696533203, -0.005019426345825195, -0.0048198699951171875, -0.00462031364440918, -0.004420757293701172, -0.004221200942993164, -0.004021644592285156, -0.0038220882415771484, -0.0036225318908691406, -0.003422975540161133, -0.003223419189453125, -0.003023862838745117, -0.0028243064880371094, -0.0026247501373291016, -0.0024251937866210938, -0.002225637435913086, -0.002026081085205078, -0.0018265247344970703, -0.0016269683837890625, -0.0014274120330810547, -0.0012278556823730469, -0.001028299331665039, -0.0008287429809570312, -0.0006291866302490234, -0.0004296302795410156, -0.0002300739288330078, -3.0517578125e-05, 0.0001690387725830078, 0.0003685951232910156, 0.0005681514739990234, 0.0007677078247070312, 0.0009672641754150391, 0.0011668205261230469, 0.0013663768768310547, 0.0015659332275390625, 0.0017654895782470703, 0.001965045928955078, 0.002164602279663086, 0.0023641586303710938, 0.0025637149810791016, 0.0027632713317871094, 0.002962827682495117, 0.003162384033203125, 0.003361940383911133, 0.0035614967346191406, 0.0037610530853271484, 0.003960609436035156, 0.004160165786743164, 0.004359722137451172, 0.00455927848815918, 0.0047588348388671875, 0.004958391189575195, 0.005157947540283203, 0.005357503890991211, 0.005557060241699219, 0.0057566165924072266, 0.005956172943115234, 0.006155729293823242, 0.00635528564453125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4084.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013742446899414062, -0.0013476237654685974, -0.0013210028409957886, -0.0012943819165229797, -0.001267760992050171, -0.001241140067577362, -0.0012145191431045532, -0.0011878982186317444, -0.0011612772941589355, -0.0011346563696861267, -0.0011080354452133179, -0.001081414520740509, -0.0010547935962677002, -0.0010281726717948914, -0.0010015517473220825, -0.0009749308228492737, -0.0009483098983764648, -0.000921688973903656, -0.0008950680494308472, -0.0008684471249580383, -0.0008418262004852295, -0.0008152052760124207, -0.0007885843515396118, -0.000761963427066803, -0.0007353425025939941, -0.0007087215781211853, -0.0006821006536483765, -0.0006554797291755676, -0.0006288588047027588, -0.00060223788022995, -0.0005756169557571411, -0.0005489960312843323, -0.0005223751068115234, -0.0004957541823387146, -0.00046913325786590576, -0.0004425123333930969, -0.0004158914089202881, -0.00038927048444747925, -0.0003626495599746704, -0.00033602863550186157, -0.00030940771102905273, -0.0002827867865562439, -0.00025616586208343506, -0.00022954493761062622, -0.00020292401313781738, -0.00017630308866500854, -0.0001496821641921997, -0.00012306123971939087, -9.644031524658203e-05, -6.98193907737732e-05, -4.3198466300964355e-05, -1.6577541828155518e-05, 1.004338264465332e-05, 3.666430711746216e-05, 6.3285231590271e-05, 8.990615606307983e-05, 0.00011652708053588867, 0.0001431480050086975, 0.00016976892948150635, 0.00019638985395431519, 0.00022301077842712402, 0.00024963170289993286, 0.0002762526273727417, 0.00030287355184555054, 0.0003294944763183594]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 2.0, 9.0, 10.0, 10.0, 13.0, 22.0, 31.0, 25.0, 42.0, 77.0, 132.0, 252.0, 125.0, 86.0, 41.0, 34.0, 30.0, 11.0, 10.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013026318047195673, -0.0012625500094145536, -0.00122246821410954, -0.0011823864188045263, -0.0011423046234995127, -0.001102222828194499, -0.0010621410328894854, -0.0010220592375844717, -0.000981977442279458, -0.0009418956469744444, -0.0009018138516694307, -0.0008617320563644171, -0.0008216502610594034, -0.0007815684657543898, -0.0007414866122417152, -0.0007014048169367015, -0.000661322963424027, -0.0006212411681190133, -0.0005811593728139997, -0.000541077577508986, -0.0005009957822039723, -0.0004609139577951282, -0.0004208321333862841, -0.00038075033808127046, -0.0003406685427762568, -0.00030058674747124314, -0.0002605049521662295, -0.00022042312775738537, -0.00018034133245237172, -0.00014025953714735806, -0.00010017772729042917, -6.009591743350029e-05, -2.0014005713164806e-05, 2.0067796867806464e-05, 6.0149599448777735e-05, 0.000100231402029749, 0.00014031320461072028, 0.00018039499991573393, 0.00022047680977266282, 0.0002605586196295917, 0.00030064041493460536, 0.000340722210239619, 0.0003808040055446327, 0.0004208858299534768, 0.00046096762525849044, 0.0005010494496673346, 0.0005411312449723482, 0.0005812130402773619, 0.0006212948355823755, 0.0006613766308873892, 0.0007014584261924028, 0.0007415402214974165, 0.0007816220168024302, 0.0008217038121074438, 0.0008617856656201184, 0.000901867460925132, 0.0009419492562301457, 0.0009820311097428203, 0.001022112905047834, 0.0010621947003528476, 0.0011022764956578612, 0.0011423582909628749, 0.0011824400862678885, 0.0012225218815729022, 0.0012626036768779159]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 6.0, 10.0, 13.0, 14.0, 15.0, 27.0, 33.0, 31.0, 32.0, 50.0, 28.0, 35.0, 45.0, 49.0, 59.0, 58.0, 62.0, 45.0, 49.0, 52.0, 40.0, 37.0, 41.0, 14.0, 22.0, 19.0, 25.0, 17.0, 12.0, 9.0, 11.0, 6.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007683038711547852, -0.000745994970202446, -0.0007236860692501068, -0.0007013771682977676, -0.0006790682673454285, -0.0006567593663930893, -0.0006344504654407501, -0.000612141564488411, -0.0005898326635360718, -0.0005675237625837326, -0.0005452148616313934, -0.0005229059606790543, -0.0005005970597267151, -0.0004782881587743759, -0.00045597925782203674, -0.00043367035686969757, -0.0004113614559173584, -0.0003890525549650192, -0.00036674365401268005, -0.0003444347530603409, -0.0003221258521080017, -0.00029981695115566254, -0.00027750805020332336, -0.0002551991492509842, -0.00023289024829864502, -0.00021058134734630585, -0.00018827244639396667, -0.0001659635454416275, -0.00014365464448928833, -0.00012134574353694916, -9.903684258460999e-05, -7.672794163227081e-05, -5.441904067993164e-05, -3.211013972759247e-05, -9.801238775253296e-06, 1.2507662177085876e-05, 3.481656312942505e-05, 5.712546408176422e-05, 7.94343650341034e-05, 0.00010174326598644257, 0.00012405216693878174, 0.0001463610678911209, 0.00016866996884346008, 0.00019097886979579926, 0.00021328777074813843, 0.0002355966717004776, 0.00025790557265281677, 0.00028021447360515594, 0.0003025233745574951, 0.0003248322755098343, 0.00034714117646217346, 0.00036945007741451263, 0.0003917589783668518, 0.000414067879319191, 0.00043637678027153015, 0.0004586856812238693, 0.0004809945821762085, 0.0005033034831285477, 0.0005256123840808868, 0.000547921285033226, 0.0005702301859855652, 0.0005925390869379044, 0.0006148479878902435, 0.0006371568888425827, 0.0006594657897949219]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 3.0, 7.0, 15.0, 10.0, 16.0, 17.0, 19.0, 19.0, 44.0, 44.0, 52.0, 72.0, 127.0, 248.0, 564.0, 1369.0, 4366.0, 17615.0, 102174.0, 764607.0, 128539.0, 20725.0, 4978.0, 1541.0, 590.0, 268.0, 145.0, 85.0, 63.0, 43.0, 34.0, 26.0, 24.0, 19.0, 10.0, 10.0, 11.0, 4.0, 6.0, 10.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.05377197265625, -0.0521693229675293, -0.050566673278808594, -0.04896402359008789, -0.04736137390136719, -0.045758724212646484, -0.04415607452392578, -0.04255342483520508, -0.040950775146484375, -0.03934812545776367, -0.03774547576904297, -0.036142826080322266, -0.03454017639160156, -0.03293752670288086, -0.031334877014160156, -0.029732227325439453, -0.02812957763671875, -0.026526927947998047, -0.024924278259277344, -0.02332162857055664, -0.021718978881835938, -0.020116329193115234, -0.01851367950439453, -0.016911029815673828, -0.015308380126953125, -0.013705730438232422, -0.012103080749511719, -0.010500431060791016, -0.008897781372070312, -0.007295131683349609, -0.005692481994628906, -0.004089832305908203, -0.0024871826171875, -0.0008845329284667969, 0.0007181167602539062, 0.0023207664489746094, 0.0039234161376953125, 0.005526065826416016, 0.007128715515136719, 0.008731365203857422, 0.010334014892578125, 0.011936664581298828, 0.013539314270019531, 0.015141963958740234, 0.016744613647460938, 0.01834726333618164, 0.019949913024902344, 0.021552562713623047, 0.02315521240234375, 0.024757862091064453, 0.026360511779785156, 0.02796316146850586, 0.029565811157226562, 0.031168460845947266, 0.03277111053466797, 0.03437376022338867, 0.035976409912109375, 0.03757905960083008, 0.03918170928955078, 0.040784358978271484, 0.04238700866699219, 0.04398965835571289, 0.045592308044433594, 0.0471949577331543, 0.048797607421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 15.0, 27.0, 47.0, 61.0, 117.0, 157.0, 144.0, 153.0, 111.0, 55.0, 53.0, 25.0, 15.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01470184326171875, -0.014378011226654053, -0.014054179191589355, -0.013730347156524658, -0.013406515121459961, -0.013082683086395264, -0.012758851051330566, -0.01243501901626587, -0.012111186981201172, -0.011787354946136475, -0.011463522911071777, -0.01113969087600708, -0.010815858840942383, -0.010492026805877686, -0.010168194770812988, -0.009844362735748291, -0.009520530700683594, -0.009196698665618896, -0.0088728666305542, -0.008549034595489502, -0.008225202560424805, -0.007901370525360107, -0.00757753849029541, -0.007253706455230713, -0.006929874420166016, -0.006606042385101318, -0.006282210350036621, -0.005958378314971924, -0.0056345462799072266, -0.005310714244842529, -0.004986882209777832, -0.004663050174713135, -0.0043392181396484375, -0.00401538610458374, -0.003691554069519043, -0.0033677220344543457, -0.0030438899993896484, -0.002720057964324951, -0.002396225929260254, -0.0020723938941955566, -0.0017485618591308594, -0.0014247298240661621, -0.0011008977890014648, -0.0007770657539367676, -0.0004532337188720703, -0.00012940168380737305, 0.00019443035125732422, 0.0005182623863220215, 0.0008420944213867188, 0.001165926456451416, 0.0014897584915161133, 0.0018135905265808105, 0.002137422561645508, 0.002461254596710205, 0.0027850866317749023, 0.0031089186668395996, 0.003432750701904297, 0.003756582736968994, 0.004080414772033691, 0.004404246807098389, 0.004728078842163086, 0.005051910877227783, 0.0053757429122924805, 0.005699574947357178, 0.006023406982421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 6.0, 8.0, 7.0, 8.0, 14.0, 25.0, 22.0, 42.0, 66.0, 117.0, 231.0, 452.0, 989.0, 2147.0, 5119.0, 12595.0, 32997.0, 95336.0, 504491.0, 278019.0, 72425.0, 25877.0, 9967.0, 4140.0, 1802.0, 796.0, 386.0, 186.0, 90.0, 66.0, 30.0, 26.0, 17.0, 11.0, 14.0, 9.0, 2.0, 3.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0281219482421875, -0.027315616607666016, -0.02650928497314453, -0.025702953338623047, -0.024896621704101562, -0.024090290069580078, -0.023283958435058594, -0.02247762680053711, -0.021671295166015625, -0.02086496353149414, -0.020058631896972656, -0.019252300262451172, -0.018445968627929688, -0.017639636993408203, -0.01683330535888672, -0.016026973724365234, -0.01522064208984375, -0.014414310455322266, -0.013607978820800781, -0.012801647186279297, -0.011995315551757812, -0.011188983917236328, -0.010382652282714844, -0.00957632064819336, -0.008769989013671875, -0.00796365737915039, -0.007157325744628906, -0.006350994110107422, -0.0055446624755859375, -0.004738330841064453, -0.003931999206542969, -0.0031256675720214844, -0.0023193359375, -0.0015130043029785156, -0.0007066726684570312, 9.965896606445312e-05, 0.0009059906005859375, 0.0017123222351074219, 0.0025186538696289062, 0.0033249855041503906, 0.004131317138671875, 0.004937648773193359, 0.005743980407714844, 0.006550312042236328, 0.0073566436767578125, 0.008162975311279297, 0.008969306945800781, 0.009775638580322266, 0.01058197021484375, 0.011388301849365234, 0.012194633483886719, 0.013000965118408203, 0.013807296752929688, 0.014613628387451172, 0.015419960021972656, 0.01622629165649414, 0.017032623291015625, 0.01783895492553711, 0.018645286560058594, 0.019451618194580078, 0.020257949829101562, 0.021064281463623047, 0.02187061309814453, 0.022676944732666016, 0.0234832763671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 2.0, 3.0, 10.0, 12.0, 8.0, 14.0, 17.0, 20.0, 26.0, 27.0, 28.0, 36.0, 32.0, 38.0, 42.0, 44.0, 36.0, 51.0, 50.0, 36.0, 43.0, 40.0, 42.0, 44.0, 37.0, 34.0, 42.0, 28.0, 28.0, 22.0, 22.0, 12.0, 21.0, 12.0, 7.0, 5.0, 10.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01557159423828125, -0.01503598690032959, -0.01450037956237793, -0.01396477222442627, -0.01342916488647461, -0.01289355754852295, -0.012357950210571289, -0.011822342872619629, -0.011286735534667969, -0.010751128196716309, -0.010215520858764648, -0.009679913520812988, -0.009144306182861328, -0.008608698844909668, -0.008073091506958008, -0.007537484169006348, -0.0070018768310546875, -0.006466269493103027, -0.005930662155151367, -0.005395054817199707, -0.004859447479248047, -0.004323840141296387, -0.0037882328033447266, -0.0032526254653930664, -0.0027170181274414062, -0.002181410789489746, -0.001645803451538086, -0.0011101961135864258, -0.0005745887756347656, -3.898143768310547e-05, 0.0004966259002685547, 0.0010322332382202148, 0.001567840576171875, 0.002103447914123535, 0.0026390552520751953, 0.0031746625900268555, 0.0037102699279785156, 0.004245877265930176, 0.004781484603881836, 0.005317091941833496, 0.005852699279785156, 0.006388306617736816, 0.0069239139556884766, 0.007459521293640137, 0.007995128631591797, 0.008530735969543457, 0.009066343307495117, 0.009601950645446777, 0.010137557983398438, 0.010673165321350098, 0.011208772659301758, 0.011744379997253418, 0.012279987335205078, 0.012815594673156738, 0.013351202011108398, 0.013886809349060059, 0.014422416687011719, 0.014958024024963379, 0.015493631362915039, 0.0160292387008667, 0.01656484603881836, 0.01710045337677002, 0.01763606071472168, 0.01817166805267334, 0.018707275390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 8.0, 10.0, 15.0, 14.0, 31.0, 43.0, 56.0, 71.0, 124.0, 194.0, 340.0, 538.0, 1006.0, 1919.0, 3980.0, 9443.0, 28239.0, 153148.0, 747631.0, 71012.0, 17612.0, 6664.0, 2940.0, 1502.0, 795.0, 426.0, 277.0, 162.0, 103.0, 79.0, 46.0, 42.0, 24.0, 13.0, 10.0, 10.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00021350383758544922, -0.00020689517259597778, -0.00020028650760650635, -0.0001936778426170349, -0.00018706917762756348, -0.00018046051263809204, -0.0001738518476486206, -0.00016724318265914917, -0.00016063451766967773, -0.0001540258526802063, -0.00014741718769073486, -0.00014080852270126343, -0.000134199857711792, -0.00012759119272232056, -0.00012098252773284912, -0.00011437386274337769, -0.00010776519775390625, -0.00010115653276443481, -9.454786777496338e-05, -8.793920278549194e-05, -8.133053779602051e-05, -7.472187280654907e-05, -6.811320781707764e-05, -6.15045428276062e-05, -5.4895877838134766e-05, -4.828721284866333e-05, -4.1678547859191895e-05, -3.506988286972046e-05, -2.8461217880249023e-05, -2.1852552890777588e-05, -1.5243887901306152e-05, -8.635222911834717e-06, -2.0265579223632812e-06, 4.582107067108154e-06, 1.119077205657959e-05, 1.7799437046051025e-05, 2.440810203552246e-05, 3.1016767024993896e-05, 3.762543201446533e-05, 4.423409700393677e-05, 5.08427619934082e-05, 5.745142698287964e-05, 6.406009197235107e-05, 7.066875696182251e-05, 7.727742195129395e-05, 8.388608694076538e-05, 9.049475193023682e-05, 9.710341691970825e-05, 0.00010371208190917969, 0.00011032074689865112, 0.00011692941188812256, 0.000123538076877594, 0.00013014674186706543, 0.00013675540685653687, 0.0001433640718460083, 0.00014997273683547974, 0.00015658140182495117, 0.0001631900668144226, 0.00016979873180389404, 0.00017640739679336548, 0.00018301606178283691, 0.00018962472677230835, 0.00019623339176177979, 0.00020284205675125122, 0.00020945072174072266]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 9.0, 7.0, 13.0, 26.0, 35.0, 36.0, 54.0, 84.0, 107.0, 122.0, 134.0, 77.0, 73.0, 51.0, 26.0, 30.0, 12.0, 18.0, 7.0, 8.0, 3.0, 9.0, 2.0, 2.0, 5.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9371509552001953e-05, -1.870095729827881e-05, -1.8030405044555664e-05, -1.735985279083252e-05, -1.6689300537109375e-05, -1.601874828338623e-05, -1.5348196029663086e-05, -1.4677643775939941e-05, -1.4007091522216797e-05, -1.3336539268493652e-05, -1.2665987014770508e-05, -1.1995434761047363e-05, -1.1324882507324219e-05, -1.0654330253601074e-05, -9.98377799987793e-06, -9.313225746154785e-06, -8.64267349243164e-06, -7.972121238708496e-06, -7.3015689849853516e-06, -6.631016731262207e-06, -5.9604644775390625e-06, -5.289912223815918e-06, -4.6193599700927734e-06, -3.948807716369629e-06, -3.2782554626464844e-06, -2.60770320892334e-06, -1.9371509552001953e-06, -1.2665987014770508e-06, -5.960464477539062e-07, 7.450580596923828e-08, 7.450580596923828e-07, 1.4156103134155273e-06, 2.086162567138672e-06, 2.7567148208618164e-06, 3.427267074584961e-06, 4.0978193283081055e-06, 4.76837158203125e-06, 5.4389238357543945e-06, 6.109476089477539e-06, 6.780028343200684e-06, 7.450580596923828e-06, 8.121132850646973e-06, 8.791685104370117e-06, 9.462237358093262e-06, 1.0132789611816406e-05, 1.080334186553955e-05, 1.1473894119262695e-05, 1.214444637298584e-05, 1.2814998626708984e-05, 1.3485550880432129e-05, 1.4156103134155273e-05, 1.4826655387878418e-05, 1.5497207641601562e-05, 1.6167759895324707e-05, 1.683831214904785e-05, 1.7508864402770996e-05, 1.817941665649414e-05, 1.8849968910217285e-05, 1.952052116394043e-05, 2.0191073417663574e-05, 2.086162567138672e-05, 2.1532177925109863e-05, 2.2202730178833008e-05, 2.2873282432556152e-05, 2.3543834686279297e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 12.0, 15.0, 43.0, 55.0, 128.0, 236.0, 416.0, 882.0, 1872.0, 4613.0, 13911.0, 85613.0, 848803.0, 71396.0, 12767.0, 4215.0, 1812.0, 851.0, 426.0, 212.0, 108.0, 73.0, 31.0, 23.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032591819763183594, -0.0003152191638946533, -0.0003045201301574707, -0.0002938210964202881, -0.00028312206268310547, -0.00027242302894592285, -0.00026172399520874023, -0.0002510249614715576, -0.000240325927734375, -0.00022962689399719238, -0.00021892786026000977, -0.00020822882652282715, -0.00019752979278564453, -0.00018683075904846191, -0.0001761317253112793, -0.00016543269157409668, -0.00015473365783691406, -0.00014403462409973145, -0.00013333559036254883, -0.0001226365566253662, -0.0001119375228881836, -0.00010123848915100098, -9.053945541381836e-05, -7.984042167663574e-05, -6.914138793945312e-05, -5.844235420227051e-05, -4.774332046508789e-05, -3.7044286727905273e-05, -2.6345252990722656e-05, -1.564621925354004e-05, -4.947185516357422e-06, 5.751848220825195e-06, 1.6450881958007812e-05, 2.714991569519043e-05, 3.784894943237305e-05, 4.8547983169555664e-05, 5.924701690673828e-05, 6.99460506439209e-05, 8.064508438110352e-05, 9.134411811828613e-05, 0.00010204315185546875, 0.00011274218559265137, 0.00012344121932983398, 0.0001341402530670166, 0.00014483928680419922, 0.00015553832054138184, 0.00016623735427856445, 0.00017693638801574707, 0.0001876354217529297, 0.0001983344554901123, 0.00020903348922729492, 0.00021973252296447754, 0.00023043155670166016, 0.00024113059043884277, 0.0002518296241760254, 0.000262528657913208, 0.0002732276916503906, 0.00028392672538757324, 0.00029462575912475586, 0.0003053247928619385, 0.0003160238265991211, 0.0003267228603363037, 0.00033742189407348633, 0.00034812092781066895, 0.00035881996154785156]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 13.0, 11.0, 9.0, 21.0, 26.0, 49.0, 57.0, 100.0, 132.0, 137.0, 134.0, 99.0, 57.0, 49.0, 27.0, 13.0, 12.0, 8.0, 5.0, 4.0, 2.0, 5.0, 1.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023818016052246094, -0.0002310723066329956, -0.00022396445274353027, -0.00021685659885406494, -0.0002097487449645996, -0.00020264089107513428, -0.00019553303718566895, -0.0001884251832962036, -0.00018131732940673828, -0.00017420947551727295, -0.00016710162162780762, -0.00015999376773834229, -0.00015288591384887695, -0.00014577805995941162, -0.0001386702060699463, -0.00013156235218048096, -0.00012445449829101562, -0.00011734664440155029, -0.00011023879051208496, -0.00010313093662261963, -9.60230827331543e-05, -8.891522884368896e-05, -8.180737495422363e-05, -7.46995210647583e-05, -6.759166717529297e-05, -6.048381328582764e-05, -5.3375959396362305e-05, -4.626810550689697e-05, -3.916025161743164e-05, -3.205239772796631e-05, -2.4944543838500977e-05, -1.7836689949035645e-05, -1.0728836059570312e-05, -3.6209821701049805e-06, 3.4868717193603516e-06, 1.0594725608825684e-05, 1.7702579498291016e-05, 2.4810433387756348e-05, 3.191828727722168e-05, 3.902614116668701e-05, 4.6133995056152344e-05, 5.3241848945617676e-05, 6.034970283508301e-05, 6.745755672454834e-05, 7.456541061401367e-05, 8.1673264503479e-05, 8.878111839294434e-05, 9.588897228240967e-05, 0.000102996826171875, 0.00011010468006134033, 0.00011721253395080566, 0.000124320387840271, 0.00013142824172973633, 0.00013853609561920166, 0.000145643949508667, 0.00015275180339813232, 0.00015985965728759766, 0.000166967511177063, 0.00017407536506652832, 0.00018118321895599365, 0.00018829107284545898, 0.00019539892673492432, 0.00020250678062438965, 0.00020961463451385498, 0.0002167224884033203]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 7.0, 7.0, 11.0, 12.0, 30.0, 38.0, 51.0, 99.0, 266.0, 191.0, 87.0, 58.0, 27.0, 33.0, 24.0, 21.0, 11.0, 10.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11800666153430939, -0.11201057583093643, -0.10601448267698288, -0.10001839697360992, -0.09402230381965637, -0.08802621811628342, -0.08203013241291046, -0.07603403925895691, -0.07003795355558395, -0.064041867852211, -0.058045774698257446, -0.05204968899488449, -0.04605359956622124, -0.04005751013755798, -0.03406142443418503, -0.028065335005521774, -0.02206924557685852, -0.016073156148195267, -0.010077068582177162, -0.004080981016159058, 0.0019151084125041962, 0.00791119784116745, 0.013907283544540405, 0.01990337297320366, 0.025899462401866913, 0.03189555183053017, 0.03789164125919342, 0.043887726962566376, 0.04988381639122963, 0.05587990581989288, 0.06187599152326584, 0.0678720772266388, 0.07386815547943115, 0.07986424118280411, 0.08586033433675766, 0.09185642004013062, 0.09785251319408417, 0.10384859889745712, 0.10984468460083008, 0.11584077775478363, 0.12183686345815659, 0.12783294916152954, 0.1338290423154831, 0.13982513546943665, 0.145821213722229, 0.15181730687618256, 0.1578134000301361, 0.16380947828292847, 0.16980557143688202, 0.17580166459083557, 0.18179774284362793, 0.18779383599758148, 0.19378992915153503, 0.1997860074043274, 0.20578210055828094, 0.2117781937122345, 0.21777427196502686, 0.2237703651189804, 0.22976644337177277, 0.23576253652572632, 0.24175862967967987, 0.24775472283363342, 0.2537508010864258, 0.25974687933921814, 0.2657429873943329]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 14.0, 8.0, 12.0, 13.0, 20.0, 30.0, 35.0, 40.0, 50.0, 50.0, 54.0, 54.0, 83.0, 63.0, 79.0, 64.0, 58.0, 38.0, 57.0, 39.0, 31.0, 24.0, 27.0, 15.0, 14.0, 9.0, 9.0, 4.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0791899561882019, -0.07535061240196228, -0.07151126116514206, -0.06767190992832184, -0.06383256614208221, -0.05999321863055229, -0.05615387111902237, -0.05231452360749245, -0.048475176095962524, -0.0446358285844326, -0.04079648107290268, -0.03695713356137276, -0.033117786049842834, -0.029278438538312912, -0.02543909102678299, -0.021599743515253067, -0.017760396003723145, -0.013921048492193222, -0.0100817009806633, -0.006242353469133377, -0.0024030059576034546, 0.001436341553926468, 0.00527568906545639, 0.009115036576986313, 0.012954384088516235, 0.016793731600046158, 0.02063307911157608, 0.024472426623106003, 0.028311774134635925, 0.03215112164616585, 0.03599046915769577, 0.03982981666922569, 0.043669164180755615, 0.04750851169228554, 0.05134785920381546, 0.05518720671534538, 0.059026554226875305, 0.06286589801311493, 0.06670524924993515, 0.07054460048675537, 0.074383944272995, 0.07822328805923462, 0.08206263929605484, 0.08590199053287506, 0.08974133431911469, 0.09358067810535431, 0.09742002934217453, 0.10125938057899475, 0.10509872436523438, 0.108938068151474, 0.11277741938829422, 0.11661677062511444, 0.12045611441135406, 0.12429545819759369, 0.1281348168849945, 0.13197416067123413, 0.13581350445747375, 0.13965284824371338, 0.143492192029953, 0.14733155071735382, 0.15117089450359344, 0.15501023828983307, 0.1588495969772339, 0.1626889407634735, 0.16652828454971313]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 11.0, 24.0, 36.0, 71.0, 151.0, 306.0, 682.0, 4190710.0, 1404.0, 453.0, 210.0, 97.0, 52.0, 27.0, 19.0, 11.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02984619140625, -0.029147982597351074, -0.02844977378845215, -0.027751564979553223, -0.027053356170654297, -0.02635514736175537, -0.025656938552856445, -0.02495872974395752, -0.024260520935058594, -0.023562312126159668, -0.022864103317260742, -0.022165894508361816, -0.02146768569946289, -0.020769476890563965, -0.02007126808166504, -0.019373059272766113, -0.018674850463867188, -0.01797664165496826, -0.017278432846069336, -0.01658022403717041, -0.015882015228271484, -0.015183806419372559, -0.014485597610473633, -0.013787388801574707, -0.013089179992675781, -0.012390971183776855, -0.01169276237487793, -0.010994553565979004, -0.010296344757080078, -0.009598135948181152, -0.008899927139282227, -0.0082017183303833, -0.007503509521484375, -0.006805300712585449, -0.0061070919036865234, -0.005408883094787598, -0.004710674285888672, -0.004012465476989746, -0.0033142566680908203, -0.0026160478591918945, -0.0019178390502929688, -0.001219630241394043, -0.0005214214324951172, 0.0001767873764038086, 0.0008749961853027344, 0.0015732049942016602, 0.002271413803100586, 0.0029696226119995117, 0.0036678314208984375, 0.004366040229797363, 0.005064249038696289, 0.005762457847595215, 0.006460666656494141, 0.007158875465393066, 0.007857084274291992, 0.008555293083190918, 0.009253501892089844, 0.00995171070098877, 0.010649919509887695, 0.011348128318786621, 0.012046337127685547, 0.012744545936584473, 0.013442754745483398, 0.014140963554382324, 0.01483917236328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 14.0, 12.0, 27.0, 39.0, 70.0, 118.0, 144.0, 143.0, 147.0, 118.0, 53.0, 58.0, 27.0, 16.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0137481689453125, -0.01343923807144165, -0.0131303071975708, -0.012821376323699951, -0.012512445449829102, -0.012203514575958252, -0.011894583702087402, -0.011585652828216553, -0.011276721954345703, -0.010967791080474854, -0.010658860206604004, -0.010349929332733154, -0.010040998458862305, -0.009732067584991455, -0.009423136711120605, -0.009114205837249756, -0.008805274963378906, -0.008496344089508057, -0.008187413215637207, -0.007878482341766357, -0.007569551467895508, -0.007260620594024658, -0.006951689720153809, -0.006642758846282959, -0.006333827972412109, -0.00602489709854126, -0.00571596622467041, -0.0054070353507995605, -0.005098104476928711, -0.004789173603057861, -0.004480242729187012, -0.004171311855316162, -0.0038623809814453125, -0.003553450107574463, -0.0032445192337036133, -0.0029355883598327637, -0.002626657485961914, -0.0023177266120910645, -0.002008795738220215, -0.0016998648643493652, -0.0013909339904785156, -0.001082003116607666, -0.0007730722427368164, -0.0004641413688659668, -0.0001552104949951172, 0.00015372037887573242, 0.00046265125274658203, 0.0007715821266174316, 0.0010805130004882812, 0.0013894438743591309, 0.0016983747482299805, 0.00200730562210083, 0.0023162364959716797, 0.0026251673698425293, 0.002934098243713379, 0.0032430291175842285, 0.003551959991455078, 0.0038608908653259277, 0.004169821739196777, 0.004478752613067627, 0.0047876834869384766, 0.005096614360809326, 0.005405545234680176, 0.005714476108551025, 0.006023406982421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 1.0, 6.0, 9.0, 17.0, 16.0, 18.0, 39.0, 40.0, 50.0, 73.0, 105.0, 116.0, 155.0, 194.0, 246.0, 313.0, 438.0, 924.0, 4183281.0, 5930.0, 654.0, 382.0, 266.0, 244.0, 164.0, 138.0, 134.0, 78.0, 66.0, 48.0, 30.0, 37.0, 21.0, 10.0, 10.0, 8.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164031982421875, -0.015768766403198242, -0.015134334564208984, -0.014499902725219727, -0.013865470886230469, -0.013231039047241211, -0.012596607208251953, -0.011962175369262695, -0.011327743530273438, -0.01069331169128418, -0.010058879852294922, -0.009424448013305664, -0.008790016174316406, -0.008155584335327148, -0.007521152496337891, -0.006886720657348633, -0.006252288818359375, -0.005617856979370117, -0.004983425140380859, -0.0043489933013916016, -0.0037145614624023438, -0.003080129623413086, -0.002445697784423828, -0.0018112659454345703, -0.0011768341064453125, -0.0005424022674560547, 9.202957153320312e-05, 0.0007264614105224609, 0.0013608932495117188, 0.0019953250885009766, 0.0026297569274902344, 0.003264188766479492, 0.00389862060546875, 0.004533052444458008, 0.005167484283447266, 0.0058019161224365234, 0.006436347961425781, 0.007070779800415039, 0.007705211639404297, 0.008339643478393555, 0.008974075317382812, 0.00960850715637207, 0.010242938995361328, 0.010877370834350586, 0.011511802673339844, 0.012146234512329102, 0.01278066635131836, 0.013415098190307617, 0.014049530029296875, 0.014683961868286133, 0.01531839370727539, 0.01595282554626465, 0.016587257385253906, 0.017221689224243164, 0.017856121063232422, 0.01849055290222168, 0.019124984741210938, 0.019759416580200195, 0.020393848419189453, 0.02102828025817871, 0.02166271209716797, 0.022297143936157227, 0.022931575775146484, 0.023566007614135742, 0.024200439453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 4065.0, 11.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00484466552734375, -0.004720181226730347, -0.004595696926116943, -0.00447121262550354, -0.004346728324890137, -0.004222244024276733, -0.00409775972366333, -0.003973275423049927, -0.0038487911224365234, -0.00372430682182312, -0.003599822521209717, -0.0034753382205963135, -0.00335085391998291, -0.003226369619369507, -0.0031018853187561035, -0.0029774010181427, -0.002852916717529297, -0.0027284324169158936, -0.0026039481163024902, -0.002479463815689087, -0.0023549795150756836, -0.0022304952144622803, -0.002106010913848877, -0.0019815266132354736, -0.0018570423126220703, -0.001732558012008667, -0.0016080737113952637, -0.0014835894107818604, -0.001359105110168457, -0.0012346208095550537, -0.0011101365089416504, -0.000985652208328247, -0.0008611679077148438, -0.0007366836071014404, -0.0006121993064880371, -0.0004877150058746338, -0.00036323070526123047, -0.00023874640464782715, -0.00011426210403442383, 1.0222196578979492e-05, 0.0001347064971923828, 0.00025919079780578613, 0.00038367509841918945, 0.0005081593990325928, 0.0006326436996459961, 0.0007571280002593994, 0.0008816123008728027, 0.001006096601486206, 0.0011305809020996094, 0.0012550652027130127, 0.001379549503326416, 0.0015040338039398193, 0.0016285181045532227, 0.001753002405166626, 0.0018774867057800293, 0.0020019710063934326, 0.002126455307006836, 0.0022509396076202393, 0.0023754239082336426, 0.002499908208847046, 0.0026243925094604492, 0.0027488768100738525, 0.002873361110687256, 0.002997845411300659, 0.0031223297119140625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 8.0, 3.0, 12.0, 7.0, 13.0, 19.0, 20.0, 15.0, 50.0, 59.0, 92.0, 154.0, 250.0, 108.0, 52.0, 53.0, 23.0, 14.0, 14.0, 12.0, 5.0, 6.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.01142862904816866, -0.011192009784281254, -0.010955390520393848, -0.010718772187829018, -0.010482152923941612, -0.010245533660054207, -0.010008914396166801, -0.009772295132279396, -0.00953567586839199, -0.009299056604504585, -0.00906243734061718, -0.008825818076729774, -0.008589199744164944, -0.008352580480277538, -0.008115961216390133, -0.007879341952502728, -0.007642723154276609, -0.007406103890389204, -0.007169485092163086, -0.0069328658282756805, -0.006696246564388275, -0.00645962730050087, -0.006223008502274752, -0.005986389238387346, -0.005749770440161228, -0.005513151176273823, -0.005276532378047705, -0.005039913114160299, -0.004803293850272894, -0.004566675052046776, -0.00433005578815937, -0.004093436524271965, -0.0038568174932152033, -0.0036201984621584415, -0.003383579198271036, -0.0031469601672142744, -0.0029103411361575127, -0.0026737218722701073, -0.0024371028412133455, -0.002200483810156584, -0.0019638645462691784, -0.0017272453987970948, -0.0014906262513250113, -0.0012540072202682495, -0.001017388072796166, -0.0007807689253240824, -0.0005441498942673206, -0.00030753074679523706, -7.09115993231535e-05, 0.00016570751904509962, 0.00040232663741335273, 0.0006389457266777754, 0.000875564874149859, 0.0011121840216219425, 0.0013488030526787043, 0.0015854222001507878, 0.0018220413476228714, 0.002058660378679633, 0.0022952796425670385, 0.0025318986736238003, 0.0027685179375112057, 0.0030051369685679674, 0.003241755999624729, 0.0034783752635121346, 0.0037149942945688963]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 5.0, 8.0, 8.0, 8.0, 7.0, 6.0, 18.0, 14.0, 17.0, 17.0, 17.0, 20.0, 22.0, 32.0, 37.0, 27.0, 29.0, 44.0, 36.0, 40.0, 38.0, 48.0, 38.0, 42.0, 40.0, 38.0, 40.0, 42.0, 37.0, 29.0, 20.0, 27.0, 27.0, 22.0, 17.0, 16.0, 16.0, 9.0, 6.0, 6.0, 5.0, 12.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0029709339141845703, -0.002868802286684513, -0.002766670659184456, -0.0026645390316843987, -0.0025624074041843414, -0.002460275776684284, -0.002358144149184227, -0.0022560125216841698, -0.0021538808941841125, -0.0020517492666840553, -0.001949617639183998, -0.0018474860116839409, -0.0017453543841838837, -0.0016432227566838264, -0.0015410911291837692, -0.001438959501683712, -0.0013368278741836548, -0.0012346962466835976, -0.0011325646191835403, -0.0010304329916834831, -0.0009283013641834259, -0.0008261697366833687, -0.0007240381091833115, -0.0006219064816832542, -0.000519774854183197, -0.0004176432266831398, -0.0003155115991830826, -0.00021337997168302536, -0.00011124834418296814, -9.11671668291092e-06, 9.30149108171463e-05, 0.00019514653831720352, 0.00029727816581726074, 0.00039940979331731796, 0.0005015414208173752, 0.0006036730483174324, 0.0007058046758174896, 0.0008079363033175468, 0.0009100679308176041, 0.0010121995583176613, 0.0011143311858177185, 0.0012164628133177757, 0.001318594440817833, 0.0014207260683178902, 0.0015228576958179474, 0.0016249893233180046, 0.0017271209508180618, 0.001829252578318119, 0.0019313842058181763, 0.0020335158333182335, 0.0021356474608182907, 0.002237779088318348, 0.002339910715818405, 0.0024420423433184624, 0.0025441739708185196, 0.002646305598318577, 0.002748437225818634, 0.0028505688533186913, 0.0029527004808187485, 0.0030548321083188057, 0.003156963735818863, 0.00325909536331892, 0.0033612269908189774, 0.0034633586183190346, 0.003565490245819092]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 3.0, 4.0, 6.0, 17.0, 13.0, 13.0, 14.0, 24.0, 28.0, 41.0, 57.0, 65.0, 120.0, 146.0, 344.0, 720.0, 2004.0, 7181.0, 33353.0, 267701.0, 660562.0, 59791.0, 11322.0, 2921.0, 1059.0, 426.0, 194.0, 139.0, 58.0, 54.0, 29.0, 28.0, 20.0, 18.0, 10.0, 10.0, 12.0, 10.0, 12.0, 7.0, 5.0, 3.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0406494140625, -0.03920602798461914, -0.03776264190673828, -0.03631925582885742, -0.03487586975097656, -0.0334324836730957, -0.031989097595214844, -0.030545711517333984, -0.029102325439453125, -0.027658939361572266, -0.026215553283691406, -0.024772167205810547, -0.023328781127929688, -0.021885395050048828, -0.02044200897216797, -0.01899862289428711, -0.01755523681640625, -0.01611185073852539, -0.014668464660644531, -0.013225078582763672, -0.011781692504882812, -0.010338306427001953, -0.008894920349121094, -0.007451534271240234, -0.006008148193359375, -0.004564762115478516, -0.0031213760375976562, -0.0016779899597167969, -0.0002346038818359375, 0.0012087821960449219, 0.0026521682739257812, 0.004095554351806641, 0.0055389404296875, 0.006982326507568359, 0.008425712585449219, 0.009869098663330078, 0.011312484741210938, 0.012755870819091797, 0.014199256896972656, 0.015642642974853516, 0.017086029052734375, 0.018529415130615234, 0.019972801208496094, 0.021416187286376953, 0.022859573364257812, 0.024302959442138672, 0.02574634552001953, 0.02718973159790039, 0.02863311767578125, 0.03007650375366211, 0.03151988983154297, 0.03296327590942383, 0.03440666198730469, 0.03585004806518555, 0.037293434143066406, 0.038736820220947266, 0.040180206298828125, 0.041623592376708984, 0.043066978454589844, 0.0445103645324707, 0.04595375061035156, 0.04739713668823242, 0.04884052276611328, 0.05028390884399414, 0.051727294921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 13.0, 13.0, 29.0, 39.0, 69.0, 119.0, 145.0, 142.0, 152.0, 112.0, 54.0, 57.0, 27.0, 16.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01372528076171875, -0.013416707515716553, -0.013108134269714355, -0.012799561023712158, -0.012490987777709961, -0.012182414531707764, -0.011873841285705566, -0.01156526803970337, -0.011256694793701172, -0.010948121547698975, -0.010639548301696777, -0.01033097505569458, -0.010022401809692383, -0.009713828563690186, -0.009405255317687988, -0.009096682071685791, -0.008788108825683594, -0.008479535579681396, -0.0081709623336792, -0.007862389087677002, -0.007553815841674805, -0.007245242595672607, -0.00693666934967041, -0.006628096103668213, -0.006319522857666016, -0.006010949611663818, -0.005702376365661621, -0.005393803119659424, -0.0050852298736572266, -0.004776656627655029, -0.004468083381652832, -0.004159510135650635, -0.0038509368896484375, -0.0035423636436462402, -0.003233790397644043, -0.0029252171516418457, -0.0026166439056396484, -0.002308070659637451, -0.001999497413635254, -0.0016909241676330566, -0.0013823509216308594, -0.0010737776756286621, -0.0007652044296264648, -0.0004566311836242676, -0.0001480579376220703, 0.00016051530838012695, 0.0004690885543823242, 0.0007776618003845215, 0.0010862350463867188, 0.001394808292388916, 0.0017033815383911133, 0.0020119547843933105, 0.002320528030395508, 0.002629101276397705, 0.0029376745223999023, 0.0032462477684020996, 0.003554821014404297, 0.003863394260406494, 0.004171967506408691, 0.004480540752410889, 0.004789113998413086, 0.005097687244415283, 0.0054062604904174805, 0.005714833736419678, 0.006023406982421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 12.0, 12.0, 14.0, 31.0, 27.0, 45.0, 66.0, 105.0, 275.0, 625.0, 1350.0, 3284.0, 8301.0, 22350.0, 69154.0, 357827.0, 469990.0, 75670.0, 24197.0, 8915.0, 3521.0, 1473.0, 632.0, 281.0, 139.0, 69.0, 34.0, 37.0, 27.0, 14.0, 14.0, 12.0, 12.0, 5.0, 8.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191497802734375, -0.018384933471679688, -0.017620086669921875, -0.016855239868164062, -0.01609039306640625, -0.015325546264648438, -0.014560699462890625, -0.013795852661132812, -0.013031005859375, -0.012266159057617188, -0.011501312255859375, -0.010736465454101562, -0.00997161865234375, -0.009206771850585938, -0.008441925048828125, -0.0076770782470703125, -0.0069122314453125, -0.0061473846435546875, -0.005382537841796875, -0.0046176910400390625, -0.00385284423828125, -0.0030879974365234375, -0.002323150634765625, -0.0015583038330078125, -0.00079345703125, -2.86102294921875e-05, 0.000736236572265625, 0.0015010833740234375, 0.00226593017578125, 0.0030307769775390625, 0.003795623779296875, 0.0045604705810546875, 0.0053253173828125, 0.0060901641845703125, 0.006855010986328125, 0.0076198577880859375, 0.00838470458984375, 0.009149551391601562, 0.009914398193359375, 0.010679244995117188, 0.011444091796875, 0.012208938598632812, 0.012973785400390625, 0.013738632202148438, 0.01450347900390625, 0.015268325805664062, 0.016033172607421875, 0.016798019409179688, 0.0175628662109375, 0.018327713012695312, 0.019092559814453125, 0.019857406616210938, 0.02062225341796875, 0.021387100219726562, 0.022151947021484375, 0.022916793823242188, 0.023681640625, 0.024446487426757812, 0.025211334228515625, 0.025976181030273438, 0.02674102783203125, 0.027505874633789062, 0.028270721435546875, 0.029035568237304688, 0.0298004150390625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 5.0, 11.0, 10.0, 14.0, 9.0, 19.0, 22.0, 19.0, 17.0, 31.0, 39.0, 33.0, 44.0, 41.0, 44.0, 33.0, 43.0, 46.0, 37.0, 56.0, 49.0, 49.0, 43.0, 34.0, 44.0, 36.0, 24.0, 20.0, 25.0, 17.0, 23.0, 13.0, 8.0, 12.0, 4.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.019287109375, -0.018793940544128418, -0.018300771713256836, -0.017807602882385254, -0.017314434051513672, -0.01682126522064209, -0.016328096389770508, -0.015834927558898926, -0.015341758728027344, -0.014848589897155762, -0.01435542106628418, -0.013862252235412598, -0.013369083404541016, -0.012875914573669434, -0.012382745742797852, -0.01188957691192627, -0.011396408081054688, -0.010903239250183105, -0.010410070419311523, -0.009916901588439941, -0.00942373275756836, -0.008930563926696777, -0.008437395095825195, -0.007944226264953613, -0.007451057434082031, -0.006957888603210449, -0.006464719772338867, -0.005971550941467285, -0.005478382110595703, -0.004985213279724121, -0.004492044448852539, -0.003998875617980957, -0.003505706787109375, -0.003012537956237793, -0.002519369125366211, -0.002026200294494629, -0.0015330314636230469, -0.0010398626327514648, -0.0005466938018798828, -5.352497100830078e-05, 0.00043964385986328125, 0.0009328126907348633, 0.0014259815216064453, 0.0019191503524780273, 0.0024123191833496094, 0.0029054880142211914, 0.0033986568450927734, 0.0038918256759643555, 0.0043849945068359375, 0.0048781633377075195, 0.0053713321685791016, 0.005864500999450684, 0.006357669830322266, 0.006850838661193848, 0.00734400749206543, 0.007837176322937012, 0.008330345153808594, 0.008823513984680176, 0.009316682815551758, 0.00980985164642334, 0.010303020477294922, 0.010796189308166504, 0.011289358139038086, 0.011782526969909668, 0.01227569580078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 11.0, 23.0, 20.0, 34.0, 69.0, 101.0, 201.0, 371.0, 941.0, 2613.0, 9302.0, 57128.0, 865194.0, 94546.0, 12700.0, 3159.0, 1137.0, 479.0, 221.0, 108.0, 81.0, 29.0, 26.0, 19.0, 8.0, 2.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002770423889160156, -0.0002692602574825287, -0.00026147812604904175, -0.0002536959946155548, -0.00024591386318206787, -0.00023813173174858093, -0.000230349600315094, -0.00022256746888160706, -0.00021478533744812012, -0.00020700320601463318, -0.00019922107458114624, -0.0001914389431476593, -0.00018365681171417236, -0.00017587468028068542, -0.00016809254884719849, -0.00016031041741371155, -0.0001525282859802246, -0.00014474615454673767, -0.00013696402311325073, -0.0001291818916797638, -0.00012139976024627686, -0.00011361762881278992, -0.00010583549737930298, -9.805336594581604e-05, -9.02712345123291e-05, -8.248910307884216e-05, -7.470697164535522e-05, -6.692484021186829e-05, -5.914270877838135e-05, -5.136057734489441e-05, -4.357844591140747e-05, -3.579631447792053e-05, -2.8014183044433594e-05, -2.0232051610946655e-05, -1.2449920177459717e-05, -4.667788743972778e-06, 3.11434268951416e-06, 1.0896474123001099e-05, 1.8678605556488037e-05, 2.6460736989974976e-05, 3.4242868423461914e-05, 4.202499985694885e-05, 4.980713129043579e-05, 5.758926272392273e-05, 6.537139415740967e-05, 7.31535255908966e-05, 8.093565702438354e-05, 8.871778845787048e-05, 9.649991989135742e-05, 0.00010428205132484436, 0.0001120641827583313, 0.00011984631419181824, 0.00012762844562530518, 0.00013541057705879211, 0.00014319270849227905, 0.000150974839925766, 0.00015875697135925293, 0.00016653910279273987, 0.0001743212342262268, 0.00018210336565971375, 0.00018988549709320068, 0.00019766762852668762, 0.00020544975996017456, 0.0002132318913936615, 0.00022101402282714844]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 10.0, 14.0, 11.0, 26.0, 31.0, 39.0, 62.0, 95.0, 148.0, 147.0, 111.0, 91.0, 55.0, 40.0, 24.0, 14.0, 12.0, 12.0, 3.0, 12.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.9078142940998077e-05, -1.848675310611725e-05, -1.789536327123642e-05, -1.730397343635559e-05, -1.6712583601474762e-05, -1.6121193766593933e-05, -1.5529803931713104e-05, -1.4938414096832275e-05, -1.4347024261951447e-05, -1.3755634427070618e-05, -1.3164244592189789e-05, -1.257285475730896e-05, -1.1981464922428131e-05, -1.1390075087547302e-05, -1.0798685252666473e-05, -1.0207295417785645e-05, -9.615905582904816e-06, -9.024515748023987e-06, -8.433125913143158e-06, -7.841736078262329e-06, -7.2503462433815e-06, -6.658956408500671e-06, -6.0675665736198425e-06, -5.476176738739014e-06, -4.884786903858185e-06, -4.293397068977356e-06, -3.702007234096527e-06, -3.1106173992156982e-06, -2.5192275643348694e-06, -1.9278377294540405e-06, -1.3364478945732117e-06, -7.450580596923828e-07, -1.5366822481155396e-07, 4.377216100692749e-07, 1.0291114449501038e-06, 1.6205012798309326e-06, 2.2118911147117615e-06, 2.8032809495925903e-06, 3.394670784473419e-06, 3.986060619354248e-06, 4.577450454235077e-06, 5.168840289115906e-06, 5.760230123996735e-06, 6.3516199588775635e-06, 6.943009793758392e-06, 7.534399628639221e-06, 8.12578946352005e-06, 8.717179298400879e-06, 9.308569133281708e-06, 9.899958968162537e-06, 1.0491348803043365e-05, 1.1082738637924194e-05, 1.1674128472805023e-05, 1.2265518307685852e-05, 1.2856908142566681e-05, 1.344829797744751e-05, 1.4039687812328339e-05, 1.4631077647209167e-05, 1.5222467482089996e-05, 1.5813857316970825e-05, 1.6405247151851654e-05, 1.6996636986732483e-05, 1.7588026821613312e-05, 1.817941665649414e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 5.0, 1.0, 7.0, 10.0, 14.0, 12.0, 18.0, 29.0, 40.0, 74.0, 141.0, 360.0, 1129.0, 4910.0, 32497.0, 892389.0, 104238.0, 9747.0, 1955.0, 534.0, 192.0, 95.0, 39.0, 36.0, 27.0, 19.0, 13.0, 9.0, 9.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020456314086914062, -0.00019362568855285645, -0.00018268823623657227, -0.00017175078392028809, -0.0001608133316040039, -0.00014987587928771973, -0.00013893842697143555, -0.00012800097465515137, -0.00011706352233886719, -0.00010612607002258301, -9.518861770629883e-05, -8.425116539001465e-05, -7.331371307373047e-05, -6.237626075744629e-05, -5.143880844116211e-05, -4.050135612487793e-05, -2.956390380859375e-05, -1.862645149230957e-05, -7.68899917602539e-06, 3.248453140258789e-06, 1.4185905456542969e-05, 2.512335777282715e-05, 3.606081008911133e-05, 4.699826240539551e-05, 5.793571472167969e-05, 6.887316703796387e-05, 7.981061935424805e-05, 9.074807167053223e-05, 0.0001016855239868164, 0.00011262297630310059, 0.00012356042861938477, 0.00013449788093566895, 0.00014543533325195312, 0.0001563727855682373, 0.00016731023788452148, 0.00017824769020080566, 0.00018918514251708984, 0.00020012259483337402, 0.0002110600471496582, 0.00022199749946594238, 0.00023293495178222656, 0.00024387240409851074, 0.0002548098564147949, 0.0002657473087310791, 0.0002766847610473633, 0.00028762221336364746, 0.00029855966567993164, 0.0003094971179962158, 0.0003204345703125, 0.0003313720226287842, 0.00034230947494506836, 0.00035324692726135254, 0.0003641843795776367, 0.0003751218318939209, 0.0003860592842102051, 0.00039699673652648926, 0.00040793418884277344, 0.0004188716411590576, 0.0004298090934753418, 0.000440746545791626, 0.00045168399810791016, 0.00046262145042419434, 0.0004735589027404785, 0.0004844963550567627, 0.0004954338073730469]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 9.0, 7.0, 9.0, 14.0, 14.0, 23.0, 36.0, 67.0, 102.0, 173.0, 153.0, 138.0, 93.0, 57.0, 38.0, 24.0, 19.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0003204345703125, -0.0003137849271297455, -0.00030713528394699097, -0.00030048564076423645, -0.00029383599758148193, -0.0002871863543987274, -0.0002805367112159729, -0.0002738870680332184, -0.00026723742485046387, -0.00026058778166770935, -0.00025393813848495483, -0.0002472884953022003, -0.0002406388521194458, -0.00023398920893669128, -0.00022733956575393677, -0.00022068992257118225, -0.00021404027938842773, -0.00020739063620567322, -0.0002007409930229187, -0.00019409134984016418, -0.00018744170665740967, -0.00018079206347465515, -0.00017414242029190063, -0.00016749277710914612, -0.0001608431339263916, -0.00015419349074363708, -0.00014754384756088257, -0.00014089420437812805, -0.00013424456119537354, -0.00012759491801261902, -0.0001209452748298645, -0.00011429563164710999, -0.00010764598846435547, -0.00010099634528160095, -9.434670209884644e-05, -8.769705891609192e-05, -8.10474157333374e-05, -7.439777255058289e-05, -6.774812936782837e-05, -6.109848618507385e-05, -5.4448843002319336e-05, -4.779919981956482e-05, -4.11495566368103e-05, -3.4499913454055786e-05, -2.785027027130127e-05, -2.1200627088546753e-05, -1.4550983905792236e-05, -7.90134072303772e-06, -1.2516975402832031e-06, 5.3979456424713135e-06, 1.204758882522583e-05, 1.8697232007980347e-05, 2.5346875190734863e-05, 3.199651837348938e-05, 3.8646161556243896e-05, 4.529580473899841e-05, 5.194544792175293e-05, 5.8595091104507446e-05, 6.524473428726196e-05, 7.189437747001648e-05, 7.8544020652771e-05, 8.519366383552551e-05, 9.184330701828003e-05, 9.849295020103455e-05, 0.00010514259338378906]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 10.0, 11.0, 10.0, 16.0, 32.0, 19.0, 42.0, 72.0, 96.0, 230.0, 134.0, 87.0, 51.0, 35.0, 38.0, 25.0, 14.0, 11.0, 11.0, 9.0, 10.0, 0.0, 3.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11983984708786011, -0.11593308299779892, -0.11202631890773773, -0.10811954736709595, -0.10421278327703476, -0.10030601918697357, -0.09639924764633179, -0.0924924835562706, -0.08858571946620941, -0.08467895537614822, -0.08077219128608704, -0.07686541974544525, -0.07295865565538406, -0.06905189156532288, -0.06514512002468109, -0.061238355934619904, -0.057331591844558716, -0.05342482775449753, -0.04951805993914604, -0.045611292123794556, -0.04170452803373337, -0.03779776394367218, -0.033890996128320694, -0.029984230175614357, -0.02607746422290802, -0.022170698270201683, -0.018263932317495346, -0.014357166364789009, -0.010450400412082672, -0.006543634459376335, -0.002636868506669998, 0.0012698974460363388, 0.005176663398742676, 0.009083429351449013, 0.01299019530415535, 0.016896961256861687, 0.020803727209568024, 0.02471049316227436, 0.028617259114980698, 0.032524026930332184, 0.03643079102039337, 0.04033755511045456, 0.044244322925806046, 0.04815109074115753, 0.05205785483121872, 0.05596461892127991, 0.05987138673663139, 0.06377815455198288, 0.06768491864204407, 0.07159168273210526, 0.07549844682216644, 0.07940521836280823, 0.08331198245286942, 0.0872187465429306, 0.09112551808357239, 0.09503228217363358, 0.09893904626369476, 0.10284581035375595, 0.10675257444381714, 0.11065934598445892, 0.11456611007452011, 0.1184728741645813, 0.12237964570522308, 0.12628640234470367, 0.13019317388534546]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 11.0, 6.0, 8.0, 13.0, 11.0, 19.0, 36.0, 37.0, 36.0, 36.0, 54.0, 54.0, 64.0, 59.0, 67.0, 67.0, 52.0, 57.0, 46.0, 45.0, 45.0, 35.0, 26.0, 24.0, 22.0, 20.0, 8.0, 9.0, 12.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0989154577255249, -0.09587566554546356, -0.09283588081598282, -0.08979608863592148, -0.08675630390644073, -0.0837165117263794, -0.08067671954631805, -0.07763692736625671, -0.07459714263677597, -0.07155735045671463, -0.06851756572723389, -0.06547777354717255, -0.062437985092401505, -0.05939819663763046, -0.05635840445756912, -0.05331861600279808, -0.05027882754802704, -0.047239039093256, -0.044199250638484955, -0.041159458458423615, -0.03811967000365257, -0.03507988154888153, -0.03204008936882019, -0.02900030091404915, -0.025960512459278107, -0.022920724004507065, -0.019880933687090874, -0.016841143369674683, -0.01380135491490364, -0.010761565528810024, -0.007721776142716408, -0.004681985825300217, -0.0016421973705291748, 0.0013975920155644417, 0.004437381401658058, 0.007477170787751675, 0.010516960173845291, 0.013556749559938908, 0.016596538946032524, 0.019636329263448715, 0.022676117718219757, 0.0257159061729908, 0.02875569649040699, 0.03179548680782318, 0.03483527526259422, 0.037875063717365265, 0.040914855897426605, 0.04395464435219765, 0.04699443280696869, 0.05003422126173973, 0.05307400971651077, 0.05611380189657211, 0.059153590351343155, 0.0621933788061142, 0.06523317098617554, 0.06827296316623688, 0.07131274789571762, 0.07435254007577896, 0.0773923248052597, 0.08043211698532104, 0.08347190916538239, 0.08651169389486313, 0.08955148607492447, 0.09259127080440521, 0.09563106298446655]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 12.0, 8.0, 33.0, 49.0, 98.0, 170.0, 350.0, 634.0, 1368.0, 4188926.0, 1270.0, 620.0, 344.0, 196.0, 92.0, 47.0, 21.0, 13.0, 7.0, 6.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.10223388671875, -0.09993505477905273, -0.09763622283935547, -0.0953373908996582, -0.09303855895996094, -0.09073972702026367, -0.0884408950805664, -0.08614206314086914, -0.08384323120117188, -0.08154439926147461, -0.07924556732177734, -0.07694673538208008, -0.07464790344238281, -0.07234907150268555, -0.07005023956298828, -0.06775140762329102, -0.06545257568359375, -0.06315374374389648, -0.06085491180419922, -0.05855607986450195, -0.05625724792480469, -0.05395841598510742, -0.051659584045410156, -0.04936075210571289, -0.047061920166015625, -0.04476308822631836, -0.042464256286621094, -0.04016542434692383, -0.03786659240722656, -0.0355677604675293, -0.03326892852783203, -0.030970096588134766, -0.0286712646484375, -0.026372432708740234, -0.02407360076904297, -0.021774768829345703, -0.019475936889648438, -0.017177104949951172, -0.014878273010253906, -0.01257944107055664, -0.010280609130859375, -0.00798177719116211, -0.005682945251464844, -0.003384113311767578, -0.0010852813720703125, 0.0012135505676269531, 0.0035123825073242188, 0.005811214447021484, 0.00811004638671875, 0.010408878326416016, 0.012707710266113281, 0.015006542205810547, 0.017305374145507812, 0.019604206085205078, 0.021903038024902344, 0.02420186996459961, 0.026500701904296875, 0.02879953384399414, 0.031098365783691406, 0.03339719772338867, 0.03569602966308594, 0.0379948616027832, 0.04029369354248047, 0.042592525482177734, 0.044891357421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 24.0, 36.0, 53.0, 81.0, 141.0, 152.0, 144.0, 131.0, 78.0, 47.0, 52.0, 20.0, 14.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01323699951171875, -0.012936055660247803, -0.012635111808776855, -0.012334167957305908, -0.012033224105834961, -0.011732280254364014, -0.011431336402893066, -0.01113039255142212, -0.010829448699951172, -0.010528504848480225, -0.010227560997009277, -0.00992661714553833, -0.009625673294067383, -0.009324729442596436, -0.009023785591125488, -0.008722841739654541, -0.008421897888183594, -0.008120954036712646, -0.0078200101852417, -0.007519066333770752, -0.007218122482299805, -0.006917178630828857, -0.00661623477935791, -0.006315290927886963, -0.006014347076416016, -0.005713403224945068, -0.005412459373474121, -0.005111515522003174, -0.0048105716705322266, -0.004509627819061279, -0.004208683967590332, -0.003907740116119385, -0.0036067962646484375, -0.0033058524131774902, -0.003004908561706543, -0.0027039647102355957, -0.0024030208587646484, -0.002102077007293701, -0.001801133155822754, -0.0015001893043518066, -0.0011992454528808594, -0.0008983016014099121, -0.0005973577499389648, -0.0002964138984680176, 4.5299530029296875e-06, 0.00030547380447387695, 0.0006064176559448242, 0.0009073615074157715, 0.0012083053588867188, 0.001509249210357666, 0.0018101930618286133, 0.0021111369132995605, 0.002412080764770508, 0.002713024616241455, 0.0030139684677124023, 0.0033149123191833496, 0.003615856170654297, 0.003916800022125244, 0.004217743873596191, 0.004518687725067139, 0.004819631576538086, 0.005120575428009033, 0.0054215192794799805, 0.005722463130950928, 0.006023406982421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 6.0, 17.0, 13.0, 15.0, 26.0, 36.0, 33.0, 75.0, 84.0, 135.0, 200.0, 245.0, 378.0, 495.0, 776.0, 2198.0, 4183250.0, 3328.0, 955.0, 570.0, 391.0, 306.0, 216.0, 147.0, 119.0, 65.0, 68.0, 35.0, 26.0, 18.0, 20.0, 3.0, 8.0, 10.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.01739501953125, -0.016956090927124023, -0.016517162322998047, -0.01607823371887207, -0.015639305114746094, -0.015200376510620117, -0.01476144790649414, -0.014322519302368164, -0.013883590698242188, -0.013444662094116211, -0.013005733489990234, -0.012566804885864258, -0.012127876281738281, -0.011688947677612305, -0.011250019073486328, -0.010811090469360352, -0.010372161865234375, -0.009933233261108398, -0.009494304656982422, -0.009055376052856445, -0.008616447448730469, -0.008177518844604492, -0.007738590240478516, -0.007299661636352539, -0.0068607330322265625, -0.006421804428100586, -0.005982875823974609, -0.005543947219848633, -0.005105018615722656, -0.00466609001159668, -0.004227161407470703, -0.0037882328033447266, -0.00334930419921875, -0.0029103755950927734, -0.002471446990966797, -0.0020325183868408203, -0.0015935897827148438, -0.0011546611785888672, -0.0007157325744628906, -0.00027680397033691406, 0.0001621246337890625, 0.0006010532379150391, 0.0010399818420410156, 0.0014789104461669922, 0.0019178390502929688, 0.0023567676544189453, 0.002795696258544922, 0.0032346248626708984, 0.003673553466796875, 0.0041124820709228516, 0.004551410675048828, 0.004990339279174805, 0.005429267883300781, 0.005868196487426758, 0.006307125091552734, 0.006746053695678711, 0.0071849822998046875, 0.007623910903930664, 0.00806283950805664, 0.008501768112182617, 0.008940696716308594, 0.00937962532043457, 0.009818553924560547, 0.010257482528686523, 0.0106964111328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4072.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019664764404296875, -0.0018892288208007812, -0.001811981201171875, -0.0017347335815429688, -0.0016574859619140625, -0.0015802383422851562, -0.00150299072265625, -0.0014257431030273438, -0.0013484954833984375, -0.0012712478637695312, -0.001194000244140625, -0.0011167526245117188, -0.0010395050048828125, -0.0009622573852539062, -0.000885009765625, -0.0008077621459960938, -0.0007305145263671875, -0.0006532669067382812, -0.000576019287109375, -0.0004987716674804688, -0.0004215240478515625, -0.00034427642822265625, -0.00026702880859375, -0.00018978118896484375, -0.0001125335693359375, -3.528594970703125e-05, 4.1961669921875e-05, 0.00011920928955078125, 0.0001964569091796875, 0.00027370452880859375, 0.0003509521484375, 0.00042819976806640625, 0.0005054473876953125, 0.0005826950073242188, 0.000659942626953125, 0.0007371902465820312, 0.0008144378662109375, 0.0008916854858398438, 0.00096893310546875, 0.0010461807250976562, 0.0011234283447265625, 0.0012006759643554688, 0.001277923583984375, 0.0013551712036132812, 0.0014324188232421875, 0.0015096664428710938, 0.0015869140625, 0.0016641616821289062, 0.0017414093017578125, 0.0018186569213867188, 0.001895904541015625, 0.0019731521606445312, 0.0020503997802734375, 0.0021276473999023438, 0.00220489501953125, 0.0022821426391601562, 0.0023593902587890625, 0.0024366378784179688, 0.002513885498046875, 0.0025911331176757812, 0.0026683807373046875, 0.0027456283569335938, 0.0028228759765625, 0.0029001235961914062, 0.0029773712158203125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 5.0, 15.0, 14.0, 27.0, 27.0, 41.0, 82.0, 118.0, 226.0, 129.0, 71.0, 49.0, 40.0, 28.0, 25.0, 16.0, 20.0, 8.0, 9.0, 7.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033214713912457228, -0.0031969347037374973, -0.0030723982490599155, -0.00294786156155169, -0.0028233248740434647, -0.002698788419365883, -0.0025742517318576574, -0.002449715044349432, -0.00232517858967185, -0.0022006419021636248, -0.002076105447486043, -0.0019515687599778175, -0.001827032072469592, -0.0017024955013766885, -0.0015779589302837849, -0.0014534222427755594, -0.001328885555267334, -0.0012043489841744304, -0.001079812296666205, -0.0009552757255733013, -0.0008307390962727368, -0.0007062024669721723, -0.0005816658958792686, -0.0004571292665787041, -0.0003325926372781396, -0.0002080560225294903, -8.351940778084099e-05, 4.101719241589308e-05, 0.0001655538217164576, 0.00029009045101702213, 0.00041462702210992575, 0.0005391636514104903, 0.0006637000478804111, 0.0007882366771809757, 0.0009127733064815402, 0.0010373098775744438, 0.0011618465650826693, 0.0012863831361755729, 0.0014109197072684765, 0.001535456394776702, 0.0016599929658696055, 0.0017845295369625092, 0.0019090662244707346, 0.00203360291197896, 0.002158139366656542, 0.0022826760541647673, 0.0024072127416729927, 0.0025317491963505745, 0.0026562858838588, 0.0027808225713670254, 0.002905359026044607, 0.0030298957135528326, 0.003154432401061058, 0.00327896885573864, 0.0034035055432468653, 0.0035280422307550907, 0.0036525786854326725, 0.003777115372940898, 0.0039016518276184797, 0.004026188515126705, 0.004150724969804287, 0.004275261890143156, 0.004399798344820738, 0.00452433479949832, 0.004648871719837189]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 12.0, 7.0, 4.0, 10.0, 10.0, 11.0, 14.0, 17.0, 15.0, 22.0, 30.0, 22.0, 27.0, 36.0, 42.0, 40.0, 44.0, 39.0, 45.0, 48.0, 36.0, 42.0, 37.0, 33.0, 34.0, 31.0, 37.0, 32.0, 30.0, 27.0, 19.0, 26.0, 24.0, 17.0, 16.0, 9.0, 11.0, 5.0, 12.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0022591352462768555, -0.0021954048424959183, -0.002131674438714981, -0.002067944034934044, -0.0020042136311531067, -0.0019404832273721695, -0.0018767528235912323, -0.001813022419810295, -0.001749292016029358, -0.0016855616122484207, -0.0016218312084674835, -0.0015581008046865463, -0.0014943704009056091, -0.001430639997124672, -0.0013669095933437347, -0.0013031791895627975, -0.0012394487857818604, -0.0011757183820009232, -0.001111987978219986, -0.0010482575744390488, -0.0009845271706581116, -0.0009207967668771744, -0.0008570663630962372, -0.0007933359593153, -0.0007296055555343628, -0.0006658751517534256, -0.0006021447479724884, -0.0005384143441915512, -0.000474683940410614, -0.0004109535366296768, -0.0003472231328487396, -0.00028349272906780243, -0.00021976232528686523, -0.00015603192150592804, -9.230151772499084e-05, -2.857111394405365e-05, 3.5159289836883545e-05, 9.888969361782074e-05, 0.00016262009739875793, 0.00022635050117969513, 0.0002900809049606323, 0.0003538113087415695, 0.0004175417125225067, 0.0004812721163034439, 0.0005450025200843811, 0.0006087329238653183, 0.0006724633276462555, 0.0007361937314271927, 0.0007999241352081299, 0.0008636545389890671, 0.0009273849427700043, 0.0009911153465509415, 0.0010548457503318787, 0.0011185761541128159, 0.001182306557893753, 0.0012460369616746902, 0.0013097673654556274, 0.0013734977692365646, 0.0014372281730175018, 0.001500958576798439, 0.0015646889805793762, 0.0016284193843603134, 0.0016921497881412506, 0.0017558801919221878, 0.001819610595703125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 10.0, 12.0, 9.0, 15.0, 18.0, 25.0, 38.0, 46.0, 57.0, 133.0, 212.0, 455.0, 1088.0, 3445.0, 15578.0, 106363.0, 795482.0, 104426.0, 15571.0, 3453.0, 1076.0, 439.0, 188.0, 127.0, 70.0, 50.0, 33.0, 28.0, 13.0, 19.0, 17.0, 10.0, 12.0, 8.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.051025390625, -0.04945516586303711, -0.04788494110107422, -0.04631471633911133, -0.04474449157714844, -0.04317426681518555, -0.041604042053222656, -0.040033817291259766, -0.038463592529296875, -0.036893367767333984, -0.035323143005371094, -0.0337529182434082, -0.03218269348144531, -0.030612468719482422, -0.02904224395751953, -0.02747201919555664, -0.02590179443359375, -0.02433156967163086, -0.02276134490966797, -0.021191120147705078, -0.019620895385742188, -0.018050670623779297, -0.016480445861816406, -0.014910221099853516, -0.013339996337890625, -0.011769771575927734, -0.010199546813964844, -0.008629322052001953, -0.0070590972900390625, -0.005488872528076172, -0.003918647766113281, -0.0023484230041503906, -0.0007781982421875, 0.0007920265197753906, 0.0023622512817382812, 0.003932476043701172, 0.0055027008056640625, 0.007072925567626953, 0.008643150329589844, 0.010213375091552734, 0.011783599853515625, 0.013353824615478516, 0.014924049377441406, 0.016494274139404297, 0.018064498901367188, 0.019634723663330078, 0.02120494842529297, 0.02277517318725586, 0.02434539794921875, 0.02591562271118164, 0.02748584747314453, 0.029056072235107422, 0.030626296997070312, 0.0321965217590332, 0.033766746520996094, 0.035336971282958984, 0.036907196044921875, 0.038477420806884766, 0.040047645568847656, 0.04161787033081055, 0.04318809509277344, 0.04475831985473633, 0.04632854461669922, 0.04789876937866211, 0.049468994140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 27.0, 34.0, 56.0, 79.0, 138.0, 158.0, 145.0, 130.0, 73.0, 46.0, 52.0, 21.0, 14.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.013214111328125, -0.012913644313812256, -0.012613177299499512, -0.012312710285186768, -0.012012243270874023, -0.01171177625656128, -0.011411309242248535, -0.011110842227935791, -0.010810375213623047, -0.010509908199310303, -0.010209441184997559, -0.009908974170684814, -0.00960850715637207, -0.009308040142059326, -0.009007573127746582, -0.008707106113433838, -0.008406639099121094, -0.00810617208480835, -0.0078057050704956055, -0.007505238056182861, -0.007204771041870117, -0.006904304027557373, -0.006603837013244629, -0.006303369998931885, -0.006002902984619141, -0.0057024359703063965, -0.005401968955993652, -0.005101501941680908, -0.004801034927368164, -0.00450056791305542, -0.004200100898742676, -0.0038996338844299316, -0.0035991668701171875, -0.0032986998558044434, -0.0029982328414916992, -0.002697765827178955, -0.002397298812866211, -0.002096831798553467, -0.0017963647842407227, -0.0014958977699279785, -0.0011954307556152344, -0.0008949637413024902, -0.0005944967269897461, -0.00029402971267700195, 6.4373016357421875e-06, 0.00030690431594848633, 0.0006073713302612305, 0.0009078383445739746, 0.0012083053588867188, 0.0015087723731994629, 0.001809239387512207, 0.002109706401824951, 0.0024101734161376953, 0.0027106404304504395, 0.0030111074447631836, 0.0033115744590759277, 0.003612041473388672, 0.003912508487701416, 0.00421297550201416, 0.004513442516326904, 0.0048139095306396484, 0.005114376544952393, 0.005414843559265137, 0.005715310573577881, 0.006015777587890625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 10.0, 11.0, 14.0, 16.0, 20.0, 19.0, 26.0, 37.0, 59.0, 110.0, 207.0, 359.0, 755.0, 1837.0, 4633.0, 12652.0, 39816.0, 176740.0, 671153.0, 98667.0, 26504.0, 8864.0, 3296.0, 1387.0, 633.0, 292.0, 123.0, 75.0, 40.0, 32.0, 28.0, 16.0, 15.0, 19.0, 13.0, 10.0, 8.0, 7.0, 9.0, 9.0, 1.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024566650390625, -0.023699522018432617, -0.022832393646240234, -0.02196526527404785, -0.02109813690185547, -0.020231008529663086, -0.019363880157470703, -0.01849675178527832, -0.017629623413085938, -0.016762495040893555, -0.015895366668701172, -0.015028238296508789, -0.014161109924316406, -0.013293981552124023, -0.01242685317993164, -0.011559724807739258, -0.010692596435546875, -0.009825468063354492, -0.00895833969116211, -0.008091211318969727, -0.007224082946777344, -0.006356954574584961, -0.005489826202392578, -0.004622697830200195, -0.0037555694580078125, -0.0028884410858154297, -0.002021312713623047, -0.001154184341430664, -0.00028705596923828125, 0.0005800724029541016, 0.0014472007751464844, 0.002314329147338867, 0.00318145751953125, 0.004048585891723633, 0.004915714263916016, 0.0057828426361083984, 0.006649971008300781, 0.007517099380493164, 0.008384227752685547, 0.00925135612487793, 0.010118484497070312, 0.010985612869262695, 0.011852741241455078, 0.012719869613647461, 0.013586997985839844, 0.014454126358032227, 0.01532125473022461, 0.016188383102416992, 0.017055511474609375, 0.017922639846801758, 0.01878976821899414, 0.019656896591186523, 0.020524024963378906, 0.02139115333557129, 0.022258281707763672, 0.023125410079956055, 0.023992538452148438, 0.02485966682434082, 0.025726795196533203, 0.026593923568725586, 0.02746105194091797, 0.02832818031311035, 0.029195308685302734, 0.030062437057495117, 0.0309295654296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 2.0, 8.0, 8.0, 8.0, 9.0, 9.0, 13.0, 18.0, 14.0, 15.0, 23.0, 21.0, 16.0, 25.0, 25.0, 33.0, 36.0, 30.0, 38.0, 38.0, 37.0, 40.0, 43.0, 40.0, 33.0, 31.0, 34.0, 56.0, 25.0, 30.0, 38.0, 28.0, 20.0, 20.0, 19.0, 17.0, 18.0, 17.0, 15.0, 10.0, 10.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0], "bins": [-0.01488494873046875, -0.014469146728515625, -0.0140533447265625, -0.013637542724609375, -0.01322174072265625, -0.012805938720703125, -0.01239013671875, -0.011974334716796875, -0.01155853271484375, -0.011142730712890625, -0.0107269287109375, -0.010311126708984375, -0.00989532470703125, -0.009479522705078125, -0.009063720703125, -0.008647918701171875, -0.00823211669921875, -0.007816314697265625, -0.0074005126953125, -0.006984710693359375, -0.00656890869140625, -0.006153106689453125, -0.0057373046875, -0.005321502685546875, -0.00490570068359375, -0.004489898681640625, -0.0040740966796875, -0.003658294677734375, -0.00324249267578125, -0.002826690673828125, -0.002410888671875, -0.001995086669921875, -0.00157928466796875, -0.001163482666015625, -0.0007476806640625, -0.000331878662109375, 8.392333984375e-05, 0.000499725341796875, 0.00091552734375, 0.001331329345703125, 0.00174713134765625, 0.002162933349609375, 0.0025787353515625, 0.002994537353515625, 0.00341033935546875, 0.003826141357421875, 0.004241943359375, 0.004657745361328125, 0.00507354736328125, 0.005489349365234375, 0.0059051513671875, 0.006320953369140625, 0.00673675537109375, 0.007152557373046875, 0.007568359375, 0.007984161376953125, 0.00839996337890625, 0.008815765380859375, 0.0092315673828125, 0.009647369384765625, 0.01006317138671875, 0.010478973388671875, 0.010894775390625, 0.011310577392578125, 0.01172637939453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 16.0, 25.0, 50.0, 66.0, 83.0, 118.0, 201.0, 367.0, 732.0, 1552.0, 3476.0, 10729.0, 46841.0, 746321.0, 200501.0, 25544.0, 6769.0, 2584.0, 1106.0, 595.0, 307.0, 176.0, 118.0, 72.0, 53.0, 33.0, 28.0, 13.0, 13.0, 9.0, 3.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00019037723541259766, -0.00018419884145259857, -0.0001780204474925995, -0.0001718420535326004, -0.00016566365957260132, -0.00015948526561260223, -0.00015330687165260315, -0.00014712847769260406, -0.00014095008373260498, -0.0001347716897726059, -0.0001285932958126068, -0.00012241490185260773, -0.00011623650789260864, -0.00011005811393260956, -0.00010387971997261047, -9.770132601261139e-05, -9.15229320526123e-05, -8.534453809261322e-05, -7.916614413261414e-05, -7.298775017261505e-05, -6.680935621261597e-05, -6.063096225261688e-05, -5.44525682926178e-05, -4.827417433261871e-05, -4.209578037261963e-05, -3.5917386412620544e-05, -2.973899245262146e-05, -2.3560598492622375e-05, -1.738220453262329e-05, -1.1203810572624207e-05, -5.025416612625122e-06, 1.1529773473739624e-06, 7.331371307373047e-06, 1.3509765267372131e-05, 1.9688159227371216e-05, 2.58665531873703e-05, 3.2044947147369385e-05, 3.822334110736847e-05, 4.4401735067367554e-05, 5.058012902736664e-05, 5.675852298736572e-05, 6.293691694736481e-05, 6.911531090736389e-05, 7.529370486736298e-05, 8.147209882736206e-05, 8.765049278736115e-05, 9.382888674736023e-05, 0.00010000728070735931, 0.0001061856746673584, 0.00011236406862735748, 0.00011854246258735657, 0.00012472085654735565, 0.00013089925050735474, 0.00013707764446735382, 0.0001432560384273529, 0.000149434432387352, 0.00015561282634735107, 0.00016179122030735016, 0.00016796961426734924, 0.00017414800822734833, 0.0001803264021873474, 0.0001865047961473465, 0.00019268319010734558, 0.00019886158406734467, 0.00020503997802734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 2.0, 10.0, 5.0, 10.0, 10.0, 10.0, 10.0, 17.0, 12.0, 24.0, 34.0, 47.0, 46.0, 60.0, 84.0, 136.0, 109.0, 69.0, 53.0, 50.0, 37.0, 43.0, 20.0, 16.0, 9.0, 20.0, 9.0, 9.0, 8.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8656253814697266e-05, -1.8149614334106445e-05, -1.7642974853515625e-05, -1.7136335372924805e-05, -1.6629695892333984e-05, -1.6123056411743164e-05, -1.5616416931152344e-05, -1.5109777450561523e-05, -1.4603137969970703e-05, -1.4096498489379883e-05, -1.3589859008789062e-05, -1.3083219528198242e-05, -1.2576580047607422e-05, -1.2069940567016602e-05, -1.1563301086425781e-05, -1.1056661605834961e-05, -1.055002212524414e-05, -1.004338264465332e-05, -9.5367431640625e-06, -9.03010368347168e-06, -8.52346420288086e-06, -8.016824722290039e-06, -7.510185241699219e-06, -7.0035457611083984e-06, -6.496906280517578e-06, -5.990266799926758e-06, -5.4836273193359375e-06, -4.976987838745117e-06, -4.470348358154297e-06, -3.9637088775634766e-06, -3.4570693969726562e-06, -2.950429916381836e-06, -2.4437904357910156e-06, -1.9371509552001953e-06, -1.430511474609375e-06, -9.238719940185547e-07, -4.172325134277344e-07, 8.940696716308594e-08, 5.960464477539062e-07, 1.1026859283447266e-06, 1.6093254089355469e-06, 2.115964889526367e-06, 2.6226043701171875e-06, 3.129243850708008e-06, 3.635883331298828e-06, 4.1425228118896484e-06, 4.649162292480469e-06, 5.155801773071289e-06, 5.662441253662109e-06, 6.16908073425293e-06, 6.67572021484375e-06, 7.18235969543457e-06, 7.68899917602539e-06, 8.195638656616211e-06, 8.702278137207031e-06, 9.208917617797852e-06, 9.715557098388672e-06, 1.0222196578979492e-05, 1.0728836059570312e-05, 1.1235475540161133e-05, 1.1742115020751953e-05, 1.2248754501342773e-05, 1.2755393981933594e-05, 1.3262033462524414e-05, 1.3768672943115234e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 13.0, 15.0, 27.0, 57.0, 92.0, 159.0, 323.0, 645.0, 1552.0, 4290.0, 14916.0, 76702.0, 803787.0, 117586.0, 19535.0, 5353.0, 1912.0, 773.0, 345.0, 152.0, 87.0, 60.0, 37.0, 33.0, 18.0, 16.0, 14.0, 2.0, 2.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021064281463623047, -0.00020397640764713287, -0.00019731000065803528, -0.00019064359366893768, -0.0001839771866798401, -0.0001773107796907425, -0.0001706443727016449, -0.0001639779657125473, -0.0001573115587234497, -0.0001506451517343521, -0.00014397874474525452, -0.00013731233775615692, -0.00013064593076705933, -0.00012397952377796173, -0.00011731311678886414, -0.00011064670979976654, -0.00010398030281066895, -9.731389582157135e-05, -9.064748883247375e-05, -8.398108184337616e-05, -7.731467485427856e-05, -7.064826786518097e-05, -6.398186087608337e-05, -5.731545388698578e-05, -5.0649046897888184e-05, -4.398263990879059e-05, -3.731623291969299e-05, -3.06498259305954e-05, -2.3983418941497803e-05, -1.7317011952400208e-05, -1.0650604963302612e-05, -3.984197974205017e-06, 2.682209014892578e-06, 9.348616003990173e-06, 1.601502299308777e-05, 2.2681429982185364e-05, 2.934783697128296e-05, 3.6014243960380554e-05, 4.268065094947815e-05, 4.9347057938575745e-05, 5.601346492767334e-05, 6.267987191677094e-05, 6.934627890586853e-05, 7.601268589496613e-05, 8.267909288406372e-05, 8.934549987316132e-05, 9.601190686225891e-05, 0.0001026783138513565, 0.0001093447208404541, 0.0001160111278295517, 0.0001226775348186493, 0.0001293439418077469, 0.00013601034879684448, 0.00014267675578594208, 0.00014934316277503967, 0.00015600956976413727, 0.00016267597675323486, 0.00016934238374233246, 0.00017600879073143005, 0.00018267519772052765, 0.00018934160470962524, 0.00019600801169872284, 0.00020267441868782043, 0.00020934082567691803, 0.00021600723266601562]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 3.0, 13.0, 8.0, 15.0, 18.0, 18.0, 15.0, 22.0, 30.0, 34.0, 46.0, 47.0, 51.0, 58.0, 77.0, 80.0, 58.0, 56.0, 71.0, 52.0, 42.0, 30.0, 20.0, 23.0, 29.0, 18.0, 9.0, 9.0, 6.0, 5.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00010389089584350586, -0.00010070577263832092, -9.752064943313599e-05, -9.433552622795105e-05, -9.115040302276611e-05, -8.796527981758118e-05, -8.478015661239624e-05, -8.15950334072113e-05, -7.840991020202637e-05, -7.522478699684143e-05, -7.20396637916565e-05, -6.885454058647156e-05, -6.566941738128662e-05, -6.248429417610168e-05, -5.929917097091675e-05, -5.611404776573181e-05, -5.2928924560546875e-05, -4.974380135536194e-05, -4.6558678150177e-05, -4.3373554944992065e-05, -4.018843173980713e-05, -3.700330853462219e-05, -3.3818185329437256e-05, -3.063306212425232e-05, -2.7447938919067383e-05, -2.4262815713882446e-05, -2.107769250869751e-05, -1.7892569303512573e-05, -1.4707446098327637e-05, -1.15223228931427e-05, -8.337199687957764e-06, -5.152076482772827e-06, -1.9669532775878906e-06, 1.218169927597046e-06, 4.403293132781982e-06, 7.588416337966919e-06, 1.0773539543151855e-05, 1.3958662748336792e-05, 1.714378595352173e-05, 2.0328909158706665e-05, 2.35140323638916e-05, 2.6699155569076538e-05, 2.9884278774261475e-05, 3.306940197944641e-05, 3.625452518463135e-05, 3.9439648389816284e-05, 4.262477159500122e-05, 4.580989480018616e-05, 4.8995018005371094e-05, 5.218014121055603e-05, 5.536526441574097e-05, 5.85503876209259e-05, 6.173551082611084e-05, 6.492063403129578e-05, 6.810575723648071e-05, 7.129088044166565e-05, 7.447600364685059e-05, 7.766112685203552e-05, 8.084625005722046e-05, 8.40313732624054e-05, 8.721649646759033e-05, 9.040161967277527e-05, 9.35867428779602e-05, 9.677186608314514e-05, 9.995698928833008e-05]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 7.0, 5.0, 10.0, 16.0, 13.0, 22.0, 28.0, 38.0, 62.0, 88.0, 184.0, 197.0, 90.0, 60.0, 38.0, 30.0, 22.0, 21.0, 19.0, 8.0, 6.0, 10.0, 5.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12331752479076385, -0.1196894645690918, -0.11606140434741974, -0.11243334412574768, -0.10880528390407562, -0.10517722368240356, -0.10154915601015091, -0.09792109578847885, -0.0942930355668068, -0.09066497534513474, -0.08703691512346268, -0.08340885490179062, -0.07978078722953796, -0.0761527270078659, -0.07252466678619385, -0.06889660656452179, -0.06526854634284973, -0.06164048612117767, -0.058012425899505615, -0.05438436195254326, -0.0507563017308712, -0.04712824150919914, -0.043500177562236786, -0.03987211734056473, -0.03624405711889267, -0.03261599689722061, -0.028987934812903404, -0.025359872728586197, -0.02173181250691414, -0.01810375228524208, -0.014475690200924873, -0.010847628116607666, -0.007219560444355011, -0.0035914992913603783, 3.6561861634254456e-05, 0.003664623014628887, 0.00729268416762352, 0.010920744389295578, 0.014548806473612785, 0.018176868557929993, 0.02180492877960205, 0.02543298900127411, 0.029061051085591316, 0.032689113169908524, 0.03631717339158058, 0.03994523361325264, 0.043573297560214996, 0.047201357781887054, 0.05082941800355911, 0.05445747822523117, 0.05808553844690323, 0.061713602393865585, 0.06534166634082794, 0.0689697265625, 0.07259778678417206, 0.07622584700584412, 0.07985390722751617, 0.08348196744918823, 0.08711002767086029, 0.09073808789253235, 0.0943661481142044, 0.09799420833587646, 0.10162227600812912, 0.10525033622980118, 0.10887839645147324]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 13.0, 12.0, 14.0, 15.0, 19.0, 25.0, 19.0, 37.0, 36.0, 30.0, 48.0, 42.0, 58.0, 52.0, 61.0, 60.0, 64.0, 55.0, 53.0, 36.0, 40.0, 37.0, 30.0, 29.0, 26.0, 17.0, 16.0, 12.0, 12.0, 8.0, 9.0, 5.0, 6.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07691287994384766, -0.07434757053852081, -0.07178226858377457, -0.06921695917844772, -0.06665165722370148, -0.06408634781837463, -0.06152103841304779, -0.058955732733011246, -0.0563904270529747, -0.053825121372938156, -0.05125981569290161, -0.04869450628757477, -0.04612920060753822, -0.04356389492750168, -0.040998585522174835, -0.03843327984213829, -0.035867974162101746, -0.0333026684820652, -0.030737360939383507, -0.028172053396701813, -0.025606747716665268, -0.023041442036628723, -0.02047613449394703, -0.017910826951265335, -0.01534552127122879, -0.012780214659869671, -0.010214908048510551, -0.007649601437151432, -0.005084294825792313, -0.002518988214433193, 4.631839692592621e-05, 0.0026116259396076202, 0.005176931619644165, 0.0077422382310032845, 0.010307544842362404, 0.012872851453721523, 0.015438158065080643, 0.018003463745117188, 0.02056877128779888, 0.023134078830480576, 0.02569938451051712, 0.028264690190553665, 0.03082999773323536, 0.03339530527591705, 0.0359606109559536, 0.03852591663599014, 0.041091226041316986, 0.04365653172135353, 0.046221837401390076, 0.04878714308142662, 0.051352448761463165, 0.05391775816679001, 0.05648306384682655, 0.0590483695268631, 0.06161367893218994, 0.06417898833751678, 0.06674429029226303, 0.06930959969758987, 0.07187490165233612, 0.07444021105766296, 0.07700552046298981, 0.07957082241773605, 0.0821361318230629, 0.08470143377780914, 0.08726674318313599]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 6.0, 5.0, 11.0, 23.0, 30.0, 61.0, 121.0, 276.0, 779.0, 3012.0, 4183585.0, 4618.0, 1100.0, 321.0, 151.0, 81.0, 54.0, 19.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08831787109375, -0.08629274368286133, -0.08426761627197266, -0.08224248886108398, -0.08021736145019531, -0.07819223403930664, -0.07616710662841797, -0.0741419792175293, -0.07211685180664062, -0.07009172439575195, -0.06806659698486328, -0.06604146957397461, -0.06401634216308594, -0.061991214752197266, -0.059966087341308594, -0.05794095993041992, -0.05591583251953125, -0.05389070510864258, -0.051865577697753906, -0.049840450286865234, -0.04781532287597656, -0.04579019546508789, -0.04376506805419922, -0.04173994064331055, -0.039714813232421875, -0.0376896858215332, -0.03566455841064453, -0.03363943099975586, -0.03161430358886719, -0.029589176177978516, -0.027564048767089844, -0.025538921356201172, -0.0235137939453125, -0.021488666534423828, -0.019463539123535156, -0.017438411712646484, -0.015413284301757812, -0.01338815689086914, -0.011363029479980469, -0.009337902069091797, -0.007312774658203125, -0.005287647247314453, -0.0032625198364257812, -0.0012373924255371094, 0.0007877349853515625, 0.0028128623962402344, 0.004837989807128906, 0.006863117218017578, 0.00888824462890625, 0.010913372039794922, 0.012938499450683594, 0.014963626861572266, 0.016988754272460938, 0.01901388168334961, 0.02103900909423828, 0.023064136505126953, 0.025089263916015625, 0.027114391326904297, 0.02913951873779297, 0.03116464614868164, 0.03318977355957031, 0.035214900970458984, 0.037240028381347656, 0.03926515579223633, 0.041290283203125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 13.0, 20.0, 29.0, 45.0, 57.0, 119.0, 156.0, 148.0, 129.0, 106.0, 62.0, 46.0, 34.0, 17.0, 13.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01268768310546875, -0.01239544153213501, -0.01210319995880127, -0.01181095838546753, -0.011518716812133789, -0.011226475238800049, -0.010934233665466309, -0.010641992092132568, -0.010349750518798828, -0.010057508945465088, -0.009765267372131348, -0.009473025798797607, -0.009180784225463867, -0.008888542652130127, -0.008596301078796387, -0.008304059505462646, -0.008011817932128906, -0.007719576358795166, -0.007427334785461426, -0.0071350932121276855, -0.006842851638793945, -0.006550610065460205, -0.006258368492126465, -0.005966126918792725, -0.005673885345458984, -0.005381643772125244, -0.005089402198791504, -0.004797160625457764, -0.0045049190521240234, -0.004212677478790283, -0.003920435905456543, -0.0036281943321228027, -0.0033359527587890625, -0.0030437111854553223, -0.002751469612121582, -0.002459228038787842, -0.0021669864654541016, -0.0018747448921203613, -0.001582503318786621, -0.0012902617454528809, -0.0009980201721191406, -0.0007057785987854004, -0.00041353702545166016, -0.00012129545211791992, 0.0001709461212158203, 0.00046318769454956055, 0.0007554292678833008, 0.001047670841217041, 0.0013399124145507812, 0.0016321539878845215, 0.0019243955612182617, 0.002216637134552002, 0.002508878707885742, 0.0028011202812194824, 0.0030933618545532227, 0.003385603427886963, 0.003677845001220703, 0.003970086574554443, 0.004262328147888184, 0.004554569721221924, 0.004846811294555664, 0.005139052867889404, 0.0054312944412231445, 0.005723536014556885, 0.006015777587890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 7.0, 27.0, 24.0, 32.0, 49.0, 71.0, 102.0, 163.0, 278.0, 476.0, 1145.0, 3562.0, 24316.0, 4155127.0, 5707.0, 1655.0, 658.0, 326.0, 204.0, 117.0, 69.0, 54.0, 31.0, 31.0, 11.0, 12.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0217437744140625, -0.020763635635375977, -0.019783496856689453, -0.01880335807800293, -0.017823219299316406, -0.016843080520629883, -0.01586294174194336, -0.014882802963256836, -0.013902664184570312, -0.012922525405883789, -0.011942386627197266, -0.010962247848510742, -0.009982109069824219, -0.009001970291137695, -0.008021831512451172, -0.0070416927337646484, -0.006061553955078125, -0.0050814151763916016, -0.004101276397705078, -0.0031211376190185547, -0.0021409988403320312, -0.0011608600616455078, -0.00018072128295898438, 0.0007994174957275391, 0.0017795562744140625, 0.002759695053100586, 0.0037398338317871094, 0.004719972610473633, 0.005700111389160156, 0.00668025016784668, 0.007660388946533203, 0.008640527725219727, 0.00962066650390625, 0.010600805282592773, 0.011580944061279297, 0.01256108283996582, 0.013541221618652344, 0.014521360397338867, 0.01550149917602539, 0.016481637954711914, 0.017461776733398438, 0.01844191551208496, 0.019422054290771484, 0.020402193069458008, 0.02138233184814453, 0.022362470626831055, 0.023342609405517578, 0.0243227481842041, 0.025302886962890625, 0.02628302574157715, 0.027263164520263672, 0.028243303298950195, 0.02922344207763672, 0.030203580856323242, 0.031183719635009766, 0.03216385841369629, 0.03314399719238281, 0.034124135971069336, 0.03510427474975586, 0.03608441352844238, 0.037064552307128906, 0.03804469108581543, 0.03902482986450195, 0.04000496864318848, 0.040985107421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 0.0, 2.0, 11.0, 37.0, 3955.0, 33.0, 14.0, 6.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009918212890625, -0.009700655937194824, -0.009483098983764648, -0.009265542030334473, -0.009047985076904297, -0.008830428123474121, -0.008612871170043945, -0.00839531421661377, -0.008177757263183594, -0.007960200309753418, -0.007742643356323242, -0.007525086402893066, -0.007307529449462891, -0.007089972496032715, -0.006872415542602539, -0.006654858589172363, -0.0064373016357421875, -0.006219744682312012, -0.006002187728881836, -0.00578463077545166, -0.005567073822021484, -0.005349516868591309, -0.005131959915161133, -0.004914402961730957, -0.004696846008300781, -0.0044792890548706055, -0.00426173210144043, -0.004044175148010254, -0.003826618194580078, -0.0036090612411499023, -0.0033915042877197266, -0.0031739473342895508, -0.002956390380859375, -0.0027388334274291992, -0.0025212764739990234, -0.0023037195205688477, -0.002086162567138672, -0.001868605613708496, -0.0016510486602783203, -0.0014334917068481445, -0.0012159347534179688, -0.000998377799987793, -0.0007808208465576172, -0.0005632638931274414, -0.0003457069396972656, -0.00012814998626708984, 8.940696716308594e-05, 0.0003069639205932617, 0.0005245208740234375, 0.0007420778274536133, 0.0009596347808837891, 0.0011771917343139648, 0.0013947486877441406, 0.0016123056411743164, 0.0018298625946044922, 0.002047419548034668, 0.0022649765014648438, 0.0024825334548950195, 0.0027000904083251953, 0.002917647361755371, 0.003135204315185547, 0.0033527612686157227, 0.0035703182220458984, 0.0037878751754760742, 0.00400543212890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 12.0, 11.0, 32.0, 36.0, 55.0, 86.0, 195.0, 286.0, 105.0, 65.0, 36.0, 23.0, 19.0, 9.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.032492250204086304, -0.03175739571452141, -0.031022541224956512, -0.030287686735391617, -0.02955283224582672, -0.028817977756261826, -0.02808312326669693, -0.027348268777132034, -0.02661341428756714, -0.025878559798002243, -0.025143705308437347, -0.024408850818872452, -0.023673996329307556, -0.02293914183974266, -0.022204287350177765, -0.02146943286061287, -0.020734576508402824, -0.01999972201883793, -0.019264867529273033, -0.018530013039708138, -0.017795158550143242, -0.017060304060578346, -0.0163254477083683, -0.01559059415012598, -0.014855739660561085, -0.014120885170996189, -0.013386030681431293, -0.012651175260543823, -0.011916320770978928, -0.011181466281414032, -0.010446611791849136, -0.00971175730228424, -0.00897690374404192, -0.008242049254477024, -0.0075071947649121284, -0.0067723398096859455, -0.00603748532012105, -0.005302630830556154, -0.004567775875329971, -0.0038329213857650757, -0.00309806689620018, -0.0023632124066352844, -0.0016283576842397451, -0.0008935029618442059, -0.00015864847227931023, 0.0005762060172855854, 0.0013110609725117683, 0.002045915462076664, 0.0027807699516415596, 0.0035156244412064552, 0.004250478930771351, 0.004985333885997534, 0.005720188375562429, 0.006455042865127325, 0.007189897820353508, 0.007924752309918404, 0.0086596067994833, 0.009394461289048195, 0.01012931577861309, 0.010864170268177986, 0.011599024757742882, 0.012333879247307777, 0.013068734668195248, 0.013803589157760143, 0.014538443647325039]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 16.0, 17.0, 24.0, 33.0, 41.0, 46.0, 74.0, 92.0, 73.0, 94.0, 86.0, 77.0, 70.0, 61.0, 55.0, 49.0, 28.0, 19.0, 13.0, 7.0, 7.0, 5.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016002535820007324, -0.015486223623156548, -0.014969911426305771, -0.014453599229454994, -0.013937287032604218, -0.01342097483575344, -0.012904662638902664, -0.012388350442051888, -0.01187203824520111, -0.011355726048350334, -0.010839413851499557, -0.01032310165464878, -0.009806789457798004, -0.009290477260947227, -0.00877416506409645, -0.008257852867245674, -0.0077415406703948975, -0.007225228473544121, -0.006708916276693344, -0.0061926040798425674, -0.005676291882991791, -0.005159979686141014, -0.004643667489290237, -0.004127355292439461, -0.003611043095588684, -0.0030947308987379074, -0.0025784187018871307, -0.002062106505036354, -0.0015457943081855774, -0.0010294821113348007, -0.000513169914484024, 3.1422823667526245e-06, 0.0005194544792175293, 0.001035766676068306, 0.0015520788729190826, 0.0020683910697698593, 0.002584703266620636, 0.0031010154634714127, 0.0036173276603221893, 0.004133639857172966, 0.004649952054023743, 0.005166264250874519, 0.005682576447725296, 0.006198888644576073, 0.006715200841426849, 0.007231513038277626, 0.007747825235128403, 0.00826413743197918, 0.008780449628829956, 0.009296761825680733, 0.00981307402253151, 0.010329386219382286, 0.010845698416233063, 0.01136201061308384, 0.011878322809934616, 0.012394635006785393, 0.01291094720363617, 0.013427259400486946, 0.013943571597337723, 0.0144598837941885, 0.014976195991039276, 0.015492508187890053, 0.01600882038474083, 0.016525132581591606, 0.017041444778442383]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 4.0, 7.0, 13.0, 8.0, 15.0, 24.0, 31.0, 42.0, 80.0, 130.0, 229.0, 574.0, 1588.0, 5980.0, 35461.0, 662902.0, 309768.0, 24720.0, 4656.0, 1275.0, 434.0, 215.0, 125.0, 78.0, 53.0, 44.0, 22.0, 18.0, 7.0, 11.0, 14.0, 3.0, 5.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0390625, -0.037428855895996094, -0.03579521179199219, -0.03416156768798828, -0.032527923583984375, -0.03089427947998047, -0.029260635375976562, -0.027626991271972656, -0.02599334716796875, -0.024359703063964844, -0.022726058959960938, -0.02109241485595703, -0.019458770751953125, -0.01782512664794922, -0.016191482543945312, -0.014557838439941406, -0.0129241943359375, -0.011290550231933594, -0.009656906127929688, -0.008023262023925781, -0.006389617919921875, -0.004755973815917969, -0.0031223297119140625, -0.0014886856079101562, 0.00014495849609375, 0.0017786026000976562, 0.0034122467041015625, 0.005045890808105469, 0.006679534912109375, 0.008313179016113281, 0.009946823120117188, 0.011580467224121094, 0.013214111328125, 0.014847755432128906, 0.016481399536132812, 0.01811504364013672, 0.019748687744140625, 0.02138233184814453, 0.023015975952148438, 0.024649620056152344, 0.02628326416015625, 0.027916908264160156, 0.029550552368164062, 0.03118419647216797, 0.032817840576171875, 0.03445148468017578, 0.03608512878417969, 0.037718772888183594, 0.0393524169921875, 0.040986061096191406, 0.04261970520019531, 0.04425334930419922, 0.045886993408203125, 0.04752063751220703, 0.04915428161621094, 0.050787925720214844, 0.05242156982421875, 0.054055213928222656, 0.05568885803222656, 0.05732250213623047, 0.058956146240234375, 0.06058979034423828, 0.06222343444824219, 0.0638570785522461, 0.06549072265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 12.0, 19.0, 28.0, 41.0, 58.0, 118.0, 152.0, 148.0, 135.0, 107.0, 63.0, 46.0, 36.0, 18.0, 13.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01274871826171875, -0.012455523014068604, -0.012162327766418457, -0.01186913251876831, -0.011575937271118164, -0.011282742023468018, -0.010989546775817871, -0.010696351528167725, -0.010403156280517578, -0.010109961032867432, -0.009816765785217285, -0.009523570537567139, -0.009230375289916992, -0.008937180042266846, -0.0086439847946167, -0.008350789546966553, -0.008057594299316406, -0.00776439905166626, -0.007471203804016113, -0.007178008556365967, -0.00688481330871582, -0.006591618061065674, -0.006298422813415527, -0.006005227565765381, -0.005712032318115234, -0.005418837070465088, -0.005125641822814941, -0.004832446575164795, -0.0045392513275146484, -0.004246056079864502, -0.0039528608322143555, -0.003659665584564209, -0.0033664703369140625, -0.003073275089263916, -0.0027800798416137695, -0.002486884593963623, -0.0021936893463134766, -0.00190049409866333, -0.0016072988510131836, -0.0013141036033630371, -0.0010209083557128906, -0.0007277131080627441, -0.00043451786041259766, -0.00014132261276245117, 0.0001518726348876953, 0.0004450678825378418, 0.0007382631301879883, 0.0010314583778381348, 0.0013246536254882812, 0.0016178488731384277, 0.0019110441207885742, 0.0022042393684387207, 0.002497434616088867, 0.0027906298637390137, 0.00308382511138916, 0.0033770203590393066, 0.003670215606689453, 0.0039634108543396, 0.004256606101989746, 0.004549801349639893, 0.004842996597290039, 0.0051361918449401855, 0.005429387092590332, 0.0057225823402404785, 0.006015777587890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 10.0, 5.0, 12.0, 15.0, 23.0, 30.0, 22.0, 40.0, 60.0, 90.0, 169.0, 344.0, 644.0, 1411.0, 3304.0, 8286.0, 23952.0, 87123.0, 645774.0, 209662.0, 44208.0, 13984.0, 5206.0, 2108.0, 969.0, 460.0, 220.0, 150.0, 67.0, 58.0, 32.0, 30.0, 17.0, 9.0, 6.0, 14.0, 8.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0222320556640625, -0.021458864212036133, -0.020685672760009766, -0.0199124813079834, -0.01913928985595703, -0.018366098403930664, -0.017592906951904297, -0.01681971549987793, -0.016046524047851562, -0.015273332595825195, -0.014500141143798828, -0.013726949691772461, -0.012953758239746094, -0.012180566787719727, -0.01140737533569336, -0.010634183883666992, -0.009860992431640625, -0.009087800979614258, -0.00831460952758789, -0.0075414180755615234, -0.006768226623535156, -0.005995035171508789, -0.005221843719482422, -0.004448652267456055, -0.0036754608154296875, -0.0029022693634033203, -0.002129077911376953, -0.001355886459350586, -0.0005826950073242188, 0.00019049644470214844, 0.0009636878967285156, 0.0017368793487548828, 0.00251007080078125, 0.003283262252807617, 0.004056453704833984, 0.0048296451568603516, 0.005602836608886719, 0.006376028060913086, 0.007149219512939453, 0.00792241096496582, 0.008695602416992188, 0.009468793869018555, 0.010241985321044922, 0.011015176773071289, 0.011788368225097656, 0.012561559677124023, 0.01333475112915039, 0.014107942581176758, 0.014881134033203125, 0.015654325485229492, 0.01642751693725586, 0.017200708389282227, 0.017973899841308594, 0.01874709129333496, 0.019520282745361328, 0.020293474197387695, 0.021066665649414062, 0.02183985710144043, 0.022613048553466797, 0.023386240005493164, 0.02415943145751953, 0.0249326229095459, 0.025705814361572266, 0.026479005813598633, 0.027252197265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 6.0, 3.0, 5.0, 8.0, 13.0, 6.0, 11.0, 13.0, 20.0, 20.0, 27.0, 18.0, 25.0, 25.0, 33.0, 36.0, 44.0, 51.0, 46.0, 42.0, 43.0, 34.0, 37.0, 32.0, 49.0, 44.0, 43.0, 27.0, 36.0, 31.0, 27.0, 27.0, 13.0, 15.0, 16.0, 19.0, 15.0, 9.0, 5.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.01445770263671875, -0.014046192169189453, -0.013634681701660156, -0.01322317123413086, -0.012811660766601562, -0.012400150299072266, -0.011988639831542969, -0.011577129364013672, -0.011165618896484375, -0.010754108428955078, -0.010342597961425781, -0.009931087493896484, -0.009519577026367188, -0.00910806655883789, -0.008696556091308594, -0.008285045623779297, -0.00787353515625, -0.007462024688720703, -0.007050514221191406, -0.006639003753662109, -0.0062274932861328125, -0.005815982818603516, -0.005404472351074219, -0.004992961883544922, -0.004581451416015625, -0.004169940948486328, -0.0037584304809570312, -0.0033469200134277344, -0.0029354095458984375, -0.0025238990783691406, -0.0021123886108398438, -0.0017008781433105469, -0.00128936767578125, -0.0008778572082519531, -0.00046634674072265625, -5.4836273193359375e-05, 0.0003566741943359375, 0.0007681846618652344, 0.0011796951293945312, 0.0015912055969238281, 0.002002716064453125, 0.002414226531982422, 0.0028257369995117188, 0.0032372474670410156, 0.0036487579345703125, 0.004060268402099609, 0.004471778869628906, 0.004883289337158203, 0.0052947998046875, 0.005706310272216797, 0.006117820739746094, 0.006529331207275391, 0.0069408416748046875, 0.007352352142333984, 0.007763862609863281, 0.008175373077392578, 0.008586883544921875, 0.008998394012451172, 0.009409904479980469, 0.009821414947509766, 0.010232925415039062, 0.01064443588256836, 0.011055946350097656, 0.011467456817626953, 0.01187896728515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 11.0, 13.0, 26.0, 30.0, 38.0, 56.0, 70.0, 135.0, 177.0, 269.0, 409.0, 654.0, 1242.0, 2056.0, 4167.0, 9197.0, 25575.0, 112620.0, 768749.0, 84691.0, 21261.0, 8348.0, 3722.0, 2056.0, 1111.0, 668.0, 400.0, 260.0, 163.0, 107.0, 80.0, 51.0, 40.0, 30.0, 17.0, 8.0, 5.0, 8.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.548664093017578e-05, -9.224191308021545e-05, -8.899718523025513e-05, -8.57524573802948e-05, -8.250772953033447e-05, -7.926300168037415e-05, -7.601827383041382e-05, -7.277354598045349e-05, -6.952881813049316e-05, -6.628409028053284e-05, -6.303936243057251e-05, -5.979463458061218e-05, -5.6549906730651855e-05, -5.330517888069153e-05, -5.00604510307312e-05, -4.6815723180770874e-05, -4.357099533081055e-05, -4.032626748085022e-05, -3.708153963088989e-05, -3.3836811780929565e-05, -3.059208393096924e-05, -2.734735608100891e-05, -2.4102628231048584e-05, -2.0857900381088257e-05, -1.761317253112793e-05, -1.4368444681167603e-05, -1.1123716831207275e-05, -7.878988981246948e-06, -4.634261131286621e-06, -1.389533281326294e-06, 1.8551945686340332e-06, 5.09992241859436e-06, 8.344650268554688e-06, 1.1589378118515015e-05, 1.4834105968475342e-05, 1.807883381843567e-05, 2.1323561668395996e-05, 2.4568289518356323e-05, 2.781301736831665e-05, 3.105774521827698e-05, 3.4302473068237305e-05, 3.754720091819763e-05, 4.079192876815796e-05, 4.4036656618118286e-05, 4.728138446807861e-05, 5.052611231803894e-05, 5.377084016799927e-05, 5.7015568017959595e-05, 6.026029586791992e-05, 6.350502371788025e-05, 6.674975156784058e-05, 6.99944794178009e-05, 7.323920726776123e-05, 7.648393511772156e-05, 7.972866296768188e-05, 8.297339081764221e-05, 8.621811866760254e-05, 8.946284651756287e-05, 9.27075743675232e-05, 9.595230221748352e-05, 9.919703006744385e-05, 0.00010244175791740417, 0.0001056864857673645, 0.00010893121361732483, 0.00011217594146728516]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 5.0, 9.0, 5.0, 17.0, 23.0, 12.0, 22.0, 50.0, 51.0, 99.0, 120.0, 161.0, 126.0, 83.0, 64.0, 35.0, 25.0, 14.0, 15.0, 9.0, 13.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8656253814697266e-05, -1.8156133592128754e-05, -1.7656013369560242e-05, -1.715589314699173e-05, -1.6655772924423218e-05, -1.6155652701854706e-05, -1.5655532479286194e-05, -1.5155412256717682e-05, -1.465529203414917e-05, -1.4155171811580658e-05, -1.3655051589012146e-05, -1.3154931366443634e-05, -1.2654811143875122e-05, -1.215469092130661e-05, -1.1654570698738098e-05, -1.1154450476169586e-05, -1.0654330253601074e-05, -1.0154210031032562e-05, -9.65408980846405e-06, -9.153969585895538e-06, -8.653849363327026e-06, -8.153729140758514e-06, -7.653608918190002e-06, -7.1534886956214905e-06, -6.6533684730529785e-06, -6.1532482504844666e-06, -5.653128027915955e-06, -5.153007805347443e-06, -4.652887582778931e-06, -4.152767360210419e-06, -3.6526471376419067e-06, -3.1525269150733948e-06, -2.652406692504883e-06, -2.152286469936371e-06, -1.6521662473678589e-06, -1.152046024799347e-06, -6.51925802230835e-07, -1.51805579662323e-07, 3.4831464290618896e-07, 8.484348654747009e-07, 1.3485550880432129e-06, 1.8486753106117249e-06, 2.348795533180237e-06, 2.8489157557487488e-06, 3.3490359783172607e-06, 3.849156200885773e-06, 4.349276423454285e-06, 4.849396646022797e-06, 5.349516868591309e-06, 5.8496370911598206e-06, 6.3497573137283325e-06, 6.8498775362968445e-06, 7.3499977588653564e-06, 7.850117981433868e-06, 8.35023820400238e-06, 8.850358426570892e-06, 9.350478649139404e-06, 9.850598871707916e-06, 1.0350719094276428e-05, 1.085083931684494e-05, 1.1350959539413452e-05, 1.1851079761981964e-05, 1.2351199984550476e-05, 1.2851320207118988e-05, 1.33514404296875e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 24.0, 27.0, 45.0, 107.0, 195.0, 446.0, 1336.0, 4693.0, 25701.0, 896418.0, 105299.0, 10410.0, 2446.0, 764.0, 287.0, 125.0, 78.0, 54.0, 18.0, 20.0, 12.0, 5.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032806396484375, -0.0003188885748386383, -0.0003097131848335266, -0.0003005377948284149, -0.0002913624048233032, -0.00028218701481819153, -0.00027301162481307983, -0.00026383623480796814, -0.00025466084480285645, -0.00024548545479774475, -0.00023631006479263306, -0.00022713467478752136, -0.00021795928478240967, -0.00020878389477729797, -0.00019960850477218628, -0.00019043311476707458, -0.0001812577247619629, -0.0001720823347568512, -0.0001629069447517395, -0.0001537315547466278, -0.0001445561647415161, -0.00013538077473640442, -0.00012620538473129272, -0.00011702999472618103, -0.00010785460472106934, -9.867921471595764e-05, -8.950382471084595e-05, -8.032843470573425e-05, -7.115304470062256e-05, -6.197765469551086e-05, -5.280226469039917e-05, -4.3626874685287476e-05, -3.445148468017578e-05, -2.5276094675064087e-05, -1.6100704669952393e-05, -6.925314664840698e-06, 2.250075340270996e-06, 1.142546534538269e-05, 2.0600855350494385e-05, 2.977624535560608e-05, 3.8951635360717773e-05, 4.812702536582947e-05, 5.730241537094116e-05, 6.647780537605286e-05, 7.565319538116455e-05, 8.482858538627625e-05, 9.400397539138794e-05, 0.00010317936539649963, 0.00011235475540161133, 0.00012153014540672302, 0.00013070553541183472, 0.0001398809254169464, 0.0001490563154220581, 0.0001582317054271698, 0.0001674070954322815, 0.0001765824854373932, 0.00018575787544250488, 0.00019493326544761658, 0.00020410865545272827, 0.00021328404545783997, 0.00022245943546295166, 0.00023163482546806335, 0.00024081021547317505, 0.00024998560547828674, 0.00025916099548339844]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 7.0, 14.0, 6.0, 10.0, 13.0, 11.0, 25.0, 30.0, 51.0, 93.0, 166.0, 209.0, 118.0, 81.0, 48.0, 34.0, 16.0, 24.0, 15.0, 4.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013828277587890625, -0.0001334063708782196, -0.00012852996587753296, -0.0001236535608768463, -0.00011877715587615967, -0.00011390075087547302, -0.00010902434587478638, -0.00010414794087409973, -9.927153587341309e-05, -9.439513087272644e-05, -8.95187258720398e-05, -8.464232087135315e-05, -7.97659158706665e-05, -7.488951086997986e-05, -7.001310586929321e-05, -6.513670086860657e-05, -6.026029586791992e-05, -5.5383890867233276e-05, -5.050748586654663e-05, -4.5631080865859985e-05, -4.075467586517334e-05, -3.5878270864486694e-05, -3.100186586380005e-05, -2.6125460863113403e-05, -2.1249055862426758e-05, -1.6372650861740112e-05, -1.1496245861053467e-05, -6.619840860366821e-06, -1.7434358596801758e-06, 3.1329691410064697e-06, 8.009374141693115e-06, 1.288577914237976e-05, 1.7762184143066406e-05, 2.2638589143753052e-05, 2.7514994144439697e-05, 3.239139914512634e-05, 3.726780414581299e-05, 4.2144209146499634e-05, 4.702061414718628e-05, 5.1897019147872925e-05, 5.677342414855957e-05, 6.164982914924622e-05, 6.652623414993286e-05, 7.140263915061951e-05, 7.627904415130615e-05, 8.11554491519928e-05, 8.603185415267944e-05, 9.090825915336609e-05, 9.578466415405273e-05, 0.00010066106915473938, 0.00010553747415542603, 0.00011041387915611267, 0.00011529028415679932, 0.00012016668915748596, 0.0001250430941581726, 0.00012991949915885925, 0.0001347959041595459, 0.00013967230916023254, 0.0001445487141609192, 0.00014942511916160583, 0.00015430152416229248, 0.00015917792916297913, 0.00016405433416366577, 0.00016893073916435242, 0.00017380714416503906]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 10.0, 22.0, 29.0, 22.0, 32.0, 68.0, 108.0, 203.0, 139.0, 95.0, 70.0, 36.0, 41.0, 26.0, 20.0, 13.0, 12.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09341301023960114, -0.08993567526340485, -0.08645833283662796, -0.08298099040985107, -0.07950365543365479, -0.0760263204574585, -0.07254897803068161, -0.06907163560390472, -0.06559430062770844, -0.06211696192622185, -0.05863962322473526, -0.05516228452324867, -0.051684945821762085, -0.0482076071202755, -0.04473026841878891, -0.04125292971730232, -0.037775591015815735, -0.03429825231432915, -0.03082091361284256, -0.027343574911355972, -0.023866236209869385, -0.020388897508382797, -0.01691155880689621, -0.013434220105409622, -0.009956881403923035, -0.006479542702436447, -0.0030022040009498596, 0.0004751347005367279, 0.003952473402023315, 0.007429812103509903, 0.01090715080499649, 0.014384489506483078, 0.017861828207969666, 0.021339166909456253, 0.02481650561094284, 0.028293844312429428, 0.031771183013916016, 0.0352485217154026, 0.03872586041688919, 0.04220319911837578, 0.045680537819862366, 0.04915787652134895, 0.05263521522283554, 0.05611255392432213, 0.059589892625808716, 0.063067227602005, 0.06654457002878189, 0.07002191245555878, 0.07349924743175507, 0.07697658240795135, 0.08045392483472824, 0.08393126726150513, 0.08740860223770142, 0.0908859372138977, 0.09436327964067459, 0.09784062206745148, 0.10131795704364777, 0.10479529201984406, 0.10827263444662094, 0.11174997687339783, 0.11522731184959412, 0.1187046468257904, 0.12218198925256729, 0.12565933167934418, 0.12913666665554047]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 17.0, 9.0, 16.0, 19.0, 17.0, 32.0, 39.0, 35.0, 44.0, 35.0, 59.0, 82.0, 51.0, 51.0, 59.0, 55.0, 72.0, 38.0, 47.0, 38.0, 49.0, 30.0, 17.0, 26.0, 20.0, 13.0, 12.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05144846439361572, -0.048815228044986725, -0.04618199169635773, -0.04354875534772873, -0.04091551899909973, -0.038282282650470734, -0.035649046301841736, -0.03301580995321274, -0.03038257360458374, -0.027749337255954742, -0.025116100907325745, -0.022482864558696747, -0.01984962821006775, -0.01721639186143875, -0.014583155512809753, -0.011949919164180756, -0.009316682815551758, -0.00668344646692276, -0.004050210118293762, -0.0014169737696647644, 0.0012162625789642334, 0.003849498927593231, 0.006482735276222229, 0.009115971624851227, 0.011749207973480225, 0.014382444322109222, 0.01701568067073822, 0.019648917019367218, 0.022282153367996216, 0.024915389716625214, 0.02754862606525421, 0.03018186241388321, 0.03281509876251221, 0.035448335111141205, 0.0380815714597702, 0.0407148078083992, 0.0433480441570282, 0.045981280505657196, 0.048614516854286194, 0.05124775320291519, 0.05388098955154419, 0.05651422590017319, 0.059147462248802185, 0.06178069859743118, 0.06441393494606018, 0.06704717129468918, 0.06968040764331818, 0.07231364399194717, 0.07494688034057617, 0.07758011668920517, 0.08021335303783417, 0.08284658938646317, 0.08547982573509216, 0.08811306208372116, 0.09074629843235016, 0.09337953478097916, 0.09601277112960815, 0.09864600747823715, 0.10127924382686615, 0.10391248017549515, 0.10654571652412415, 0.10917895287275314, 0.11181218922138214, 0.11444542557001114, 0.11707866191864014]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 12.0, 13.0, 28.0, 36.0, 66.0, 115.0, 241.0, 421.0, 942.0, 2312.0, 9857.0, 3856913.0, 312319.0, 6658.0, 2559.0, 895.0, 416.0, 194.0, 102.0, 49.0, 25.0, 26.0, 17.0, 14.0, 4.0, 5.0, 8.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.030670166015625, -0.029955267906188965, -0.02924036979675293, -0.028525471687316895, -0.02781057357788086, -0.027095675468444824, -0.02638077735900879, -0.025665879249572754, -0.02495098114013672, -0.024236083030700684, -0.02352118492126465, -0.022806286811828613, -0.022091388702392578, -0.021376490592956543, -0.020661592483520508, -0.019946694374084473, -0.019231796264648438, -0.018516898155212402, -0.017802000045776367, -0.017087101936340332, -0.016372203826904297, -0.01565730571746826, -0.014942407608032227, -0.014227509498596191, -0.013512611389160156, -0.012797713279724121, -0.012082815170288086, -0.01136791706085205, -0.010653018951416016, -0.00993812084197998, -0.009223222732543945, -0.00850832462310791, -0.007793426513671875, -0.00707852840423584, -0.006363630294799805, -0.0056487321853637695, -0.004933834075927734, -0.004218935966491699, -0.003504037857055664, -0.002789139747619629, -0.0020742416381835938, -0.0013593435287475586, -0.0006444454193115234, 7.045269012451172e-05, 0.0007853507995605469, 0.001500248908996582, 0.002215147018432617, 0.0029300451278686523, 0.0036449432373046875, 0.004359841346740723, 0.005074739456176758, 0.005789637565612793, 0.006504535675048828, 0.007219433784484863, 0.007934331893920898, 0.008649230003356934, 0.009364128112792969, 0.010079026222229004, 0.010793924331665039, 0.011508822441101074, 0.01222372055053711, 0.012938618659973145, 0.01365351676940918, 0.014368414878845215, 0.01508331298828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 14.0, 17.0, 23.0, 39.0, 58.0, 93.0, 157.0, 144.0, 136.0, 115.0, 69.0, 47.0, 43.0, 22.0, 14.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0120697021484375, -0.011787116527557373, -0.011504530906677246, -0.01122194528579712, -0.010939359664916992, -0.010656774044036865, -0.010374188423156738, -0.010091602802276611, -0.009809017181396484, -0.009526431560516357, -0.00924384593963623, -0.008961260318756104, -0.008678674697875977, -0.00839608907699585, -0.008113503456115723, -0.007830917835235596, -0.007548332214355469, -0.007265746593475342, -0.006983160972595215, -0.006700575351715088, -0.006417989730834961, -0.006135404109954834, -0.005852818489074707, -0.00557023286819458, -0.005287647247314453, -0.005005061626434326, -0.004722476005554199, -0.004439890384674072, -0.004157304763793945, -0.0038747191429138184, -0.0035921335220336914, -0.0033095479011535645, -0.0030269622802734375, -0.0027443766593933105, -0.0024617910385131836, -0.0021792054176330566, -0.0018966197967529297, -0.0016140341758728027, -0.0013314485549926758, -0.0010488629341125488, -0.0007662773132324219, -0.0004836916923522949, -0.00020110607147216797, 8.147954940795898e-05, 0.00036406517028808594, 0.0006466507911682129, 0.0009292364120483398, 0.0012118220329284668, 0.0014944076538085938, 0.0017769932746887207, 0.0020595788955688477, 0.0023421645164489746, 0.0026247501373291016, 0.0029073357582092285, 0.0031899213790893555, 0.0034725069999694824, 0.0037550926208496094, 0.004037678241729736, 0.004320263862609863, 0.00460284948348999, 0.004885435104370117, 0.005168020725250244, 0.005450606346130371, 0.005733191967010498, 0.006015777587890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 9.0, 32.0, 58.0, 84.0, 111.0, 212.0, 323.0, 637.0, 1036.0, 1805.0, 3388.0, 7177.0, 23617.0, 3731841.0, 393772.0, 17299.0, 5940.0, 2930.0, 1674.0, 865.0, 542.0, 367.0, 205.0, 115.0, 74.0, 38.0, 29.0, 25.0, 18.0, 9.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.0205230712890625, -0.019995450973510742, -0.019467830657958984, -0.018940210342407227, -0.01841259002685547, -0.01788496971130371, -0.017357349395751953, -0.016829729080200195, -0.016302108764648438, -0.01577448844909668, -0.015246868133544922, -0.014719247817993164, -0.014191627502441406, -0.013664007186889648, -0.01313638687133789, -0.012608766555786133, -0.012081146240234375, -0.011553525924682617, -0.01102590560913086, -0.010498285293579102, -0.009970664978027344, -0.009443044662475586, -0.008915424346923828, -0.00838780403137207, -0.007860183715820312, -0.007332563400268555, -0.006804943084716797, -0.006277322769165039, -0.005749702453613281, -0.0052220821380615234, -0.004694461822509766, -0.004166841506958008, -0.00363922119140625, -0.003111600875854492, -0.0025839805603027344, -0.0020563602447509766, -0.0015287399291992188, -0.001001119613647461, -0.0004734992980957031, 5.412101745605469e-05, 0.0005817413330078125, 0.0011093616485595703, 0.0016369819641113281, 0.002164602279663086, 0.0026922225952148438, 0.0032198429107666016, 0.0037474632263183594, 0.004275083541870117, 0.004802703857421875, 0.005330324172973633, 0.005857944488525391, 0.0063855648040771484, 0.006913185119628906, 0.007440805435180664, 0.007968425750732422, 0.00849604606628418, 0.009023666381835938, 0.009551286697387695, 0.010078907012939453, 0.010606527328491211, 0.011134147644042969, 0.011661767959594727, 0.012189388275146484, 0.012717008590698242, 0.01324462890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 8.0, 9.0, 3.0, 8.0, 18.0, 22.0, 47.0, 195.0, 741.0, 2466.0, 348.0, 91.0, 32.0, 18.0, 14.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.008697509765625, -0.008352041244506836, -0.008006572723388672, -0.007661104202270508, -0.007315635681152344, -0.00697016716003418, -0.006624698638916016, -0.0062792301177978516, -0.0059337615966796875, -0.0055882930755615234, -0.005242824554443359, -0.004897356033325195, -0.004551887512207031, -0.004206418991088867, -0.003860950469970703, -0.003515481948852539, -0.003170013427734375, -0.002824544906616211, -0.002479076385498047, -0.002133607864379883, -0.0017881393432617188, -0.0014426708221435547, -0.0010972023010253906, -0.0007517337799072266, -0.0004062652587890625, -6.079673767089844e-05, 0.0002846717834472656, 0.0006301403045654297, 0.0009756088256835938, 0.0013210773468017578, 0.0016665458679199219, 0.002012014389038086, 0.00235748291015625, 0.002702951431274414, 0.003048419952392578, 0.003393888473510742, 0.0037393569946289062, 0.00408482551574707, 0.004430294036865234, 0.0047757625579833984, 0.0051212310791015625, 0.0054666996002197266, 0.005812168121337891, 0.006157636642456055, 0.006503105163574219, 0.006848573684692383, 0.007194042205810547, 0.007539510726928711, 0.007884979248046875, 0.008230447769165039, 0.008575916290283203, 0.008921384811401367, 0.009266853332519531, 0.009612321853637695, 0.00995779037475586, 0.010303258895874023, 0.010648727416992188, 0.010994195938110352, 0.011339664459228516, 0.01168513298034668, 0.012030601501464844, 0.012376070022583008, 0.012721538543701172, 0.013067007064819336, 0.0134124755859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 12.0, 19.0, 18.0, 26.0, 40.0, 52.0, 59.0, 128.0, 231.0, 115.0, 69.0, 60.0, 22.0, 28.0, 21.0, 17.0, 19.0, 13.0, 9.0, 6.0, 3.0, 2.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.06320729851722717, -0.06151523068547249, -0.059823162853717804, -0.05813109502196312, -0.056439027190208435, -0.05474695935845375, -0.053054891526699066, -0.05136282369494438, -0.0496707558631897, -0.04797868803143501, -0.04628662019968033, -0.044594552367925644, -0.04290248453617096, -0.041210416704416275, -0.03951834887266159, -0.037826281040906906, -0.03613421320915222, -0.03444214537739754, -0.03275007754564285, -0.03105800971388817, -0.029365941882133484, -0.0276738740503788, -0.025981806218624115, -0.02428973838686943, -0.022597670555114746, -0.02090560272336006, -0.019213534891605377, -0.017521467059850693, -0.01582939922809601, -0.014137331396341324, -0.01244526356458664, -0.010753195732831955, -0.009061131626367569, -0.0073690637946128845, -0.0056769959628582, -0.003984928131103516, -0.002292860299348831, -0.0006007924675941467, 0.0010912753641605377, 0.002783343195915222, 0.004475411027669907, 0.006167478859424591, 0.007859546691179276, 0.00955161452293396, 0.011243682354688644, 0.012935750186443329, 0.014627818018198013, 0.016319885849952698, 0.018011953681707382, 0.019704021513462067, 0.02139608934521675, 0.023088157176971436, 0.02478022500872612, 0.026472292840480804, 0.02816436067223549, 0.029856428503990173, 0.03154849633574486, 0.03324056416749954, 0.03493263199925423, 0.03662469983100891, 0.038316767662763596, 0.04000883549451828, 0.041700903326272964, 0.04339297115802765, 0.04508503898978233]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 3.0, 3.0, 5.0, 14.0, 7.0, 8.0, 10.0, 17.0, 11.0, 26.0, 18.0, 23.0, 21.0, 29.0, 35.0, 39.0, 43.0, 48.0, 46.0, 52.0, 36.0, 51.0, 41.0, 49.0, 47.0, 37.0, 28.0, 33.0, 29.0, 21.0, 30.0, 23.0, 23.0, 21.0, 18.0, 14.0, 15.0, 9.0, 7.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.030657470226287842, -0.029674887657165527, -0.028692305088043213, -0.0277097225189209, -0.026727139949798584, -0.02574455738067627, -0.024761974811553955, -0.02377939224243164, -0.022796809673309326, -0.02181422710418701, -0.020831644535064697, -0.019849061965942383, -0.01886647939682007, -0.017883896827697754, -0.01690131425857544, -0.015918731689453125, -0.01493614912033081, -0.013953566551208496, -0.012970983982086182, -0.011988401412963867, -0.011005818843841553, -0.010023236274719238, -0.009040653705596924, -0.00805807113647461, -0.007075488567352295, -0.0060929059982299805, -0.005110323429107666, -0.0041277408599853516, -0.003145158290863037, -0.0021625757217407227, -0.0011799931526184082, -0.00019741058349609375, 0.0007851719856262207, 0.0017677545547485352, 0.0027503371238708496, 0.003732919692993164, 0.0047155022621154785, 0.005698084831237793, 0.006680667400360107, 0.007663249969482422, 0.008645832538604736, 0.00962841510772705, 0.010610997676849365, 0.01159358024597168, 0.012576162815093994, 0.013558745384216309, 0.014541327953338623, 0.015523910522460938, 0.016506493091583252, 0.017489075660705566, 0.01847165822982788, 0.019454240798950195, 0.02043682336807251, 0.021419405937194824, 0.02240198850631714, 0.023384571075439453, 0.024367153644561768, 0.025349736213684082, 0.026332318782806396, 0.02731490135192871, 0.028297483921051025, 0.02928006649017334, 0.030262649059295654, 0.03124523162841797, 0.03222781419754028]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 9.0, 9.0, 12.0, 22.0, 22.0, 18.0, 27.0, 34.0, 77.0, 148.0, 229.0, 470.0, 1193.0, 3497.0, 15180.0, 96535.0, 793993.0, 113791.0, 17115.0, 3828.0, 1195.0, 461.0, 249.0, 149.0, 66.0, 65.0, 44.0, 26.0, 13.0, 17.0, 12.0, 9.0, 17.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037200927734375, -0.035897254943847656, -0.03459358215332031, -0.03328990936279297, -0.031986236572265625, -0.03068256378173828, -0.029378890991210938, -0.028075218200683594, -0.02677154541015625, -0.025467872619628906, -0.024164199829101562, -0.02286052703857422, -0.021556854248046875, -0.02025318145751953, -0.018949508666992188, -0.017645835876464844, -0.0163421630859375, -0.015038490295410156, -0.013734817504882812, -0.012431144714355469, -0.011127471923828125, -0.009823799133300781, -0.008520126342773438, -0.007216453552246094, -0.00591278076171875, -0.004609107971191406, -0.0033054351806640625, -0.0020017623901367188, -0.000698089599609375, 0.0006055831909179688, 0.0019092559814453125, 0.0032129287719726562, 0.0045166015625, 0.005820274353027344, 0.0071239471435546875, 0.008427619934082031, 0.009731292724609375, 0.011034965515136719, 0.012338638305664062, 0.013642311096191406, 0.01494598388671875, 0.016249656677246094, 0.017553329467773438, 0.01885700225830078, 0.020160675048828125, 0.02146434783935547, 0.022768020629882812, 0.024071693420410156, 0.0253753662109375, 0.026679039001464844, 0.027982711791992188, 0.02928638458251953, 0.030590057373046875, 0.03189373016357422, 0.03319740295410156, 0.034501075744628906, 0.03580474853515625, 0.037108421325683594, 0.03841209411621094, 0.03971576690673828, 0.041019439697265625, 0.04232311248779297, 0.04362678527832031, 0.044930458068847656, 0.046234130859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 12.0, 16.0, 28.0, 40.0, 58.0, 103.0, 152.0, 146.0, 134.0, 110.0, 69.0, 45.0, 42.0, 22.0, 14.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01202392578125, -0.011742055416107178, -0.011460185050964355, -0.011178314685821533, -0.010896444320678711, -0.010614573955535889, -0.010332703590393066, -0.010050833225250244, -0.009768962860107422, -0.0094870924949646, -0.009205222129821777, -0.008923351764678955, -0.008641481399536133, -0.00835961103439331, -0.008077740669250488, -0.007795870304107666, -0.007513999938964844, -0.0072321295738220215, -0.006950259208679199, -0.006668388843536377, -0.006386518478393555, -0.006104648113250732, -0.00582277774810791, -0.005540907382965088, -0.005259037017822266, -0.004977166652679443, -0.004695296287536621, -0.004413425922393799, -0.0041315555572509766, -0.0038496851921081543, -0.003567814826965332, -0.0032859444618225098, -0.0030040740966796875, -0.0027222037315368652, -0.002440333366394043, -0.0021584630012512207, -0.0018765926361083984, -0.0015947222709655762, -0.001312851905822754, -0.0010309815406799316, -0.0007491111755371094, -0.0004672408103942871, -0.00018537044525146484, 9.649991989135742e-05, 0.0003783702850341797, 0.000660240650177002, 0.0009421110153198242, 0.0012239813804626465, 0.0015058517456054688, 0.001787722110748291, 0.0020695924758911133, 0.0023514628410339355, 0.002633333206176758, 0.00291520357131958, 0.0031970739364624023, 0.0034789443016052246, 0.003760814666748047, 0.004042685031890869, 0.004324555397033691, 0.004606425762176514, 0.004888296127319336, 0.005170166492462158, 0.0054520368576049805, 0.005733907222747803, 0.006015777587890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 8.0, 17.0, 11.0, 17.0, 17.0, 31.0, 51.0, 66.0, 109.0, 157.0, 262.0, 492.0, 950.0, 1857.0, 3936.0, 8370.0, 19496.0, 52860.0, 213564.0, 602734.0, 90879.0, 29748.0, 11996.0, 5359.0, 2678.0, 1292.0, 645.0, 330.0, 187.0, 132.0, 84.0, 50.0, 37.0, 21.0, 23.0, 16.0, 12.0, 9.0, 9.0, 6.0, 11.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02056884765625, -0.019910097122192383, -0.019251346588134766, -0.01859259605407715, -0.01793384552001953, -0.017275094985961914, -0.016616344451904297, -0.01595759391784668, -0.015298843383789062, -0.014640092849731445, -0.013981342315673828, -0.013322591781616211, -0.012663841247558594, -0.012005090713500977, -0.01134634017944336, -0.010687589645385742, -0.010028839111328125, -0.009370088577270508, -0.00871133804321289, -0.008052587509155273, -0.007393836975097656, -0.006735086441040039, -0.006076335906982422, -0.005417585372924805, -0.0047588348388671875, -0.00410008430480957, -0.003441333770751953, -0.002782583236694336, -0.0021238327026367188, -0.0014650821685791016, -0.0008063316345214844, -0.0001475811004638672, 0.00051116943359375, 0.0011699199676513672, 0.0018286705017089844, 0.0024874210357666016, 0.0031461715698242188, 0.003804922103881836, 0.004463672637939453, 0.00512242317199707, 0.0057811737060546875, 0.006439924240112305, 0.007098674774169922, 0.007757425308227539, 0.008416175842285156, 0.009074926376342773, 0.00973367691040039, 0.010392427444458008, 0.011051177978515625, 0.011709928512573242, 0.01236867904663086, 0.013027429580688477, 0.013686180114746094, 0.014344930648803711, 0.015003681182861328, 0.015662431716918945, 0.016321182250976562, 0.01697993278503418, 0.017638683319091797, 0.018297433853149414, 0.01895618438720703, 0.01961493492126465, 0.020273685455322266, 0.020932435989379883, 0.0215911865234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 9.0, 6.0, 8.0, 10.0, 9.0, 13.0, 12.0, 11.0, 14.0, 13.0, 29.0, 28.0, 19.0, 28.0, 31.0, 32.0, 33.0, 36.0, 39.0, 44.0, 34.0, 35.0, 44.0, 42.0, 45.0, 31.0, 37.0, 48.0, 29.0, 33.0, 21.0, 17.0, 26.0, 28.0, 18.0, 12.0, 12.0, 9.0, 9.0, 15.0, 6.0, 6.0, 4.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0126953125, -0.012306928634643555, -0.01191854476928711, -0.011530160903930664, -0.011141777038574219, -0.010753393173217773, -0.010365009307861328, -0.009976625442504883, -0.009588241577148438, -0.009199857711791992, -0.008811473846435547, -0.008423089981079102, -0.008034706115722656, -0.007646322250366211, -0.007257938385009766, -0.00686955451965332, -0.006481170654296875, -0.00609278678894043, -0.005704402923583984, -0.005316019058227539, -0.004927635192871094, -0.0045392513275146484, -0.004150867462158203, -0.003762483596801758, -0.0033740997314453125, -0.002985715866088867, -0.002597332000732422, -0.0022089481353759766, -0.0018205642700195312, -0.001432180404663086, -0.0010437965393066406, -0.0006554126739501953, -0.00026702880859375, 0.00012135505676269531, 0.0005097389221191406, 0.0008981227874755859, 0.0012865066528320312, 0.0016748905181884766, 0.002063274383544922, 0.002451658248901367, 0.0028400421142578125, 0.003228425979614258, 0.003616809844970703, 0.0040051937103271484, 0.004393577575683594, 0.004781961441040039, 0.005170345306396484, 0.00555872917175293, 0.005947113037109375, 0.00633549690246582, 0.006723880767822266, 0.007112264633178711, 0.007500648498535156, 0.007889032363891602, 0.008277416229248047, 0.008665800094604492, 0.009054183959960938, 0.009442567825317383, 0.009830951690673828, 0.010219335556030273, 0.010607719421386719, 0.010996103286743164, 0.01138448715209961, 0.011772871017456055, 0.0121612548828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 7.0, 4.0, 16.0, 17.0, 26.0, 28.0, 53.0, 78.0, 104.0, 160.0, 231.0, 391.0, 605.0, 1056.0, 2071.0, 4793.0, 15846.0, 122320.0, 840176.0, 44127.0, 9253.0, 3364.0, 1554.0, 813.0, 477.0, 295.0, 177.0, 145.0, 87.0, 77.0, 51.0, 28.0, 30.0, 16.0, 22.0, 7.0, 18.0, 5.0, 4.0, 6.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.00022220611572265625, -0.00021640397608280182, -0.0002106018364429474, -0.00020479969680309296, -0.00019899755716323853, -0.0001931954175233841, -0.00018739327788352966, -0.00018159113824367523, -0.0001757889986038208, -0.00016998685896396637, -0.00016418471932411194, -0.0001583825796842575, -0.00015258044004440308, -0.00014677830040454865, -0.00014097616076469421, -0.00013517402112483978, -0.00012937188148498535, -0.00012356974184513092, -0.00011776760220527649, -0.00011196546256542206, -0.00010616332292556763, -0.0001003611832857132, -9.455904364585876e-05, -8.875690400600433e-05, -8.29547643661499e-05, -7.715262472629547e-05, -7.135048508644104e-05, -6.554834544658661e-05, -5.974620580673218e-05, -5.3944066166877747e-05, -4.8141926527023315e-05, -4.2339786887168884e-05, -3.653764724731445e-05, -3.073550760746002e-05, -2.493336796760559e-05, -1.913122832775116e-05, -1.3329088687896729e-05, -7.526949048042297e-06, -1.7248094081878662e-06, 4.077330231666565e-06, 9.879469871520996e-06, 1.5681609511375427e-05, 2.148374915122986e-05, 2.728588879108429e-05, 3.308802843093872e-05, 3.889016807079315e-05, 4.469230771064758e-05, 5.0494447350502014e-05, 5.6296586990356445e-05, 6.209872663021088e-05, 6.790086627006531e-05, 7.370300590991974e-05, 7.950514554977417e-05, 8.53072851896286e-05, 9.110942482948303e-05, 9.691156446933746e-05, 0.0001027137041091919, 0.00010851584374904633, 0.00011431798338890076, 0.00012012012302875519, 0.00012592226266860962, 0.00013172440230846405, 0.00013752654194831848, 0.0001433286815881729, 0.00014913082122802734]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 2.0, 6.0, 5.0, 7.0, 10.0, 19.0, 16.0, 28.0, 33.0, 67.0, 132.0, 134.0, 158.0, 120.0, 79.0, 58.0, 43.0, 24.0, 10.0, 10.0, 7.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7418136596679688e-05, -2.6565976440906525e-05, -2.5713816285133362e-05, -2.48616561293602e-05, -2.4009495973587036e-05, -2.3157335817813873e-05, -2.230517566204071e-05, -2.1453015506267548e-05, -2.0600855350494385e-05, -1.9748695194721222e-05, -1.889653503894806e-05, -1.8044374883174896e-05, -1.7192214727401733e-05, -1.634005457162857e-05, -1.5487894415855408e-05, -1.4635734260082245e-05, -1.3783574104309082e-05, -1.293141394853592e-05, -1.2079253792762756e-05, -1.1227093636989594e-05, -1.037493348121643e-05, -9.522773325443268e-06, -8.670613169670105e-06, -7.818453013896942e-06, -6.966292858123779e-06, -6.1141327023506165e-06, -5.261972546577454e-06, -4.409812390804291e-06, -3.557652235031128e-06, -2.705492079257965e-06, -1.8533319234848022e-06, -1.0011717677116394e-06, -1.4901161193847656e-07, 7.031485438346863e-07, 1.5553086996078491e-06, 2.407468855381012e-06, 3.259629011154175e-06, 4.111789166927338e-06, 4.9639493227005005e-06, 5.816109478473663e-06, 6.668269634246826e-06, 7.520429790019989e-06, 8.372589945793152e-06, 9.224750101566315e-06, 1.0076910257339478e-05, 1.092907041311264e-05, 1.1781230568885803e-05, 1.2633390724658966e-05, 1.3485550880432129e-05, 1.4337711036205292e-05, 1.5189871191978455e-05, 1.6042031347751617e-05, 1.689419150352478e-05, 1.7746351659297943e-05, 1.8598511815071106e-05, 1.945067197084427e-05, 2.030283212661743e-05, 2.1154992282390594e-05, 2.2007152438163757e-05, 2.285931259393692e-05, 2.3711472749710083e-05, 2.4563632905483246e-05, 2.541579306125641e-05, 2.626795321702957e-05, 2.7120113372802734e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 11.0, 17.0, 29.0, 41.0, 66.0, 134.0, 207.0, 444.0, 927.0, 2134.0, 6855.0, 296182.0, 729632.0, 7596.0, 2305.0, 956.0, 452.0, 257.0, 114.0, 79.0, 43.0, 16.0, 20.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007357597351074219, -0.0007147565484046936, -0.0006937533617019653, -0.0006727501749992371, -0.0006517469882965088, -0.0006307438015937805, -0.0006097406148910522, -0.000588737428188324, -0.0005677342414855957, -0.0005467310547828674, -0.0005257278680801392, -0.0005047246813774109, -0.0004837214946746826, -0.00046271830797195435, -0.0004417151212692261, -0.0004207119345664978, -0.00039970874786376953, -0.00037870556116104126, -0.000357702374458313, -0.0003366991877555847, -0.00031569600105285645, -0.0002946928143501282, -0.0002736896276473999, -0.00025268644094467163, -0.00023168325424194336, -0.0002106800675392151, -0.00018967688083648682, -0.00016867369413375854, -0.00014767050743103027, -0.000126667320728302, -0.00010566413402557373, -8.466094732284546e-05, -6.365776062011719e-05, -4.2654573917388916e-05, -2.1651387214660645e-05, -6.48200511932373e-07, 2.03549861907959e-05, 4.135817289352417e-05, 6.236135959625244e-05, 8.336454629898071e-05, 0.00010436773300170898, 0.00012537091970443726, 0.00014637410640716553, 0.0001673772931098938, 0.00018838047981262207, 0.00020938366651535034, 0.0002303868532180786, 0.0002513900399208069, 0.00027239322662353516, 0.00029339641332626343, 0.0003143996000289917, 0.00033540278673171997, 0.00035640597343444824, 0.0003774091601371765, 0.0003984123468399048, 0.00041941553354263306, 0.00044041872024536133, 0.0004614219069480896, 0.00048242509365081787, 0.0005034282803535461, 0.0005244314670562744, 0.0005454346537590027, 0.000566437840461731, 0.0005874410271644592, 0.0006084442138671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 17.0, 49.0, 133.0, 267.0, 280.0, 139.0, 48.0, 18.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003552436828613281, -0.0003429800271987915, -0.0003307163715362549, -0.00031845271587371826, -0.00030618906021118164, -0.000293925404548645, -0.0002816617488861084, -0.0002693980932235718, -0.00025713443756103516, -0.00024487078189849854, -0.00023260712623596191, -0.0002203434705734253, -0.00020807981491088867, -0.00019581615924835205, -0.00018355250358581543, -0.0001712888479232788, -0.0001590251922607422, -0.00014676153659820557, -0.00013449788093566895, -0.00012223422527313232, -0.0001099705696105957, -9.770691394805908e-05, -8.544325828552246e-05, -7.317960262298584e-05, -6.091594696044922e-05, -4.86522912979126e-05, -3.6388635635375977e-05, -2.4124979972839355e-05, -1.1861324310302734e-05, 4.023313522338867e-07, 1.2665987014770508e-05, 2.492964267730713e-05, 3.719329833984375e-05, 4.945695400238037e-05, 6.172060966491699e-05, 7.398426532745361e-05, 8.624792098999023e-05, 9.851157665252686e-05, 0.00011077523231506348, 0.0001230388879776001, 0.00013530254364013672, 0.00014756619930267334, 0.00015982985496520996, 0.00017209351062774658, 0.0001843571662902832, 0.00019662082195281982, 0.00020888447761535645, 0.00022114813327789307, 0.0002334117889404297, 0.0002456754446029663, 0.00025793910026550293, 0.00027020275592803955, 0.00028246641159057617, 0.0002947300672531128, 0.0003069937229156494, 0.00031925737857818604, 0.00033152103424072266, 0.0003437846899032593, 0.0003560483455657959, 0.0003683120012283325, 0.00038057565689086914, 0.00039283931255340576, 0.0004051029682159424, 0.000417366623878479, 0.0004296302795410156]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 6.0, 13.0, 26.0, 27.0, 34.0, 54.0, 82.0, 127.0, 252.0, 114.0, 48.0, 50.0, 40.0, 23.0, 26.0, 10.0, 9.0, 8.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08876732736825943, -0.08564143627882004, -0.08251554518938065, -0.07938964664936066, -0.07626375555992126, -0.07313786447048187, -0.07001197338104248, -0.06688608229160309, -0.0637601912021637, -0.060634300112724304, -0.057508405297994614, -0.05438251420855522, -0.05125661939382553, -0.04813072830438614, -0.04500483721494675, -0.041878946125507355, -0.038753047585487366, -0.035627156496047974, -0.03250126168131828, -0.02937537059187889, -0.02624947763979435, -0.02312358468770981, -0.019997693598270416, -0.016871800646185875, -0.013745907694101334, -0.010620014742016792, -0.007494122721254826, -0.004368230700492859, -0.0012423377484083176, 0.0018835552036762238, 0.005009446293115616, 0.008135339245200157, 0.011261239647865295, 0.014387132599949837, 0.017513025552034378, 0.02063891664147377, 0.02376480959355831, 0.026890702545642853, 0.030016593635082245, 0.03314248472452164, 0.03626837953925133, 0.03939427062869072, 0.04252016544342041, 0.0456460565328598, 0.048771947622299194, 0.051897842437028885, 0.05502373352646828, 0.05814962834119797, 0.06127551943063736, 0.06440141052007675, 0.06752730160951614, 0.07065320014953613, 0.07377909123897552, 0.07690498232841492, 0.08003087341785431, 0.0831567645072937, 0.0862826555967331, 0.08940854668617249, 0.09253443777561188, 0.09566032886505127, 0.09878622740507126, 0.10191211849451065, 0.10503800958395004, 0.10816390067338943, 0.11128979921340942]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 9.0, 11.0, 19.0, 10.0, 31.0, 33.0, 33.0, 43.0, 47.0, 42.0, 78.0, 50.0, 75.0, 57.0, 65.0, 66.0, 53.0, 55.0, 39.0, 45.0, 22.0, 35.0, 18.0, 14.0, 13.0, 8.0, 9.0, 9.0, 4.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05976712703704834, -0.05738585442304611, -0.055004578083753586, -0.05262330174446106, -0.05024202913045883, -0.047860756516456604, -0.04547948017716408, -0.04309820383787155, -0.040716931223869324, -0.038335658609867096, -0.03595438227057457, -0.03357310593128204, -0.031191833317279816, -0.02881055884063244, -0.02642928436398506, -0.024048009887337685, -0.021666735410690308, -0.01928546093404293, -0.016904186457395554, -0.014522911980748177, -0.0121416375041008, -0.009760363027453423, -0.0073790885508060455, -0.0049978140741586685, -0.0026165395975112915, -0.0002352651208639145, 0.0021460093557834625, 0.0045272838324308395, 0.0069085583090782166, 0.009289832785725594, 0.01167110726237297, 0.014052381739020348, 0.016433656215667725, 0.0188149306923151, 0.02119620516896248, 0.023577479645609856, 0.025958754122257233, 0.02834002859890461, 0.030721303075551987, 0.03310257941484451, 0.03548385202884674, 0.03786512464284897, 0.040246400982141495, 0.04262767732143402, 0.04500894993543625, 0.04739022254943848, 0.049771498888731, 0.05215277522802353, 0.05453404784202576, 0.056915320456027985, 0.05929659679532051, 0.06167787313461304, 0.06405914574861526, 0.06644041836261749, 0.06882169842720032, 0.07120297104120255, 0.07358424365520477, 0.075965516269207, 0.07834678888320923, 0.08072806894779205, 0.08310934156179428, 0.08549061417579651, 0.08787189424037933, 0.09025316685438156, 0.09263443946838379]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 7.0, 4.0, 14.0, 24.0, 44.0, 67.0, 98.0, 221.0, 432.0, 801.0, 1783.0, 5506.0, 77302.0, 4085961.0, 15023.0, 3743.0, 1796.0, 691.0, 337.0, 162.0, 73.0, 45.0, 37.0, 24.0, 12.0, 11.0, 18.0, 2.0, 3.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.02392578125, -0.023360252380371094, -0.022794723510742188, -0.02222919464111328, -0.021663665771484375, -0.02109813690185547, -0.020532608032226562, -0.019967079162597656, -0.01940155029296875, -0.018836021423339844, -0.018270492553710938, -0.01770496368408203, -0.017139434814453125, -0.01657390594482422, -0.016008377075195312, -0.015442848205566406, -0.0148773193359375, -0.014311790466308594, -0.013746261596679688, -0.013180732727050781, -0.012615203857421875, -0.012049674987792969, -0.011484146118164062, -0.010918617248535156, -0.01035308837890625, -0.009787559509277344, -0.009222030639648438, -0.008656501770019531, -0.008090972900390625, -0.007525444030761719, -0.0069599151611328125, -0.006394386291503906, -0.005828857421875, -0.005263328552246094, -0.0046977996826171875, -0.004132270812988281, -0.003566741943359375, -0.0030012130737304688, -0.0024356842041015625, -0.0018701553344726562, -0.00130462646484375, -0.0007390975952148438, -0.0001735687255859375, 0.00039196014404296875, 0.000957489013671875, 0.0015230178833007812, 0.0020885467529296875, 0.0026540756225585938, 0.0032196044921875, 0.0037851333618164062, 0.0043506622314453125, 0.004916191101074219, 0.005481719970703125, 0.006047248840332031, 0.0066127777099609375, 0.007178306579589844, 0.00774383544921875, 0.008309364318847656, 0.008874893188476562, 0.009440422058105469, 0.010005950927734375, 0.010571479797363281, 0.011137008666992188, 0.011702537536621094, 0.01226806640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 19.0, 26.0, 28.0, 50.0, 98.0, 140.0, 146.0, 137.0, 110.0, 93.0, 43.0, 43.0, 30.0, 16.0, 8.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01143646240234375, -0.011163830757141113, -0.010891199111938477, -0.01061856746673584, -0.010345935821533203, -0.010073304176330566, -0.00980067253112793, -0.009528040885925293, -0.009255409240722656, -0.00898277759552002, -0.008710145950317383, -0.008437514305114746, -0.00816488265991211, -0.007892251014709473, -0.007619619369506836, -0.007346987724304199, -0.0070743560791015625, -0.006801724433898926, -0.006529092788696289, -0.006256461143493652, -0.005983829498291016, -0.005711197853088379, -0.005438566207885742, -0.0051659345626831055, -0.004893302917480469, -0.004620671272277832, -0.004348039627075195, -0.004075407981872559, -0.003802776336669922, -0.003530144691467285, -0.0032575130462646484, -0.0029848814010620117, -0.002712249755859375, -0.0024396181106567383, -0.0021669864654541016, -0.0018943548202514648, -0.0016217231750488281, -0.0013490915298461914, -0.0010764598846435547, -0.000803828239440918, -0.0005311965942382812, -0.00025856494903564453, 1.4066696166992188e-05, 0.0002866983413696289, 0.0005593299865722656, 0.0008319616317749023, 0.001104593276977539, 0.0013772249221801758, 0.0016498565673828125, 0.0019224882125854492, 0.002195119857788086, 0.0024677515029907227, 0.0027403831481933594, 0.003013014793395996, 0.003285646438598633, 0.0035582780838012695, 0.0038309097290039062, 0.004103541374206543, 0.00437617301940918, 0.004648804664611816, 0.004921436309814453, 0.00519406795501709, 0.0054666996002197266, 0.005739331245422363, 0.006011962890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 4.0, 4.0, 2.0, 11.0, 17.0, 13.0, 24.0, 27.0, 41.0, 81.0, 100.0, 246.0, 700.0, 2797.0, 34131.0, 4145258.0, 8203.0, 1584.0, 466.0, 221.0, 121.0, 62.0, 42.0, 43.0, 22.0, 24.0, 17.0, 6.0, 9.0, 4.0, 1.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053070068359375, -0.05164623260498047, -0.05022239685058594, -0.048798561096191406, -0.047374725341796875, -0.045950889587402344, -0.04452705383300781, -0.04310321807861328, -0.04167938232421875, -0.04025554656982422, -0.03883171081542969, -0.037407875061035156, -0.035984039306640625, -0.034560203552246094, -0.03313636779785156, -0.03171253204345703, -0.0302886962890625, -0.02886486053466797, -0.027441024780273438, -0.026017189025878906, -0.024593353271484375, -0.023169517517089844, -0.021745681762695312, -0.02032184600830078, -0.01889801025390625, -0.01747417449951172, -0.016050338745117188, -0.014626502990722656, -0.013202667236328125, -0.011778831481933594, -0.010354995727539062, -0.008931159973144531, -0.00750732421875, -0.006083488464355469, -0.0046596527099609375, -0.0032358169555664062, -0.001811981201171875, -0.00038814544677734375, 0.0010356903076171875, 0.0024595260620117188, 0.00388336181640625, 0.005307197570800781, 0.0067310333251953125, 0.008154869079589844, 0.009578704833984375, 0.011002540588378906, 0.012426376342773438, 0.013850212097167969, 0.0152740478515625, 0.01669788360595703, 0.018121719360351562, 0.019545555114746094, 0.020969390869140625, 0.022393226623535156, 0.023817062377929688, 0.02524089813232422, 0.02666473388671875, 0.02808856964111328, 0.029512405395507812, 0.030936241149902344, 0.032360076904296875, 0.033783912658691406, 0.03520774841308594, 0.03663158416748047, 0.038055419921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 2.0, 12.0, 31.0, 171.0, 3399.0, 382.0, 40.0, 12.0, 5.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01165008544921875, -0.010950684547424316, -0.010251283645629883, -0.00955188274383545, -0.008852481842041016, -0.008153080940246582, -0.0074536800384521484, -0.006754279136657715, -0.006054878234863281, -0.005355477333068848, -0.004656076431274414, -0.0039566755294799805, -0.003257274627685547, -0.0025578737258911133, -0.0018584728240966797, -0.001159071922302246, -0.0004596710205078125, 0.0002397298812866211, 0.0009391307830810547, 0.0016385316848754883, 0.002337932586669922, 0.0030373334884643555, 0.003736734390258789, 0.004436135292053223, 0.005135536193847656, 0.00583493709564209, 0.0065343379974365234, 0.007233738899230957, 0.00793313980102539, 0.008632540702819824, 0.009331941604614258, 0.010031342506408691, 0.010730743408203125, 0.011430144309997559, 0.012129545211791992, 0.012828946113586426, 0.01352834701538086, 0.014227747917175293, 0.014927148818969727, 0.01562654972076416, 0.016325950622558594, 0.017025351524353027, 0.01772475242614746, 0.018424153327941895, 0.019123554229736328, 0.01982295513153076, 0.020522356033325195, 0.02122175693511963, 0.021921157836914062, 0.022620558738708496, 0.02331995964050293, 0.024019360542297363, 0.024718761444091797, 0.02541816234588623, 0.026117563247680664, 0.026816964149475098, 0.02751636505126953, 0.028215765953063965, 0.0289151668548584, 0.029614567756652832, 0.030313968658447266, 0.0310133695602417, 0.03171277046203613, 0.032412171363830566, 0.033111572265625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 5.0, 5.0, 11.0, 14.0, 16.0, 21.0, 42.0, 56.0, 123.0, 322.0, 155.0, 94.0, 53.0, 30.0, 22.0, 6.0, 9.0, 10.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12957608699798584, -0.12130890786647797, -0.1130417212843895, -0.10477453470230103, -0.09650735557079315, -0.08824017643928528, -0.07997298985719681, -0.07170580327510834, -0.06343862414360046, -0.05517144128680229, -0.04690425843000412, -0.03863707557320595, -0.030369892716407776, -0.022102709859609604, -0.013835527002811432, -0.00556834414601326, 0.002698838710784912, 0.010966021567583084, 0.019233204424381256, 0.027500387281179428, 0.0357675701379776, 0.04403475299477577, 0.052301935851573944, 0.060569118708372116, 0.06883630156517029, 0.07710348069667816, 0.08537066727876663, 0.0936378538608551, 0.10190503299236298, 0.11017221212387085, 0.11843939870595932, 0.1267065852880478, 0.13497373461723328, 0.14324091374874115, 0.15150809288024902, 0.1597752869129181, 0.16804246604442596, 0.17630964517593384, 0.1845768392086029, 0.19284401834011078, 0.20111119747161865, 0.20937837660312653, 0.2176455557346344, 0.22591274976730347, 0.23417992889881134, 0.2424471080303192, 0.2507143020629883, 0.25898146629333496, 0.26724866032600403, 0.2755158543586731, 0.2837830185890198, 0.29205021262168884, 0.3003174066543579, 0.3085845708847046, 0.31685176491737366, 0.32511892914772034, 0.3333861231803894, 0.34165331721305847, 0.34992048144340515, 0.3581876754760742, 0.3664548397064209, 0.37472203373908997, 0.38298922777175903, 0.3912563920021057, 0.3995235860347748]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 9.0, 8.0, 16.0, 15.0, 19.0, 32.0, 39.0, 56.0, 59.0, 81.0, 90.0, 95.0, 96.0, 85.0, 73.0, 44.0, 45.0, 36.0, 30.0, 22.0, 12.0, 4.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.22167569398880005, -0.21580113470554352, -0.209926575422287, -0.20405200123786926, -0.19817744195461273, -0.1923028826713562, -0.18642832338809967, -0.18055376410484314, -0.17467918992042542, -0.16880463063716888, -0.16293007135391235, -0.15705549716949463, -0.1511809378862381, -0.14530637860298157, -0.13943181931972504, -0.1335572600364685, -0.12768270075321198, -0.12180814146995544, -0.11593357473611832, -0.11005901545286179, -0.10418444871902466, -0.09830988943576813, -0.0924353301525116, -0.08656077086925507, -0.08068620413541794, -0.07481164485216141, -0.06893707811832428, -0.06306251883506775, -0.05718795582652092, -0.05131339281797409, -0.04543883353471756, -0.03956427052617073, -0.0336897075176239, -0.027815144509077072, -0.021940583363175392, -0.016066022217273712, -0.010191459208726883, -0.004316896200180054, 0.001557663083076477, 0.007432226091623306, 0.013306789100170135, 0.019181352108716965, 0.025055913254618645, 0.030930474400520325, 0.036805037409067154, 0.04267960041761398, 0.048554159700870514, 0.05442872270941734, 0.06030328571796417, 0.0661778450012207, 0.07205241173505783, 0.07792697101831436, 0.08380153775215149, 0.08967609703540802, 0.09555065631866455, 0.10142521560192108, 0.10729978233575821, 0.11317434161901474, 0.11904890835285187, 0.1249234676361084, 0.13079802691936493, 0.13667258620262146, 0.14254716038703918, 0.14842171967029572, 0.15429627895355225]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 14.0, 12.0, 15.0, 26.0, 33.0, 31.0, 51.0, 73.0, 123.0, 221.0, 438.0, 1051.0, 2917.0, 11042.0, 55707.0, 656697.0, 274847.0, 34033.0, 7337.0, 2200.0, 757.0, 375.0, 182.0, 117.0, 62.0, 38.0, 39.0, 26.0, 18.0, 15.0, 19.0, 12.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0340576171875, -0.032877445220947266, -0.03169727325439453, -0.030517101287841797, -0.029336929321289062, -0.028156757354736328, -0.026976585388183594, -0.02579641342163086, -0.024616241455078125, -0.02343606948852539, -0.022255897521972656, -0.021075725555419922, -0.019895553588867188, -0.018715381622314453, -0.01753520965576172, -0.016355037689208984, -0.01517486572265625, -0.013994693756103516, -0.012814521789550781, -0.011634349822998047, -0.010454177856445312, -0.009274005889892578, -0.008093833923339844, -0.006913661956787109, -0.005733489990234375, -0.004553318023681641, -0.0033731460571289062, -0.002192974090576172, -0.0010128021240234375, 0.00016736984252929688, 0.0013475418090820312, 0.0025277137756347656, 0.0037078857421875, 0.004888057708740234, 0.006068229675292969, 0.007248401641845703, 0.008428573608398438, 0.009608745574951172, 0.010788917541503906, 0.01196908950805664, 0.013149261474609375, 0.01432943344116211, 0.015509605407714844, 0.016689777374267578, 0.017869949340820312, 0.019050121307373047, 0.02023029327392578, 0.021410465240478516, 0.02259063720703125, 0.023770809173583984, 0.02495098114013672, 0.026131153106689453, 0.027311325073242188, 0.028491497039794922, 0.029671669006347656, 0.03085184097290039, 0.032032012939453125, 0.03321218490600586, 0.034392356872558594, 0.03557252883911133, 0.03675270080566406, 0.0379328727722168, 0.03911304473876953, 0.040293216705322266, 0.041473388671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 18.0, 23.0, 31.0, 49.0, 83.0, 130.0, 132.0, 124.0, 134.0, 94.0, 56.0, 48.0, 30.0, 20.0, 13.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01151275634765625, -0.011240065097808838, -0.010967373847961426, -0.010694682598114014, -0.010421991348266602, -0.01014930009841919, -0.009876608848571777, -0.009603917598724365, -0.009331226348876953, -0.009058535099029541, -0.008785843849182129, -0.008513152599334717, -0.008240461349487305, -0.007967770099639893, -0.0076950788497924805, -0.007422387599945068, -0.007149696350097656, -0.006877005100250244, -0.006604313850402832, -0.00633162260055542, -0.006058931350708008, -0.005786240100860596, -0.005513548851013184, -0.0052408576011657715, -0.004968166351318359, -0.004695475101470947, -0.004422783851623535, -0.004150092601776123, -0.003877401351928711, -0.003604710102081299, -0.0033320188522338867, -0.0030593276023864746, -0.0027866363525390625, -0.0025139451026916504, -0.0022412538528442383, -0.001968562602996826, -0.001695871353149414, -0.001423180103302002, -0.0011504888534545898, -0.0008777976036071777, -0.0006051063537597656, -0.0003324151039123535, -5.9723854064941406e-05, 0.0002129673957824707, 0.0004856586456298828, 0.0007583498954772949, 0.001031041145324707, 0.0013037323951721191, 0.0015764236450195312, 0.0018491148948669434, 0.0021218061447143555, 0.0023944973945617676, 0.0026671886444091797, 0.002939879894256592, 0.003212571144104004, 0.003485262393951416, 0.003757953643798828, 0.00403064489364624, 0.004303336143493652, 0.0045760273933410645, 0.0048487186431884766, 0.005121409893035889, 0.005394101142883301, 0.005666792392730713, 0.005939483642578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 10.0, 10.0, 22.0, 19.0, 32.0, 45.0, 70.0, 124.0, 223.0, 422.0, 936.0, 2074.0, 4786.0, 12032.0, 33266.0, 111657.0, 651499.0, 162030.0, 43532.0, 15086.0, 5880.0, 2510.0, 1060.0, 545.0, 253.0, 139.0, 89.0, 61.0, 33.0, 21.0, 16.0, 15.0, 11.0, 4.0, 7.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0236663818359375, -0.022917985916137695, -0.02216958999633789, -0.021421194076538086, -0.02067279815673828, -0.019924402236938477, -0.019176006317138672, -0.018427610397338867, -0.017679214477539062, -0.016930818557739258, -0.016182422637939453, -0.015434026718139648, -0.014685630798339844, -0.013937234878540039, -0.013188838958740234, -0.01244044303894043, -0.011692047119140625, -0.01094365119934082, -0.010195255279541016, -0.009446859359741211, -0.008698463439941406, -0.007950067520141602, -0.007201671600341797, -0.006453275680541992, -0.0057048797607421875, -0.004956483840942383, -0.004208087921142578, -0.0034596920013427734, -0.0027112960815429688, -0.001962900161743164, -0.0012145042419433594, -0.0004661083221435547, 0.00028228759765625, 0.0010306835174560547, 0.0017790794372558594, 0.002527475357055664, 0.0032758712768554688, 0.0040242671966552734, 0.004772663116455078, 0.005521059036254883, 0.0062694549560546875, 0.007017850875854492, 0.007766246795654297, 0.008514642715454102, 0.009263038635253906, 0.010011434555053711, 0.010759830474853516, 0.01150822639465332, 0.012256622314453125, 0.01300501823425293, 0.013753414154052734, 0.014501810073852539, 0.015250205993652344, 0.01599860191345215, 0.016746997833251953, 0.017495393753051758, 0.018243789672851562, 0.018992185592651367, 0.019740581512451172, 0.020488977432250977, 0.02123737335205078, 0.021985769271850586, 0.02273416519165039, 0.023482561111450195, 0.02423095703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 7.0, 6.0, 3.0, 6.0, 15.0, 12.0, 12.0, 17.0, 23.0, 33.0, 38.0, 34.0, 41.0, 40.0, 34.0, 44.0, 45.0, 40.0, 54.0, 43.0, 50.0, 40.0, 43.0, 43.0, 26.0, 39.0, 40.0, 27.0, 23.0, 24.0, 16.0, 13.0, 14.0, 17.0, 7.0, 8.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01381683349609375, -0.01339268684387207, -0.01296854019165039, -0.012544393539428711, -0.012120246887207031, -0.011696100234985352, -0.011271953582763672, -0.010847806930541992, -0.010423660278320312, -0.009999513626098633, -0.009575366973876953, -0.009151220321655273, -0.008727073669433594, -0.008302927017211914, -0.007878780364990234, -0.007454633712768555, -0.007030487060546875, -0.006606340408325195, -0.006182193756103516, -0.005758047103881836, -0.005333900451660156, -0.0049097537994384766, -0.004485607147216797, -0.004061460494995117, -0.0036373138427734375, -0.003213167190551758, -0.002789020538330078, -0.0023648738861083984, -0.0019407272338867188, -0.001516580581665039, -0.0010924339294433594, -0.0006682872772216797, -0.000244140625, 0.0001800060272216797, 0.0006041526794433594, 0.001028299331665039, 0.0014524459838867188, 0.0018765926361083984, 0.002300739288330078, 0.002724885940551758, 0.0031490325927734375, 0.003573179244995117, 0.003997325897216797, 0.0044214725494384766, 0.004845619201660156, 0.005269765853881836, 0.005693912506103516, 0.006118059158325195, 0.006542205810546875, 0.006966352462768555, 0.007390499114990234, 0.007814645767211914, 0.008238792419433594, 0.008662939071655273, 0.009087085723876953, 0.009511232376098633, 0.009935379028320312, 0.010359525680541992, 0.010783672332763672, 0.011207818984985352, 0.011631965637207031, 0.012056112289428711, 0.01248025894165039, 0.01290440559387207, 0.01332855224609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 14.0, 14.0, 28.0, 37.0, 54.0, 80.0, 159.0, 265.0, 414.0, 821.0, 1444.0, 3230.0, 8408.0, 28140.0, 409247.0, 552396.0, 28673.0, 8454.0, 3302.0, 1545.0, 761.0, 397.0, 256.0, 115.0, 101.0, 64.0, 45.0, 25.0, 9.0, 12.0, 13.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002887248992919922, -0.00027877092361450195, -0.0002688169479370117, -0.0002588629722595215, -0.00024890899658203125, -0.00023895502090454102, -0.00022900104522705078, -0.00021904706954956055, -0.0002090930938720703, -0.00019913911819458008, -0.00018918514251708984, -0.0001792311668395996, -0.00016927719116210938, -0.00015932321548461914, -0.0001493692398071289, -0.00013941526412963867, -0.00012946128845214844, -0.0001195073127746582, -0.00010955333709716797, -9.959936141967773e-05, -8.96453857421875e-05, -7.969141006469727e-05, -6.973743438720703e-05, -5.97834587097168e-05, -4.982948303222656e-05, -3.987550735473633e-05, -2.9921531677246094e-05, -1.996755599975586e-05, -1.0013580322265625e-05, -5.960464477539063e-08, 9.894371032714844e-06, 1.9848346710205078e-05, 2.9802322387695312e-05, 3.975629806518555e-05, 4.971027374267578e-05, 5.9664249420166016e-05, 6.961822509765625e-05, 7.957220077514648e-05, 8.952617645263672e-05, 9.948015213012695e-05, 0.00010943412780761719, 0.00011938810348510742, 0.00012934207916259766, 0.0001392960548400879, 0.00014925003051757812, 0.00015920400619506836, 0.0001691579818725586, 0.00017911195755004883, 0.00018906593322753906, 0.0001990199089050293, 0.00020897388458251953, 0.00021892786026000977, 0.0002288818359375, 0.00023883581161499023, 0.00024878978729248047, 0.0002587437629699707, 0.00026869773864746094, 0.00027865171432495117, 0.0002886056900024414, 0.00029855966567993164, 0.0003085136413574219, 0.0003184676170349121, 0.00032842159271240234, 0.0003383755683898926, 0.0003483295440673828]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 9.0, 13.0, 8.0, 13.0, 11.0, 21.0, 31.0, 38.0, 70.0, 103.0, 91.0, 143.0, 121.0, 84.0, 90.0, 42.0, 34.0, 24.0, 11.0, 22.0, 7.0, 9.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8312206268310547e-05, -2.7497299015522003e-05, -2.668239176273346e-05, -2.5867484509944916e-05, -2.5052577257156372e-05, -2.423767000436783e-05, -2.3422762751579285e-05, -2.260785549879074e-05, -2.1792948246002197e-05, -2.0978040993213654e-05, -2.016313374042511e-05, -1.9348226487636566e-05, -1.8533319234848022e-05, -1.771841198205948e-05, -1.6903504729270935e-05, -1.608859747648239e-05, -1.5273690223693848e-05, -1.4458782970905304e-05, -1.364387571811676e-05, -1.2828968465328217e-05, -1.2014061212539673e-05, -1.1199153959751129e-05, -1.0384246706962585e-05, -9.569339454174042e-06, -8.754432201385498e-06, -7.939524948596954e-06, -7.124617695808411e-06, -6.309710443019867e-06, -5.494803190231323e-06, -4.6798959374427795e-06, -3.864988684654236e-06, -3.050081431865692e-06, -2.2351741790771484e-06, -1.4202669262886047e-06, -6.05359673500061e-07, 2.0954757928848267e-07, 1.0244548320770264e-06, 1.83936208486557e-06, 2.6542693376541138e-06, 3.4691765904426575e-06, 4.284083843231201e-06, 5.098991096019745e-06, 5.9138983488082886e-06, 6.728805601596832e-06, 7.543712854385376e-06, 8.35862010717392e-06, 9.173527359962463e-06, 9.988434612751007e-06, 1.080334186553955e-05, 1.1618249118328094e-05, 1.2433156371116638e-05, 1.3248063623905182e-05, 1.4062970876693726e-05, 1.487787812948227e-05, 1.5692785382270813e-05, 1.6507692635059357e-05, 1.73225998878479e-05, 1.8137507140636444e-05, 1.8952414393424988e-05, 1.976732164621353e-05, 2.0582228899002075e-05, 2.139713615179062e-05, 2.2212043404579163e-05, 2.3026950657367706e-05, 2.384185791015625e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 8.0, 6.0, 10.0, 20.0, 24.0, 42.0, 85.0, 145.0, 269.0, 512.0, 965.0, 2078.0, 4705.0, 12752.0, 51965.0, 855955.0, 90841.0, 17108.0, 5993.0, 2514.0, 1204.0, 596.0, 318.0, 176.0, 83.0, 64.0, 34.0, 25.0, 17.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000507354736328125, -0.000491313636302948, -0.000475272536277771, -0.000459231436252594, -0.000443190336227417, -0.00042714923620224, -0.000411108136177063, -0.000395067036151886, -0.000379025936126709, -0.000362984836101532, -0.000346943736076355, -0.000330902636051178, -0.000314861536026001, -0.000298820436000824, -0.00028277933597564697, -0.00026673823595046997, -0.00025069713592529297, -0.00023465603590011597, -0.00021861493587493896, -0.00020257383584976196, -0.00018653273582458496, -0.00017049163579940796, -0.00015445053577423096, -0.00013840943574905396, -0.00012236833572387695, -0.00010632723569869995, -9.028613567352295e-05, -7.424503564834595e-05, -5.8203935623168945e-05, -4.216283559799194e-05, -2.612173557281494e-05, -1.008063554763794e-05, 5.9604644775390625e-06, 2.2001564502716064e-05, 3.8042664527893066e-05, 5.408376455307007e-05, 7.012486457824707e-05, 8.616596460342407e-05, 0.00010220706462860107, 0.00011824816465377808, 0.00013428926467895508, 0.00015033036470413208, 0.00016637146472930908, 0.00018241256475448608, 0.00019845366477966309, 0.0002144947648048401, 0.0002305358648300171, 0.0002465769648551941, 0.0002626180648803711, 0.0002786591649055481, 0.0002947002649307251, 0.0003107413649559021, 0.0003267824649810791, 0.0003428235650062561, 0.0003588646650314331, 0.0003749057650566101, 0.0003909468650817871, 0.0004069879651069641, 0.0004230290651321411, 0.0004390701651573181, 0.0004551112651824951, 0.0004711523652076721, 0.0004871934652328491, 0.0005032345652580261, 0.0005192756652832031]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 5.0, 12.0, 8.0, 9.0, 16.0, 18.0, 33.0, 33.0, 64.0, 85.0, 144.0, 161.0, 145.0, 65.0, 32.0, 28.0, 20.0, 23.0, 11.0, 13.0, 13.0, 4.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0002949237823486328, -0.0002858005464076996, -0.00027667731046676636, -0.00026755407452583313, -0.0002584308385848999, -0.0002493076026439667, -0.00024018436670303345, -0.00023106113076210022, -0.000221937894821167, -0.00021281465888023376, -0.00020369142293930054, -0.0001945681869983673, -0.00018544495105743408, -0.00017632171511650085, -0.00016719847917556763, -0.0001580752432346344, -0.00014895200729370117, -0.00013982877135276794, -0.00013070553541183472, -0.00012158229947090149, -0.00011245906352996826, -0.00010333582758903503, -9.42125916481018e-05, -8.508935570716858e-05, -7.596611976623535e-05, -6.684288382530212e-05, -5.7719647884368896e-05, -4.859641194343567e-05, -3.947317600250244e-05, -3.0349940061569214e-05, -2.1226704120635986e-05, -1.2103468179702759e-05, -2.9802322387695312e-06, 6.143003702163696e-06, 1.5266239643096924e-05, 2.438947558403015e-05, 3.351271152496338e-05, 4.2635947465896606e-05, 5.1759183406829834e-05, 6.088241934776306e-05, 7.000565528869629e-05, 7.912889122962952e-05, 8.825212717056274e-05, 9.737536311149597e-05, 0.0001064985990524292, 0.00011562183499336243, 0.00012474507093429565, 0.00013386830687522888, 0.0001429915428161621, 0.00015211477875709534, 0.00016123801469802856, 0.0001703612506389618, 0.00017948448657989502, 0.00018860772252082825, 0.00019773095846176147, 0.0002068541944026947, 0.00021597743034362793, 0.00022510066628456116, 0.00023422390222549438, 0.0002433471381664276, 0.00025247037410736084, 0.00026159361004829407, 0.0002707168459892273, 0.0002798400819301605, 0.00028896331787109375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 8.0, 7.0, 4.0, 8.0, 10.0, 20.0, 18.0, 36.0, 65.0, 75.0, 113.0, 267.0, 107.0, 60.0, 55.0, 32.0, 34.0, 18.0, 7.0, 12.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12252210080623627, -0.11933580785989761, -0.11614950746297836, -0.11296321451663971, -0.10977691411972046, -0.1065906211733818, -0.10340432822704315, -0.1002180278301239, -0.09703173488378525, -0.0938454419374466, -0.09065914154052734, -0.08747284859418869, -0.08428655564785004, -0.08110025525093079, -0.07791396230459213, -0.07472766935825348, -0.07154136896133423, -0.06835507601499557, -0.06516877561807632, -0.06198248267173767, -0.05879618600010872, -0.05560988932847977, -0.05242359638214111, -0.04923729971051216, -0.04605100303888321, -0.04286470636725426, -0.039678409695625305, -0.03649211674928665, -0.0333058200776577, -0.030119523406028748, -0.026933228597044945, -0.023746933788061142, -0.020560629665851593, -0.01737433299422264, -0.014188038185238838, -0.01100174244493246, -0.007815446704626083, -0.004629150032997131, -0.0014428552240133286, 0.0017434395849704742, 0.004929736256599426, 0.008116031996905804, 0.011302327737212181, 0.014488623477518559, 0.017674919217824936, 0.020861215889453888, 0.02404751069843769, 0.027233805507421494, 0.030420102179050446, 0.0336063988506794, 0.03679269552230835, 0.039978988468647, 0.043165285140275955, 0.04635158181190491, 0.04953787475824356, 0.05272417142987251, 0.055910468101501465, 0.05909676477313042, 0.06228306144475937, 0.06546935439109802, 0.06865565478801727, 0.07184194773435593, 0.07502824068069458, 0.07821454107761383, 0.08140083402395248]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 8.0, 1.0, 8.0, 8.0, 12.0, 19.0, 23.0, 30.0, 22.0, 37.0, 35.0, 47.0, 55.0, 49.0, 80.0, 76.0, 63.0, 62.0, 57.0, 51.0, 38.0, 42.0, 26.0, 36.0, 22.0, 20.0, 16.0, 17.0, 11.0, 7.0, 7.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05956077575683594, -0.05723828822374344, -0.05491579696536064, -0.052593305706977844, -0.050270818173885345, -0.04794833064079285, -0.04562583938241005, -0.04330334812402725, -0.04098086059093475, -0.038658373057842255, -0.03633588179945946, -0.03401339054107666, -0.03169090300798416, -0.029368413612246513, -0.027045924216508865, -0.024723434820771217, -0.02240094542503357, -0.02007845602929592, -0.017755966633558273, -0.015433477237820625, -0.013110987842082977, -0.01078849844634533, -0.008466009050607681, -0.006143519654870033, -0.0038210302591323853, -0.0014985408633947372, 0.0008239485323429108, 0.0031464379280805588, 0.005468927323818207, 0.007791416719555855, 0.010113906115293503, 0.01243639551103115, 0.014758884906768799, 0.017081374302506447, 0.019403863698244095, 0.021726353093981743, 0.02404884248971939, 0.02637133188545704, 0.028693821281194687, 0.031016310676932335, 0.03333880007266998, 0.03566128760576248, 0.03798377886414528, 0.040306270122528076, 0.042628757655620575, 0.044951245188713074, 0.04727373644709587, 0.04959622770547867, 0.05191871523857117, 0.054241202771663666, 0.05656369403004646, 0.05888618528842926, 0.06120867282152176, 0.06353116035461426, 0.06585365533828735, 0.06817614287137985, 0.07049863040447235, 0.07282111793756485, 0.07514360547065735, 0.07746610045433044, 0.07978858798742294, 0.08211107552051544, 0.08443357050418854, 0.08675605803728104, 0.08907854557037354]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 4.0, 5.0, 8.0, 7.0, 11.0, 11.0, 14.0, 25.0, 39.0, 91.0, 120.0, 267.0, 555.0, 1258.0, 3234.0, 12865.0, 369970.0, 3773310.0, 22324.0, 6082.0, 2515.0, 751.0, 346.0, 167.0, 103.0, 55.0, 38.0, 25.0, 23.0, 10.0, 4.0, 11.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0252685546875, -0.024669647216796875, -0.02407073974609375, -0.023471832275390625, -0.0228729248046875, -0.022274017333984375, -0.02167510986328125, -0.021076202392578125, -0.020477294921875, -0.019878387451171875, -0.01927947998046875, -0.018680572509765625, -0.0180816650390625, -0.017482757568359375, -0.01688385009765625, -0.016284942626953125, -0.01568603515625, -0.015087127685546875, -0.01448822021484375, -0.013889312744140625, -0.0132904052734375, -0.012691497802734375, -0.01209259033203125, -0.011493682861328125, -0.010894775390625, -0.010295867919921875, -0.00969696044921875, -0.009098052978515625, -0.0084991455078125, -0.007900238037109375, -0.00730133056640625, -0.006702423095703125, -0.006103515625, -0.005504608154296875, -0.00490570068359375, -0.004306793212890625, -0.0037078857421875, -0.003108978271484375, -0.00251007080078125, -0.001911163330078125, -0.001312255859375, -0.000713348388671875, -0.00011444091796875, 0.000484466552734375, 0.0010833740234375, 0.001682281494140625, 0.00228118896484375, 0.002880096435546875, 0.00347900390625, 0.004077911376953125, 0.00467681884765625, 0.005275726318359375, 0.0058746337890625, 0.006473541259765625, 0.00707244873046875, 0.007671356201171875, 0.008270263671875, 0.008869171142578125, 0.00946807861328125, 0.010066986083984375, 0.0106658935546875, 0.011264801025390625, 0.01186370849609375, 0.012462615966796875, 0.0130615234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 4.0, 12.0, 23.0, 27.0, 40.0, 66.0, 105.0, 142.0, 132.0, 126.0, 122.0, 62.0, 51.0, 42.0, 18.0, 17.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01104736328125, -0.010781943798065186, -0.010516524314880371, -0.010251104831695557, -0.009985685348510742, -0.009720265865325928, -0.009454846382141113, -0.009189426898956299, -0.008924007415771484, -0.00865858793258667, -0.008393168449401855, -0.008127748966217041, -0.007862329483032227, -0.007596909999847412, -0.007331490516662598, -0.007066071033477783, -0.006800651550292969, -0.006535232067108154, -0.00626981258392334, -0.006004393100738525, -0.005738973617553711, -0.0054735541343688965, -0.005208134651184082, -0.004942715167999268, -0.004677295684814453, -0.004411876201629639, -0.004146456718444824, -0.0038810372352600098, -0.0036156177520751953, -0.003350198268890381, -0.0030847787857055664, -0.002819359302520752, -0.0025539398193359375, -0.002288520336151123, -0.0020231008529663086, -0.0017576813697814941, -0.0014922618865966797, -0.0012268424034118652, -0.0009614229202270508, -0.0006960034370422363, -0.0004305839538574219, -0.00016516447067260742, 0.00010025501251220703, 0.0003656744956970215, 0.0006310939788818359, 0.0008965134620666504, 0.0011619329452514648, 0.0014273524284362793, 0.0016927719116210938, 0.001958191394805908, 0.0022236108779907227, 0.002489030361175537, 0.0027544498443603516, 0.003019869327545166, 0.0032852888107299805, 0.003550708293914795, 0.0038161277770996094, 0.004081547260284424, 0.004346966743469238, 0.004612386226654053, 0.004877805709838867, 0.005143225193023682, 0.005408644676208496, 0.0056740641593933105, 0.005939483642578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 7.0, 20.0, 22.0, 27.0, 48.0, 64.0, 82.0, 162.0, 291.0, 738.0, 2027.0, 8410.0, 59336.0, 4032553.0, 76474.0, 10107.0, 2475.0, 817.0, 307.0, 128.0, 64.0, 46.0, 14.0, 18.0, 14.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021820068359375, -0.021027803421020508, -0.020235538482666016, -0.019443273544311523, -0.01865100860595703, -0.01785874366760254, -0.017066478729248047, -0.016274213790893555, -0.015481948852539062, -0.01468968391418457, -0.013897418975830078, -0.013105154037475586, -0.012312889099121094, -0.011520624160766602, -0.01072835922241211, -0.009936094284057617, -0.009143829345703125, -0.008351564407348633, -0.007559299468994141, -0.0067670345306396484, -0.005974769592285156, -0.005182504653930664, -0.004390239715576172, -0.0035979747772216797, -0.0028057098388671875, -0.0020134449005126953, -0.0012211799621582031, -0.00042891502380371094, 0.00036334991455078125, 0.0011556148529052734, 0.0019478797912597656, 0.002740144729614258, 0.00353240966796875, 0.004324674606323242, 0.005116939544677734, 0.0059092044830322266, 0.006701469421386719, 0.007493734359741211, 0.008285999298095703, 0.009078264236450195, 0.009870529174804688, 0.01066279411315918, 0.011455059051513672, 0.012247323989868164, 0.013039588928222656, 0.013831853866577148, 0.01462411880493164, 0.015416383743286133, 0.016208648681640625, 0.017000913619995117, 0.01779317855834961, 0.0185854434967041, 0.019377708435058594, 0.020169973373413086, 0.020962238311767578, 0.02175450325012207, 0.022546768188476562, 0.023339033126831055, 0.024131298065185547, 0.02492356300354004, 0.02571582794189453, 0.026508092880249023, 0.027300357818603516, 0.028092622756958008, 0.0288848876953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 13.0, 23.0, 33.0, 29.0, 60.0, 189.0, 1054.0, 2073.0, 350.0, 80.0, 51.0, 33.0, 22.0, 14.0, 12.0, 10.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.02191162109375, -0.021437406539916992, -0.020963191986083984, -0.020488977432250977, -0.02001476287841797, -0.01954054832458496, -0.019066333770751953, -0.018592119216918945, -0.018117904663085938, -0.01764369010925293, -0.017169475555419922, -0.016695261001586914, -0.016221046447753906, -0.0157468318939209, -0.01527261734008789, -0.014798402786254883, -0.014324188232421875, -0.013849973678588867, -0.01337575912475586, -0.012901544570922852, -0.012427330017089844, -0.011953115463256836, -0.011478900909423828, -0.01100468635559082, -0.010530471801757812, -0.010056257247924805, -0.009582042694091797, -0.009107828140258789, -0.008633613586425781, -0.008159399032592773, -0.007685184478759766, -0.007210969924926758, -0.00673675537109375, -0.006262540817260742, -0.005788326263427734, -0.0053141117095947266, -0.004839897155761719, -0.004365682601928711, -0.003891468048095703, -0.0034172534942626953, -0.0029430389404296875, -0.0024688243865966797, -0.001994609832763672, -0.001520395278930664, -0.0010461807250976562, -0.0005719661712646484, -9.775161743164062e-05, 0.0003764629364013672, 0.000850677490234375, 0.0013248920440673828, 0.0017991065979003906, 0.0022733211517333984, 0.0027475357055664062, 0.003221750259399414, 0.003695964813232422, 0.00417017936706543, 0.0046443939208984375, 0.005118608474731445, 0.005592823028564453, 0.006067037582397461, 0.006541252136230469, 0.0070154666900634766, 0.007489681243896484, 0.007963895797729492, 0.0084381103515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 10.0, 13.0, 21.0, 37.0, 60.0, 82.0, 212.0, 257.0, 110.0, 63.0, 36.0, 27.0, 21.0, 15.0, 14.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06460139900445938, -0.06191864609718323, -0.059235893189907074, -0.05655314028263092, -0.05387038737535477, -0.05118763446807861, -0.04850488156080246, -0.045822128653526306, -0.04313937574625015, -0.040456622838974, -0.037773869931697845, -0.03509111702442169, -0.03240836411714554, -0.029725611209869385, -0.027042856439948082, -0.02436010353267193, -0.021677348762750626, -0.018994595855474472, -0.01631184294819832, -0.01362908910959959, -0.010946336202323437, -0.008263583295047283, -0.005580829456448555, -0.0028980765491724014, -0.00021532364189624786, 0.0024674294982105494, 0.005150182638317347, 0.007832936011254787, 0.010515688918530941, 0.013198441825807095, 0.015881195664405823, 0.018563948571681976, 0.02124670147895813, 0.023929454386234283, 0.026612207293510437, 0.02929496020078659, 0.031977713108062744, 0.0346604660153389, 0.03734321892261505, 0.040025971829891205, 0.04270872473716736, 0.04539147764444351, 0.048074230551719666, 0.05075698345899582, 0.05343973636627197, 0.056122489273548126, 0.05880524218082428, 0.06148799508810043, 0.06417074799537659, 0.06685350090265274, 0.0695362538099289, 0.07221900671720505, 0.0749017596244812, 0.07758451253175735, 0.08026726543903351, 0.08295001834630966, 0.08563277870416641, 0.08831553161144257, 0.09099828451871872, 0.09368103742599487, 0.09636379033327103, 0.09904654324054718, 0.10172929614782333, 0.10441204905509949, 0.10709480196237564]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 4.0, 14.0, 10.0, 13.0, 17.0, 21.0, 39.0, 38.0, 39.0, 45.0, 55.0, 52.0, 40.0, 50.0, 37.0, 62.0, 58.0, 55.0, 56.0, 43.0, 38.0, 32.0, 28.0, 30.0, 23.0, 29.0, 16.0, 9.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038012802600860596, -0.03679495304822922, -0.03557710349559784, -0.03435925394296646, -0.03314140439033508, -0.031923554837703705, -0.030705705285072327, -0.02948785573244095, -0.02827000617980957, -0.027052156627178192, -0.025834307074546814, -0.024616457521915436, -0.023398607969284058, -0.02218075841665268, -0.0209629088640213, -0.019745059311389923, -0.018527209758758545, -0.017309360206127167, -0.01609151065349579, -0.01487366110086441, -0.013655811548233032, -0.012437961995601654, -0.011220112442970276, -0.010002262890338898, -0.00878441333770752, -0.007566563785076141, -0.006348714232444763, -0.005130864679813385, -0.003913015127182007, -0.0026951655745506287, -0.0014773160219192505, -0.0002594664692878723, 0.0009583830833435059, 0.002176232635974884, 0.003394082188606262, 0.00461193174123764, 0.0058297812938690186, 0.007047630846500397, 0.008265480399131775, 0.009483329951763153, 0.010701179504394531, 0.01191902905702591, 0.013136878609657288, 0.014354728162288666, 0.015572577714920044, 0.016790427267551422, 0.0180082768201828, 0.01922612637281418, 0.020443975925445557, 0.021661825478076935, 0.022879675030708313, 0.02409752458333969, 0.02531537413597107, 0.026533223688602448, 0.027751073241233826, 0.028968922793865204, 0.030186772346496582, 0.03140462189912796, 0.03262247145175934, 0.03384032100439072, 0.035058170557022095, 0.03627602010965347, 0.03749386966228485, 0.03871171921491623, 0.03992956876754761]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 20.0, 14.0, 26.0, 36.0, 45.0, 64.0, 88.0, 151.0, 218.0, 439.0, 964.0, 2752.0, 9304.0, 40208.0, 325420.0, 595322.0, 55645.0, 11942.0, 3389.0, 1221.0, 525.0, 273.0, 146.0, 86.0, 64.0, 39.0, 25.0, 22.0, 13.0, 14.0, 13.0, 5.0, 9.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.034515380859375, -0.033503055572509766, -0.03249073028564453, -0.0314784049987793, -0.030466079711914062, -0.029453754425048828, -0.028441429138183594, -0.02742910385131836, -0.026416778564453125, -0.02540445327758789, -0.024392127990722656, -0.023379802703857422, -0.022367477416992188, -0.021355152130126953, -0.02034282684326172, -0.019330501556396484, -0.01831817626953125, -0.017305850982666016, -0.01629352569580078, -0.015281200408935547, -0.014268875122070312, -0.013256549835205078, -0.012244224548339844, -0.01123189926147461, -0.010219573974609375, -0.00920724868774414, -0.008194923400878906, -0.007182598114013672, -0.0061702728271484375, -0.005157947540283203, -0.004145622253417969, -0.0031332969665527344, -0.0021209716796875, -0.0011086463928222656, -9.632110595703125e-05, 0.0009160041809082031, 0.0019283294677734375, 0.002940654754638672, 0.003952980041503906, 0.004965305328369141, 0.005977630615234375, 0.006989955902099609, 0.008002281188964844, 0.009014606475830078, 0.010026931762695312, 0.011039257049560547, 0.012051582336425781, 0.013063907623291016, 0.01407623291015625, 0.015088558197021484, 0.01610088348388672, 0.017113208770751953, 0.018125534057617188, 0.019137859344482422, 0.020150184631347656, 0.02116250991821289, 0.022174835205078125, 0.02318716049194336, 0.024199485778808594, 0.025211811065673828, 0.026224136352539062, 0.027236461639404297, 0.02824878692626953, 0.029261112213134766, 0.0302734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 5.0, 12.0, 24.0, 26.0, 41.0, 61.0, 103.0, 142.0, 125.0, 134.0, 119.0, 67.0, 53.0, 41.0, 20.0, 18.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0110321044921875, -0.01076728105545044, -0.010502457618713379, -0.010237634181976318, -0.009972810745239258, -0.009707987308502197, -0.009443163871765137, -0.009178340435028076, -0.008913516998291016, -0.008648693561553955, -0.008383870124816895, -0.008119046688079834, -0.007854223251342773, -0.007589399814605713, -0.007324576377868652, -0.007059752941131592, -0.006794929504394531, -0.006530106067657471, -0.00626528263092041, -0.00600045919418335, -0.005735635757446289, -0.0054708123207092285, -0.005205988883972168, -0.004941165447235107, -0.004676342010498047, -0.004411518573760986, -0.004146695137023926, -0.0038818717002868652, -0.0036170482635498047, -0.003352224826812744, -0.0030874013900756836, -0.002822577953338623, -0.0025577545166015625, -0.002292931079864502, -0.0020281076431274414, -0.0017632842063903809, -0.0014984607696533203, -0.0012336373329162598, -0.0009688138961791992, -0.0007039904594421387, -0.0004391670227050781, -0.00017434358596801758, 9.047985076904297e-05, 0.0003553032875061035, 0.0006201267242431641, 0.0008849501609802246, 0.0011497735977172852, 0.0014145970344543457, 0.0016794204711914062, 0.0019442439079284668, 0.0022090673446655273, 0.002473890781402588, 0.0027387142181396484, 0.003003537654876709, 0.0032683610916137695, 0.00353318452835083, 0.0037980079650878906, 0.004062831401824951, 0.004327654838562012, 0.004592478275299072, 0.004857301712036133, 0.005122125148773193, 0.005386948585510254, 0.0056517720222473145, 0.005916595458984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 5.0, 3.0, 17.0, 14.0, 16.0, 39.0, 43.0, 67.0, 104.0, 168.0, 302.0, 507.0, 878.0, 1674.0, 3499.0, 6902.0, 14523.0, 32606.0, 84512.0, 549925.0, 237325.0, 65020.0, 26285.0, 12208.0, 5769.0, 2787.0, 1433.0, 806.0, 442.0, 253.0, 143.0, 102.0, 57.0, 48.0, 18.0, 18.0, 6.0, 6.0, 10.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0167236328125, -0.01618194580078125, -0.0156402587890625, -0.01509857177734375, -0.014556884765625, -0.01401519775390625, -0.0134735107421875, -0.01293182373046875, -0.01239013671875, -0.01184844970703125, -0.0113067626953125, -0.01076507568359375, -0.010223388671875, -0.00968170166015625, -0.0091400146484375, -0.00859832763671875, -0.008056640625, -0.00751495361328125, -0.0069732666015625, -0.00643157958984375, -0.005889892578125, -0.00534820556640625, -0.0048065185546875, -0.00426483154296875, -0.00372314453125, -0.00318145751953125, -0.0026397705078125, -0.00209808349609375, -0.001556396484375, -0.00101470947265625, -0.0004730224609375, 6.866455078125e-05, 0.0006103515625, 0.00115203857421875, 0.0016937255859375, 0.00223541259765625, 0.002777099609375, 0.00331878662109375, 0.0038604736328125, 0.00440216064453125, 0.00494384765625, 0.00548553466796875, 0.0060272216796875, 0.00656890869140625, 0.007110595703125, 0.00765228271484375, 0.0081939697265625, 0.00873565673828125, 0.00927734375, 0.00981903076171875, 0.0103607177734375, 0.01090240478515625, 0.011444091796875, 0.01198577880859375, 0.0125274658203125, 0.01306915283203125, 0.01361083984375, 0.01415252685546875, 0.0146942138671875, 0.01523590087890625, 0.015777587890625, 0.01631927490234375, 0.0168609619140625, 0.01740264892578125, 0.0179443359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 8.0, 21.0, 17.0, 19.0, 25.0, 19.0, 24.0, 27.0, 34.0, 32.0, 36.0, 40.0, 45.0, 49.0, 49.0, 49.0, 41.0, 52.0, 39.0, 40.0, 36.0, 44.0, 31.0, 29.0, 21.0, 26.0, 25.0, 23.0, 16.0, 11.0, 9.0, 9.0, 9.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 1.0], "bins": [-0.0157623291015625, -0.015355944633483887, -0.014949560165405273, -0.01454317569732666, -0.014136791229248047, -0.013730406761169434, -0.01332402229309082, -0.012917637825012207, -0.012511253356933594, -0.01210486888885498, -0.011698484420776367, -0.011292099952697754, -0.01088571548461914, -0.010479331016540527, -0.010072946548461914, -0.0096665620803833, -0.009260177612304688, -0.008853793144226074, -0.008447408676147461, -0.008041024208068848, -0.007634639739990234, -0.007228255271911621, -0.006821870803833008, -0.0064154863357543945, -0.006009101867675781, -0.005602717399597168, -0.005196332931518555, -0.004789948463439941, -0.004383563995361328, -0.003977179527282715, -0.0035707950592041016, -0.0031644105911254883, -0.002758026123046875, -0.0023516416549682617, -0.0019452571868896484, -0.0015388727188110352, -0.0011324882507324219, -0.0007261037826538086, -0.0003197193145751953, 8.666515350341797e-05, 0.0004930496215820312, 0.0008994340896606445, 0.0013058185577392578, 0.001712203025817871, 0.0021185874938964844, 0.0025249719619750977, 0.002931356430053711, 0.0033377408981323242, 0.0037441253662109375, 0.004150509834289551, 0.004556894302368164, 0.004963278770446777, 0.005369663238525391, 0.005776047706604004, 0.006182432174682617, 0.0065888166427612305, 0.006995201110839844, 0.007401585578918457, 0.00780797004699707, 0.008214354515075684, 0.008620738983154297, 0.00902712345123291, 0.009433507919311523, 0.009839892387390137, 0.01024627685546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 9.0, 10.0, 11.0, 31.0, 36.0, 63.0, 88.0, 108.0, 175.0, 226.0, 344.0, 563.0, 830.0, 1416.0, 2616.0, 5973.0, 17593.0, 139491.0, 831511.0, 30559.0, 8466.0, 3619.0, 1823.0, 1027.0, 667.0, 407.0, 272.0, 180.0, 121.0, 89.0, 51.0, 38.0, 36.0, 21.0, 20.0, 12.0, 9.0, 9.0, 9.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0002884864807128906, -0.0002802889794111252, -0.00027209147810935974, -0.0002638939768075943, -0.00025569647550582886, -0.0002474989742040634, -0.00023930147290229797, -0.00023110397160053253, -0.0002229064702987671, -0.00021470896899700165, -0.0002065114676952362, -0.00019831396639347076, -0.00019011646509170532, -0.00018191896378993988, -0.00017372146248817444, -0.000165523961186409, -0.00015732645988464355, -0.0001491289585828781, -0.00014093145728111267, -0.00013273395597934723, -0.0001245364546775818, -0.00011633895337581635, -0.0001081414520740509, -9.994395077228546e-05, -9.174644947052002e-05, -8.354894816875458e-05, -7.535144686698914e-05, -6.71539455652237e-05, -5.895644426345825e-05, -5.075894296169281e-05, -4.256144165992737e-05, -3.4363940358161926e-05, -2.6166439056396484e-05, -1.7968937754631042e-05, -9.7714364528656e-06, -1.5739351511001587e-06, 6.623566150665283e-06, 1.4821067452430725e-05, 2.3018568754196167e-05, 3.121607005596161e-05, 3.941357135772705e-05, 4.761107265949249e-05, 5.5808573961257935e-05, 6.400607526302338e-05, 7.220357656478882e-05, 8.040107786655426e-05, 8.85985791683197e-05, 9.679608047008514e-05, 0.00010499358177185059, 0.00011319108307361603, 0.00012138858437538147, 0.0001295860856771469, 0.00013778358697891235, 0.0001459810882806778, 0.00015417858958244324, 0.00016237609088420868, 0.00017057359218597412, 0.00017877109348773956, 0.000186968594789505, 0.00019516609609127045, 0.0002033635973930359, 0.00021156109869480133, 0.00021975859999656677, 0.00022795610129833221, 0.00023615360260009766]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 1.0, 3.0, 8.0, 4.0, 6.0, 21.0, 14.0, 16.0, 27.0, 41.0, 41.0, 77.0, 52.0, 65.0, 100.0, 105.0, 85.0, 69.0, 47.0, 53.0, 33.0, 28.0, 21.0, 19.0, 16.0, 8.0, 5.0, 12.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.775161743164062e-06, -9.39890742301941e-06, -9.022653102874756e-06, -8.646398782730103e-06, -8.27014446258545e-06, -7.893890142440796e-06, -7.517635822296143e-06, -7.141381502151489e-06, -6.765127182006836e-06, -6.388872861862183e-06, -6.012618541717529e-06, -5.636364221572876e-06, -5.260109901428223e-06, -4.883855581283569e-06, -4.507601261138916e-06, -4.131346940994263e-06, -3.7550926208496094e-06, -3.378838300704956e-06, -3.0025839805603027e-06, -2.6263296604156494e-06, -2.250075340270996e-06, -1.8738210201263428e-06, -1.4975666999816895e-06, -1.1213123798370361e-06, -7.450580596923828e-07, -3.688037395477295e-07, 7.450580596923828e-09, 3.8370490074157715e-07, 7.599592208862305e-07, 1.1362135410308838e-06, 1.5124678611755371e-06, 1.8887221813201904e-06, 2.2649765014648438e-06, 2.641230821609497e-06, 3.0174851417541504e-06, 3.3937394618988037e-06, 3.769993782043457e-06, 4.14624810218811e-06, 4.522502422332764e-06, 4.898756742477417e-06, 5.27501106262207e-06, 5.651265382766724e-06, 6.027519702911377e-06, 6.40377402305603e-06, 6.780028343200684e-06, 7.156282663345337e-06, 7.53253698348999e-06, 7.908791303634644e-06, 8.285045623779297e-06, 8.66129994392395e-06, 9.037554264068604e-06, 9.413808584213257e-06, 9.79006290435791e-06, 1.0166317224502563e-05, 1.0542571544647217e-05, 1.091882586479187e-05, 1.1295080184936523e-05, 1.1671334505081177e-05, 1.204758882522583e-05, 1.2423843145370483e-05, 1.2800097465515137e-05, 1.317635178565979e-05, 1.3552606105804443e-05, 1.3928860425949097e-05, 1.430511474609375e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 5.0, 0.0, 2.0, 5.0, 6.0, 9.0, 21.0, 24.0, 41.0, 58.0, 114.0, 173.0, 269.0, 350.0, 514.0, 843.0, 1733.0, 3907.0, 12768.0, 140424.0, 856317.0, 20666.0, 5323.0, 2085.0, 1089.0, 608.0, 405.0, 244.0, 184.0, 136.0, 90.0, 52.0, 31.0, 20.0, 17.0, 9.0, 5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004756450653076172, -0.0004603751003742218, -0.0004451051354408264, -0.00042983517050743103, -0.00041456520557403564, -0.00039929524064064026, -0.0003840252757072449, -0.0003687553107738495, -0.0003534853458404541, -0.0003382153809070587, -0.00032294541597366333, -0.00030767545104026794, -0.00029240548610687256, -0.00027713552117347717, -0.0002618655562400818, -0.0002465955913066864, -0.00023132562637329102, -0.00021605566143989563, -0.00020078569650650024, -0.00018551573157310486, -0.00017024576663970947, -0.0001549758017063141, -0.0001397058367729187, -0.00012443587183952332, -0.00010916590690612793, -9.389594197273254e-05, -7.862597703933716e-05, -6.335601210594177e-05, -4.808604717254639e-05, -3.2816082239151e-05, -1.7546117305755615e-05, -2.2761523723602295e-06, 1.2993812561035156e-05, 2.8263777494430542e-05, 4.353374242782593e-05, 5.8803707361221313e-05, 7.40736722946167e-05, 8.934363722801208e-05, 0.00010461360216140747, 0.00011988356709480286, 0.00013515353202819824, 0.00015042349696159363, 0.00016569346189498901, 0.0001809634268283844, 0.00019623339176177979, 0.00021150335669517517, 0.00022677332162857056, 0.00024204328656196594, 0.00025731325149536133, 0.0002725832164287567, 0.0002878531813621521, 0.0003031231462955475, 0.00031839311122894287, 0.00033366307616233826, 0.00034893304109573364, 0.00036420300602912903, 0.0003794729709625244, 0.0003947429358959198, 0.0004100129008293152, 0.00042528286576271057, 0.00044055283069610596, 0.00045582279562950134, 0.00047109276056289673, 0.0004863627254962921, 0.0005016326904296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 2.0, 10.0, 12.0, 23.0, 27.0, 58.0, 177.0, 320.0, 202.0, 67.0, 30.0, 15.0, 18.0, 10.0, 5.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044536590576171875, -0.0004324689507484436, -0.00041957199573516846, -0.0004066750407218933, -0.00039377808570861816, -0.000380881130695343, -0.00036798417568206787, -0.0003550872206687927, -0.0003421902656555176, -0.00032929331064224243, -0.0003163963556289673, -0.00030349940061569214, -0.000290602445602417, -0.00027770549058914185, -0.0002648085355758667, -0.00025191158056259155, -0.0002390146255493164, -0.00022611767053604126, -0.0002132207155227661, -0.00020032376050949097, -0.00018742680549621582, -0.00017452985048294067, -0.00016163289546966553, -0.00014873594045639038, -0.00013583898544311523, -0.0001229420304298401, -0.00011004507541656494, -9.71481204032898e-05, -8.425116539001465e-05, -7.13542103767395e-05, -5.8457255363464355e-05, -4.556030035018921e-05, -3.266334533691406e-05, -1.9766390323638916e-05, -6.8694353103637695e-06, 6.027519702911377e-06, 1.8924474716186523e-05, 3.182142972946167e-05, 4.4718384742736816e-05, 5.761533975601196e-05, 7.051229476928711e-05, 8.340924978256226e-05, 9.63062047958374e-05, 0.00010920315980911255, 0.0001221001148223877, 0.00013499706983566284, 0.000147894024848938, 0.00016079097986221313, 0.00017368793487548828, 0.00018658488988876343, 0.00019948184490203857, 0.00021237879991531372, 0.00022527575492858887, 0.00023817270994186401, 0.00025106966495513916, 0.0002639666199684143, 0.00027686357498168945, 0.0002897605299949646, 0.00030265748500823975, 0.0003155544400215149, 0.00032845139503479004, 0.0003413483500480652, 0.00035424530506134033, 0.0003671422600746155, 0.0003800392150878906]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 10.0, 6.0, 12.0, 10.0, 15.0, 23.0, 32.0, 42.0, 58.0, 125.0, 287.0, 110.0, 67.0, 47.0, 28.0, 27.0, 17.0, 19.0, 10.0, 6.0, 8.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10940819978713989, -0.10623476654291153, -0.10306132584810257, -0.0998878926038742, -0.09671445190906525, -0.09354101866483688, -0.09036758542060852, -0.08719414472579956, -0.0840207040309906, -0.08084727078676224, -0.07767383009195328, -0.07450039684772491, -0.07132695615291595, -0.06815352290868759, -0.06498008966445923, -0.06180664896965027, -0.058633215725421906, -0.055459778755903244, -0.05228634178638458, -0.04911290854215622, -0.04593946784734726, -0.042766034603118896, -0.039592597633600235, -0.036419160664081573, -0.03324572369456291, -0.03007228672504425, -0.02689884975552559, -0.023725414648652077, -0.020551977679133415, -0.017378540709614754, -0.014205105602741241, -0.01103166863322258, -0.007858231663703918, -0.004684795159846544, -0.00151135865598917, 0.0016620773822069168, 0.004835514351725578, 0.00800895132124424, 0.011182386428117752, 0.014355823397636414, 0.017529260367155075, 0.020702697336673737, 0.023876134306192398, 0.02704956941306591, 0.030223006382584572, 0.03339644521474838, 0.036569878458976746, 0.03974331542849541, 0.04291675239801407, 0.04609018936753273, 0.04926362633705139, 0.052437059581279755, 0.055610500276088715, 0.05878393352031708, 0.06195737048983574, 0.0651308074593544, 0.06830424070358276, 0.07147767394781113, 0.07465111464262009, 0.07782454788684845, 0.08099798858165741, 0.08417142182588577, 0.08734485507011414, 0.0905182957649231, 0.09369173645973206]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 5.0, 2.0, 7.0, 5.0, 9.0, 8.0, 11.0, 12.0, 23.0, 13.0, 13.0, 27.0, 22.0, 23.0, 20.0, 30.0, 44.0, 40.0, 29.0, 36.0, 47.0, 57.0, 71.0, 53.0, 42.0, 41.0, 29.0, 27.0, 30.0, 20.0, 24.0, 16.0, 21.0, 23.0, 20.0, 12.0, 16.0, 9.0, 9.0, 12.0, 15.0, 5.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04677075147628784, -0.045248404145240784, -0.043726056814193726, -0.042203713208436966, -0.04068136587738991, -0.03915901854634285, -0.03763667494058609, -0.03611432760953903, -0.034591980278491974, -0.033069632947444916, -0.03154728561639786, -0.030024942010641098, -0.02850259467959404, -0.026980247348546982, -0.025457901880145073, -0.023935556411743164, -0.022413209080696106, -0.020890861749649048, -0.01936851628124714, -0.01784617081284523, -0.016323823481798172, -0.014801477082073689, -0.013279130682349205, -0.011756784282624722, -0.010234437882900238, -0.008712091483175755, -0.007189745083451271, -0.005667398683726788, -0.004145052284002304, -0.0026227058842778206, -0.001100359484553337, 0.0004219869151711464, 0.0019443333148956299, 0.0034666797146201134, 0.004989026114344597, 0.00651137251406908, 0.008033718913793564, 0.009556065313518047, 0.01107841171324253, 0.012600758112967014, 0.014123104512691498, 0.015645451843738556, 0.017167797312140465, 0.018690142780542374, 0.020212490111589432, 0.02173483744263649, 0.0232571829110384, 0.024779528379440308, 0.026301875710487366, 0.027824223041534424, 0.029346568509936333, 0.03086891397833824, 0.0323912613093853, 0.03391360864043236, 0.03543595224618912, 0.036958299577236176, 0.038480646908283234, 0.04000299423933029, 0.04152534157037735, 0.04304768517613411, 0.04457003250718117, 0.046092379838228226, 0.047614723443984985, 0.04913707077503204, 0.0506594181060791]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 13.0, 17.0, 16.0, 22.0, 39.0, 81.0, 142.0, 382.0, 1017.0, 3465.0, 20911.0, 4143631.0, 19287.0, 3527.0, 997.0, 365.0, 158.0, 80.0, 51.0, 22.0, 18.0, 10.0, 6.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.048797607421875, -0.04762125015258789, -0.04644489288330078, -0.04526853561401367, -0.04409217834472656, -0.04291582107543945, -0.041739463806152344, -0.040563106536865234, -0.039386749267578125, -0.038210391998291016, -0.037034034729003906, -0.0358576774597168, -0.03468132019042969, -0.03350496292114258, -0.03232860565185547, -0.03115224838256836, -0.02997589111328125, -0.02879953384399414, -0.02762317657470703, -0.026446819305419922, -0.025270462036132812, -0.024094104766845703, -0.022917747497558594, -0.021741390228271484, -0.020565032958984375, -0.019388675689697266, -0.018212318420410156, -0.017035961151123047, -0.015859603881835938, -0.014683246612548828, -0.013506889343261719, -0.01233053207397461, -0.0111541748046875, -0.00997781753540039, -0.008801460266113281, -0.007625102996826172, -0.0064487457275390625, -0.005272388458251953, -0.004096031188964844, -0.0029196739196777344, -0.001743316650390625, -0.0005669593811035156, 0.0006093978881835938, 0.0017857551574707031, 0.0029621124267578125, 0.004138469696044922, 0.005314826965332031, 0.006491184234619141, 0.00766754150390625, 0.00884389877319336, 0.010020256042480469, 0.011196613311767578, 0.012372970581054688, 0.013549327850341797, 0.014725685119628906, 0.015902042388916016, 0.017078399658203125, 0.018254756927490234, 0.019431114196777344, 0.020607471466064453, 0.021783828735351562, 0.022960186004638672, 0.02413654327392578, 0.02531290054321289, 0.0264892578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 17.0, 24.0, 30.0, 38.0, 71.0, 114.0, 147.0, 137.0, 131.0, 101.0, 61.0, 51.0, 34.0, 20.0, 15.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01084136962890625, -0.010579526424407959, -0.010317683219909668, -0.010055840015411377, -0.009793996810913086, -0.009532153606414795, -0.009270310401916504, -0.009008467197418213, -0.008746623992919922, -0.00848478078842163, -0.00822293758392334, -0.007961094379425049, -0.007699251174926758, -0.007437407970428467, -0.007175564765930176, -0.006913721561431885, -0.006651878356933594, -0.006390035152435303, -0.006128191947937012, -0.005866348743438721, -0.00560450553894043, -0.005342662334442139, -0.005080819129943848, -0.004818975925445557, -0.004557132720947266, -0.004295289516448975, -0.004033446311950684, -0.0037716031074523926, -0.0035097599029541016, -0.0032479166984558105, -0.0029860734939575195, -0.0027242302894592285, -0.0024623870849609375, -0.0022005438804626465, -0.0019387006759643555, -0.0016768574714660645, -0.0014150142669677734, -0.0011531710624694824, -0.0008913278579711914, -0.0006294846534729004, -0.0003676414489746094, -0.00010579824447631836, 0.00015604496002197266, 0.00041788816452026367, 0.0006797313690185547, 0.0009415745735168457, 0.0012034177780151367, 0.0014652609825134277, 0.0017271041870117188, 0.0019889473915100098, 0.0022507905960083008, 0.002512633800506592, 0.002774477005004883, 0.003036320209503174, 0.003298163414001465, 0.003560006618499756, 0.003821849822998047, 0.004083693027496338, 0.004345536231994629, 0.00460737943649292, 0.004869222640991211, 0.005131065845489502, 0.005392909049987793, 0.005654752254486084, 0.005916595458984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 8.0, 8.0, 10.0, 15.0, 28.0, 31.0, 58.0, 70.0, 134.0, 194.0, 270.0, 437.0, 689.0, 1247.0, 2000.0, 3978.0, 8546.0, 22610.0, 192629.0, 3899395.0, 38024.0, 11618.0, 5213.0, 2736.0, 1570.0, 958.0, 570.0, 401.0, 274.0, 170.0, 124.0, 69.0, 64.0, 38.0, 30.0, 22.0, 21.0, 1.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01296234130859375, -0.012546777725219727, -0.012131214141845703, -0.01171565055847168, -0.011300086975097656, -0.010884523391723633, -0.01046895980834961, -0.010053396224975586, -0.009637832641601562, -0.009222269058227539, -0.008806705474853516, -0.008391141891479492, -0.007975578308105469, -0.007560014724731445, -0.007144451141357422, -0.0067288875579833984, -0.006313323974609375, -0.0058977603912353516, -0.005482196807861328, -0.005066633224487305, -0.004651069641113281, -0.004235506057739258, -0.0038199424743652344, -0.003404378890991211, -0.0029888153076171875, -0.002573251724243164, -0.0021576881408691406, -0.0017421245574951172, -0.0013265609741210938, -0.0009109973907470703, -0.0004954338073730469, -7.987022399902344e-05, 0.000335693359375, 0.0007512569427490234, 0.0011668205261230469, 0.0015823841094970703, 0.0019979476928710938, 0.002413511276245117, 0.0028290748596191406, 0.003244638442993164, 0.0036602020263671875, 0.004075765609741211, 0.004491329193115234, 0.004906892776489258, 0.005322456359863281, 0.005738019943237305, 0.006153583526611328, 0.0065691471099853516, 0.006984710693359375, 0.0074002742767333984, 0.007815837860107422, 0.008231401443481445, 0.008646965026855469, 0.009062528610229492, 0.009478092193603516, 0.009893655776977539, 0.010309219360351562, 0.010724782943725586, 0.01114034652709961, 0.011555910110473633, 0.011971473693847656, 0.01238703727722168, 0.012802600860595703, 0.013218164443969727, 0.01363372802734375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 4.0, 17.0, 15.0, 22.0, 33.0, 78.0, 213.0, 3073.0, 347.0, 116.0, 37.0, 19.0, 13.0, 7.0, 8.0, 10.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0108642578125, -0.010541200637817383, -0.010218143463134766, -0.009895086288452148, -0.009572029113769531, -0.009248971939086914, -0.008925914764404297, -0.00860285758972168, -0.008279800415039062, -0.007956743240356445, -0.007633686065673828, -0.007310628890991211, -0.006987571716308594, -0.0066645145416259766, -0.006341457366943359, -0.006018400192260742, -0.005695343017578125, -0.005372285842895508, -0.005049228668212891, -0.0047261714935302734, -0.004403114318847656, -0.004080057144165039, -0.003756999969482422, -0.0034339427947998047, -0.0031108856201171875, -0.0027878284454345703, -0.002464771270751953, -0.002141714096069336, -0.0018186569213867188, -0.0014955997467041016, -0.0011725425720214844, -0.0008494853973388672, -0.00052642822265625, -0.0002033710479736328, 0.00011968612670898438, 0.00044274330139160156, 0.0007658004760742188, 0.001088857650756836, 0.0014119148254394531, 0.0017349720001220703, 0.0020580291748046875, 0.0023810863494873047, 0.002704143524169922, 0.003027200698852539, 0.0033502578735351562, 0.0036733150482177734, 0.003996372222900391, 0.004319429397583008, 0.004642486572265625, 0.004965543746948242, 0.005288600921630859, 0.0056116580963134766, 0.005934715270996094, 0.006257772445678711, 0.006580829620361328, 0.006903886795043945, 0.0072269439697265625, 0.00755000114440918, 0.007873058319091797, 0.008196115493774414, 0.008519172668457031, 0.008842229843139648, 0.009165287017822266, 0.009488344192504883, 0.0098114013671875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 5.0, 1.0, 8.0, 6.0, 9.0, 7.0, 13.0, 19.0, 23.0, 40.0, 50.0, 98.0, 222.0, 199.0, 98.0, 66.0, 40.0, 29.0, 14.0, 12.0, 11.0, 10.0, 8.0, 7.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04882966727018356, -0.0472487136721611, -0.04566775634884834, -0.04408680275082588, -0.04250584542751312, -0.04092489182949066, -0.0393439382314682, -0.03776298090815544, -0.03618202358484268, -0.03460106998682022, -0.03302011266350746, -0.031439159065485, -0.02985820174217224, -0.02827724814414978, -0.02669629268348217, -0.02511533722281456, -0.0235343836247921, -0.02195342816412449, -0.02037247270345688, -0.018791519105434418, -0.01721056178212166, -0.015629608184099197, -0.014048652723431587, -0.012467697262763977, -0.010886741802096367, -0.009305786341428757, -0.007724831346422434, -0.006143876351416111, -0.004562920890748501, -0.0029819654300808907, -0.001401010900735855, 0.00017994455993175507, 0.0017608962953090668, 0.0033418515231460333, 0.004922806750983, 0.006503761745989323, 0.008084717206656933, 0.009665672667324543, 0.011246627196669579, 0.012827582657337189, 0.014408538118004799, 0.01598949357867241, 0.01757044903934002, 0.01915140450000763, 0.02073235809803009, 0.02231331542134285, 0.02389426901936531, 0.02547522448003292, 0.02705617994070053, 0.02863713540136814, 0.03021809086203575, 0.03179904446005821, 0.03338000178337097, 0.03496095538139343, 0.036541908979415894, 0.03812286630272865, 0.03970382362604141, 0.04128477722406387, 0.04286573454737663, 0.044446688145399094, 0.04602764546871185, 0.047608599066734314, 0.049189552664756775, 0.050770509988069534, 0.052351463586091995]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 8.0, 8.0, 10.0, 14.0, 13.0, 16.0, 12.0, 21.0, 30.0, 28.0, 23.0, 31.0, 31.0, 31.0, 43.0, 40.0, 50.0, 40.0, 57.0, 46.0, 44.0, 40.0, 38.0, 47.0, 38.0, 37.0, 27.0, 22.0, 23.0, 16.0, 18.0, 18.0, 18.0, 12.0, 5.0, 6.0, 10.0, 5.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.025822997093200684, -0.02509630098938942, -0.024369603022933006, -0.023642905056476593, -0.02291620895266533, -0.022189512848854065, -0.02146281488239765, -0.02073611691594124, -0.020009420812129974, -0.01928272470831871, -0.018556026741862297, -0.017829328775405884, -0.01710263267159462, -0.016375936567783356, -0.015649238601326942, -0.014922541566193104, -0.014195844531059265, -0.013469147495925426, -0.012742450460791588, -0.01201575342565775, -0.01128905639052391, -0.010562359355390072, -0.009835662320256233, -0.009108965285122395, -0.008382268249988556, -0.007655571214854717, -0.006928874179720879, -0.00620217714458704, -0.005475480109453201, -0.004748783074319363, -0.004022086039185524, -0.0032953890040516853, -0.0025686919689178467, -0.001841994933784008, -0.0011152978986501694, -0.0003886008635163307, 0.00033809617161750793, 0.0010647932067513466, 0.0017914902418851852, 0.002518187277019024, 0.0032448843121528625, 0.003971581347286701, 0.00469827838242054, 0.0054249754175543785, 0.006151672452688217, 0.006878369487822056, 0.0076050665229558945, 0.008331763558089733, 0.009058460593223572, 0.00978515762835741, 0.010511854663491249, 0.011238551698625088, 0.011965248733758926, 0.012691945768892765, 0.013418642804026604, 0.014145339839160442, 0.014872036874294281, 0.01559873390942812, 0.01632543094456196, 0.01705212891101837, 0.017778825014829636, 0.0185055211186409, 0.019232219085097313, 0.019958917051553726, 0.02068561315536499]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 16.0, 15.0, 17.0, 20.0, 35.0, 39.0, 50.0, 95.0, 163.0, 278.0, 521.0, 1238.0, 3521.0, 13161.0, 65029.0, 722318.0, 203885.0, 27540.0, 6781.0, 2102.0, 786.0, 351.0, 178.0, 131.0, 76.0, 52.0, 27.0, 21.0, 17.0, 23.0, 13.0, 9.0, 9.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049713134765625, -0.04804229736328125, -0.0463714599609375, -0.04470062255859375, -0.04302978515625, -0.04135894775390625, -0.0396881103515625, -0.03801727294921875, -0.036346435546875, -0.03467559814453125, -0.0330047607421875, -0.03133392333984375, -0.0296630859375, -0.02799224853515625, -0.0263214111328125, -0.02465057373046875, -0.022979736328125, -0.02130889892578125, -0.0196380615234375, -0.01796722412109375, -0.01629638671875, -0.01462554931640625, -0.0129547119140625, -0.01128387451171875, -0.009613037109375, -0.00794219970703125, -0.0062713623046875, -0.00460052490234375, -0.0029296875, -0.00125885009765625, 0.0004119873046875, 0.00208282470703125, 0.003753662109375, 0.00542449951171875, 0.0070953369140625, 0.00876617431640625, 0.01043701171875, 0.01210784912109375, 0.0137786865234375, 0.01544952392578125, 0.017120361328125, 0.01879119873046875, 0.0204620361328125, 0.02213287353515625, 0.0238037109375, 0.02547454833984375, 0.0271453857421875, 0.02881622314453125, 0.030487060546875, 0.03215789794921875, 0.0338287353515625, 0.03549957275390625, 0.03717041015625, 0.03884124755859375, 0.0405120849609375, 0.04218292236328125, 0.043853759765625, 0.04552459716796875, 0.0471954345703125, 0.04886627197265625, 0.050537109375, 0.05220794677734375, 0.0538787841796875, 0.05554962158203125, 0.057220458984375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 18.0, 23.0, 29.0, 44.0, 73.0, 119.0, 148.0, 128.0, 130.0, 99.0, 64.0, 46.0, 35.0, 24.0, 12.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01082611083984375, -0.01056438684463501, -0.01030266284942627, -0.01004093885421753, -0.009779214859008789, -0.009517490863800049, -0.009255766868591309, -0.008994042873382568, -0.008732318878173828, -0.008470594882965088, -0.008208870887756348, -0.007947146892547607, -0.007685422897338867, -0.007423698902130127, -0.007161974906921387, -0.0069002509117126465, -0.006638526916503906, -0.006376802921295166, -0.006115078926086426, -0.0058533549308776855, -0.005591630935668945, -0.005329906940460205, -0.005068182945251465, -0.004806458950042725, -0.004544734954833984, -0.004283010959625244, -0.004021286964416504, -0.0037595629692077637, -0.0034978389739990234, -0.003236114978790283, -0.002974390983581543, -0.0027126669883728027, -0.0024509429931640625, -0.0021892189979553223, -0.001927495002746582, -0.0016657710075378418, -0.0014040470123291016, -0.0011423230171203613, -0.0008805990219116211, -0.0006188750267028809, -0.0003571510314941406, -9.542703628540039e-05, 0.00016629695892333984, 0.0004280209541320801, 0.0006897449493408203, 0.0009514689445495605, 0.0012131929397583008, 0.001474916934967041, 0.0017366409301757812, 0.0019983649253845215, 0.0022600889205932617, 0.002521812915802002, 0.002783536911010742, 0.0030452609062194824, 0.0033069849014282227, 0.003568708896636963, 0.003830432891845703, 0.004092156887054443, 0.004353880882263184, 0.004615604877471924, 0.004877328872680664, 0.005139052867889404, 0.0054007768630981445, 0.005662500858306885, 0.005924224853515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 10.0, 7.0, 9.0, 13.0, 33.0, 46.0, 62.0, 102.0, 127.0, 254.0, 441.0, 883.0, 1737.0, 3857.0, 9049.0, 22194.0, 64474.0, 503238.0, 342447.0, 61795.0, 21677.0, 8723.0, 3716.0, 1747.0, 844.0, 457.0, 211.0, 156.0, 73.0, 60.0, 39.0, 18.0, 17.0, 15.0, 9.0, 3.0, 11.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.024444580078125, -0.023725271224975586, -0.023005962371826172, -0.022286653518676758, -0.021567344665527344, -0.02084803581237793, -0.020128726959228516, -0.0194094181060791, -0.018690109252929688, -0.017970800399780273, -0.01725149154663086, -0.016532182693481445, -0.01581287384033203, -0.015093564987182617, -0.014374256134033203, -0.013654947280883789, -0.012935638427734375, -0.012216329574584961, -0.011497020721435547, -0.010777711868286133, -0.010058403015136719, -0.009339094161987305, -0.00861978530883789, -0.007900476455688477, -0.0071811676025390625, -0.0064618587493896484, -0.005742549896240234, -0.00502324104309082, -0.004303932189941406, -0.003584623336791992, -0.002865314483642578, -0.002146005630493164, -0.00142669677734375, -0.0007073879241943359, 1.1920928955078125e-05, 0.0007312297821044922, 0.0014505386352539062, 0.0021698474884033203, 0.0028891563415527344, 0.0036084651947021484, 0.0043277740478515625, 0.0050470829010009766, 0.005766391754150391, 0.006485700607299805, 0.007205009460449219, 0.007924318313598633, 0.008643627166748047, 0.009362936019897461, 0.010082244873046875, 0.010801553726196289, 0.011520862579345703, 0.012240171432495117, 0.012959480285644531, 0.013678789138793945, 0.01439809799194336, 0.015117406845092773, 0.015836715698242188, 0.0165560245513916, 0.017275333404541016, 0.01799464225769043, 0.018713951110839844, 0.019433259963989258, 0.020152568817138672, 0.020871877670288086, 0.0215911865234375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 1.0, 8.0, 8.0, 12.0, 7.0, 15.0, 12.0, 16.0, 30.0, 35.0, 24.0, 35.0, 35.0, 48.0, 44.0, 61.0, 56.0, 51.0, 65.0, 52.0, 44.0, 50.0, 52.0, 31.0, 31.0, 36.0, 24.0, 21.0, 28.0, 16.0, 18.0, 14.0, 5.0, 4.0, 4.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013671875, -0.013216137886047363, -0.012760400772094727, -0.01230466365814209, -0.011848926544189453, -0.011393189430236816, -0.01093745231628418, -0.010481715202331543, -0.010025978088378906, -0.00957024097442627, -0.009114503860473633, -0.008658766746520996, -0.00820302963256836, -0.007747292518615723, -0.007291555404663086, -0.006835818290710449, -0.0063800811767578125, -0.005924344062805176, -0.005468606948852539, -0.005012869834899902, -0.004557132720947266, -0.004101395606994629, -0.003645658493041992, -0.0031899213790893555, -0.0027341842651367188, -0.002278447151184082, -0.0018227100372314453, -0.0013669729232788086, -0.0009112358093261719, -0.00045549869537353516, 2.384185791015625e-07, 0.0004559755325317383, 0.000911712646484375, 0.0013674497604370117, 0.0018231868743896484, 0.002278923988342285, 0.002734661102294922, 0.0031903982162475586, 0.0036461353302001953, 0.004101872444152832, 0.004557609558105469, 0.0050133466720581055, 0.005469083786010742, 0.005924820899963379, 0.006380558013916016, 0.006836295127868652, 0.007292032241821289, 0.007747769355773926, 0.008203506469726562, 0.0086592435836792, 0.009114980697631836, 0.009570717811584473, 0.01002645492553711, 0.010482192039489746, 0.010937929153442383, 0.01139366626739502, 0.011849403381347656, 0.012305140495300293, 0.01276087760925293, 0.013216614723205566, 0.013672351837158203, 0.01412808895111084, 0.014583826065063477, 0.015039563179016113, 0.01549530029296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 8.0, 14.0, 16.0, 20.0, 32.0, 62.0, 74.0, 98.0, 203.0, 322.0, 547.0, 890.0, 1618.0, 2848.0, 5729.0, 12287.0, 28897.0, 86375.0, 703989.0, 135542.0, 38559.0, 15291.0, 7156.0, 3538.0, 1879.0, 970.0, 641.0, 348.0, 206.0, 117.0, 87.0, 59.0, 46.0, 36.0, 15.0, 13.0, 5.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00022220611572265625, -0.00021645613014698029, -0.00021070614457130432, -0.00020495615899562836, -0.0001992061734199524, -0.00019345618784427643, -0.00018770620226860046, -0.0001819562166929245, -0.00017620623111724854, -0.00017045624554157257, -0.0001647062599658966, -0.00015895627439022064, -0.00015320628881454468, -0.0001474563032388687, -0.00014170631766319275, -0.00013595633208751678, -0.00013020634651184082, -0.00012445636093616486, -0.00011870637536048889, -0.00011295638978481293, -0.00010720640420913696, -0.000101456418633461, -9.570643305778503e-05, -8.995644748210907e-05, -8.42064619064331e-05, -7.845647633075714e-05, -7.270649075508118e-05, -6.695650517940521e-05, -6.120651960372925e-05, -5.5456534028053284e-05, -4.970654845237732e-05, -4.3956562876701355e-05, -3.820657730102539e-05, -3.2456591725349426e-05, -2.6706606149673462e-05, -2.0956620573997498e-05, -1.5206634998321533e-05, -9.456649422645569e-06, -3.7066638469696045e-06, 2.04332172870636e-06, 7.793307304382324e-06, 1.3543292880058289e-05, 1.9293278455734253e-05, 2.5043264031410217e-05, 3.079324960708618e-05, 3.6543235182762146e-05, 4.229322075843811e-05, 4.8043206334114075e-05, 5.379319190979004e-05, 5.9543177485466003e-05, 6.529316306114197e-05, 7.104314863681793e-05, 7.67931342124939e-05, 8.254311978816986e-05, 8.829310536384583e-05, 9.404309093952179e-05, 9.979307651519775e-05, 0.00010554306209087372, 0.00011129304766654968, 0.00011704303324222565, 0.0001227930188179016, 0.00012854300439357758, 0.00013429298996925354, 0.0001400429755449295, 0.00014579296112060547]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 9.0, 6.0, 5.0, 3.0, 4.0, 8.0, 24.0, 25.0, 28.0, 59.0, 159.0, 237.0, 179.0, 88.0, 51.0, 19.0, 16.0, 9.0, 8.0, 11.0, 6.0, 3.0, 3.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5762786865234375e-05, -3.473181277513504e-05, -3.3700838685035706e-05, -3.266986459493637e-05, -3.1638890504837036e-05, -3.06079164147377e-05, -2.9576942324638367e-05, -2.8545968234539032e-05, -2.7514994144439697e-05, -2.6484020054340363e-05, -2.5453045964241028e-05, -2.4422071874141693e-05, -2.339109778404236e-05, -2.2360123693943024e-05, -2.132914960384369e-05, -2.0298175513744354e-05, -1.926720142364502e-05, -1.8236227333545685e-05, -1.720525324344635e-05, -1.6174279153347015e-05, -1.514330506324768e-05, -1.4112330973148346e-05, -1.3081356883049011e-05, -1.2050382792949677e-05, -1.1019408702850342e-05, -9.988434612751007e-06, -8.957460522651672e-06, -7.926486432552338e-06, -6.895512342453003e-06, -5.864538252353668e-06, -4.8335641622543335e-06, -3.8025900721549988e-06, -2.771615982055664e-06, -1.7406418919563293e-06, -7.096678018569946e-07, 3.213062882423401e-07, 1.3522803783416748e-06, 2.3832544684410095e-06, 3.4142285585403442e-06, 4.445202648639679e-06, 5.476176738739014e-06, 6.507150828838348e-06, 7.538124918937683e-06, 8.569099009037018e-06, 9.600073099136353e-06, 1.0631047189235687e-05, 1.1662021279335022e-05, 1.2692995369434357e-05, 1.3723969459533691e-05, 1.4754943549633026e-05, 1.578591763973236e-05, 1.6816891729831696e-05, 1.784786581993103e-05, 1.8878839910030365e-05, 1.99098140001297e-05, 2.0940788090229034e-05, 2.197176218032837e-05, 2.3002736270427704e-05, 2.403371036052704e-05, 2.5064684450626373e-05, 2.6095658540725708e-05, 2.7126632630825043e-05, 2.8157606720924377e-05, 2.9188580811023712e-05, 3.0219554901123047e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 19.0, 17.0, 22.0, 36.0, 42.0, 88.0, 161.0, 240.0, 459.0, 934.0, 1978.0, 4792.0, 12180.0, 39294.0, 379940.0, 546461.0, 40714.0, 12350.0, 4689.0, 2078.0, 915.0, 489.0, 256.0, 131.0, 78.0, 58.0, 41.0, 20.0, 17.0, 12.0, 14.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00032901763916015625, -0.0003201272338628769, -0.00031123682856559753, -0.0003023464232683182, -0.0002934560179710388, -0.00028456561267375946, -0.0002756752073764801, -0.00026678480207920074, -0.0002578943967819214, -0.00024900399148464203, -0.00024011358618736267, -0.0002312231808900833, -0.00022233277559280396, -0.0002134423702955246, -0.00020455196499824524, -0.00019566155970096588, -0.00018677115440368652, -0.00017788074910640717, -0.0001689903438091278, -0.00016009993851184845, -0.0001512095332145691, -0.00014231912791728973, -0.00013342872262001038, -0.00012453831732273102, -0.00011564791202545166, -0.0001067575067281723, -9.786710143089294e-05, -8.897669613361359e-05, -8.008629083633423e-05, -7.119588553905487e-05, -6.230548024177551e-05, -5.3415074944496155e-05, -4.45246696472168e-05, -3.563426434993744e-05, -2.674385905265808e-05, -1.7853453755378723e-05, -8.963048458099365e-06, -7.264316082000732e-08, 8.81776213645935e-06, 1.770816743373871e-05, 2.6598572731018066e-05, 3.5488978028297424e-05, 4.437938332557678e-05, 5.326978862285614e-05, 6.21601939201355e-05, 7.105059921741486e-05, 7.994100451469421e-05, 8.883140981197357e-05, 9.772181510925293e-05, 0.00010661222040653229, 0.00011550262570381165, 0.000124393031001091, 0.00013328343629837036, 0.00014217384159564972, 0.00015106424689292908, 0.00015995465219020844, 0.0001688450574874878, 0.00017773546278476715, 0.0001866258680820465, 0.00019551627337932587, 0.00020440667867660522, 0.00021329708397388458, 0.00022218748927116394, 0.0002310778945684433, 0.00023996829986572266]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 2.0, 10.0, 13.0, 11.0, 15.0, 13.0, 20.0, 28.0, 40.0, 37.0, 56.0, 83.0, 110.0, 130.0, 105.0, 67.0, 57.0, 35.0, 31.0, 29.0, 17.0, 12.0, 25.0, 10.0, 6.0, 7.0, 4.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014734268188476562, -0.0001417696475982666, -0.00013619661331176758, -0.00013062357902526855, -0.00012505054473876953, -0.00011947751045227051, -0.00011390447616577148, -0.00010833144187927246, -0.00010275840759277344, -9.718537330627441e-05, -9.161233901977539e-05, -8.603930473327637e-05, -8.046627044677734e-05, -7.489323616027832e-05, -6.93202018737793e-05, -6.374716758728027e-05, -5.817413330078125e-05, -5.2601099014282227e-05, -4.70280647277832e-05, -4.145503044128418e-05, -3.5881996154785156e-05, -3.0308961868286133e-05, -2.473592758178711e-05, -1.9162893295288086e-05, -1.3589859008789062e-05, -8.016824722290039e-06, -2.4437904357910156e-06, 3.129243850708008e-06, 8.702278137207031e-06, 1.4275312423706055e-05, 1.9848346710205078e-05, 2.54213809967041e-05, 3.0994415283203125e-05, 3.656744956970215e-05, 4.214048385620117e-05, 4.7713518142700195e-05, 5.328655242919922e-05, 5.885958671569824e-05, 6.443262100219727e-05, 7.000565528869629e-05, 7.557868957519531e-05, 8.115172386169434e-05, 8.672475814819336e-05, 9.229779243469238e-05, 9.78708267211914e-05, 0.00010344386100769043, 0.00010901689529418945, 0.00011458992958068848, 0.0001201629638671875, 0.00012573599815368652, 0.00013130903244018555, 0.00013688206672668457, 0.0001424551010131836, 0.00014802813529968262, 0.00015360116958618164, 0.00015917420387268066, 0.0001647472381591797, 0.0001703202724456787, 0.00017589330673217773, 0.00018146634101867676, 0.00018703937530517578, 0.0001926124095916748, 0.00019818544387817383, 0.00020375847816467285, 0.00020933151245117188]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 11.0, 18.0, 24.0, 32.0, 81.0, 201.0, 339.0, 91.0, 53.0, 36.0, 21.0, 20.0, 22.0, 8.0, 9.0, 10.0, 7.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.17582225799560547, -0.17174933850765228, -0.1676764190196991, -0.16360348463058472, -0.15953056514263153, -0.15545764565467834, -0.15138471126556396, -0.14731179177761078, -0.1432388722896576, -0.1391659528017044, -0.13509303331375122, -0.13102009892463684, -0.12694717943668365, -0.12287425994873047, -0.11880133301019669, -0.1147284060716629, -0.11065548658370972, -0.10658256709575653, -0.10250964015722275, -0.09843671321868896, -0.09436379373073578, -0.09029087424278259, -0.08621794730424881, -0.08214502036571503, -0.07807210087776184, -0.07399918138980865, -0.06992625445127487, -0.06585332751274109, -0.0617804080247879, -0.05770748481154442, -0.053634561598300934, -0.04956163838505745, -0.045488715171813965, -0.04141579195857048, -0.037342868745326996, -0.03326994553208351, -0.029197022318840027, -0.025124099105596542, -0.021051175892353058, -0.016978252679109573, -0.012905329465866089, -0.008832406252622604, -0.00475948303937912, -0.0006865598261356354, 0.003386363387107849, 0.007459286600351334, 0.011532209813594818, 0.015605133026838303, 0.019678056240081787, 0.02375097945332527, 0.027823902666568756, 0.03189682587981224, 0.035969749093055725, 0.04004267230629921, 0.044115595519542694, 0.04818851873278618, 0.05226144194602966, 0.05633436515927315, 0.06040728837251663, 0.06448021531105042, 0.0685531347990036, 0.07262605428695679, 0.07669898122549057, 0.08077190816402435, 0.08484482765197754]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 5.0, 8.0, 11.0, 12.0, 9.0, 13.0, 20.0, 19.0, 25.0, 28.0, 31.0, 39.0, 38.0, 48.0, 75.0, 91.0, 87.0, 55.0, 63.0, 45.0, 43.0, 41.0, 32.0, 19.0, 24.0, 15.0, 17.0, 18.0, 15.0, 9.0, 6.0, 9.0, 6.0, 7.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04868197441101074, -0.04681331291794777, -0.044944651424884796, -0.043075986206531525, -0.04120732471346855, -0.03933866322040558, -0.03746999800205231, -0.035601336508989334, -0.03373267501592636, -0.03186401352286339, -0.029995350167155266, -0.028126686811447144, -0.02625802531838417, -0.024389363825321198, -0.022520700469613075, -0.020652037113904953, -0.01878337562084198, -0.016914714127779007, -0.015046050772070885, -0.013177388347685337, -0.01130872592329979, -0.009440063498914242, -0.007571401074528694, -0.0057027386501431465, -0.003834076225757599, -0.0019654138013720512, -9.67513769865036e-05, 0.001771911047399044, 0.0036405734717845917, 0.005509235896170139, 0.007377898320555687, 0.009246560744941235, 0.011115223169326782, 0.01298388559371233, 0.014852548018097878, 0.016721211373806, 0.018589872866868973, 0.020458534359931946, 0.022327197715640068, 0.02419586107134819, 0.026064522564411163, 0.027933184057474136, 0.02980184741318226, 0.03167051076889038, 0.033539172261953354, 0.03540783375501633, 0.0372764989733696, 0.03914516046643257, 0.041013821959495544, 0.04288248345255852, 0.04475114494562149, 0.04661981016397476, 0.048488471657037735, 0.05035713315010071, 0.05222579836845398, 0.05409445986151695, 0.055963121354579926, 0.0578317828476429, 0.05970044434070587, 0.06156910955905914, 0.06343777477741241, 0.06530643254518509, 0.06717509776353836, 0.06904375553131104, 0.0709124207496643]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 12.0, 15.0, 22.0, 16.0, 22.0, 37.0, 51.0, 57.0, 68.0, 90.0, 106.0, 126.0, 131.0, 174.0, 210.0, 196.0, 323.0, 515.0, 1040.0, 2375.0, 6238.0, 19409.0, 69699.0, 340741.0, 3222740.0, 412410.0, 83659.0, 20775.0, 6464.0, 2715.0, 1538.0, 879.0, 608.0, 314.0, 211.0, 112.0, 75.0, 54.0, 25.0, 12.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0804443359375, -0.0784602165222168, -0.0764760971069336, -0.07449197769165039, -0.07250785827636719, -0.07052373886108398, -0.06853961944580078, -0.06655550003051758, -0.06457138061523438, -0.06258726119995117, -0.06060314178466797, -0.058619022369384766, -0.05663490295410156, -0.05465078353881836, -0.052666664123535156, -0.05068254470825195, -0.04869842529296875, -0.04671430587768555, -0.044730186462402344, -0.04274606704711914, -0.04076194763183594, -0.038777828216552734, -0.03679370880126953, -0.03480958938598633, -0.032825469970703125, -0.030841350555419922, -0.02885723114013672, -0.026873111724853516, -0.024888992309570312, -0.02290487289428711, -0.020920753479003906, -0.018936634063720703, -0.0169525146484375, -0.014968395233154297, -0.012984275817871094, -0.01100015640258789, -0.009016036987304688, -0.007031917572021484, -0.005047798156738281, -0.003063678741455078, -0.001079559326171875, 0.0009045600891113281, 0.0028886795043945312, 0.004872798919677734, 0.0068569183349609375, 0.00884103775024414, 0.010825157165527344, 0.012809276580810547, 0.01479339599609375, 0.016777515411376953, 0.018761634826660156, 0.02074575424194336, 0.022729873657226562, 0.024713993072509766, 0.02669811248779297, 0.028682231903076172, 0.030666351318359375, 0.03265047073364258, 0.03463459014892578, 0.036618709564208984, 0.03860282897949219, 0.04058694839477539, 0.042571067810058594, 0.0445551872253418, 0.046539306640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 4.0, 8.0, 25.0, 26.0, 37.0, 61.0, 107.0, 132.0, 141.0, 124.0, 117.0, 80.0, 51.0, 38.0, 21.0, 21.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0103912353515625, -0.010136306285858154, -0.009881377220153809, -0.009626448154449463, -0.009371519088745117, -0.009116590023040771, -0.008861660957336426, -0.00860673189163208, -0.008351802825927734, -0.008096873760223389, -0.007841944694519043, -0.007587015628814697, -0.0073320865631103516, -0.007077157497406006, -0.00682222843170166, -0.0065672993659973145, -0.006312370300292969, -0.006057441234588623, -0.005802512168884277, -0.005547583103179932, -0.005292654037475586, -0.00503772497177124, -0.0047827959060668945, -0.004527866840362549, -0.004272937774658203, -0.004018008708953857, -0.0037630796432495117, -0.003508150577545166, -0.0032532215118408203, -0.0029982924461364746, -0.002743363380432129, -0.002488434314727783, -0.0022335052490234375, -0.001978576183319092, -0.001723647117614746, -0.0014687180519104004, -0.0012137889862060547, -0.000958859920501709, -0.0007039308547973633, -0.0004490017890930176, -0.00019407272338867188, 6.085634231567383e-05, 0.00031578540802001953, 0.0005707144737243652, 0.0008256435394287109, 0.0010805726051330566, 0.0013355016708374023, 0.001590430736541748, 0.0018453598022460938, 0.0021002888679504395, 0.002355217933654785, 0.002610146999359131, 0.0028650760650634766, 0.0031200051307678223, 0.003374934196472168, 0.0036298632621765137, 0.0038847923278808594, 0.004139721393585205, 0.004394650459289551, 0.0046495795249938965, 0.004904508590698242, 0.005159437656402588, 0.005414366722106934, 0.005669295787811279, 0.005924224853515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 7.0, 9.0, 14.0, 20.0, 23.0, 33.0, 71.0, 96.0, 144.0, 217.0, 339.0, 538.0, 831.0, 1447.0, 2512.0, 4424.0, 7740.0, 14163.0, 28252.0, 59541.0, 140278.0, 415498.0, 2391915.0, 744813.0, 213457.0, 85198.0, 39023.0, 19512.0, 10225.0, 5690.0, 3234.0, 1896.0, 1195.0, 700.0, 461.0, 275.0, 165.0, 114.0, 72.0, 51.0, 32.0, 22.0, 11.0, 10.0, 8.0, 5.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01555633544921875, -0.015107989311218262, -0.014659643173217773, -0.014211297035217285, -0.013762950897216797, -0.013314604759216309, -0.01286625862121582, -0.012417912483215332, -0.011969566345214844, -0.011521220207214355, -0.011072874069213867, -0.010624527931213379, -0.01017618179321289, -0.009727835655212402, -0.009279489517211914, -0.008831143379211426, -0.008382797241210938, -0.00793445110321045, -0.007486104965209961, -0.007037758827209473, -0.006589412689208984, -0.006141066551208496, -0.005692720413208008, -0.0052443742752075195, -0.004796028137207031, -0.004347681999206543, -0.0038993358612060547, -0.0034509897232055664, -0.003002643585205078, -0.00255429744720459, -0.0021059513092041016, -0.0016576051712036133, -0.001209259033203125, -0.0007609128952026367, -0.00031256675720214844, 0.00013577938079833984, 0.0005841255187988281, 0.0010324716567993164, 0.0014808177947998047, 0.001929163932800293, 0.0023775100708007812, 0.0028258562088012695, 0.003274202346801758, 0.003722548484802246, 0.004170894622802734, 0.004619240760803223, 0.005067586898803711, 0.005515933036804199, 0.0059642791748046875, 0.006412625312805176, 0.006860971450805664, 0.007309317588806152, 0.007757663726806641, 0.008206009864807129, 0.008654356002807617, 0.009102702140808105, 0.009551048278808594, 0.009999394416809082, 0.01044774055480957, 0.010896086692810059, 0.011344432830810547, 0.011792778968811035, 0.012241125106811523, 0.012689471244812012, 0.0131378173828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 6.0, 6.0, 7.0, 10.0, 14.0, 26.0, 42.0, 36.0, 50.0, 54.0, 69.0, 84.0, 99.0, 122.0, 142.0, 210.0, 262.0, 288.0, 476.0, 450.0, 260.0, 232.0, 182.0, 167.0, 147.0, 129.0, 92.0, 95.0, 64.0, 52.0, 43.0, 34.0, 32.0, 22.0, 23.0, 7.0, 13.0, 7.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0137481689453125, -0.013237953186035156, -0.012727737426757812, -0.012217521667480469, -0.011707305908203125, -0.011197090148925781, -0.010686874389648438, -0.010176658630371094, -0.00966644287109375, -0.009156227111816406, -0.008646011352539062, -0.008135795593261719, -0.007625579833984375, -0.007115364074707031, -0.0066051483154296875, -0.006094932556152344, -0.005584716796875, -0.005074501037597656, -0.0045642852783203125, -0.004054069519042969, -0.003543853759765625, -0.0030336380004882812, -0.0025234222412109375, -0.0020132064819335938, -0.00150299072265625, -0.0009927749633789062, -0.0004825592041015625, 2.765655517578125e-05, 0.000537872314453125, 0.0010480880737304688, 0.0015583038330078125, 0.0020685195922851562, 0.0025787353515625, 0.0030889511108398438, 0.0035991668701171875, 0.004109382629394531, 0.004619598388671875, 0.005129814147949219, 0.0056400299072265625, 0.006150245666503906, 0.00666046142578125, 0.007170677185058594, 0.0076808929443359375, 0.008191108703613281, 0.008701324462890625, 0.009211540222167969, 0.009721755981445312, 0.010231971740722656, 0.0107421875, 0.011252403259277344, 0.011762619018554688, 0.012272834777832031, 0.012783050537109375, 0.013293266296386719, 0.013803482055664062, 0.014313697814941406, 0.01482391357421875, 0.015334129333496094, 0.015844345092773438, 0.01635456085205078, 0.016864776611328125, 0.01737499237060547, 0.017885208129882812, 0.018395423889160156, 0.0189056396484375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 12.0, 22.0, 27.0, 76.0, 130.0, 238.0, 128.0, 75.0, 68.0, 61.0, 39.0, 29.0, 15.0, 22.0, 5.0, 9.0, 7.0, 6.0, 6.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29051944613456726, -0.2802116572856903, -0.26990389823913574, -0.2595961093902588, -0.24928833544254303, -0.23898056149482727, -0.22867277264595032, -0.21836499869823456, -0.2080572247505188, -0.19774945080280304, -0.1874416619539261, -0.17713388800621033, -0.16682611405849457, -0.1565183401107788, -0.14621055126190186, -0.1359027773141861, -0.12559498846530914, -0.11528720706701279, -0.10497943311929703, -0.09467165172100067, -0.08436387777328491, -0.07405609637498856, -0.0637483149766922, -0.05344054102897644, -0.043132759630680084, -0.032824981957674026, -0.02251720242202282, -0.012209422886371613, -0.0019016452133655548, 0.008406132459640503, 0.01871391385793686, 0.02902168780565262, 0.039329469203948975, 0.04963724687695503, 0.05994502454996109, 0.07025280594825745, 0.0805605798959732, 0.09086836129426956, 0.10117614269256592, 0.11148391664028168, 0.12179169803857803, 0.1320994794368744, 0.14240725338459015, 0.1527150273323059, 0.16302281618118286, 0.17333059012889862, 0.18363836407661438, 0.19394615292549133, 0.2042539268732071, 0.21456170082092285, 0.2248694896697998, 0.23517726361751556, 0.24548503756523132, 0.2557928264141083, 0.26610058546066284, 0.2764083743095398, 0.28671616315841675, 0.2970239520072937, 0.30733171105384827, 0.3176394999027252, 0.3279472887516022, 0.33825504779815674, 0.3485628366470337, 0.35887062549591064, 0.3691783845424652]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 9.0, 6.0, 13.0, 13.0, 14.0, 13.0, 11.0, 14.0, 26.0, 25.0, 30.0, 42.0, 32.0, 51.0, 40.0, 58.0, 33.0, 49.0, 38.0, 38.0, 28.0, 29.0, 44.0, 32.0, 30.0, 40.0, 17.0, 28.0, 32.0, 24.0, 21.0, 12.0, 15.0, 18.0, 8.0, 14.0, 7.0, 12.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.14641225337982178, -0.14178502559661865, -0.13715781271457672, -0.1325305998325348, -0.12790337204933167, -0.12327615171670914, -0.11864893138408661, -0.11402171105146408, -0.10939449071884155, -0.10476727038621902, -0.1001400500535965, -0.09551282972097397, -0.09088560938835144, -0.08625838905572891, -0.08163116872310638, -0.07700394839048386, -0.07237672805786133, -0.0677495077252388, -0.06312228739261627, -0.058495067059993744, -0.053867846727371216, -0.04924062639474869, -0.04461340606212616, -0.03998618572950363, -0.035358965396881104, -0.030731745064258575, -0.026104524731636047, -0.02147730439901352, -0.01685008406639099, -0.012222863733768463, -0.007595643401145935, -0.002968423068523407, 0.001658797264099121, 0.006286017596721649, 0.010913237929344177, 0.015540458261966705, 0.020167678594589233, 0.02479489892721176, 0.02942211925983429, 0.03404933959245682, 0.038676559925079346, 0.043303780257701874, 0.0479310005903244, 0.05255822092294693, 0.05718544125556946, 0.061812661588191986, 0.06643988192081451, 0.07106710225343704, 0.07569432258605957, 0.0803215429186821, 0.08494876325130463, 0.08957598358392715, 0.09420320391654968, 0.09883042424917221, 0.10345764458179474, 0.10808486491441727, 0.1127120852470398, 0.11733930557966232, 0.12196652591228485, 0.12659373879432678, 0.1312209665775299, 0.13584819436073303, 0.14047540724277496, 0.1451026201248169, 0.14972984790802002]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 8.0, 7.0, 11.0, 14.0, 27.0, 37.0, 43.0, 74.0, 162.0, 304.0, 517.0, 1212.0, 2905.0, 8628.0, 29832.0, 137025.0, 683987.0, 139587.0, 30023.0, 8651.0, 3103.0, 1135.0, 519.0, 282.0, 149.0, 91.0, 56.0, 36.0, 21.0, 17.0, 17.0, 14.0, 12.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0361328125, -0.034716129302978516, -0.03329944610595703, -0.03188276290893555, -0.030466079711914062, -0.029049396514892578, -0.027632713317871094, -0.02621603012084961, -0.024799346923828125, -0.02338266372680664, -0.021965980529785156, -0.020549297332763672, -0.019132614135742188, -0.017715930938720703, -0.01629924774169922, -0.014882564544677734, -0.01346588134765625, -0.012049198150634766, -0.010632514953613281, -0.009215831756591797, -0.0077991485595703125, -0.006382465362548828, -0.004965782165527344, -0.0035490989685058594, -0.002132415771484375, -0.0007157325744628906, 0.0007009506225585938, 0.002117633819580078, 0.0035343170166015625, 0.004951000213623047, 0.006367683410644531, 0.007784366607666016, 0.0092010498046875, 0.010617733001708984, 0.012034416198730469, 0.013451099395751953, 0.014867782592773438, 0.016284465789794922, 0.017701148986816406, 0.01911783218383789, 0.020534515380859375, 0.02195119857788086, 0.023367881774902344, 0.024784564971923828, 0.026201248168945312, 0.027617931365966797, 0.02903461456298828, 0.030451297760009766, 0.03186798095703125, 0.033284664154052734, 0.03470134735107422, 0.0361180305480957, 0.03753471374511719, 0.03895139694213867, 0.040368080139160156, 0.04178476333618164, 0.043201446533203125, 0.04461812973022461, 0.046034812927246094, 0.04745149612426758, 0.04886817932128906, 0.05028486251831055, 0.05170154571533203, 0.053118228912353516, 0.054534912109375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 11.0, 16.0, 36.0, 35.0, 67.0, 78.0, 81.0, 87.0, 107.0, 93.0, 104.0, 71.0, 60.0, 51.0, 28.0, 22.0, 25.0, 7.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0117340087890625, -0.011465132236480713, -0.011196255683898926, -0.010927379131317139, -0.010658502578735352, -0.010389626026153564, -0.010120749473571777, -0.00985187292098999, -0.009582996368408203, -0.009314119815826416, -0.009045243263244629, -0.008776366710662842, -0.008507490158081055, -0.008238613605499268, -0.00796973705291748, -0.007700860500335693, -0.007431983947753906, -0.007163107395172119, -0.006894230842590332, -0.006625354290008545, -0.006356477737426758, -0.006087601184844971, -0.005818724632263184, -0.0055498480796813965, -0.005280971527099609, -0.005012094974517822, -0.004743218421936035, -0.004474341869354248, -0.004205465316772461, -0.003936588764190674, -0.0036677122116088867, -0.0033988356590270996, -0.0031299591064453125, -0.0028610825538635254, -0.0025922060012817383, -0.002323329448699951, -0.002054452896118164, -0.001785576343536377, -0.0015166997909545898, -0.0012478232383728027, -0.0009789466857910156, -0.0007100701332092285, -0.0004411935806274414, -0.0001723170280456543, 9.655952453613281e-05, 0.0003654360771179199, 0.000634312629699707, 0.0009031891822814941, 0.0011720657348632812, 0.0014409422874450684, 0.0017098188400268555, 0.0019786953926086426, 0.0022475719451904297, 0.002516448497772217, 0.002785325050354004, 0.003054201602935791, 0.003323078155517578, 0.0035919547080993652, 0.0038608312606811523, 0.0041297078132629395, 0.0043985843658447266, 0.004667460918426514, 0.004936337471008301, 0.005205214023590088, 0.005474090576171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 3.0, 16.0, 21.0, 29.0, 40.0, 56.0, 87.0, 126.0, 187.0, 268.0, 396.0, 608.0, 966.0, 1577.0, 2525.0, 4453.0, 7843.0, 15500.0, 33622.0, 85363.0, 537667.0, 233521.0, 67091.0, 27000.0, 12937.0, 6776.0, 3768.0, 2177.0, 1344.0, 875.0, 539.0, 361.0, 260.0, 181.0, 111.0, 71.0, 61.0, 38.0, 28.0, 23.0, 7.0, 8.0, 3.0, 6.0, 7.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.018524169921875, -0.017834901809692383, -0.017145633697509766, -0.01645636558532715, -0.01576709747314453, -0.015077829360961914, -0.014388561248779297, -0.01369929313659668, -0.013010025024414062, -0.012320756912231445, -0.011631488800048828, -0.010942220687866211, -0.010252952575683594, -0.009563684463500977, -0.00887441635131836, -0.008185148239135742, -0.007495880126953125, -0.006806612014770508, -0.006117343902587891, -0.0054280757904052734, -0.004738807678222656, -0.004049539566040039, -0.003360271453857422, -0.0026710033416748047, -0.0019817352294921875, -0.0012924671173095703, -0.0006031990051269531, 8.606910705566406e-05, 0.0007753372192382812, 0.0014646053314208984, 0.0021538734436035156, 0.002843141555786133, 0.00353240966796875, 0.004221677780151367, 0.004910945892333984, 0.0056002140045166016, 0.006289482116699219, 0.006978750228881836, 0.007668018341064453, 0.00835728645324707, 0.009046554565429688, 0.009735822677612305, 0.010425090789794922, 0.011114358901977539, 0.011803627014160156, 0.012492895126342773, 0.01318216323852539, 0.013871431350708008, 0.014560699462890625, 0.015249967575073242, 0.01593923568725586, 0.016628503799438477, 0.017317771911621094, 0.01800704002380371, 0.018696308135986328, 0.019385576248168945, 0.020074844360351562, 0.02076411247253418, 0.021453380584716797, 0.022142648696899414, 0.02283191680908203, 0.02352118492126465, 0.024210453033447266, 0.024899721145629883, 0.0255889892578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 7.0, 8.0, 7.0, 12.0, 23.0, 18.0, 25.0, 28.0, 34.0, 46.0, 55.0, 36.0, 56.0, 50.0, 61.0, 48.0, 56.0, 44.0, 44.0, 46.0, 45.0, 47.0, 29.0, 31.0, 24.0, 15.0, 15.0, 19.0, 13.0, 11.0, 9.0, 2.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017791748046875, -0.017177343368530273, -0.016562938690185547, -0.01594853401184082, -0.015334129333496094, -0.014719724655151367, -0.01410531997680664, -0.013490915298461914, -0.012876510620117188, -0.012262105941772461, -0.011647701263427734, -0.011033296585083008, -0.010418891906738281, -0.009804487228393555, -0.009190082550048828, -0.008575677871704102, -0.007961273193359375, -0.0073468685150146484, -0.006732463836669922, -0.006118059158325195, -0.005503654479980469, -0.004889249801635742, -0.004274845123291016, -0.003660440444946289, -0.0030460357666015625, -0.002431631088256836, -0.0018172264099121094, -0.0012028217315673828, -0.0005884170532226562, 2.5987625122070312e-05, 0.0006403923034667969, 0.0012547969818115234, 0.00186920166015625, 0.0024836063385009766, 0.003098011016845703, 0.0037124156951904297, 0.004326820373535156, 0.004941225051879883, 0.005555629730224609, 0.006170034408569336, 0.0067844390869140625, 0.007398843765258789, 0.008013248443603516, 0.008627653121948242, 0.009242057800292969, 0.009856462478637695, 0.010470867156982422, 0.011085271835327148, 0.011699676513671875, 0.012314081192016602, 0.012928485870361328, 0.013542890548706055, 0.014157295227050781, 0.014771699905395508, 0.015386104583740234, 0.01600050926208496, 0.016614913940429688, 0.017229318618774414, 0.01784372329711914, 0.018458127975463867, 0.019072532653808594, 0.01968693733215332, 0.020301342010498047, 0.020915746688842773, 0.0215301513671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 17.0, 20.0, 27.0, 36.0, 77.0, 96.0, 152.0, 324.0, 490.0, 863.0, 1658.0, 3172.0, 6699.0, 15956.0, 48091.0, 250540.0, 619127.0, 64962.0, 20167.0, 7999.0, 3621.0, 1904.0, 1026.0, 566.0, 394.0, 191.0, 120.0, 79.0, 53.0, 34.0, 23.0, 15.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013227462768554688, -0.0012839734554290771, -0.0012452006340026855, -0.001206427812576294, -0.0011676549911499023, -0.0011288821697235107, -0.0010901093482971191, -0.0010513365268707275, -0.001012563705444336, -0.0009737908840179443, -0.0009350180625915527, -0.0008962452411651611, -0.0008574724197387695, -0.0008186995983123779, -0.0007799267768859863, -0.0007411539554595947, -0.0007023811340332031, -0.0006636083126068115, -0.0006248354911804199, -0.0005860626697540283, -0.0005472898483276367, -0.0005085170269012451, -0.0004697442054748535, -0.0004309713840484619, -0.0003921985626220703, -0.0003534257411956787, -0.0003146529197692871, -0.0002758800983428955, -0.0002371072769165039, -0.0001983344554901123, -0.0001595616340637207, -0.0001207888126373291, -8.20159912109375e-05, -4.32431697845459e-05, -4.470348358154297e-06, 3.4302473068237305e-05, 7.30752944946289e-05, 0.00011184811592102051, 0.0001506209373474121, 0.0001893937587738037, 0.0002281665802001953, 0.0002669394016265869, 0.0003057122230529785, 0.0003444850444793701, 0.0003832578659057617, 0.0004220306873321533, 0.0004608035087585449, 0.0004995763301849365, 0.0005383491516113281, 0.0005771219730377197, 0.0006158947944641113, 0.0006546676158905029, 0.0006934404373168945, 0.0007322132587432861, 0.0007709860801696777, 0.0008097589015960693, 0.0008485317230224609, 0.0008873045444488525, 0.0009260773658752441, 0.0009648501873016357, 0.0010036230087280273, 0.001042395830154419, 0.0010811686515808105, 0.0011199414730072021, 0.0011587142944335938]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 5.0, 5.0, 10.0, 14.0, 15.0, 19.0, 15.0, 21.0, 41.0, 34.0, 57.0, 83.0, 146.0, 127.0, 120.0, 70.0, 44.0, 33.0, 34.0, 25.0, 22.0, 16.0, 6.0, 13.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7583370208740234e-05, -1.6963109374046326e-05, -1.6342848539352417e-05, -1.5722587704658508e-05, -1.51023268699646e-05, -1.4482066035270691e-05, -1.3861805200576782e-05, -1.3241544365882874e-05, -1.2621283531188965e-05, -1.2001022696495056e-05, -1.1380761861801147e-05, -1.0760501027107239e-05, -1.014024019241333e-05, -9.519979357719421e-06, -8.899718523025513e-06, -8.279457688331604e-06, -7.659196853637695e-06, -7.038936018943787e-06, -6.418675184249878e-06, -5.798414349555969e-06, -5.1781535148620605e-06, -4.557892680168152e-06, -3.937631845474243e-06, -3.3173710107803345e-06, -2.6971101760864258e-06, -2.076849341392517e-06, -1.4565885066986084e-06, -8.363276720046997e-07, -2.1606683731079102e-07, 4.041939973831177e-07, 1.0244548320770264e-06, 1.644715666770935e-06, 2.2649765014648438e-06, 2.8852373361587524e-06, 3.505498170852661e-06, 4.12575900554657e-06, 4.7460198402404785e-06, 5.366280674934387e-06, 5.986541509628296e-06, 6.606802344322205e-06, 7.227063179016113e-06, 7.847324013710022e-06, 8.46758484840393e-06, 9.08784568309784e-06, 9.708106517791748e-06, 1.0328367352485657e-05, 1.0948628187179565e-05, 1.1568889021873474e-05, 1.2189149856567383e-05, 1.2809410691261292e-05, 1.34296715259552e-05, 1.4049932360649109e-05, 1.4670193195343018e-05, 1.5290454030036926e-05, 1.5910714864730835e-05, 1.6530975699424744e-05, 1.7151236534118652e-05, 1.777149736881256e-05, 1.839175820350647e-05, 1.901201903820038e-05, 1.9632279872894287e-05, 2.0252540707588196e-05, 2.0872801542282104e-05, 2.1493062376976013e-05, 2.2113323211669922e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 7.0, 11.0, 13.0, 22.0, 21.0, 31.0, 47.0, 59.0, 85.0, 116.0, 161.0, 206.0, 260.0, 362.0, 542.0, 835.0, 1085.0, 1715.0, 2925.0, 4833.0, 8534.0, 16129.0, 37564.0, 114727.0, 642011.0, 134266.0, 41517.0, 17741.0, 9028.0, 4789.0, 3039.0, 1862.0, 1199.0, 847.0, 537.0, 395.0, 233.0, 185.0, 166.0, 121.0, 69.0, 57.0, 45.0, 33.0, 29.0, 26.0, 21.0, 13.0, 8.0, 11.0, 4.0, 5.0, 4.0, 2.0], "bins": [-0.0009531974792480469, -0.0009256079792976379, -0.000898018479347229, -0.0008704289793968201, -0.0008428394794464111, -0.0008152499794960022, -0.0007876604795455933, -0.0007600709795951843, -0.0007324814796447754, -0.0007048919796943665, -0.0006773024797439575, -0.0006497129797935486, -0.0006221234798431396, -0.0005945339798927307, -0.0005669444799423218, -0.0005393549799919128, -0.0005117654800415039, -0.00048417598009109497, -0.00045658648014068604, -0.0004289969801902771, -0.00040140748023986816, -0.00037381798028945923, -0.0003462284803390503, -0.00031863898038864136, -0.0002910494804382324, -0.0002634599804878235, -0.00023587048053741455, -0.00020828098058700562, -0.00018069148063659668, -0.00015310198068618774, -0.0001255124807357788, -9.792298078536987e-05, -7.033348083496094e-05, -4.2743980884552e-05, -1.5154480934143066e-05, 1.2435019016265869e-05, 4.0024518966674805e-05, 6.761401891708374e-05, 9.520351886749268e-05, 0.0001227930188179016, 0.00015038251876831055, 0.00017797201871871948, 0.00020556151866912842, 0.00023315101861953735, 0.0002607405185699463, 0.0002883300185203552, 0.00031591951847076416, 0.0003435090184211731, 0.00037109851837158203, 0.00039868801832199097, 0.0004262775182723999, 0.00045386701822280884, 0.0004814565181732178, 0.0005090460181236267, 0.0005366355180740356, 0.0005642250180244446, 0.0005918145179748535, 0.0006194040179252625, 0.0006469935178756714, 0.0006745830178260803, 0.0007021725177764893, 0.0007297620177268982, 0.0007573515176773071, 0.0007849410176277161, 0.000812530517578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 4.0, 7.0, 8.0, 7.0, 6.0, 13.0, 18.0, 21.0, 31.0, 34.0, 45.0, 53.0, 55.0, 63.0, 81.0, 82.0, 78.0, 68.0, 68.0, 41.0, 36.0, 39.0, 19.0, 25.0, 15.0, 18.0, 7.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0], "bins": [-0.0009312629699707031, -0.000904373824596405, -0.0008774846792221069, -0.0008505955338478088, -0.0008237063884735107, -0.0007968172430992126, -0.0007699280977249146, -0.0007430389523506165, -0.0007161498069763184, -0.0006892606616020203, -0.0006623715162277222, -0.0006354823708534241, -0.000608593225479126, -0.0005817040801048279, -0.0005548149347305298, -0.0005279257893562317, -0.0005010366439819336, -0.0004741474986076355, -0.0004472583532333374, -0.0004203692078590393, -0.0003934800624847412, -0.0003665909171104431, -0.000339701771736145, -0.0003128126263618469, -0.00028592348098754883, -0.00025903433561325073, -0.00023214519023895264, -0.00020525604486465454, -0.00017836689949035645, -0.00015147775411605835, -0.00012458860874176025, -9.769946336746216e-05, -7.081031799316406e-05, -4.392117261886597e-05, -1.703202724456787e-05, 9.857118129730225e-06, 3.674626350402832e-05, 6.363540887832642e-05, 9.052455425262451e-05, 0.00011741369962692261, 0.0001443028450012207, 0.0001711919903755188, 0.0001980811357498169, 0.000224970281124115, 0.0002518594264984131, 0.0002787485718727112, 0.0003056377172470093, 0.0003325268626213074, 0.00035941600799560547, 0.00038630515336990356, 0.00041319429874420166, 0.00044008344411849976, 0.00046697258949279785, 0.000493861734867096, 0.000520750880241394, 0.0005476400256156921, 0.0005745291709899902, 0.0006014183163642883, 0.0006283074617385864, 0.0006551966071128845, 0.0006820857524871826, 0.0007089748978614807, 0.0007358640432357788, 0.0007627531886100769, 0.000789642333984375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 7.0, 12.0, 1.0, 16.0, 20.0, 21.0, 19.0, 23.0, 23.0, 43.0, 48.0, 71.0, 177.0, 236.0, 79.0, 55.0, 36.0, 23.0, 17.0, 9.0, 11.0, 7.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1368698924779892, -0.1337774097919464, -0.13068494200706482, -0.12759245932102203, -0.12449998408555984, -0.12140750885009766, -0.11831503361463547, -0.11522255837917328, -0.1121300756931305, -0.1090376004576683, -0.10594512522220612, -0.10285264253616333, -0.09976016730070114, -0.09666769206523895, -0.09357521682977676, -0.09048274159431458, -0.08739026635885239, -0.0842977911233902, -0.08120531588792801, -0.07811284065246582, -0.07502035796642303, -0.07192788273096085, -0.06883540749549866, -0.06574293226003647, -0.06265045702457428, -0.05955798178911209, -0.056465502828359604, -0.053373027592897415, -0.05028054863214493, -0.04718807339668274, -0.04409559816122055, -0.04100312292575836, -0.03791063651442528, -0.03481816127896309, -0.0317256823182106, -0.028633207082748413, -0.025540729984641075, -0.022448252886533737, -0.01935577765107155, -0.01626330055296421, -0.013170823454856873, -0.010078346356749535, -0.006985870189964771, -0.003893394023180008, -0.00080091692507267, 0.002291560173034668, 0.005384035408496857, 0.008476512506604195, 0.011568989604711533, 0.01466146670281887, 0.01775394380092621, 0.020846419036388397, 0.023938896134495735, 0.027031373232603073, 0.030123848468065262, 0.03321632742881775, 0.03630880266427994, 0.039401277899742126, 0.042493756860494614, 0.0455862320959568, 0.04867871105670929, 0.05177118629217148, 0.05486366152763367, 0.057956136763095856, 0.06104861572384834]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 7.0, 3.0, 8.0, 7.0, 9.0, 15.0, 17.0, 14.0, 17.0, 15.0, 24.0, 28.0, 37.0, 39.0, 63.0, 52.0, 79.0, 90.0, 98.0, 57.0, 46.0, 36.0, 29.0, 29.0, 33.0, 28.0, 25.0, 27.0, 17.0, 14.0, 7.0, 8.0, 5.0, 8.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06350511312484741, -0.06090283393859863, -0.058300554752349854, -0.05569827929139137, -0.05309600010514259, -0.050493720918893814, -0.04789144545793533, -0.045289166271686554, -0.042686887085437775, -0.040084607899188995, -0.037482328712940216, -0.034880053251981735, -0.032277774065732956, -0.029675494879484177, -0.027073217555880547, -0.024470940232276917, -0.021868661046028137, -0.019266381859779358, -0.016664104536175728, -0.014061826281249523, -0.011459548026323318, -0.008857269771397114, -0.006254991516470909, -0.003652714192867279, -0.0010504350066184998, 0.001551843248307705, 0.00415412150323391, 0.006756399758160114, 0.009358678013086319, 0.011960956268012524, 0.014563234522938728, 0.01716551184654236, 0.019767791032791138, 0.022370070219039917, 0.024972347542643547, 0.027574624866247177, 0.030176904052495956, 0.032779183238744736, 0.03538145869970322, 0.037983737885951996, 0.040586017072200775, 0.043188296258449554, 0.045790575444698334, 0.048392850905656815, 0.050995130091905594, 0.05359740927815437, 0.056199684739112854, 0.05880196392536163, 0.06140424311161041, 0.06400652229785919, 0.06660880148410797, 0.06921108067035675, 0.07181335985660553, 0.07441563159227371, 0.07701791077852249, 0.07962018996477127, 0.08222246915102005, 0.08482474833726883, 0.08742702752351761, 0.09002930670976639, 0.09263157844543457, 0.09523385763168335, 0.09783613681793213, 0.10043841600418091, 0.10304069519042969]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 12.0, 10.0, 11.0, 18.0, 17.0, 27.0, 58.0, 73.0, 109.0, 198.0, 357.0, 609.0, 1467.0, 5523.0, 52320.0, 4075666.0, 49762.0, 5284.0, 1410.0, 563.0, 283.0, 194.0, 118.0, 88.0, 45.0, 13.0, 11.0, 4.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0], "bins": [-0.10009765625, -0.09768486022949219, -0.09527206420898438, -0.09285926818847656, -0.09044647216796875, -0.08803367614746094, -0.08562088012695312, -0.08320808410644531, -0.0807952880859375, -0.07838249206542969, -0.07596969604492188, -0.07355690002441406, -0.07114410400390625, -0.06873130798339844, -0.06631851196289062, -0.06390571594238281, -0.061492919921875, -0.05908012390136719, -0.056667327880859375, -0.05425453186035156, -0.05184173583984375, -0.04942893981933594, -0.047016143798828125, -0.04460334777832031, -0.0421905517578125, -0.03977775573730469, -0.037364959716796875, -0.03495216369628906, -0.03253936767578125, -0.030126571655273438, -0.027713775634765625, -0.025300979614257812, -0.02288818359375, -0.020475387573242188, -0.018062591552734375, -0.015649795532226562, -0.01323699951171875, -0.010824203491210938, -0.008411407470703125, -0.0059986114501953125, -0.0035858154296875, -0.0011730194091796875, 0.001239776611328125, 0.0036525726318359375, 0.00606536865234375, 0.008478164672851562, 0.010890960693359375, 0.013303756713867188, 0.015716552734375, 0.018129348754882812, 0.020542144775390625, 0.022954940795898438, 0.02536773681640625, 0.027780532836914062, 0.030193328857421875, 0.03260612487792969, 0.0350189208984375, 0.03743171691894531, 0.039844512939453125, 0.04225730895996094, 0.04467010498046875, 0.04708290100097656, 0.049495697021484375, 0.05190849304199219, 0.0543212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 11.0, 9.0, 14.0, 24.0, 43.0, 43.0, 62.0, 89.0, 85.0, 98.0, 92.0, 89.0, 85.0, 80.0, 50.0, 34.0, 32.0, 19.0, 17.0, 15.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00975799560546875, -0.009521186351776123, -0.009284377098083496, -0.00904756784439087, -0.008810758590698242, -0.008573949337005615, -0.008337140083312988, -0.008100330829620361, -0.007863521575927734, -0.007626712322235107, -0.0073899030685424805, -0.0071530938148498535, -0.0069162845611572266, -0.0066794753074646, -0.006442666053771973, -0.006205856800079346, -0.005969047546386719, -0.005732238292694092, -0.005495429039001465, -0.005258619785308838, -0.005021810531616211, -0.004785001277923584, -0.004548192024230957, -0.00431138277053833, -0.004074573516845703, -0.003837764263153076, -0.0036009550094604492, -0.0033641457557678223, -0.0031273365020751953, -0.0028905272483825684, -0.0026537179946899414, -0.0024169087409973145, -0.0021800994873046875, -0.0019432902336120605, -0.0017064809799194336, -0.0014696717262268066, -0.0012328624725341797, -0.0009960532188415527, -0.0007592439651489258, -0.0005224347114562988, -0.0002856254577636719, -4.881620407104492e-05, 0.00018799304962158203, 0.000424802303314209, 0.0006616115570068359, 0.0008984208106994629, 0.0011352300643920898, 0.0013720393180847168, 0.0016088485717773438, 0.0018456578254699707, 0.0020824670791625977, 0.0023192763328552246, 0.0025560855865478516, 0.0027928948402404785, 0.0030297040939331055, 0.0032665133476257324, 0.0035033226013183594, 0.0037401318550109863, 0.003976941108703613, 0.00421375036239624, 0.004450559616088867, 0.004687368869781494, 0.004924178123474121, 0.005160987377166748, 0.005397796630859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 13.0, 14.0, 29.0, 50.0, 79.0, 101.0, 150.0, 240.0, 470.0, 927.0, 2627.0, 10008.0, 59898.0, 3487424.0, 585848.0, 35985.0, 6716.0, 1866.0, 720.0, 422.0, 234.0, 150.0, 99.0, 59.0, 49.0, 24.0, 29.0, 18.0, 14.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0], "bins": [-0.04779052734375, -0.046675920486450195, -0.04556131362915039, -0.044446706771850586, -0.04333209991455078, -0.04221749305725098, -0.04110288619995117, -0.03998827934265137, -0.03887367248535156, -0.03775906562805176, -0.03664445877075195, -0.03552985191345215, -0.034415245056152344, -0.03330063819885254, -0.032186031341552734, -0.03107142448425293, -0.029956817626953125, -0.02884221076965332, -0.027727603912353516, -0.02661299705505371, -0.025498390197753906, -0.0243837833404541, -0.023269176483154297, -0.022154569625854492, -0.021039962768554688, -0.019925355911254883, -0.018810749053955078, -0.017696142196655273, -0.01658153533935547, -0.015466928482055664, -0.01435232162475586, -0.013237714767456055, -0.01212310791015625, -0.011008501052856445, -0.00989389419555664, -0.008779287338256836, -0.007664680480957031, -0.0065500736236572266, -0.005435466766357422, -0.004320859909057617, -0.0032062530517578125, -0.002091646194458008, -0.0009770393371582031, 0.00013756752014160156, 0.0012521743774414062, 0.002366781234741211, 0.0034813880920410156, 0.00459599494934082, 0.005710601806640625, 0.00682520866394043, 0.007939815521240234, 0.009054422378540039, 0.010169029235839844, 0.011283636093139648, 0.012398242950439453, 0.013512849807739258, 0.014627456665039062, 0.015742063522338867, 0.016856670379638672, 0.017971277236938477, 0.01908588409423828, 0.020200490951538086, 0.02131509780883789, 0.022429704666137695, 0.0235443115234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 7.0, 11.0, 6.0, 19.0, 22.0, 42.0, 46.0, 60.0, 119.0, 149.0, 288.0, 1108.0, 1519.0, 279.0, 139.0, 88.0, 53.0, 41.0, 20.0, 18.0, 19.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019744873046875, -0.018808364868164062, -0.017871856689453125, -0.016935348510742188, -0.01599884033203125, -0.015062332153320312, -0.014125823974609375, -0.013189315795898438, -0.0122528076171875, -0.011316299438476562, -0.010379791259765625, -0.009443283081054688, -0.00850677490234375, -0.0075702667236328125, -0.006633758544921875, -0.0056972503662109375, -0.0047607421875, -0.0038242340087890625, -0.002887725830078125, -0.0019512176513671875, -0.00101470947265625, -7.82012939453125e-05, 0.000858306884765625, 0.0017948150634765625, 0.0027313232421875, 0.0036678314208984375, 0.004604339599609375, 0.0055408477783203125, 0.00647735595703125, 0.0074138641357421875, 0.008350372314453125, 0.009286880493164062, 0.010223388671875, 0.011159896850585938, 0.012096405029296875, 0.013032913208007812, 0.01396942138671875, 0.014905929565429688, 0.015842437744140625, 0.016778945922851562, 0.0177154541015625, 0.018651962280273438, 0.019588470458984375, 0.020524978637695312, 0.02146148681640625, 0.022397994995117188, 0.023334503173828125, 0.024271011352539062, 0.02520751953125, 0.026144027709960938, 0.027080535888671875, 0.028017044067382812, 0.02895355224609375, 0.029890060424804688, 0.030826568603515625, 0.03176307678222656, 0.0326995849609375, 0.03363609313964844, 0.034572601318359375, 0.03550910949707031, 0.03644561767578125, 0.03738212585449219, 0.038318634033203125, 0.03925514221191406, 0.040191650390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 13.0, 18.0, 14.0, 25.0, 45.0, 88.0, 150.0, 225.0, 150.0, 92.0, 50.0, 36.0, 24.0, 17.0, 10.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2947234511375427, -0.2876898944377899, -0.2806563377380371, -0.2736227810382843, -0.2665892541408539, -0.2595556974411011, -0.25252214074134827, -0.24548858404159546, -0.23845502734184265, -0.23142147064208984, -0.22438792884349823, -0.21735437214374542, -0.21032081544399261, -0.203287273645401, -0.1962537169456482, -0.18922016024589539, -0.18218660354614258, -0.17515304684638977, -0.16811950504779816, -0.16108594834804535, -0.15405239164829254, -0.14701884984970093, -0.13998529314994812, -0.1329517364501953, -0.1259181946516037, -0.11888464540243149, -0.11185108870267868, -0.10481753945350647, -0.09778398275375366, -0.09075043350458145, -0.08371688425540924, -0.07668332755565643, -0.06964977085590363, -0.06261622160673141, -0.05558266490697861, -0.048549115657806396, -0.04151555895805359, -0.03448200970888138, -0.02744845673441887, -0.02041490375995636, -0.01338135078549385, -0.006347798276692629, 0.000685754232108593, 0.0077193062752485275, 0.014752859249711037, 0.021786410361528397, 0.028819963335990906, 0.035853516310453415, 0.042887069284915924, 0.04992062225937843, 0.05695417523384094, 0.06398772448301315, 0.07102128118276596, 0.07805483043193817, 0.08508838713169098, 0.09212193638086319, 0.0991554856300354, 0.10618903487920761, 0.11322259157896042, 0.12025614082813263, 0.12728969752788544, 0.13432323932647705, 0.14135679602622986, 0.14839035272598267, 0.15542390942573547]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 7.0, 8.0, 10.0, 15.0, 28.0, 28.0, 33.0, 45.0, 43.0, 43.0, 48.0, 52.0, 57.0, 72.0, 55.0, 72.0, 62.0, 68.0, 57.0, 47.0, 37.0, 31.0, 22.0, 16.0, 14.0, 14.0, 10.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12745237350463867, -0.12164591997861862, -0.11583946645259857, -0.11003301292657852, -0.10422655940055847, -0.09842010587453842, -0.09261365234851837, -0.08680719882249832, -0.08100074529647827, -0.07519429177045822, -0.06938783824443817, -0.06358138471841812, -0.05777493119239807, -0.05196847766637802, -0.04616202414035797, -0.04035557061433792, -0.03454911708831787, -0.02874266356229782, -0.02293621003627777, -0.01712975651025772, -0.011323302984237671, -0.005516849458217621, 0.0002896040678024292, 0.006096057593822479, 0.01190251111984253, 0.01770896464586258, 0.02351541817188263, 0.02932187169790268, 0.03512832522392273, 0.04093477874994278, 0.04674123227596283, 0.05254768580198288, 0.05835413932800293, 0.06416059285402298, 0.06996704638004303, 0.07577349990606308, 0.08157995343208313, 0.08738640695810318, 0.09319286048412323, 0.09899931401014328, 0.10480576753616333, 0.11061222106218338, 0.11641867458820343, 0.12222512811422348, 0.12803158164024353, 0.13383802771568298, 0.13964448869228363, 0.14545094966888428, 0.15125739574432373, 0.15706384181976318, 0.16287030279636383, 0.16867676377296448, 0.17448320984840393, 0.18028965592384338, 0.18609611690044403, 0.19190257787704468, 0.19770902395248413, 0.20351547002792358, 0.20932193100452423, 0.21512839198112488, 0.22093483805656433, 0.22674128413200378, 0.23254774510860443, 0.23835420608520508, 0.24416065216064453]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 1.0, 13.0, 20.0, 26.0, 19.0, 31.0, 58.0, 95.0, 193.0, 393.0, 591.0, 1080.0, 2171.0, 4353.0, 9138.0, 22222.0, 60503.0, 230221.0, 542679.0, 111568.0, 36184.0, 14255.0, 6350.0, 2955.0, 1526.0, 826.0, 413.0, 220.0, 168.0, 110.0, 62.0, 38.0, 19.0, 12.0, 9.0, 5.0, 10.0, 5.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213470458984375, -0.02059149742126465, -0.019835948944091797, -0.019080400466918945, -0.018324851989746094, -0.017569303512573242, -0.01681375503540039, -0.01605820655822754, -0.015302658081054688, -0.014547109603881836, -0.013791561126708984, -0.013036012649536133, -0.012280464172363281, -0.01152491569519043, -0.010769367218017578, -0.010013818740844727, -0.009258270263671875, -0.008502721786499023, -0.007747173309326172, -0.00699162483215332, -0.006236076354980469, -0.005480527877807617, -0.004724979400634766, -0.003969430923461914, -0.0032138824462890625, -0.002458333969116211, -0.0017027854919433594, -0.0009472370147705078, -0.00019168853759765625, 0.0005638599395751953, 0.0013194084167480469, 0.0020749568939208984, 0.00283050537109375, 0.0035860538482666016, 0.004341602325439453, 0.005097150802612305, 0.005852699279785156, 0.006608247756958008, 0.007363796234130859, 0.008119344711303711, 0.008874893188476562, 0.009630441665649414, 0.010385990142822266, 0.011141538619995117, 0.011897087097167969, 0.01265263557434082, 0.013408184051513672, 0.014163732528686523, 0.014919281005859375, 0.015674829483032227, 0.016430377960205078, 0.01718592643737793, 0.01794147491455078, 0.018697023391723633, 0.019452571868896484, 0.020208120346069336, 0.020963668823242188, 0.02171921730041504, 0.02247476577758789, 0.023230314254760742, 0.023985862731933594, 0.024741411209106445, 0.025496959686279297, 0.02625250816345215, 0.027008056640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 14.0, 10.0, 14.0, 17.0, 25.0, 36.0, 31.0, 42.0, 55.0, 66.0, 61.0, 58.0, 88.0, 86.0, 66.0, 71.0, 54.0, 43.0, 37.0, 30.0, 19.0, 19.0, 13.0, 7.0, 10.0, 7.0, 4.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01108551025390625, -0.010790646076202393, -0.010495781898498535, -0.010200917720794678, -0.00990605354309082, -0.009611189365386963, -0.009316325187683105, -0.009021461009979248, -0.00872659683227539, -0.008431732654571533, -0.008136868476867676, -0.007842004299163818, -0.007547140121459961, -0.0072522759437561035, -0.006957411766052246, -0.006662547588348389, -0.006367683410644531, -0.006072819232940674, -0.005777955055236816, -0.005483090877532959, -0.0051882266998291016, -0.004893362522125244, -0.004598498344421387, -0.004303634166717529, -0.004008769989013672, -0.0037139058113098145, -0.003419041633605957, -0.0031241774559020996, -0.002829313278198242, -0.0025344491004943848, -0.0022395849227905273, -0.00194472074508667, -0.0016498565673828125, -0.001354992389678955, -0.0010601282119750977, -0.0007652640342712402, -0.0004703998565673828, -0.0001755356788635254, 0.00011932849884033203, 0.00041419267654418945, 0.0007090568542480469, 0.0010039210319519043, 0.0012987852096557617, 0.0015936493873596191, 0.0018885135650634766, 0.002183377742767334, 0.0024782419204711914, 0.002773106098175049, 0.0030679702758789062, 0.0033628344535827637, 0.003657698631286621, 0.0039525628089904785, 0.004247426986694336, 0.004542291164398193, 0.004837155342102051, 0.005132019519805908, 0.005426883697509766, 0.005721747875213623, 0.0060166120529174805, 0.006311476230621338, 0.006606340408325195, 0.006901204586029053, 0.00719606876373291, 0.007490932941436768, 0.007785797119140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 15.0, 17.0, 31.0, 43.0, 47.0, 100.0, 132.0, 229.0, 313.0, 472.0, 877.0, 1559.0, 2823.0, 5536.0, 11562.0, 25252.0, 66575.0, 274916.0, 526088.0, 77063.0, 28633.0, 12629.0, 6333.0, 3145.0, 1635.0, 983.0, 553.0, 345.0, 210.0, 131.0, 87.0, 66.0, 46.0, 30.0, 22.0, 16.0, 13.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0], "bins": [-0.022705078125, -0.02210867404937744, -0.021512269973754883, -0.020915865898132324, -0.020319461822509766, -0.019723057746887207, -0.01912665367126465, -0.01853024959564209, -0.01793384552001953, -0.017337441444396973, -0.016741037368774414, -0.016144633293151855, -0.015548229217529297, -0.014951825141906738, -0.01435542106628418, -0.013759016990661621, -0.013162612915039062, -0.012566208839416504, -0.011969804763793945, -0.011373400688171387, -0.010776996612548828, -0.01018059253692627, -0.009584188461303711, -0.008987784385681152, -0.008391380310058594, -0.007794976234436035, -0.0071985721588134766, -0.006602168083190918, -0.006005764007568359, -0.005409359931945801, -0.004812955856323242, -0.004216551780700684, -0.003620147705078125, -0.0030237436294555664, -0.002427339553833008, -0.0018309354782104492, -0.0012345314025878906, -0.000638127326965332, -4.172325134277344e-05, 0.0005546808242797852, 0.0011510848999023438, 0.0017474889755249023, 0.002343893051147461, 0.0029402971267700195, 0.003536701202392578, 0.004133105278015137, 0.004729509353637695, 0.005325913429260254, 0.0059223175048828125, 0.006518721580505371, 0.00711512565612793, 0.007711529731750488, 0.008307933807373047, 0.008904337882995605, 0.009500741958618164, 0.010097146034240723, 0.010693550109863281, 0.01128995418548584, 0.011886358261108398, 0.012482762336730957, 0.013079166412353516, 0.013675570487976074, 0.014271974563598633, 0.014868378639221191, 0.01546478271484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 14.0, 13.0, 8.0, 12.0, 8.0, 15.0, 21.0, 28.0, 19.0, 36.0, 28.0, 52.0, 42.0, 59.0, 56.0, 68.0, 37.0, 55.0, 42.0, 35.0, 35.0, 55.0, 45.0, 35.0, 27.0, 28.0, 20.0, 13.0, 22.0, 12.0, 6.0, 7.0, 11.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.0335693359375, -0.03267979621887207, -0.03179025650024414, -0.03090071678161621, -0.03001117706298828, -0.02912163734436035, -0.028232097625732422, -0.027342557907104492, -0.026453018188476562, -0.025563478469848633, -0.024673938751220703, -0.023784399032592773, -0.022894859313964844, -0.022005319595336914, -0.021115779876708984, -0.020226240158081055, -0.019336700439453125, -0.018447160720825195, -0.017557621002197266, -0.016668081283569336, -0.015778541564941406, -0.014889001846313477, -0.013999462127685547, -0.013109922409057617, -0.012220382690429688, -0.011330842971801758, -0.010441303253173828, -0.009551763534545898, -0.008662223815917969, -0.007772684097290039, -0.006883144378662109, -0.00599360466003418, -0.00510406494140625, -0.00421452522277832, -0.0033249855041503906, -0.002435445785522461, -0.0015459060668945312, -0.0006563663482666016, 0.00023317337036132812, 0.0011227130889892578, 0.0020122528076171875, 0.002901792526245117, 0.003791332244873047, 0.0046808719635009766, 0.005570411682128906, 0.006459951400756836, 0.007349491119384766, 0.008239030838012695, 0.009128570556640625, 0.010018110275268555, 0.010907649993896484, 0.011797189712524414, 0.012686729431152344, 0.013576269149780273, 0.014465808868408203, 0.015355348587036133, 0.016244888305664062, 0.017134428024291992, 0.018023967742919922, 0.01891350746154785, 0.01980304718017578, 0.02069258689880371, 0.02158212661743164, 0.02247166633605957, 0.0233612060546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 8.0, 15.0, 14.0, 22.0, 47.0, 57.0, 101.0, 143.0, 234.0, 389.0, 687.0, 1304.0, 2465.0, 5213.0, 12442.0, 38914.0, 301589.0, 616301.0, 43550.0, 13733.0, 5468.0, 2597.0, 1397.0, 731.0, 405.0, 282.0, 148.0, 92.0, 72.0, 53.0, 21.0, 18.0, 11.0, 10.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006641387939453125, -0.00646209716796875, -0.006282806396484375, -0.006103515625, -0.005924224853515625, -0.00574493408203125, -0.005565643310546875, -0.0053863525390625, -0.005207061767578125, -0.00502777099609375, -0.004848480224609375, -0.004669189453125, -0.004489898681640625, -0.00431060791015625, -0.004131317138671875, -0.0039520263671875, -0.003772735595703125, -0.00359344482421875, -0.003414154052734375, -0.00323486328125, -0.003055572509765625, -0.00287628173828125, -0.002696990966796875, -0.0025177001953125, -0.002338409423828125, -0.00215911865234375, -0.001979827880859375, -0.001800537109375, -0.001621246337890625, -0.00144195556640625, -0.001262664794921875, -0.0010833740234375, -0.000904083251953125, -0.00072479248046875, -0.000545501708984375, -0.0003662109375, -0.000186920166015625, -7.62939453125e-06, 0.000171661376953125, 0.0003509521484375, 0.000530242919921875, 0.00070953369140625, 0.000888824462890625, 0.001068115234375, 0.001247406005859375, 0.00142669677734375, 0.001605987548828125, 0.0017852783203125, 0.001964569091796875, 0.00214385986328125, 0.002323150634765625, 0.00250244140625, 0.002681732177734375, 0.00286102294921875, 0.003040313720703125, 0.0032196044921875, 0.003398895263671875, 0.00357818603515625, 0.003757476806640625, 0.003936767578125, 0.004116058349609375, 0.00429534912109375, 0.004474639892578125, 0.0046539306640625, 0.004833221435546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 11.0, 13.0, 16.0, 15.0, 36.0, 33.0, 59.0, 72.0, 98.0, 100.0, 115.0, 88.0, 87.0, 77.0, 61.0, 45.0, 23.0, 20.0, 20.0, 7.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.927417755126953e-06, -7.65826553106308e-06, -7.3891133069992065e-06, -7.119961082935333e-06, -6.85080885887146e-06, -6.581656634807587e-06, -6.312504410743713e-06, -6.04335218667984e-06, -5.774199962615967e-06, -5.5050477385520935e-06, -5.23589551448822e-06, -4.966743290424347e-06, -4.697591066360474e-06, -4.4284388422966e-06, -4.159286618232727e-06, -3.890134394168854e-06, -3.6209821701049805e-06, -3.351829946041107e-06, -3.082677721977234e-06, -2.8135254979133606e-06, -2.5443732738494873e-06, -2.275221049785614e-06, -2.0060688257217407e-06, -1.7369166016578674e-06, -1.4677643775939941e-06, -1.1986121535301208e-06, -9.294599294662476e-07, -6.603077054023743e-07, -3.91155481338501e-07, -1.2200325727462769e-07, 1.471489667892456e-07, 4.163011908531189e-07, 6.854534149169922e-07, 9.546056389808655e-07, 1.2237578630447388e-06, 1.492910087108612e-06, 1.7620623111724854e-06, 2.0312145352363586e-06, 2.300366759300232e-06, 2.5695189833641052e-06, 2.8386712074279785e-06, 3.107823431491852e-06, 3.376975655555725e-06, 3.6461278796195984e-06, 3.915280103683472e-06, 4.184432327747345e-06, 4.453584551811218e-06, 4.7227367758750916e-06, 4.991888999938965e-06, 5.261041224002838e-06, 5.5301934480667114e-06, 5.799345672130585e-06, 6.068497896194458e-06, 6.337650120258331e-06, 6.606802344322205e-06, 6.875954568386078e-06, 7.145106792449951e-06, 7.4142590165138245e-06, 7.683411240577698e-06, 7.952563464641571e-06, 8.221715688705444e-06, 8.490867912769318e-06, 8.760020136833191e-06, 9.029172360897064e-06, 9.298324584960938e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 2.0, 8.0, 21.0, 17.0, 25.0, 31.0, 36.0, 82.0, 97.0, 133.0, 222.0, 411.0, 589.0, 1026.0, 1686.0, 3006.0, 5609.0, 11718.0, 27525.0, 83032.0, 693249.0, 149611.0, 38714.0, 15665.0, 7146.0, 3687.0, 1979.0, 1155.0, 693.0, 473.0, 273.0, 204.0, 138.0, 84.0, 67.0, 33.0, 28.0, 19.0, 17.0, 11.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00420379638671875, -0.004078984260559082, -0.003954172134399414, -0.003829360008239746, -0.003704547882080078, -0.00357973575592041, -0.003454923629760742, -0.0033301115036010742, -0.0032052993774414062, -0.0030804872512817383, -0.0029556751251220703, -0.0028308629989624023, -0.0027060508728027344, -0.0025812387466430664, -0.0024564266204833984, -0.0023316144943237305, -0.0022068023681640625, -0.0020819902420043945, -0.0019571781158447266, -0.0018323659896850586, -0.0017075538635253906, -0.0015827417373657227, -0.0014579296112060547, -0.0013331174850463867, -0.0012083053588867188, -0.0010834932327270508, -0.0009586811065673828, -0.0008338689804077148, -0.0007090568542480469, -0.0005842447280883789, -0.00045943260192871094, -0.00033462047576904297, -0.000209808349609375, -8.499622344970703e-05, 3.981590270996094e-05, 0.0001646280288696289, 0.0002894401550292969, 0.00041425228118896484, 0.0005390644073486328, 0.0006638765335083008, 0.0007886886596679688, 0.0009135007858276367, 0.0010383129119873047, 0.0011631250381469727, 0.0012879371643066406, 0.0014127492904663086, 0.0015375614166259766, 0.0016623735427856445, 0.0017871856689453125, 0.0019119977951049805, 0.0020368099212646484, 0.0021616220474243164, 0.0022864341735839844, 0.0024112462997436523, 0.0025360584259033203, 0.0026608705520629883, 0.0027856826782226562, 0.0029104948043823242, 0.003035306930541992, 0.00316011905670166, 0.003284931182861328, 0.003409743309020996, 0.003534555435180664, 0.003659367561340332, 0.0037841796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 4.0, 16.0, 15.0, 18.0, 21.0, 29.0, 25.0, 38.0, 38.0, 61.0, 91.0, 117.0, 110.0, 73.0, 51.0, 50.0, 32.0, 34.0, 21.0, 21.0, 23.0, 15.0, 20.0, 9.0, 8.0, 8.0, 7.0, 5.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.005954742431640625, -0.005779385566711426, -0.0056040287017822266, -0.005428671836853027, -0.005253314971923828, -0.005077958106994629, -0.00490260124206543, -0.0047272443771362305, -0.004551887512207031, -0.004376530647277832, -0.004201173782348633, -0.004025816917419434, -0.0038504600524902344, -0.003675103187561035, -0.003499746322631836, -0.0033243894577026367, -0.0031490325927734375, -0.0029736757278442383, -0.002798318862915039, -0.00262296199798584, -0.0024476051330566406, -0.0022722482681274414, -0.002096891403198242, -0.001921534538269043, -0.0017461776733398438, -0.0015708208084106445, -0.0013954639434814453, -0.001220107078552246, -0.0010447502136230469, -0.0008693933486938477, -0.0006940364837646484, -0.0005186796188354492, -0.00034332275390625, -0.00016796588897705078, 7.3909759521484375e-06, 0.00018274784088134766, 0.0003581047058105469, 0.0005334615707397461, 0.0007088184356689453, 0.0008841753005981445, 0.0010595321655273438, 0.001234889030456543, 0.0014102458953857422, 0.0015856027603149414, 0.0017609596252441406, 0.0019363164901733398, 0.002111673355102539, 0.0022870302200317383, 0.0024623870849609375, 0.0026377439498901367, 0.002813100814819336, 0.002988457679748535, 0.0031638145446777344, 0.0033391714096069336, 0.003514528274536133, 0.003689885139465332, 0.0038652420043945312, 0.0040405988693237305, 0.00421595573425293, 0.004391312599182129, 0.004566669464111328, 0.004742026329040527, 0.0049173831939697266, 0.005092740058898926, 0.005268096923828125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 11.0, 6.0, 14.0, 28.0, 52.0, 104.0, 289.0, 194.0, 97.0, 75.0, 40.0, 19.0, 23.0, 10.0, 10.0, 4.0, 9.0, 1.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2167155146598816, -0.21127481758594513, -0.20583412051200867, -0.200393408536911, -0.19495271146297455, -0.18951201438903809, -0.18407130241394043, -0.17863060534000397, -0.1731899082660675, -0.16774921119213104, -0.16230851411819458, -0.15686780214309692, -0.15142710506916046, -0.145986407995224, -0.14054569602012634, -0.13510499894618988, -0.12966430187225342, -0.12422360479831696, -0.1187829002737999, -0.11334219574928284, -0.10790149867534637, -0.10246080160140991, -0.09702009707689285, -0.0915793925523758, -0.08613869547843933, -0.08069799840450287, -0.07525729387998581, -0.06981658935546875, -0.06437589228153229, -0.05893519148230553, -0.053494490683078766, -0.048053789883852005, -0.04261307418346405, -0.03717237338423729, -0.03173167258501053, -0.026290971785783768, -0.020850270986557007, -0.015409570187330246, -0.009968869388103485, -0.004528168588876724, 0.0009125322103500366, 0.0063532330095767975, 0.011793933808803558, 0.01723463460803032, 0.02267533540725708, 0.02811603620648384, 0.0335567370057106, 0.03899743780493736, 0.044438138604164124, 0.049878839403390884, 0.055319540202617645, 0.060760241001844406, 0.06620094180107117, 0.07164163887500763, 0.07708234339952469, 0.08252304792404175, 0.08796374499797821, 0.09340444207191467, 0.09884514659643173, 0.10428585112094879, 0.10972654819488525, 0.11516724526882172, 0.12060794979333878, 0.12604865431785583, 0.1314893513917923]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 7.0, 7.0, 7.0, 9.0, 13.0, 12.0, 16.0, 15.0, 16.0, 31.0, 34.0, 34.0, 37.0, 53.0, 66.0, 96.0, 101.0, 82.0, 43.0, 40.0, 36.0, 33.0, 33.0, 24.0, 27.0, 24.0, 18.0, 20.0, 11.0, 8.0, 7.0, 4.0, 8.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1530930995941162, -0.14896145462989807, -0.14482980966567993, -0.14069817960262299, -0.13656653463840485, -0.1324348896741867, -0.12830324470996857, -0.12417159974575043, -0.12003996223211288, -0.11590831726789474, -0.1117766797542572, -0.10764503479003906, -0.10351338982582092, -0.09938175231218338, -0.09525010734796524, -0.0911184698343277, -0.08698682487010956, -0.08285517990589142, -0.07872354239225388, -0.07459189742803574, -0.0704602599143982, -0.06632861495018005, -0.062196969985961914, -0.05806532874703407, -0.05393368750810623, -0.04980204626917839, -0.04567040503025055, -0.04153876006603241, -0.03740711882710457, -0.03327547758817673, -0.029143834486603737, -0.025012191385030746, -0.020880550146102905, -0.016748908907175064, -0.012617265805602074, -0.008485623635351658, -0.004353981465101242, -0.00022234022617340088, 0.0039093028753995895, 0.00804094597697258, 0.012172587215900421, 0.016304228454828262, 0.020435871556401253, 0.024567514657974243, 0.028699155896902084, 0.032830797135829926, 0.036962442100048065, 0.041094083338975906, 0.04522572457790375, 0.04935736581683159, 0.05348900705575943, 0.05762065201997757, 0.06175229325890541, 0.06588393449783325, 0.07001557946205139, 0.07414722442626953, 0.07827886193990707, 0.08241050690412521, 0.08654214441776276, 0.0906737893819809, 0.09480543434619904, 0.09893707185983658, 0.10306871682405472, 0.10720035433769226, 0.1113319993019104]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 12.0, 12.0, 10.0, 22.0, 18.0, 26.0, 35.0, 47.0, 57.0, 101.0, 139.0, 236.0, 351.0, 675.0, 1690.0, 15671.0, 949522.0, 3110162.0, 107553.0, 5195.0, 1356.0, 545.0, 290.0, 185.0, 124.0, 69.0, 46.0, 39.0, 22.0, 19.0, 14.0, 8.0, 9.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0165557861328125, -0.016133666038513184, -0.015711545944213867, -0.01528942584991455, -0.014867305755615234, -0.014445185661315918, -0.014023065567016602, -0.013600945472717285, -0.013178825378417969, -0.012756705284118652, -0.012334585189819336, -0.01191246509552002, -0.011490345001220703, -0.011068224906921387, -0.01064610481262207, -0.010223984718322754, -0.009801864624023438, -0.009379744529724121, -0.008957624435424805, -0.008535504341125488, -0.008113384246826172, -0.0076912641525268555, -0.007269144058227539, -0.006847023963928223, -0.006424903869628906, -0.00600278377532959, -0.0055806636810302734, -0.005158543586730957, -0.004736423492431641, -0.004314303398132324, -0.003892183303833008, -0.0034700632095336914, -0.003047943115234375, -0.0026258230209350586, -0.002203702926635742, -0.0017815828323364258, -0.0013594627380371094, -0.000937342643737793, -0.0005152225494384766, -9.310245513916016e-05, 0.00032901763916015625, 0.0007511377334594727, 0.001173257827758789, 0.0015953779220581055, 0.002017498016357422, 0.0024396181106567383, 0.0028617382049560547, 0.003283858299255371, 0.0037059783935546875, 0.004128098487854004, 0.00455021858215332, 0.004972338676452637, 0.005394458770751953, 0.0058165788650512695, 0.006238698959350586, 0.006660819053649902, 0.007082939147949219, 0.007505059242248535, 0.007927179336547852, 0.008349299430847168, 0.008771419525146484, 0.0091935396194458, 0.009615659713745117, 0.010037779808044434, 0.01045989990234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 10.0, 10.0, 12.0, 20.0, 17.0, 20.0, 18.0, 36.0, 37.0, 43.0, 31.0, 48.0, 45.0, 45.0, 59.0, 60.0, 55.0, 42.0, 67.0, 44.0, 48.0, 34.0, 37.0, 34.0, 24.0, 23.0, 16.0, 9.0, 8.0, 17.0, 4.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00839996337890625, -0.008180379867553711, -0.007960796356201172, -0.007741212844848633, -0.007521629333496094, -0.007302045822143555, -0.007082462310791016, -0.0068628787994384766, -0.0066432952880859375, -0.0064237117767333984, -0.006204128265380859, -0.00598454475402832, -0.005764961242675781, -0.005545377731323242, -0.005325794219970703, -0.005106210708618164, -0.004886627197265625, -0.004667043685913086, -0.004447460174560547, -0.004227876663208008, -0.004008293151855469, -0.0037887096405029297, -0.0035691261291503906, -0.0033495426177978516, -0.0031299591064453125, -0.0029103755950927734, -0.0026907920837402344, -0.0024712085723876953, -0.0022516250610351562, -0.002032041549682617, -0.0018124580383300781, -0.001592874526977539, -0.001373291015625, -0.001153707504272461, -0.0009341239929199219, -0.0007145404815673828, -0.0004949569702148438, -0.0002753734588623047, -5.5789947509765625e-05, 0.00016379356384277344, 0.0003833770751953125, 0.0006029605865478516, 0.0008225440979003906, 0.0010421276092529297, 0.0012617111206054688, 0.0014812946319580078, 0.0017008781433105469, 0.001920461654663086, 0.002140045166015625, 0.002359628677368164, 0.002579212188720703, 0.002798795700073242, 0.0030183792114257812, 0.0032379627227783203, 0.0034575462341308594, 0.0036771297454833984, 0.0038967132568359375, 0.0041162967681884766, 0.004335880279541016, 0.004555463790893555, 0.004775047302246094, 0.004994630813598633, 0.005214214324951172, 0.005433797836303711, 0.00565338134765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 29.0, 54.0, 121.0, 244.0, 631.0, 1724.0, 8791.0, 1956783.0, 2213537.0, 9393.0, 1798.0, 651.0, 251.0, 113.0, 62.0, 34.0, 13.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0292205810546875, -0.028430938720703125, -0.02764129638671875, -0.026851654052734375, -0.02606201171875, -0.025272369384765625, -0.02448272705078125, -0.023693084716796875, -0.0229034423828125, -0.022113800048828125, -0.02132415771484375, -0.020534515380859375, -0.019744873046875, -0.018955230712890625, -0.01816558837890625, -0.017375946044921875, -0.0165863037109375, -0.015796661376953125, -0.01500701904296875, -0.014217376708984375, -0.013427734375, -0.012638092041015625, -0.01184844970703125, -0.011058807373046875, -0.0102691650390625, -0.009479522705078125, -0.00868988037109375, -0.007900238037109375, -0.007110595703125, -0.006320953369140625, -0.00553131103515625, -0.004741668701171875, -0.0039520263671875, -0.003162384033203125, -0.00237274169921875, -0.001583099365234375, -0.00079345703125, -3.814697265625e-06, 0.00078582763671875, 0.001575469970703125, 0.0023651123046875, 0.003154754638671875, 0.00394439697265625, 0.004734039306640625, 0.005523681640625, 0.006313323974609375, 0.00710296630859375, 0.007892608642578125, 0.0086822509765625, 0.009471893310546875, 0.01026153564453125, 0.011051177978515625, 0.0118408203125, 0.012630462646484375, 0.01342010498046875, 0.014209747314453125, 0.0149993896484375, 0.015789031982421875, 0.01657867431640625, 0.017368316650390625, 0.018157958984375, 0.018947601318359375, 0.01973724365234375, 0.020526885986328125, 0.0213165283203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 12.0, 23.0, 47.0, 117.0, 425.0, 1082.0, 1265.0, 620.0, 246.0, 99.0, 47.0, 21.0, 16.0, 14.0, 11.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0165863037109375, -0.016056060791015625, -0.01552581787109375, -0.014995574951171875, -0.01446533203125, -0.013935089111328125, -0.01340484619140625, -0.012874603271484375, -0.0123443603515625, -0.011814117431640625, -0.01128387451171875, -0.010753631591796875, -0.010223388671875, -0.009693145751953125, -0.00916290283203125, -0.008632659912109375, -0.0081024169921875, -0.007572174072265625, -0.00704193115234375, -0.006511688232421875, -0.0059814453125, -0.005451202392578125, -0.00492095947265625, -0.004390716552734375, -0.0038604736328125, -0.003330230712890625, -0.00279998779296875, -0.002269744873046875, -0.001739501953125, -0.001209259033203125, -0.00067901611328125, -0.000148773193359375, 0.0003814697265625, 0.000911712646484375, 0.00144195556640625, 0.001972198486328125, 0.00250244140625, 0.003032684326171875, 0.00356292724609375, 0.004093170166015625, 0.0046234130859375, 0.005153656005859375, 0.00568389892578125, 0.006214141845703125, 0.006744384765625, 0.007274627685546875, 0.00780487060546875, 0.008335113525390625, 0.0088653564453125, 0.009395599365234375, 0.00992584228515625, 0.010456085205078125, 0.010986328125, 0.011516571044921875, 0.01204681396484375, 0.012577056884765625, 0.0131072998046875, 0.013637542724609375, 0.01416778564453125, 0.014698028564453125, 0.015228271484375, 0.015758514404296875, 0.01628875732421875, 0.016819000244140625, 0.0173492431640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 6.0, 5.0, 7.0, 24.0, 43.0, 64.0, 113.0, 181.0, 194.0, 131.0, 79.0, 65.0, 32.0, 14.0, 11.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027537288144230843, -0.024989455938339233, -0.022441623732447624, -0.019893791526556015, -0.017345959320664406, -0.014798127114772797, -0.012250294908881187, -0.009702462702989578, -0.007154630497097969, -0.00460679829120636, -0.0020589660853147507, 0.0004888661205768585, 0.0030366983264684677, 0.005584530532360077, 0.008132362738251686, 0.010680194944143295, 0.013228027150034904, 0.015775859355926514, 0.018323691561818123, 0.020871523767709732, 0.02341935597360134, 0.02596718817949295, 0.02851502038538456, 0.03106285259127617, 0.03361068665981293, 0.03615851700305939, 0.038706351071596146, 0.041254185140132904, 0.043802015483379364, 0.046349845826625824, 0.04889767989516258, 0.05144551396369934, 0.0539933443069458, 0.05654117465019226, 0.05908900871872902, 0.06163684278726578, 0.06418467313051224, 0.0667325034737587, 0.06928034126758575, 0.07182817161083221, 0.07437600195407867, 0.07692383229732513, 0.0794716626405716, 0.08201950043439865, 0.08456733077764511, 0.08711516112089157, 0.08966299891471863, 0.09221082925796509, 0.09475865960121155, 0.09730648994445801, 0.09985432028770447, 0.10240215808153152, 0.10494998842477798, 0.10749781876802444, 0.1100456565618515, 0.11259348690509796, 0.11514131724834442, 0.11768914759159088, 0.12023697793483734, 0.1227848157286644, 0.12533265352249146, 0.12788048386573792, 0.13042831420898438, 0.13297614455223083, 0.1355239748954773]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 2.0, 7.0, 9.0, 18.0, 16.0, 17.0, 21.0, 29.0, 27.0, 38.0, 24.0, 36.0, 45.0, 77.0, 55.0, 45.0, 55.0, 60.0, 63.0, 66.0, 43.0, 40.0, 35.0, 23.0, 36.0, 14.0, 16.0, 20.0, 11.0, 9.0, 10.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05511254072189331, -0.05345321074128151, -0.05179388076066971, -0.05013454705476761, -0.04847521707415581, -0.046815887093544006, -0.04515655338764191, -0.043497223407030106, -0.041837893426418304, -0.0401785634458065, -0.0385192334651947, -0.0368598997592926, -0.0352005697786808, -0.033541239798069, -0.0318819060921669, -0.0302225761115551, -0.0285632461309433, -0.026903916150331497, -0.025244584307074547, -0.023585252463817596, -0.021925922483205795, -0.020266592502593994, -0.018607260659337044, -0.016947928816080093, -0.015288598835468292, -0.013629267923533916, -0.01196993701159954, -0.010310606099665165, -0.00865127518773079, -0.006991944275796413, -0.005332613363862038, -0.003673282451927662, -0.002013951539993286, -0.00035462062805891037, 0.0013047102838754654, 0.002964041195809841, 0.004623372107744217, 0.006282703019678593, 0.007942033931612968, 0.009601364843547344, 0.01126069575548172, 0.012920026667416096, 0.014579357579350471, 0.016238689422607422, 0.017898019403219223, 0.019557349383831024, 0.021216681227087975, 0.022876013070344925, 0.024535343050956726, 0.026194673031568527, 0.027854004874825478, 0.029513336718082428, 0.03117266669869423, 0.03283199667930603, 0.03449133038520813, 0.03615066036581993, 0.03780999034643173, 0.03946932032704353, 0.041128650307655334, 0.042787984013557434, 0.044447313994169235, 0.046106643974781036, 0.047765977680683136, 0.04942530766129494, 0.05108463764190674]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 6.0, 3.0, 2.0, 9.0, 4.0, 16.0, 22.0, 25.0, 39.0, 50.0, 81.0, 108.0, 243.0, 361.0, 618.0, 1065.0, 1912.0, 3487.0, 7133.0, 15811.0, 41133.0, 142995.0, 560142.0, 187298.0, 50402.0, 18457.0, 8199.0, 3963.0, 2127.0, 1174.0, 666.0, 372.0, 229.0, 141.0, 79.0, 68.0, 32.0, 28.0, 15.0, 13.0, 14.0, 6.0, 2.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01082611083984375, -0.010403037071228027, -0.009979963302612305, -0.009556889533996582, -0.00913381576538086, -0.008710741996765137, -0.008287668228149414, -0.007864594459533691, -0.007441520690917969, -0.007018446922302246, -0.0065953731536865234, -0.006172299385070801, -0.005749225616455078, -0.0053261518478393555, -0.004903078079223633, -0.00448000431060791, -0.0040569305419921875, -0.003633856773376465, -0.003210783004760742, -0.0027877092361450195, -0.002364635467529297, -0.0019415616989135742, -0.0015184879302978516, -0.001095414161682129, -0.0006723403930664062, -0.0002492666244506836, 0.00017380714416503906, 0.0005968809127807617, 0.0010199546813964844, 0.001443028450012207, 0.0018661022186279297, 0.0022891759872436523, 0.002712249755859375, 0.0031353235244750977, 0.0035583972930908203, 0.003981471061706543, 0.004404544830322266, 0.004827618598937988, 0.005250692367553711, 0.005673766136169434, 0.006096839904785156, 0.006519913673400879, 0.0069429874420166016, 0.007366061210632324, 0.007789134979248047, 0.00821220874786377, 0.008635282516479492, 0.009058356285095215, 0.009481430053710938, 0.00990450382232666, 0.010327577590942383, 0.010750651359558105, 0.011173725128173828, 0.01159679889678955, 0.012019872665405273, 0.012442946434020996, 0.012866020202636719, 0.013289093971252441, 0.013712167739868164, 0.014135241508483887, 0.01455831527709961, 0.014981389045715332, 0.015404462814331055, 0.015827536582946777, 0.0162506103515625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 4.0, 8.0, 5.0, 13.0, 13.0, 15.0, 8.0, 16.0, 22.0, 28.0, 35.0, 37.0, 32.0, 44.0, 42.0, 48.0, 77.0, 46.0, 57.0, 38.0, 53.0, 60.0, 47.0, 36.0, 33.0, 28.0, 29.0, 31.0, 14.0, 21.0, 9.0, 14.0, 7.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.00836181640625, -0.008147239685058594, -0.007932662963867188, -0.007718086242675781, -0.007503509521484375, -0.007288932800292969, -0.0070743560791015625, -0.006859779357910156, -0.00664520263671875, -0.006430625915527344, -0.0062160491943359375, -0.006001472473144531, -0.005786895751953125, -0.005572319030761719, -0.0053577423095703125, -0.005143165588378906, -0.0049285888671875, -0.004714012145996094, -0.0044994354248046875, -0.004284858703613281, -0.004070281982421875, -0.0038557052612304688, -0.0036411285400390625, -0.0034265518188476562, -0.00321197509765625, -0.0029973983764648438, -0.0027828216552734375, -0.0025682449340820312, -0.002353668212890625, -0.0021390914916992188, -0.0019245147705078125, -0.0017099380493164062, -0.001495361328125, -0.0012807846069335938, -0.0010662078857421875, -0.0008516311645507812, -0.000637054443359375, -0.00042247772216796875, -0.0002079010009765625, 6.67572021484375e-06, 0.00022125244140625, 0.00043582916259765625, 0.0006504058837890625, 0.0008649826049804688, 0.001079559326171875, 0.0012941360473632812, 0.0015087127685546875, 0.0017232894897460938, 0.0019378662109375, 0.0021524429321289062, 0.0023670196533203125, 0.0025815963745117188, 0.002796173095703125, 0.0030107498168945312, 0.0032253265380859375, 0.0034399032592773438, 0.00365447998046875, 0.0038690567016601562, 0.0040836334228515625, 0.004298210144042969, 0.004512786865234375, 0.004727363586425781, 0.0049419403076171875, 0.005156517028808594, 0.00537109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 7.0, 2.0, 12.0, 16.0, 11.0, 21.0, 22.0, 26.0, 43.0, 57.0, 66.0, 89.0, 111.0, 214.0, 288.0, 510.0, 846.0, 1838.0, 4786.0, 16964.0, 109973.0, 831234.0, 62410.0, 11792.0, 3667.0, 1468.0, 706.0, 437.0, 268.0, 179.0, 138.0, 100.0, 55.0, 42.0, 43.0, 21.0, 17.0, 23.0, 14.0, 18.0, 4.0, 4.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213470458984375, -0.020620346069335938, -0.019893646240234375, -0.019166946411132812, -0.01844024658203125, -0.017713546752929688, -0.016986846923828125, -0.016260147094726562, -0.015533447265625, -0.014806747436523438, -0.014080047607421875, -0.013353347778320312, -0.01262664794921875, -0.011899948120117188, -0.011173248291015625, -0.010446548461914062, -0.0097198486328125, -0.008993148803710938, -0.008266448974609375, -0.0075397491455078125, -0.00681304931640625, -0.0060863494873046875, -0.005359649658203125, -0.0046329498291015625, -0.00390625, -0.0031795501708984375, -0.002452850341796875, -0.0017261505126953125, -0.00099945068359375, -0.0002727508544921875, 0.000453948974609375, 0.0011806488037109375, 0.0019073486328125, 0.0026340484619140625, 0.003360748291015625, 0.0040874481201171875, 0.00481414794921875, 0.0055408477783203125, 0.006267547607421875, 0.0069942474365234375, 0.007720947265625, 0.008447647094726562, 0.009174346923828125, 0.009901046752929688, 0.01062774658203125, 0.011354446411132812, 0.012081146240234375, 0.012807846069335938, 0.0135345458984375, 0.014261245727539062, 0.014987945556640625, 0.015714645385742188, 0.01644134521484375, 0.017168045043945312, 0.017894744873046875, 0.018621444702148438, 0.01934814453125, 0.020074844360351562, 0.020801544189453125, 0.021528244018554688, 0.02225494384765625, 0.022981643676757812, 0.023708343505859375, 0.024435043334960938, 0.0251617431640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 4.0, 6.0, 4.0, 7.0, 10.0, 7.0, 15.0, 9.0, 13.0, 27.0, 30.0, 33.0, 44.0, 40.0, 61.0, 49.0, 58.0, 71.0, 65.0, 62.0, 57.0, 57.0, 37.0, 44.0, 31.0, 25.0, 32.0, 17.0, 13.0, 13.0, 15.0, 5.0, 8.0, 1.0, 6.0, 5.0, 7.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0277862548828125, -0.02688884735107422, -0.025991439819335938, -0.025094032287597656, -0.024196624755859375, -0.023299217224121094, -0.022401809692382812, -0.02150440216064453, -0.02060699462890625, -0.01970958709716797, -0.018812179565429688, -0.017914772033691406, -0.017017364501953125, -0.016119956970214844, -0.015222549438476562, -0.014325141906738281, -0.013427734375, -0.012530326843261719, -0.011632919311523438, -0.010735511779785156, -0.009838104248046875, -0.008940696716308594, -0.008043289184570312, -0.007145881652832031, -0.00624847412109375, -0.005351066589355469, -0.0044536590576171875, -0.0035562515258789062, -0.002658843994140625, -0.0017614364624023438, -0.0008640289306640625, 3.337860107421875e-05, 0.0009307861328125, 0.0018281936645507812, 0.0027256011962890625, 0.0036230087280273438, 0.004520416259765625, 0.005417823791503906, 0.0063152313232421875, 0.007212638854980469, 0.00811004638671875, 0.009007453918457031, 0.009904861450195312, 0.010802268981933594, 0.011699676513671875, 0.012597084045410156, 0.013494491577148438, 0.014391899108886719, 0.015289306640625, 0.01618671417236328, 0.017084121704101562, 0.017981529235839844, 0.018878936767578125, 0.019776344299316406, 0.020673751831054688, 0.02157115936279297, 0.02246856689453125, 0.02336597442626953, 0.024263381958007812, 0.025160789489746094, 0.026058197021484375, 0.026955604553222656, 0.027853012084960938, 0.02875041961669922, 0.0296478271484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 6.0, 16.0, 15.0, 30.0, 28.0, 44.0, 76.0, 129.0, 228.0, 434.0, 922.0, 2631.0, 10050.0, 97971.0, 891277.0, 35532.0, 5895.0, 1779.0, 666.0, 335.0, 168.0, 106.0, 71.0, 43.0, 30.0, 16.0, 9.0, 12.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0038604736328125, -0.003728806972503662, -0.0035971403121948242, -0.0034654736518859863, -0.0033338069915771484, -0.0032021403312683105, -0.0030704736709594727, -0.0029388070106506348, -0.002807140350341797, -0.002675473690032959, -0.002543807029724121, -0.002412140369415283, -0.0022804737091064453, -0.0021488070487976074, -0.0020171403884887695, -0.0018854737281799316, -0.0017538070678710938, -0.0016221404075622559, -0.001490473747253418, -0.00135880708694458, -0.0012271404266357422, -0.0010954737663269043, -0.0009638071060180664, -0.0008321404457092285, -0.0007004737854003906, -0.0005688071250915527, -0.00043714046478271484, -0.00030547380447387695, -0.00017380714416503906, -4.214048385620117e-05, 8.952617645263672e-05, 0.0002211928367614746, 0.0003528594970703125, 0.0004845261573791504, 0.0006161928176879883, 0.0007478594779968262, 0.0008795261383056641, 0.001011192798614502, 0.0011428594589233398, 0.0012745261192321777, 0.0014061927795410156, 0.0015378594398498535, 0.0016695261001586914, 0.0018011927604675293, 0.0019328594207763672, 0.002064526081085205, 0.002196192741394043, 0.002327859401702881, 0.0024595260620117188, 0.0025911927223205566, 0.0027228593826293945, 0.0028545260429382324, 0.0029861927032470703, 0.003117859363555908, 0.003249526023864746, 0.003381192684173584, 0.003512859344482422, 0.0036445260047912598, 0.0037761926651000977, 0.0039078593254089355, 0.0040395259857177734, 0.004171192646026611, 0.004302859306335449, 0.004434525966644287, 0.004566192626953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 7.0, 5.0, 5.0, 10.0, 18.0, 31.0, 39.0, 56.0, 59.0, 78.0, 114.0, 124.0, 111.0, 85.0, 71.0, 54.0, 43.0, 30.0, 11.0, 11.0, 10.0, 6.0, 4.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0609626770019531e-05, -1.0263174772262573e-05, -9.916722774505615e-06, -9.570270776748657e-06, -9.2238187789917e-06, -8.877366781234741e-06, -8.530914783477783e-06, -8.184462785720825e-06, -7.838010787963867e-06, -7.491558790206909e-06, -7.145106792449951e-06, -6.798654794692993e-06, -6.452202796936035e-06, -6.105750799179077e-06, -5.759298801422119e-06, -5.412846803665161e-06, -5.066394805908203e-06, -4.719942808151245e-06, -4.373490810394287e-06, -4.027038812637329e-06, -3.680586814880371e-06, -3.334134817123413e-06, -2.987682819366455e-06, -2.641230821609497e-06, -2.294778823852539e-06, -1.948326826095581e-06, -1.601874828338623e-06, -1.255422830581665e-06, -9.08970832824707e-07, -5.62518835067749e-07, -2.1606683731079102e-07, 1.30385160446167e-07, 4.76837158203125e-07, 8.23289155960083e-07, 1.169741153717041e-06, 1.516193151473999e-06, 1.862645149230957e-06, 2.209097146987915e-06, 2.555549144744873e-06, 2.902001142501831e-06, 3.248453140258789e-06, 3.594905138015747e-06, 3.941357135772705e-06, 4.287809133529663e-06, 4.634261131286621e-06, 4.980713129043579e-06, 5.327165126800537e-06, 5.673617124557495e-06, 6.020069122314453e-06, 6.366521120071411e-06, 6.712973117828369e-06, 7.059425115585327e-06, 7.405877113342285e-06, 7.752329111099243e-06, 8.098781108856201e-06, 8.44523310661316e-06, 8.791685104370117e-06, 9.138137102127075e-06, 9.484589099884033e-06, 9.831041097640991e-06, 1.017749309539795e-05, 1.0523945093154907e-05, 1.0870397090911865e-05, 1.1216849088668823e-05, 1.1563301086425781e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 11.0, 14.0, 17.0, 28.0, 37.0, 51.0, 74.0, 124.0, 223.0, 447.0, 1030.0, 2806.0, 10114.0, 99083.0, 888324.0, 36391.0, 6136.0, 1950.0, 806.0, 355.0, 172.0, 113.0, 74.0, 42.0, 28.0, 23.0, 17.0, 16.0, 7.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004917144775390625, -0.004781782627105713, -0.004646420478820801, -0.004511058330535889, -0.0043756961822509766, -0.0042403340339660645, -0.004104971885681152, -0.00396960973739624, -0.003834247589111328, -0.003698885440826416, -0.003563523292541504, -0.003428161144256592, -0.0032927989959716797, -0.0031574368476867676, -0.0030220746994018555, -0.0028867125511169434, -0.0027513504028320312, -0.002615988254547119, -0.002480626106262207, -0.002345263957977295, -0.002209901809692383, -0.0020745396614074707, -0.0019391775131225586, -0.0018038153648376465, -0.0016684532165527344, -0.0015330910682678223, -0.0013977289199829102, -0.001262366771697998, -0.001127004623413086, -0.0009916424751281738, -0.0008562803268432617, -0.0007209181785583496, -0.0005855560302734375, -0.0004501938819885254, -0.0003148317337036133, -0.00017946958541870117, -4.410743713378906e-05, 9.125471115112305e-05, 0.00022661685943603516, 0.00036197900772094727, 0.0004973411560058594, 0.0006327033042907715, 0.0007680654525756836, 0.0009034276008605957, 0.0010387897491455078, 0.00117415189743042, 0.001309514045715332, 0.0014448761940002441, 0.0015802383422851562, 0.0017156004905700684, 0.0018509626388549805, 0.0019863247871398926, 0.0021216869354248047, 0.002257049083709717, 0.002392411231994629, 0.002527773380279541, 0.002663135528564453, 0.0027984976768493652, 0.0029338598251342773, 0.0030692219734191895, 0.0032045841217041016, 0.0033399462699890137, 0.0034753084182739258, 0.003610670566558838, 0.00374603271484375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 0.0, 5.0, 8.0, 6.0, 8.0, 6.0, 18.0, 19.0, 50.0, 57.0, 84.0, 111.0, 161.0, 147.0, 88.0, 69.0, 47.0, 36.0, 30.0, 14.0, 13.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00667572021484375, -0.0065155029296875, -0.00635528564453125, -0.006195068359375, -0.00603485107421875, -0.0058746337890625, -0.00571441650390625, -0.00555419921875, -0.00539398193359375, -0.0052337646484375, -0.00507354736328125, -0.004913330078125, -0.00475311279296875, -0.0045928955078125, -0.00443267822265625, -0.0042724609375, -0.00411224365234375, -0.0039520263671875, -0.00379180908203125, -0.003631591796875, -0.00347137451171875, -0.0033111572265625, -0.00315093994140625, -0.00299072265625, -0.00283050537109375, -0.0026702880859375, -0.00251007080078125, -0.002349853515625, -0.00218963623046875, -0.0020294189453125, -0.00186920166015625, -0.001708984375, -0.00154876708984375, -0.0013885498046875, -0.00122833251953125, -0.001068115234375, -0.00090789794921875, -0.0007476806640625, -0.00058746337890625, -0.00042724609375, -0.00026702880859375, -0.0001068115234375, 5.340576171875e-05, 0.000213623046875, 0.00037384033203125, 0.0005340576171875, 0.00069427490234375, 0.0008544921875, 0.00101470947265625, 0.0011749267578125, 0.00133514404296875, 0.001495361328125, 0.00165557861328125, 0.0018157958984375, 0.00197601318359375, 0.00213623046875, 0.00229644775390625, 0.0024566650390625, 0.00261688232421875, 0.002777099609375, 0.00293731689453125, 0.0030975341796875, 0.00325775146484375, 0.00341796875, 0.00357818603515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 18.0, 50.0, 110.0, 535.0, 168.0, 56.0, 26.0, 18.0, 7.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18286588788032532, -0.17570938169956207, -0.16855286061763763, -0.1613963544368744, -0.15423984825611115, -0.1470833271741867, -0.13992682099342346, -0.13277029991149902, -0.12561379373073578, -0.11845728009939194, -0.11130077391862869, -0.10414426028728485, -0.09698774665594101, -0.08983123302459717, -0.08267472684383392, -0.07551821321249008, -0.06836170703172684, -0.061205197125673294, -0.05404868349432945, -0.04689217358827591, -0.03973565995693207, -0.032579150050878525, -0.02542264014482498, -0.01826612651348114, -0.011109616607427597, -0.003953105304390192, 0.003203405998647213, 0.01035991683602333, 0.017516428604722023, 0.024672940373420715, 0.03182945027947426, 0.0389859639108181, 0.04614247381687164, 0.053298983722925186, 0.06045549735426903, 0.06761200726032257, 0.07476852089166641, 0.08192503452301025, 0.0890815407037735, 0.09623805433511734, 0.10339456796646118, 0.11055108159780502, 0.11770758777856827, 0.12486410140991211, 0.13202060759067535, 0.1391771286725998, 0.14633363485336304, 0.15349015593528748, 0.16064664721488953, 0.16780315339565277, 0.1749596744775772, 0.18211618065834045, 0.1892726868391037, 0.19642920792102814, 0.20358571410179138, 0.21074223518371582, 0.21789874136447906, 0.2250552475452423, 0.23221176862716675, 0.23936827480793, 0.24652478098869324, 0.2536813020706177, 0.2608377933502197, 0.26799431443214417, 0.2751508355140686]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 16.0, 17.0, 17.0, 21.0, 17.0, 29.0, 31.0, 32.0, 28.0, 48.0, 64.0, 139.0, 135.0, 67.0, 43.0, 29.0, 34.0, 41.0, 37.0, 22.0, 16.0, 18.0, 14.0, 9.0, 14.0, 4.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10062956809997559, -0.09644424915313721, -0.09225893020629883, -0.08807360380887985, -0.08388828486204147, -0.0797029659152031, -0.07551763951778412, -0.07133232057094574, -0.06714700162410736, -0.06296168267726898, -0.058776360005140305, -0.05459103733301163, -0.05040571838617325, -0.04622039943933487, -0.04203507676720619, -0.037849754095077515, -0.033664435148239136, -0.029479114338755608, -0.02529379352927208, -0.02110847271978855, -0.016923151910305023, -0.012737831100821495, -0.008552510291337967, -0.004367189481854439, -0.00018186867237091064, 0.0040034521371126175, 0.008188772946596146, 0.012374093756079674, 0.016559414565563202, 0.02074473537504673, 0.024930056184530258, 0.029115376994013786, 0.033300697803497314, 0.03748601675033569, 0.04167133942246437, 0.04585666209459305, 0.05004198104143143, 0.054227299988269806, 0.05841262266039848, 0.06259794533252716, 0.06678326427936554, 0.07096858322620392, 0.0751539021730423, 0.07933922857046127, 0.08352454751729965, 0.08770986646413803, 0.091895192861557, 0.09608051180839539, 0.10026583075523376, 0.10445114970207214, 0.10863646864891052, 0.1128217950463295, 0.11700711399316788, 0.12119243294000626, 0.12537775933742523, 0.1295630782842636, 0.133748397231102, 0.13793371617794037, 0.14211903512477875, 0.14630435407161713, 0.1504896879196167, 0.15467500686645508, 0.15886032581329346, 0.16304564476013184, 0.16723096370697021]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 6.0, 7.0, 23.0, 27.0, 38.0, 46.0, 53.0, 81.0, 84.0, 146.0, 207.0, 257.0, 466.0, 686.0, 1222.0, 2895.0, 13627.0, 80651.0, 514790.0, 1881935.0, 1344911.0, 284094.0, 52130.0, 9792.0, 2541.0, 1372.0, 770.0, 469.0, 292.0, 202.0, 128.0, 91.0, 60.0, 52.0, 31.0, 24.0, 18.0, 13.0, 11.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0074005126953125, -0.007204949855804443, -0.007009387016296387, -0.00681382417678833, -0.0066182613372802734, -0.006422698497772217, -0.00622713565826416, -0.0060315728187561035, -0.005836009979248047, -0.00564044713973999, -0.005444884300231934, -0.005249321460723877, -0.00505375862121582, -0.004858195781707764, -0.004662632942199707, -0.00446707010269165, -0.004271507263183594, -0.004075944423675537, -0.0038803815841674805, -0.003684818744659424, -0.003489255905151367, -0.0032936930656433105, -0.003098130226135254, -0.0029025673866271973, -0.0027070045471191406, -0.002511441707611084, -0.0023158788681030273, -0.0021203160285949707, -0.001924753189086914, -0.0017291903495788574, -0.0015336275100708008, -0.0013380646705627441, -0.0011425018310546875, -0.0009469389915466309, -0.0007513761520385742, -0.0005558133125305176, -0.00036025047302246094, -0.0001646876335144043, 3.0875205993652344e-05, 0.00022643804550170898, 0.0004220008850097656, 0.0006175637245178223, 0.0008131265640258789, 0.0010086894035339355, 0.0012042522430419922, 0.0013998150825500488, 0.0015953779220581055, 0.0017909407615661621, 0.0019865036010742188, 0.0021820664405822754, 0.002377629280090332, 0.0025731921195983887, 0.0027687549591064453, 0.002964317798614502, 0.0031598806381225586, 0.0033554434776306152, 0.003551006317138672, 0.0037465691566467285, 0.003942131996154785, 0.004137694835662842, 0.0043332576751708984, 0.004528820514678955, 0.004724383354187012, 0.004919946193695068, 0.005115509033203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 5.0, 6.0, 4.0, 10.0, 5.0, 7.0, 11.0, 13.0, 16.0, 21.0, 27.0, 28.0, 33.0, 38.0, 33.0, 49.0, 47.0, 53.0, 44.0, 59.0, 53.0, 48.0, 47.0, 35.0, 47.0, 38.0, 37.0, 26.0, 27.0, 32.0, 31.0, 19.0, 10.0, 11.0, 6.0, 7.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.007171630859375, -0.006976902484893799, -0.006782174110412598, -0.0065874457359313965, -0.006392717361450195, -0.006197988986968994, -0.006003260612487793, -0.005808532238006592, -0.005613803863525391, -0.0054190754890441895, -0.005224347114562988, -0.005029618740081787, -0.004834890365600586, -0.004640161991119385, -0.004445433616638184, -0.004250705242156982, -0.004055976867675781, -0.00386124849319458, -0.003666520118713379, -0.0034717917442321777, -0.0032770633697509766, -0.0030823349952697754, -0.0028876066207885742, -0.002692878246307373, -0.002498149871826172, -0.0023034214973449707, -0.0021086931228637695, -0.0019139647483825684, -0.0017192363739013672, -0.001524507999420166, -0.0013297796249389648, -0.0011350512504577637, -0.0009403228759765625, -0.0007455945014953613, -0.0005508661270141602, -0.000356137752532959, -0.0001614093780517578, 3.331899642944336e-05, 0.00022804737091064453, 0.0004227757453918457, 0.0006175041198730469, 0.000812232494354248, 0.0010069608688354492, 0.0012016892433166504, 0.0013964176177978516, 0.0015911459922790527, 0.001785874366760254, 0.001980602741241455, 0.0021753311157226562, 0.0023700594902038574, 0.0025647878646850586, 0.0027595162391662598, 0.002954244613647461, 0.003148972988128662, 0.0033437013626098633, 0.0035384297370910645, 0.0037331581115722656, 0.003927886486053467, 0.004122614860534668, 0.004317343235015869, 0.00451207160949707, 0.0047067999839782715, 0.004901528358459473, 0.005096256732940674, 0.005290985107421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 14.0, 31.0, 47.0, 118.0, 278.0, 670.0, 2669.0, 46313.0, 4121568.0, 19607.0, 1905.0, 563.0, 213.0, 122.0, 57.0, 35.0, 18.0, 16.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.031494140625, -0.0305788516998291, -0.029663562774658203, -0.028748273849487305, -0.027832984924316406, -0.026917695999145508, -0.02600240707397461, -0.02508711814880371, -0.024171829223632812, -0.023256540298461914, -0.022341251373291016, -0.021425962448120117, -0.02051067352294922, -0.01959538459777832, -0.018680095672607422, -0.017764806747436523, -0.016849517822265625, -0.015934228897094727, -0.015018939971923828, -0.01410365104675293, -0.013188362121582031, -0.012273073196411133, -0.011357784271240234, -0.010442495346069336, -0.009527206420898438, -0.008611917495727539, -0.007696628570556641, -0.006781339645385742, -0.005866050720214844, -0.004950761795043945, -0.004035472869873047, -0.0031201839447021484, -0.00220489501953125, -0.0012896060943603516, -0.0003743171691894531, 0.0005409717559814453, 0.0014562606811523438, 0.002371549606323242, 0.0032868385314941406, 0.004202127456665039, 0.0051174163818359375, 0.006032705307006836, 0.006947994232177734, 0.007863283157348633, 0.008778572082519531, 0.00969386100769043, 0.010609149932861328, 0.011524438858032227, 0.012439727783203125, 0.013355016708374023, 0.014270305633544922, 0.01518559455871582, 0.01610088348388672, 0.017016172409057617, 0.017931461334228516, 0.018846750259399414, 0.019762039184570312, 0.02067732810974121, 0.02159261703491211, 0.022507905960083008, 0.023423194885253906, 0.024338483810424805, 0.025253772735595703, 0.0261690616607666, 0.0270843505859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 12.0, 18.0, 29.0, 34.0, 61.0, 100.0, 194.0, 403.0, 993.0, 1107.0, 599.0, 251.0, 120.0, 64.0, 30.0, 19.0, 10.0, 9.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0120849609375, -0.01148843765258789, -0.010891914367675781, -0.010295391082763672, -0.009698867797851562, -0.009102344512939453, -0.008505821228027344, -0.007909297943115234, -0.007312774658203125, -0.006716251373291016, -0.006119728088378906, -0.005523204803466797, -0.0049266815185546875, -0.004330158233642578, -0.0037336349487304688, -0.0031371116638183594, -0.00254058837890625, -0.0019440650939941406, -0.0013475418090820312, -0.0007510185241699219, -0.0001544952392578125, 0.0004420280456542969, 0.0010385513305664062, 0.0016350746154785156, 0.002231597900390625, 0.0028281211853027344, 0.0034246444702148438, 0.004021167755126953, 0.0046176910400390625, 0.005214214324951172, 0.005810737609863281, 0.006407260894775391, 0.0070037841796875, 0.007600307464599609, 0.008196830749511719, 0.008793354034423828, 0.009389877319335938, 0.009986400604248047, 0.010582923889160156, 0.011179447174072266, 0.011775970458984375, 0.012372493743896484, 0.012969017028808594, 0.013565540313720703, 0.014162063598632812, 0.014758586883544922, 0.015355110168457031, 0.01595163345336914, 0.01654815673828125, 0.01714468002319336, 0.01774120330810547, 0.018337726593017578, 0.018934249877929688, 0.019530773162841797, 0.020127296447753906, 0.020723819732666016, 0.021320343017578125, 0.021916866302490234, 0.022513389587402344, 0.023109912872314453, 0.023706436157226562, 0.024302959442138672, 0.02489948272705078, 0.02549600601196289, 0.026092529296875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 5.0, 6.0, 20.0, 39.0, 67.0, 120.0, 222.0, 238.0, 136.0, 68.0, 27.0, 19.0, 11.0, 4.0, 2.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12647980451583862, -0.12232302129268646, -0.1181662380695343, -0.11400945484638214, -0.10985267162322998, -0.10569588840007782, -0.10153909772634506, -0.0973823145031929, -0.09322553128004074, -0.08906874805688858, -0.08491196483373642, -0.08075518161058426, -0.0765983909368515, -0.07244160771369934, -0.06828482449054718, -0.06412804126739502, -0.05997125804424286, -0.0558144748210907, -0.05165769159793854, -0.04750090464949608, -0.04334412142634392, -0.03918733820319176, -0.0350305512547493, -0.030873768031597137, -0.026716984808444977, -0.022560201585292816, -0.018403416499495506, -0.014246632345020771, -0.010089848190546036, -0.005933064967393875, -0.0017762798815965652, 0.0023805052042007446, 0.006537273526191711, 0.010694057680666447, 0.014850841835141182, 0.019007626920938492, 0.023164410144090652, 0.027321193367242813, 0.03147798031568527, 0.03563476353883743, 0.039791546761989594, 0.043948329985141754, 0.048105113208293915, 0.052261900156736374, 0.056418683379888535, 0.060575466603040695, 0.06473225355148315, 0.06888903677463531, 0.07304581999778748, 0.07720260322093964, 0.0813593864440918, 0.08551616966724396, 0.08967295289039612, 0.09382973611354828, 0.09798652678728104, 0.1021433100104332, 0.10630009323358536, 0.11045687645673752, 0.11461365967988968, 0.11877044290304184, 0.1229272335767746, 0.12708401679992676, 0.13124080002307892, 0.13539758324623108, 0.13955436646938324]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 10.0, 11.0, 14.0, 15.0, 23.0, 18.0, 25.0, 42.0, 34.0, 38.0, 41.0, 44.0, 50.0, 71.0, 80.0, 58.0, 62.0, 51.0, 34.0, 43.0, 41.0, 45.0, 24.0, 25.0, 17.0, 24.0, 10.0, 8.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07072579860687256, -0.06849884241819382, -0.06627188622951508, -0.06404492259025574, -0.061817966401576996, -0.059591010212898254, -0.057364050298929214, -0.055137090384960175, -0.05291013419628143, -0.05068317800760269, -0.04845621809363365, -0.04622925817966461, -0.04400230199098587, -0.04177534580230713, -0.03954838588833809, -0.03732142597436905, -0.03509446978569031, -0.032867513597011566, -0.030640553683042526, -0.028413595631718636, -0.026186637580394745, -0.023959679529070854, -0.021732721477746964, -0.019505763426423073, -0.017278805375099182, -0.015051847323775291, -0.0128248892724514, -0.01059793122112751, -0.00837097316980362, -0.006144015118479729, -0.003917057067155838, -0.0016900990158319473, 0.0005368590354919434, 0.002763817086815834, 0.004990775138139725, 0.007217733189463615, 0.009444691240787506, 0.011671649292111397, 0.013898607343435287, 0.016125565394759178, 0.01835252344608307, 0.02057948149740696, 0.02280643954873085, 0.02503339760005474, 0.02726035565137863, 0.029487313702702522, 0.03171427175402641, 0.03394123166799545, 0.036168187856674194, 0.038395144045352936, 0.040622103959321976, 0.042849063873291016, 0.04507602006196976, 0.0473029762506485, 0.04952993616461754, 0.05175689607858658, 0.05398385226726532, 0.05621080845594406, 0.0584377683699131, 0.06066472828388214, 0.06289168447256088, 0.06511864066123962, 0.06734560430049896, 0.0695725604891777, 0.07179951667785645]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 9.0, 16.0, 17.0, 23.0, 44.0, 74.0, 86.0, 127.0, 192.0, 319.0, 524.0, 841.0, 1498.0, 2751.0, 5316.0, 11827.0, 30395.0, 101223.0, 619051.0, 195815.0, 46289.0, 16701.0, 7284.0, 3505.0, 1872.0, 1072.0, 551.0, 384.0, 263.0, 154.0, 92.0, 67.0, 47.0, 35.0, 28.0, 16.0, 12.0, 7.0, 6.0, 11.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0091400146484375, -0.00885164737701416, -0.00856328010559082, -0.00827491283416748, -0.00798654556274414, -0.007698178291320801, -0.007409811019897461, -0.007121443748474121, -0.006833076477050781, -0.006544709205627441, -0.0062563419342041016, -0.005967974662780762, -0.005679607391357422, -0.005391240119934082, -0.005102872848510742, -0.004814505577087402, -0.0045261383056640625, -0.004237771034240723, -0.003949403762817383, -0.003661036491394043, -0.003372669219970703, -0.0030843019485473633, -0.0027959346771240234, -0.0025075674057006836, -0.0022192001342773438, -0.001930832862854004, -0.001642465591430664, -0.0013540983200073242, -0.0010657310485839844, -0.0007773637771606445, -0.0004889965057373047, -0.00020062923431396484, 8.7738037109375e-05, 0.00037610530853271484, 0.0006644725799560547, 0.0009528398513793945, 0.0012412071228027344, 0.0015295743942260742, 0.001817941665649414, 0.002106308937072754, 0.0023946762084960938, 0.0026830434799194336, 0.0029714107513427734, 0.0032597780227661133, 0.003548145294189453, 0.003836512565612793, 0.004124879837036133, 0.004413247108459473, 0.0047016143798828125, 0.004989981651306152, 0.005278348922729492, 0.005566716194152832, 0.005855083465576172, 0.006143450736999512, 0.0064318180084228516, 0.006720185279846191, 0.007008552551269531, 0.007296919822692871, 0.007585287094116211, 0.00787365436553955, 0.00816202163696289, 0.00845038890838623, 0.00873875617980957, 0.00902712345123291, 0.00931549072265625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 13.0, 6.0, 10.0, 15.0, 18.0, 32.0, 28.0, 43.0, 39.0, 60.0, 48.0, 63.0, 51.0, 69.0, 84.0, 61.0, 41.0, 55.0, 41.0, 42.0, 33.0, 36.0, 25.0, 19.0, 14.0, 7.0, 16.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00765228271484375, -0.007403135299682617, -0.007153987884521484, -0.0069048404693603516, -0.006655693054199219, -0.006406545639038086, -0.006157398223876953, -0.00590825080871582, -0.0056591033935546875, -0.005409955978393555, -0.005160808563232422, -0.004911661148071289, -0.004662513732910156, -0.0044133663177490234, -0.004164218902587891, -0.003915071487426758, -0.003665924072265625, -0.003416776657104492, -0.0031676292419433594, -0.0029184818267822266, -0.0026693344116210938, -0.002420186996459961, -0.002171039581298828, -0.0019218921661376953, -0.0016727447509765625, -0.0014235973358154297, -0.0011744499206542969, -0.0009253025054931641, -0.0006761550903320312, -0.00042700767517089844, -0.00017786026000976562, 7.128715515136719e-05, 0.0003204345703125, 0.0005695819854736328, 0.0008187294006347656, 0.0010678768157958984, 0.0013170242309570312, 0.001566171646118164, 0.0018153190612792969, 0.0020644664764404297, 0.0023136138916015625, 0.0025627613067626953, 0.002811908721923828, 0.003061056137084961, 0.0033102035522460938, 0.0035593509674072266, 0.0038084983825683594, 0.004057645797729492, 0.004306793212890625, 0.004555940628051758, 0.004805088043212891, 0.0050542354583740234, 0.005303382873535156, 0.005552530288696289, 0.005801677703857422, 0.006050825119018555, 0.0062999725341796875, 0.00654911994934082, 0.006798267364501953, 0.007047414779663086, 0.007296562194824219, 0.0075457096099853516, 0.007794857025146484, 0.008044004440307617, 0.00829315185546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 7.0, 12.0, 25.0, 28.0, 40.0, 38.0, 63.0, 90.0, 149.0, 227.0, 340.0, 701.0, 1327.0, 3380.0, 11558.0, 70911.0, 898600.0, 47286.0, 8767.0, 2640.0, 1074.0, 512.0, 277.0, 160.0, 119.0, 61.0, 38.0, 34.0, 21.0, 16.0, 9.0, 8.0, 9.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01036834716796875, -0.009960293769836426, -0.009552240371704102, -0.009144186973571777, -0.008736133575439453, -0.008328080177307129, -0.007920026779174805, -0.0075119733810424805, -0.007103919982910156, -0.006695866584777832, -0.006287813186645508, -0.005879759788513184, -0.005471706390380859, -0.005063652992248535, -0.004655599594116211, -0.004247546195983887, -0.0038394927978515625, -0.0034314393997192383, -0.003023386001586914, -0.00261533260345459, -0.0022072792053222656, -0.0017992258071899414, -0.0013911724090576172, -0.000983119010925293, -0.0005750656127929688, -0.00016701221466064453, 0.0002410411834716797, 0.0006490945816040039, 0.0010571479797363281, 0.0014652013778686523, 0.0018732547760009766, 0.0022813081741333008, 0.002689361572265625, 0.0030974149703979492, 0.0035054683685302734, 0.003913521766662598, 0.004321575164794922, 0.004729628562927246, 0.00513768196105957, 0.0055457353591918945, 0.005953788757324219, 0.006361842155456543, 0.006769895553588867, 0.007177948951721191, 0.007586002349853516, 0.00799405574798584, 0.008402109146118164, 0.008810162544250488, 0.009218215942382812, 0.009626269340515137, 0.010034322738647461, 0.010442376136779785, 0.01085042953491211, 0.011258482933044434, 0.011666536331176758, 0.012074589729309082, 0.012482643127441406, 0.01289069652557373, 0.013298749923706055, 0.013706803321838379, 0.014114856719970703, 0.014522910118103027, 0.014930963516235352, 0.015339016914367676, 0.0157470703125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 12.0, 14.0, 18.0, 22.0, 30.0, 25.0, 34.0, 38.0, 49.0, 85.0, 91.0, 105.0, 96.0, 76.0, 79.0, 44.0, 36.0, 26.0, 26.0, 22.0, 14.0, 13.0, 15.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027374267578125, -0.026322364807128906, -0.025270462036132812, -0.02421855926513672, -0.023166656494140625, -0.02211475372314453, -0.021062850952148438, -0.020010948181152344, -0.01895904541015625, -0.017907142639160156, -0.016855239868164062, -0.01580333709716797, -0.014751434326171875, -0.013699531555175781, -0.012647628784179688, -0.011595726013183594, -0.0105438232421875, -0.009491920471191406, -0.008440017700195312, -0.007388114929199219, -0.006336212158203125, -0.005284309387207031, -0.0042324066162109375, -0.0031805038452148438, -0.00212860107421875, -0.0010766983032226562, -2.47955322265625e-05, 0.0010271072387695312, 0.002079010009765625, 0.0031309127807617188, 0.0041828155517578125, 0.005234718322753906, 0.00628662109375, 0.007338523864746094, 0.008390426635742188, 0.009442329406738281, 0.010494232177734375, 0.011546134948730469, 0.012598037719726562, 0.013649940490722656, 0.01470184326171875, 0.015753746032714844, 0.016805648803710938, 0.01785755157470703, 0.018909454345703125, 0.01996135711669922, 0.021013259887695312, 0.022065162658691406, 0.0231170654296875, 0.024168968200683594, 0.025220870971679688, 0.02627277374267578, 0.027324676513671875, 0.02837657928466797, 0.029428482055664062, 0.030480384826660156, 0.03153228759765625, 0.032584190368652344, 0.03363609313964844, 0.03468799591064453, 0.035739898681640625, 0.03679180145263672, 0.03784370422363281, 0.038895606994628906, 0.039947509765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 8.0, 3.0, 7.0, 2.0, 3.0, 7.0, 9.0, 11.0, 14.0, 20.0, 19.0, 26.0, 34.0, 68.0, 73.0, 116.0, 207.0, 308.0, 632.0, 1370.0, 3756.0, 18401.0, 913850.0, 95960.0, 8909.0, 2542.0, 914.0, 495.0, 258.0, 172.0, 89.0, 70.0, 45.0, 39.0, 20.0, 18.0, 16.0, 16.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0038471221923828125, -0.0037261545658111572, -0.003605186939239502, -0.0034842193126678467, -0.0033632516860961914, -0.003242284059524536, -0.003121316432952881, -0.0030003488063812256, -0.0028793811798095703, -0.002758413553237915, -0.0026374459266662598, -0.0025164783000946045, -0.0023955106735229492, -0.002274543046951294, -0.0021535754203796387, -0.0020326077938079834, -0.0019116401672363281, -0.0017906725406646729, -0.0016697049140930176, -0.0015487372875213623, -0.001427769660949707, -0.0013068020343780518, -0.0011858344078063965, -0.0010648667812347412, -0.0009438991546630859, -0.0008229315280914307, -0.0007019639015197754, -0.0005809962749481201, -0.00046002864837646484, -0.00033906102180480957, -0.0002180933952331543, -9.712576866149902e-05, 2.384185791015625e-05, 0.00014480948448181152, 0.0002657771110534668, 0.00038674473762512207, 0.0005077123641967773, 0.0006286799907684326, 0.0007496476173400879, 0.0008706152439117432, 0.0009915828704833984, 0.0011125504970550537, 0.001233518123626709, 0.0013544857501983643, 0.0014754533767700195, 0.0015964210033416748, 0.00171738862991333, 0.0018383562564849854, 0.0019593238830566406, 0.002080291509628296, 0.002201259136199951, 0.0023222267627716064, 0.0024431943893432617, 0.002564162015914917, 0.0026851296424865723, 0.0028060972690582275, 0.002927064895629883, 0.003048032522201538, 0.0031690001487731934, 0.0032899677753448486, 0.003410935401916504, 0.003531903028488159, 0.0036528706550598145, 0.0037738382816314697, 0.003894805908203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 12.0, 6.0, 13.0, 8.0, 9.0, 16.0, 24.0, 30.0, 42.0, 34.0, 49.0, 72.0, 83.0, 97.0, 86.0, 82.0, 52.0, 49.0, 37.0, 27.0, 22.0, 19.0, 11.0, 11.0, 12.0, 7.0, 7.0, 5.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.1742115020751953e-05, -1.1382624506950378e-05, -1.1023133993148804e-05, -1.0663643479347229e-05, -1.0304152965545654e-05, -9.94466245174408e-06, -9.585171937942505e-06, -9.22568142414093e-06, -8.866190910339355e-06, -8.50670039653778e-06, -8.147209882736206e-06, -7.787719368934631e-06, -7.428228855133057e-06, -7.068738341331482e-06, -6.709247827529907e-06, -6.3497573137283325e-06, -5.990266799926758e-06, -5.630776286125183e-06, -5.271285772323608e-06, -4.911795258522034e-06, -4.552304744720459e-06, -4.192814230918884e-06, -3.8333237171173096e-06, -3.473833203315735e-06, -3.11434268951416e-06, -2.7548521757125854e-06, -2.3953616619110107e-06, -2.035871148109436e-06, -1.6763806343078613e-06, -1.3168901205062866e-06, -9.57399606704712e-07, -5.979090929031372e-07, -2.384185791015625e-07, 1.210719347000122e-07, 4.805624485015869e-07, 8.400529623031616e-07, 1.1995434761047363e-06, 1.559033989906311e-06, 1.9185245037078857e-06, 2.2780150175094604e-06, 2.637505531311035e-06, 2.99699604511261e-06, 3.3564865589141846e-06, 3.7159770727157593e-06, 4.075467586517334e-06, 4.434958100318909e-06, 4.794448614120483e-06, 5.153939127922058e-06, 5.513429641723633e-06, 5.8729201555252075e-06, 6.232410669326782e-06, 6.591901183128357e-06, 6.951391696929932e-06, 7.310882210731506e-06, 7.670372724533081e-06, 8.029863238334656e-06, 8.38935375213623e-06, 8.748844265937805e-06, 9.10833477973938e-06, 9.467825293540955e-06, 9.82731580734253e-06, 1.0186806321144104e-05, 1.0546296834945679e-05, 1.0905787348747253e-05, 1.1265277862548828e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 5.0, 11.0, 14.0, 11.0, 27.0, 24.0, 27.0, 49.0, 65.0, 112.0, 174.0, 269.0, 509.0, 916.0, 1764.0, 4011.0, 10164.0, 34974.0, 264190.0, 672020.0, 39512.0, 11240.0, 4305.0, 1855.0, 919.0, 527.0, 288.0, 179.0, 112.0, 84.0, 46.0, 34.0, 29.0, 23.0, 7.0, 17.0, 10.0, 10.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011920928955078125, -0.0011570751667022705, -0.0011220574378967285, -0.0010870397090911865, -0.0010520219802856445, -0.0010170042514801025, -0.0009819865226745605, -0.0009469687938690186, -0.0009119510650634766, -0.0008769333362579346, -0.0008419156074523926, -0.0008068978786468506, -0.0007718801498413086, -0.0007368624210357666, -0.0007018446922302246, -0.0006668269634246826, -0.0006318092346191406, -0.0005967915058135986, -0.0005617737770080566, -0.0005267560482025146, -0.0004917383193969727, -0.00045672059059143066, -0.00042170286178588867, -0.0003866851329803467, -0.0003516674041748047, -0.0003166496753692627, -0.0002816319465637207, -0.0002466142177581787, -0.00021159648895263672, -0.00017657876014709473, -0.00014156103134155273, -0.00010654330253601074, -7.152557373046875e-05, -3.650784492492676e-05, -1.4901161193847656e-06, 3.3527612686157227e-05, 6.854534149169922e-05, 0.00010356307029724121, 0.0001385807991027832, 0.0001735985279083252, 0.0002086162567138672, 0.00024363398551940918, 0.00027865171432495117, 0.00031366944313049316, 0.00034868717193603516, 0.00038370490074157715, 0.00041872262954711914, 0.00045374035835266113, 0.0004887580871582031, 0.0005237758159637451, 0.0005587935447692871, 0.0005938112735748291, 0.0006288290023803711, 0.0006638467311859131, 0.0006988644599914551, 0.0007338821887969971, 0.0007688999176025391, 0.0008039176464080811, 0.000838935375213623, 0.000873953104019165, 0.000908970832824707, 0.000943988561630249, 0.000979006290435791, 0.001014024019241333, 0.001049041748046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 7.0, 7.0, 11.0, 15.0, 29.0, 39.0, 48.0, 66.0, 108.0, 180.0, 192.0, 97.0, 54.0, 39.0, 29.0, 22.0, 12.0, 10.0, 11.0, 3.0, 5.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004425048828125, -0.004294693470001221, -0.004164338111877441, -0.004033982753753662, -0.003903627395629883, -0.0037732720375061035, -0.0036429166793823242, -0.003512561321258545, -0.0033822059631347656, -0.0032518506050109863, -0.003121495246887207, -0.0029911398887634277, -0.0028607845306396484, -0.002730429172515869, -0.00260007381439209, -0.0024697184562683105, -0.0023393630981445312, -0.002209007740020752, -0.0020786523818969727, -0.0019482970237731934, -0.001817941665649414, -0.0016875863075256348, -0.0015572309494018555, -0.0014268755912780762, -0.0012965202331542969, -0.0011661648750305176, -0.0010358095169067383, -0.000905454158782959, -0.0007750988006591797, -0.0006447434425354004, -0.0005143880844116211, -0.0003840327262878418, -0.0002536773681640625, -0.0001233220100402832, 7.033348083496094e-06, 0.0001373887062072754, 0.0002677440643310547, 0.000398099422454834, 0.0005284547805786133, 0.0006588101387023926, 0.0007891654968261719, 0.0009195208549499512, 0.0010498762130737305, 0.0011802315711975098, 0.001310586929321289, 0.0014409422874450684, 0.0015712976455688477, 0.001701653003692627, 0.0018320083618164062, 0.0019623637199401855, 0.002092719078063965, 0.002223074436187744, 0.0023534297943115234, 0.0024837851524353027, 0.002614140510559082, 0.0027444958686828613, 0.0028748512268066406, 0.00300520658493042, 0.0031355619430541992, 0.0032659173011779785, 0.003396272659301758, 0.003526628017425537, 0.0036569833755493164, 0.0037873387336730957, 0.003917694091796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 1.0, 5.0, 6.0, 19.0, 33.0, 81.0, 489.0, 248.0, 63.0, 26.0, 15.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10401590168476105, -0.09946416318416595, -0.09491242468357086, -0.09036068618297577, -0.08580894768238068, -0.08125720918178558, -0.0767054632306099, -0.0721537247300148, -0.06760198622941971, -0.06305024772882462, -0.05849850922822952, -0.05394676700234413, -0.04939502850174904, -0.044843290001153946, -0.040291547775268555, -0.03573980927467346, -0.03118807077407837, -0.026636332273483276, -0.022084591910243034, -0.017532851547002792, -0.0129811130464077, -0.008429374545812607, -0.003877634182572365, 0.0006741061806678772, 0.00522584468126297, 0.009777584113180637, 0.014329323545098305, 0.018881063908338547, 0.02343280240893364, 0.027984540909528732, 0.032536283135414124, 0.037088021636009216, 0.0416397750377655, 0.046191513538360596, 0.05074325203895569, 0.05529499426484108, 0.05984673276543617, 0.06439846754074097, 0.06895021349191666, 0.07350195199251175, 0.07805369049310684, 0.08260542899370193, 0.08715716749429703, 0.09170890599489212, 0.09626065194606781, 0.1008123904466629, 0.105364128947258, 0.10991586744785309, 0.11446760594844818, 0.11901934444904327, 0.12357108294963837, 0.12812282145023346, 0.13267455995082855, 0.13722629845142365, 0.14177803695201874, 0.14632979035377502, 0.15088152885437012, 0.1554332673549652, 0.1599850058555603, 0.1645367443561554, 0.1690884828567505, 0.17364022135734558, 0.17819195985794067, 0.18274369835853577, 0.18729543685913086]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 16.0, 10.0, 10.0, 11.0, 18.0, 19.0, 23.0, 24.0, 18.0, 33.0, 39.0, 90.0, 187.0, 191.0, 78.0, 34.0, 23.0, 31.0, 30.0, 15.0, 18.0, 10.0, 10.0, 14.0, 19.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07081735134124756, -0.06819088757038116, -0.06556441634893417, -0.06293795257806778, -0.06031148508191109, -0.057685017585754395, -0.055058553814888, -0.05243208631873131, -0.049805618822574615, -0.04717915132641792, -0.04455268383026123, -0.041926220059394836, -0.039299752563238144, -0.03667328506708145, -0.03404682129621506, -0.031420353800058365, -0.028793886303901672, -0.02616741880774498, -0.023540953174233437, -0.020914487540721893, -0.0182880200445652, -0.01566155254840851, -0.013035086914896965, -0.010408621281385422, -0.007782153785228729, -0.005155687220394611, -0.0025292206555604935, 9.724590927362442e-05, 0.0027237124741077423, 0.00535017903894186, 0.007976645603775978, 0.010603111237287521, 0.013229578733444214, 0.015856046229600906, 0.01848251186311245, 0.021108977496623993, 0.023735444992780685, 0.026361912488937378, 0.02898837812244892, 0.031614843755960464, 0.03424131125211716, 0.03686777874827385, 0.03949424624443054, 0.042120710015296936, 0.04474717751145363, 0.04737364500761032, 0.050000108778476715, 0.05262657627463341, 0.0552530437707901, 0.05787951126694679, 0.060505978763103485, 0.06313244253396988, 0.06575891375541687, 0.06838537752628326, 0.07101184129714966, 0.07363830506801605, 0.07626477628946304, 0.07889124006032944, 0.08151771128177643, 0.08414417505264282, 0.08677063882350922, 0.08939711004495621, 0.0920235738158226, 0.09465004503726959, 0.09727650880813599]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 10.0, 9.0, 12.0, 9.0, 17.0, 16.0, 19.0, 27.0, 23.0, 28.0, 32.0, 46.0, 74.0, 153.0, 204.0, 77.0, 44.0, 28.0, 31.0, 28.0, 18.0, 14.0, 11.0, 7.0, 7.0, 9.0, 7.0, 7.0, 3.0, 6.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.005344390869140625, -0.005177795886993408, -0.005011200904846191, -0.004844605922698975, -0.004678010940551758, -0.004511415958404541, -0.004344820976257324, -0.004178225994110107, -0.004011631011962891, -0.003845036029815674, -0.003678441047668457, -0.0035118460655212402, -0.0033452510833740234, -0.0031786561012268066, -0.00301206111907959, -0.002845466136932373, -0.0026788711547851562, -0.0025122761726379395, -0.0023456811904907227, -0.002179086208343506, -0.002012491226196289, -0.0018458962440490723, -0.0016793012619018555, -0.0015127062797546387, -0.0013461112976074219, -0.001179516315460205, -0.0010129213333129883, -0.0008463263511657715, -0.0006797313690185547, -0.0005131363868713379, -0.0003465414047241211, -0.0001799464225769043, -1.33514404296875e-05, 0.0001532435417175293, 0.0003198385238647461, 0.0004864335060119629, 0.0006530284881591797, 0.0008196234703063965, 0.0009862184524536133, 0.00115281343460083, 0.0013194084167480469, 0.0014860033988952637, 0.0016525983810424805, 0.0018191933631896973, 0.001985788345336914, 0.002152383327484131, 0.0023189783096313477, 0.0024855732917785645, 0.0026521682739257812, 0.002818763256072998, 0.002985358238220215, 0.0031519532203674316, 0.0033185482025146484, 0.0034851431846618652, 0.003651738166809082, 0.003818333148956299, 0.003984928131103516, 0.004151523113250732, 0.004318118095397949, 0.004484713077545166, 0.004651308059692383, 0.0048179030418396, 0.004984498023986816, 0.005151093006134033, 0.00531768798828125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 8.0, 19.0, 21.0, 20.0, 33.0, 42.0, 40.0, 91.0, 193.0, 544.0, 2096.0, 16875.0, 8357129.0, 9252.0, 1361.0, 379.0, 179.0, 56.0, 78.0, 39.0, 27.0, 13.0, 11.0, 5.0, 3.0, 1.0, 6.0, 4.0, 2.0, 2.0, 10.0, 5.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04955712705850601, -0.04811601713299751, -0.046674903482198715, -0.045233793556690216, -0.04379267990589142, -0.04235156998038292, -0.04091046005487442, -0.03946934640407562, -0.03802823647856712, -0.036587126553058624, -0.03514601290225983, -0.03370490297675133, -0.03226379305124283, -0.03082267940044403, -0.02938156947493553, -0.027940457686781883, -0.026499345898628235, -0.025058234110474586, -0.023617122322320938, -0.02217601239681244, -0.02073490060865879, -0.019293788820505142, -0.017852678894996643, -0.016411567106842995, -0.014970455318689346, -0.013529343530535698, -0.012088232673704624, -0.01064712181687355, -0.009206010028719902, -0.007764898706227541, -0.00632378738373518, -0.004882676526904106, -0.0034415684640407562, -0.002000457141548395, -0.0005593458190560341, 0.000881765503436327, 0.002322876825928688, 0.003763988148421049, 0.00520509947091341, 0.006646210327744484, 0.008087322115898132, 0.00952843390405178, 0.010969544760882854, 0.012410655617713928, 0.013851767405867577, 0.015292879194021225, 0.016733989119529724, 0.018175100907683372, 0.01961621269583702, 0.02105732448399067, 0.022498436272144318, 0.023939546197652817, 0.025380657985806465, 0.026821769773960114, 0.028262879699468613, 0.02970399148762226, 0.03114510327577591, 0.03258621320128441, 0.034027326852083206, 0.035468436777591705, 0.0369095504283905, 0.038350660353899, 0.0397917702794075, 0.0412328839302063, 0.0426739938557148]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 6.0, 4.0, 0.0, 2.0, 6.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 7.0, 4.0, 3.0, 3.0, 8.0, 7.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013770464807748795, -0.013081957586109638, -0.012393450364470482, -0.0117049440741539, -0.011016436852514744, -0.010327929630875587, -0.009639423340559006, -0.00895091611891985, -0.008262408897280693, -0.007573901675641537, -0.006885394919663668, -0.006196888163685799, -0.005508380942046642, -0.004819873720407486, -0.004131366964429617, -0.003442860208451748, -0.0027543529868125916, -0.002065845998004079, -0.0013773390091955662, -0.0006888320203870535, -3.25031578540802e-07, 0.0006881819572299719, 0.0013766889460384846, 0.0020651957020163536, 0.00275370292365551, 0.0034422099124640226, 0.004130716901272535, 0.004819223657250404, 0.005507730878889561, 0.006196238100528717, 0.006884744856506586, 0.007573251612484455, 0.008261756971478462, 0.008950264193117619, 0.009638771414756775, 0.010327277705073357, 0.011015784926712513, 0.01170429214835167, 0.012392798438668251, 0.013081305660307407, 0.013769812881946564, 0.01445832010358572, 0.015146827325224876, 0.015835333615541458, 0.01652384176850319, 0.01721234805881977, 0.017900854349136353, 0.018589362502098083, 0.019277868792414665, 0.019966375082731247, 0.020654883235692978, 0.02134338952600956, 0.02203189581632614, 0.022720403969287872, 0.023408910259604454, 0.024097416549921036, 0.024785924702882767, 0.02547443099319935, 0.02616293914616108, 0.02685144543647766, 0.027539953589439392, 0.028228459879755974, 0.028916966170072556, 0.029605474323034286, 0.030293980613350868]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 7.0, 22.0, 25.0, 39.0, 48.0, 62.0, 135.0, 190.0, 345.0, 718.0, 1259.0, 2547.0, 5973.0, 17263.0, 64874.0, 224668.0, 148850.0, 37303.0, 11351.0, 4367.0, 1953.0, 947.0, 541.0, 281.0, 157.0, 102.0, 70.0, 54.0, 33.0, 18.0, 11.0, 11.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03369140625, -0.03275012969970703, -0.03180885314941406, -0.030867576599121094, -0.029926300048828125, -0.028985023498535156, -0.028043746948242188, -0.02710247039794922, -0.02616119384765625, -0.02521991729736328, -0.024278640747070312, -0.023337364196777344, -0.022396087646484375, -0.021454811096191406, -0.020513534545898438, -0.01957225799560547, -0.0186309814453125, -0.01768970489501953, -0.016748428344726562, -0.015807151794433594, -0.014865875244140625, -0.013924598693847656, -0.012983322143554688, -0.012042045593261719, -0.01110076904296875, -0.010159492492675781, -0.009218215942382812, -0.008276939392089844, -0.007335662841796875, -0.006394386291503906, -0.0054531097412109375, -0.004511833190917969, -0.003570556640625, -0.0026292800903320312, -0.0016880035400390625, -0.0007467269897460938, 0.000194549560546875, 0.0011358261108398438, 0.0020771026611328125, 0.0030183792114257812, 0.00395965576171875, 0.004900932312011719, 0.0058422088623046875, 0.006783485412597656, 0.007724761962890625, 0.008666038513183594, 0.009607315063476562, 0.010548591613769531, 0.0114898681640625, 0.012431144714355469, 0.013372421264648438, 0.014313697814941406, 0.015254974365234375, 0.016196250915527344, 0.017137527465820312, 0.01807880401611328, 0.01902008056640625, 0.01996135711669922, 0.020902633666992188, 0.021843910217285156, 0.022785186767578125, 0.023726463317871094, 0.024667739868164062, 0.02560901641845703, 0.02655029296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 6.0, 15.0, 7.0, 13.0, 14.0, 14.0, 15.0, 24.0, 29.0, 32.0, 52.0, 41.0, 61.0, 51.0, 71.0, 64.0, 49.0, 72.0, 43.0, 47.0, 31.0, 46.0, 37.0, 31.0, 27.0, 26.0, 6.0, 11.0, 18.0, 5.0, 8.0, 5.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0062255859375, -0.006035566329956055, -0.005845546722412109, -0.005655527114868164, -0.005465507507324219, -0.0052754878997802734, -0.005085468292236328, -0.004895448684692383, -0.0047054290771484375, -0.004515409469604492, -0.004325389862060547, -0.0041353702545166016, -0.003945350646972656, -0.003755331039428711, -0.0035653114318847656, -0.0033752918243408203, -0.003185272216796875, -0.0029952526092529297, -0.0028052330017089844, -0.002615213394165039, -0.0024251937866210938, -0.0022351741790771484, -0.002045154571533203, -0.0018551349639892578, -0.0016651153564453125, -0.0014750957489013672, -0.0012850761413574219, -0.0010950565338134766, -0.0009050369262695312, -0.0007150173187255859, -0.0005249977111816406, -0.0003349781036376953, -0.00014495849609375, 4.506111145019531e-05, 0.00023508071899414062, 0.00042510032653808594, 0.0006151199340820312, 0.0008051395416259766, 0.0009951591491699219, 0.0011851787567138672, 0.0013751983642578125, 0.0015652179718017578, 0.0017552375793457031, 0.0019452571868896484, 0.0021352767944335938, 0.002325296401977539, 0.0025153160095214844, 0.0027053356170654297, 0.002895355224609375, 0.0030853748321533203, 0.0032753944396972656, 0.003465414047241211, 0.0036554336547851562, 0.0038454532623291016, 0.004035472869873047, 0.004225492477416992, 0.0044155120849609375, 0.004605531692504883, 0.004795551300048828, 0.0049855709075927734, 0.005175590515136719, 0.005365610122680664, 0.005555629730224609, 0.005745649337768555, 0.0059356689453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 7.0, 12.0, 19.0, 69.0, 191.0, 121.0, 27.0, 13.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09296739846467972, -0.0908062532544136, -0.0886451005935669, -0.08648395538330078, -0.08432281017303467, -0.08216165751218796, -0.08000051230192184, -0.07783936709165573, -0.07567821443080902, -0.07351706922054291, -0.0713559165596962, -0.06919477134943008, -0.06703362613916397, -0.06487247347831726, -0.06271132826805115, -0.060550179332494736, -0.05838903412222862, -0.05622788518667221, -0.0540667399764061, -0.051905591040849686, -0.049744442105293274, -0.04758329689502716, -0.04542214795947075, -0.04326099902391434, -0.041099853813648224, -0.03893870487809181, -0.0367775596678257, -0.03461641073226929, -0.032455261796712875, -0.030294114723801613, -0.02813296765089035, -0.02597181871533394, -0.023810673505067825, -0.021649526432156563, -0.01948837749660015, -0.01732723042368889, -0.015166082419455051, -0.013004934415221214, -0.010843787342309952, -0.008682639338076115, -0.0065214913338422775, -0.00436034332960844, -0.0021991957910358906, -3.804825246334076e-05, 0.0021230997517704964, 0.0042842477560043335, 0.006445394828915596, 0.008606542833149433, 0.01076769083738327, 0.012928838841617107, 0.015089986845850945, 0.017251133918762207, 0.01941228285431862, 0.02157342992722988, 0.023734577000141144, 0.025895725935697556, 0.028056873008608818, 0.03021802008152008, 0.03237916901707649, 0.034540317952632904, 0.03670146316289902, 0.03886261209845543, 0.04102376103401184, 0.043184906244277954, 0.045346055179834366]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 16.0, 40.0, 103.0, 152.0, 73.0, 27.0, 11.0, 9.0, 5.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040926337242126465, -0.03939737379550934, -0.03786841034889221, -0.036339450627565384, -0.03481048718094826, -0.03328152373433113, -0.0317525640130043, -0.030223600566387177, -0.02869463711977005, -0.027165673673152924, -0.025636712089180946, -0.02410775050520897, -0.022578787058591843, -0.021049823611974716, -0.01952086202800274, -0.01799190044403076, -0.016462936997413635, -0.014933974482119083, -0.013405011966824532, -0.01187604945152998, -0.010347086936235428, -0.008818124420940876, -0.007289161905646324, -0.005760199390351772, -0.0042312368750572205, -0.0027022743597626686, -0.0011733118444681168, 0.0003556506708264351, 0.001884613186120987, 0.003413575701415539, 0.004942538216710091, 0.0064715007320046425, 0.008000463247299194, 0.009529425762593746, 0.011058388277888298, 0.01258735079318285, 0.014116313308477402, 0.015645276755094528, 0.017174238339066505, 0.018703199923038483, 0.02023216336965561, 0.021761126816272736, 0.023290088400244713, 0.02481904998421669, 0.026348013430833817, 0.027876976877450943, 0.02940593846142292, 0.030934900045394897, 0.032463863492012024, 0.03399282693862915, 0.03552179038524628, 0.037050750106573105, 0.03857971355319023, 0.04010867699980736, 0.041637636721134186, 0.04316660016775131, 0.04469556361436844, 0.046224527060985565, 0.04775349050760269, 0.04928245022892952, 0.050811413675546646, 0.05234037712216377, 0.0538693368434906, 0.05539830029010773, 0.056927263736724854]}, "_wandb": {"runtime": 2401}}