{"train/loss": 4.346, "train/learning_rate": 9.960000000000001e-05, "train/epoch": 0.84, "train/global_step": 500, "_runtime": 4786, "_timestamp": 1646192170, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 29.0, 215.0, 461.0, 265.0, 39.0, 5.0, 0.0, 1.0], "bins": [-525.2379760742188, -516.2647094726562, -507.29144287109375, -498.31817626953125, -489.34490966796875, -480.3716735839844, -471.3984069824219, -462.4251403808594, -453.4518737792969, -444.4786071777344, -435.5053405761719, -426.5320739746094, -417.558837890625, -408.5855712890625, -399.6123046875, -390.6390380859375, -381.665771484375, -372.6925048828125, -363.71923828125, -354.7459716796875, -345.772705078125, -336.7994689941406, -327.8262023925781, -318.8529357910156, -309.8796691894531, -300.9064025878906, -291.9331359863281, -282.9598693847656, -273.98663330078125, -265.01336669921875, -256.04010009765625, -247.06683349609375, -238.0935821533203, -229.1203155517578, -220.14706420898438, -211.17379760742188, -202.20053100585938, -193.22726440429688, -184.25399780273438, -175.28074645996094, -166.30747985839844, -157.33421325683594, -148.3609619140625, -139.3876953125, -130.4144287109375, -121.441162109375, -112.46790313720703, -103.49464416503906, -94.52137756347656, -85.54811096191406, -76.5748519897461, -67.60159301757812, -58.628326416015625, -49.65506362915039, -40.681800842285156, -31.708538055419922, -22.735271453857422, -13.762008666992188, -4.788745880126953, 4.184516906738281, 13.157779693603516, 22.13104248046875, 31.104305267333984, 40.07756805419922, 49.05083084106445]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 12.0, 12.0, 13.0, 17.0, 21.0, 22.0, 29.0, 37.0, 39.0, 46.0, 47.0, 45.0, 63.0, 41.0, 64.0, 61.0, 54.0, 54.0, 37.0, 29.0, 31.0, 39.0, 31.0, 31.0, 18.0, 19.0, 13.0, 14.0, 12.0, 10.0, 9.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-154.08673095703125, -149.73098754882812, -145.37522888183594, -141.0194854736328, -136.6637420654297, -132.3079833984375, -127.95223999023438, -123.59649658203125, -119.2407455444336, -114.88499450683594, -110.52925109863281, -106.17350006103516, -101.8177490234375, -97.46200561523438, -93.10625457763672, -88.75050354003906, -84.39476013183594, -80.03900909423828, -75.68326568603516, -71.3275146484375, -66.97177124023438, -62.61602020263672, -58.26026916503906, -53.90452194213867, -49.54877471923828, -45.19302749633789, -40.8372802734375, -36.481529235839844, -32.12578201293945, -27.770034790039062, -23.41428565979004, -19.058536529541016, -14.702789306640625, -10.347041130065918, -5.991292953491211, -1.635544776916504, 2.720203399658203, 7.075950622558594, 11.431699752807617, 15.78744888305664, 20.14319610595703, 24.498943328857422, 28.854692459106445, 33.21044158935547, 37.56618881225586, 41.92193603515625, 46.277687072753906, 50.6334342956543, 54.98918151855469, 59.34492874145508, 63.70067596435547, 68.05642700195312, 72.41217041015625, 76.7679214477539, 81.12367248535156, 85.47941589355469, 89.83516693115234, 94.19091796875, 98.54666137695312, 102.90241241455078, 107.25816345214844, 111.61390686035156, 115.96965789794922, 120.32540893554688, 124.68115234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 6.0, 4.0, 13.0, 9.0, 11.0, 12.0, 16.0, 21.0, 20.0, 24.0, 32.0, 28.0, 47.0, 43.0, 47.0, 50.0, 58.0, 57.0, 52.0, 66.0, 50.0, 45.0, 36.0, 35.0, 36.0, 26.0, 27.0, 25.0, 25.0, 16.0, 21.0, 14.0, 11.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.82421875, -6.643798828125, -6.46337890625, -6.282958984375, -6.1025390625, -5.922119140625, -5.74169921875, -5.561279296875, -5.380859375, -5.200439453125, -5.02001953125, -4.839599609375, -4.6591796875, -4.478759765625, -4.29833984375, -4.117919921875, -3.9375, -3.757080078125, -3.57666015625, -3.396240234375, -3.2158203125, -3.035400390625, -2.85498046875, -2.674560546875, -2.494140625, -2.313720703125, -2.13330078125, -1.952880859375, -1.7724609375, -1.592041015625, -1.41162109375, -1.231201171875, -1.05078125, -0.870361328125, -0.68994140625, -0.509521484375, -0.3291015625, -0.148681640625, 0.03173828125, 0.212158203125, 0.392578125, 0.572998046875, 0.75341796875, 0.933837890625, 1.1142578125, 1.294677734375, 1.47509765625, 1.655517578125, 1.8359375, 2.016357421875, 2.19677734375, 2.377197265625, 2.5576171875, 2.738037109375, 2.91845703125, 3.098876953125, 3.279296875, 3.459716796875, 3.64013671875, 3.820556640625, 4.0009765625, 4.181396484375, 4.36181640625, 4.542236328125, 4.72265625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 15.0, 11.0, 8.0, 12.0, 14.0, 30.0, 25.0, 31.0, 49.0, 72.0, 113.0, 142.0, 200.0, 254.0, 415.0, 635.0, 1044.0, 1811.0, 3659.0, 9326.0, 32244.0, 193371.0, 2494652.0, 1311466.0, 109015.0, 21595.0, 6902.0, 2990.0, 1538.0, 920.0, 548.0, 349.0, 239.0, 180.0, 108.0, 84.0, 58.0, 45.0, 31.0, 20.0, 24.0, 15.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.28125, -25.54833984375, -24.8154296875, -24.08251953125, -23.349609375, -22.61669921875, -21.8837890625, -21.15087890625, -20.41796875, -19.68505859375, -18.9521484375, -18.21923828125, -17.486328125, -16.75341796875, -16.0205078125, -15.28759765625, -14.5546875, -13.82177734375, -13.0888671875, -12.35595703125, -11.623046875, -10.89013671875, -10.1572265625, -9.42431640625, -8.69140625, -7.95849609375, -7.2255859375, -6.49267578125, -5.759765625, -5.02685546875, -4.2939453125, -3.56103515625, -2.828125, -2.09521484375, -1.3623046875, -0.62939453125, 0.103515625, 0.83642578125, 1.5693359375, 2.30224609375, 3.03515625, 3.76806640625, 4.5009765625, 5.23388671875, 5.966796875, 6.69970703125, 7.4326171875, 8.16552734375, 8.8984375, 9.63134765625, 10.3642578125, 11.09716796875, 11.830078125, 12.56298828125, 13.2958984375, 14.02880859375, 14.76171875, 15.49462890625, 16.2275390625, 16.96044921875, 17.693359375, 18.42626953125, 19.1591796875, 19.89208984375, 20.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 2.0, 3.0, 4.0, 6.0, 24.0, 29.0, 46.0, 68.0, 107.0, 172.0, 315.0, 425.0, 633.0, 746.0, 509.0, 367.0, 249.0, 135.0, 91.0, 63.0, 32.0, 18.0, 10.0, 8.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.21875, -38.313720703125, -37.40869140625, -36.503662109375, -35.5986328125, -34.693603515625, -33.78857421875, -32.883544921875, -31.978515625, -31.073486328125, -30.16845703125, -29.263427734375, -28.3583984375, -27.453369140625, -26.54833984375, -25.643310546875, -24.73828125, -23.833251953125, -22.92822265625, -22.023193359375, -21.1181640625, -20.213134765625, -19.30810546875, -18.403076171875, -17.498046875, -16.593017578125, -15.68798828125, -14.782958984375, -13.8779296875, -12.972900390625, -12.06787109375, -11.162841796875, -10.2578125, -9.352783203125, -8.44775390625, -7.542724609375, -6.6376953125, -5.732666015625, -4.82763671875, -3.922607421875, -3.017578125, -2.112548828125, -1.20751953125, -0.302490234375, 0.6025390625, 1.507568359375, 2.41259765625, 3.317626953125, 4.22265625, 5.127685546875, 6.03271484375, 6.937744140625, 7.8427734375, 8.747802734375, 9.65283203125, 10.557861328125, 11.462890625, 12.367919921875, 13.27294921875, 14.177978515625, 15.0830078125, 15.988037109375, 16.89306640625, 17.798095703125, 18.703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 16.0, 14.0, 29.0, 37.0, 107.0, 187.0, 403.0, 903.0, 2777.0, 83299.0, 4070220.0, 32627.0, 2195.0, 767.0, 351.0, 172.0, 81.0, 40.0, 21.0, 14.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.8125, -114.1787109375, -110.544921875, -106.9111328125, -103.27734375, -99.6435546875, -96.009765625, -92.3759765625, -88.7421875, -85.1083984375, -81.474609375, -77.8408203125, -74.20703125, -70.5732421875, -66.939453125, -63.3056640625, -59.671875, -56.0380859375, -52.404296875, -48.7705078125, -45.13671875, -41.5029296875, -37.869140625, -34.2353515625, -30.6015625, -26.9677734375, -23.333984375, -19.7001953125, -16.06640625, -12.4326171875, -8.798828125, -5.1650390625, -1.53125, 2.1025390625, 5.736328125, 9.3701171875, 13.00390625, 16.6376953125, 20.271484375, 23.9052734375, 27.5390625, 31.1728515625, 34.806640625, 38.4404296875, 42.07421875, 45.7080078125, 49.341796875, 52.9755859375, 56.609375, 60.2431640625, 63.876953125, 67.5107421875, 71.14453125, 74.7783203125, 78.412109375, 82.0458984375, 85.6796875, 89.3134765625, 92.947265625, 96.5810546875, 100.21484375, 103.8486328125, 107.482421875, 111.1162109375, 114.75]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 19.0, 76.0, 319.0, 407.0, 154.0, 38.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-65.82325744628906, -58.74569320678711, -51.668128967285156, -44.59056091308594, -37.512996673583984, -30.43543243408203, -23.357864379882812, -16.28030014038086, -9.202735900878906, -2.1251707077026367, 4.952394485473633, 12.029960632324219, 19.107524871826172, 26.185089111328125, 33.262657165527344, 40.3402214050293, 47.41778564453125, 54.4953498840332, 61.572914123535156, 68.65048217773438, 75.72804260253906, 82.80561065673828, 89.8831787109375, 96.96073913574219, 104.0383071899414, 111.11587524414062, 118.19343566894531, 125.27100372314453, 132.34857177734375, 139.42613220214844, 146.50369262695312, 153.58126831054688, 160.6588134765625, 167.7363739013672, 174.81394958496094, 181.89151000976562, 188.9690704345703, 196.046630859375, 203.12420654296875, 210.20176696777344, 217.27932739257812, 224.3568878173828, 231.43446350097656, 238.51202392578125, 245.58958435058594, 252.66714477539062, 259.7447204589844, 266.8222961425781, 273.89984130859375, 280.9774169921875, 288.0549621582031, 295.1325378417969, 302.2101135253906, 309.28765869140625, 316.365234375, 323.44281005859375, 330.5203857421875, 337.59796142578125, 344.6755065917969, 351.7530822753906, 358.8306579589844, 365.908203125, 372.98577880859375, 380.0633544921875, 387.1408996582031]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 9.0, 15.0, 7.0, 14.0, 13.0, 27.0, 20.0, 21.0, 26.0, 39.0, 41.0, 38.0, 37.0, 49.0, 50.0, 43.0, 54.0, 43.0, 49.0, 36.0, 45.0, 36.0, 43.0, 35.0, 23.0, 28.0, 24.0, 26.0, 18.0, 18.0, 16.0, 12.0, 11.0, 11.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.03872680664062, -73.7930908203125, -71.54745483398438, -69.30182647705078, -67.05619049072266, -64.81055450439453, -62.564918518066406, -60.31928253173828, -58.07365036010742, -55.8280143737793, -53.58238220214844, -51.33674621582031, -49.09111022949219, -46.84547805786133, -44.5998420715332, -42.354209899902344, -40.10857391357422, -37.862937927246094, -35.617305755615234, -33.37166976928711, -31.126035690307617, -28.880401611328125, -26.634765625, -24.389131546020508, -22.143497467041016, -19.897863388061523, -17.65222930908203, -15.406593322753906, -13.160959243774414, -10.915325164794922, -8.669690132141113, -6.424055099487305, -4.1784210205078125, -1.932786464691162, 0.3128480911254883, 2.5584826469421387, 4.804117202758789, 7.049751281738281, 9.29538631439209, 11.541021347045898, 13.78665542602539, 16.032289505004883, 18.277923583984375, 20.5235595703125, 22.769193649291992, 25.014827728271484, 27.26046371459961, 29.5060977935791, 31.751731872558594, 33.99736785888672, 36.24300003051758, 38.4886360168457, 40.73426818847656, 42.97990417480469, 45.22554016113281, 47.47117614746094, 49.7168083190918, 51.96244430541992, 54.20807647705078, 56.453712463378906, 58.69934844970703, 60.94498062133789, 63.190616607666016, 65.43624877929688, 67.681884765625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 4.0, 9.0, 7.0, 16.0, 10.0, 11.0, 29.0, 24.0, 21.0, 21.0, 29.0, 38.0, 35.0, 41.0, 35.0, 52.0, 48.0, 52.0, 53.0, 48.0, 40.0, 46.0, 34.0, 34.0, 39.0, 35.0, 32.0, 24.0, 22.0, 16.0, 18.0, 19.0, 9.0, 12.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.69921875, -5.52685546875, -5.3544921875, -5.18212890625, -5.009765625, -4.83740234375, -4.6650390625, -4.49267578125, -4.3203125, -4.14794921875, -3.9755859375, -3.80322265625, -3.630859375, -3.45849609375, -3.2861328125, -3.11376953125, -2.94140625, -2.76904296875, -2.5966796875, -2.42431640625, -2.251953125, -2.07958984375, -1.9072265625, -1.73486328125, -1.5625, -1.39013671875, -1.2177734375, -1.04541015625, -0.873046875, -0.70068359375, -0.5283203125, -0.35595703125, -0.18359375, -0.01123046875, 0.1611328125, 0.33349609375, 0.505859375, 0.67822265625, 0.8505859375, 1.02294921875, 1.1953125, 1.36767578125, 1.5400390625, 1.71240234375, 1.884765625, 2.05712890625, 2.2294921875, 2.40185546875, 2.57421875, 2.74658203125, 2.9189453125, 3.09130859375, 3.263671875, 3.43603515625, 3.6083984375, 3.78076171875, 3.953125, 4.12548828125, 4.2978515625, 4.47021484375, 4.642578125, 4.81494140625, 4.9873046875, 5.15966796875, 5.33203125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 8.0, 9.0, 21.0, 22.0, 36.0, 59.0, 80.0, 139.0, 224.0, 347.0, 526.0, 870.0, 1516.0, 2338.0, 3793.0, 6292.0, 10531.0, 17589.0, 30956.0, 56415.0, 107633.0, 207828.0, 265526.0, 155024.0, 79371.0, 42186.0, 23847.0, 13788.0, 8517.0, 5000.0, 3027.0, 1886.0, 1175.0, 714.0, 450.0, 303.0, 179.0, 104.0, 77.0, 63.0, 29.0, 25.0, 10.0, 5.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.84814453125, -0.8218612670898438, -0.7955780029296875, -0.7692947387695312, -0.743011474609375, -0.7167282104492188, -0.6904449462890625, -0.6641616821289062, -0.63787841796875, -0.6115951538085938, -0.5853118896484375, -0.5590286254882812, -0.532745361328125, -0.5064620971679688, -0.4801788330078125, -0.45389556884765625, -0.4276123046875, -0.40132904052734375, -0.3750457763671875, -0.34876251220703125, -0.322479248046875, -0.29619598388671875, -0.2699127197265625, -0.24362945556640625, -0.21734619140625, -0.19106292724609375, -0.1647796630859375, -0.13849639892578125, -0.112213134765625, -0.08592987060546875, -0.0596466064453125, -0.03336334228515625, -0.007080078125, 0.01920318603515625, 0.0454864501953125, 0.07176971435546875, 0.098052978515625, 0.12433624267578125, 0.1506195068359375, 0.17690277099609375, 0.20318603515625, 0.22946929931640625, 0.2557525634765625, 0.28203582763671875, 0.308319091796875, 0.33460235595703125, 0.3608856201171875, 0.38716888427734375, 0.4134521484375, 0.43973541259765625, 0.4660186767578125, 0.49230194091796875, 0.518585205078125, 0.5448684692382812, 0.5711517333984375, 0.5974349975585938, 0.62371826171875, 0.6500015258789062, 0.6762847900390625, 0.7025680541992188, 0.728851318359375, 0.7551345825195312, 0.7814178466796875, 0.8077011108398438, 0.833984375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 5.0, 8.0, 8.0, 12.0, 13.0, 13.0, 15.0, 22.0, 16.0, 18.0, 29.0, 34.0, 31.0, 38.0, 30.0, 43.0, 42.0, 37.0, 35.0, 1062.0, 47.0, 41.0, 43.0, 40.0, 40.0, 34.0, 31.0, 21.0, 36.0, 27.0, 18.0, 22.0, 20.0, 13.0, 9.0, 13.0, 11.0, 13.0, 9.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.046875, -2.95404052734375, -2.8612060546875, -2.76837158203125, -2.675537109375, -2.58270263671875, -2.4898681640625, -2.39703369140625, -2.30419921875, -2.21136474609375, -2.1185302734375, -2.02569580078125, -1.932861328125, -1.84002685546875, -1.7471923828125, -1.65435791015625, -1.5615234375, -1.46868896484375, -1.3758544921875, -1.28302001953125, -1.190185546875, -1.09735107421875, -1.0045166015625, -0.91168212890625, -0.81884765625, -0.72601318359375, -0.6331787109375, -0.54034423828125, -0.447509765625, -0.35467529296875, -0.2618408203125, -0.16900634765625, -0.076171875, 0.01666259765625, 0.1094970703125, 0.20233154296875, 0.295166015625, 0.38800048828125, 0.4808349609375, 0.57366943359375, 0.66650390625, 0.75933837890625, 0.8521728515625, 0.94500732421875, 1.037841796875, 1.13067626953125, 1.2235107421875, 1.31634521484375, 1.4091796875, 1.50201416015625, 1.5948486328125, 1.68768310546875, 1.780517578125, 1.87335205078125, 1.9661865234375, 2.05902099609375, 2.15185546875, 2.24468994140625, 2.3375244140625, 2.43035888671875, 2.523193359375, 2.61602783203125, 2.7088623046875, 2.80169677734375, 2.89453125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 12.0, 20.0, 5.0, 23.0, 35.0, 48.0, 76.0, 118.0, 191.0, 302.0, 468.0, 697.0, 1094.0, 1744.0, 2656.0, 4147.0, 6836.0, 11058.0, 18394.0, 30924.0, 53800.0, 92689.0, 150625.0, 1238732.0, 188697.0, 119784.0, 71244.0, 41271.0, 23630.0, 14274.0, 8888.0, 5369.0, 3350.0, 2135.0, 1337.0, 910.0, 566.0, 314.0, 238.0, 141.0, 94.0, 59.0, 47.0, 31.0, 23.0, 10.0, 16.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421875, -0.4076957702636719, -0.39351654052734375, -0.3793373107910156, -0.3651580810546875, -0.3509788513183594, -0.33679962158203125, -0.3226203918457031, -0.308441162109375, -0.2942619323730469, -0.28008270263671875, -0.2659034729003906, -0.2517242431640625, -0.23754501342773438, -0.22336578369140625, -0.20918655395507812, -0.19500732421875, -0.18082809448242188, -0.16664886474609375, -0.15246963500976562, -0.1382904052734375, -0.12411117553710938, -0.10993194580078125, -0.09575271606445312, -0.081573486328125, -0.06739425659179688, -0.05321502685546875, -0.039035797119140625, -0.0248565673828125, -0.010677337646484375, 0.00350189208984375, 0.017681121826171875, 0.0318603515625, 0.046039581298828125, 0.06021881103515625, 0.07439804077148438, 0.0885772705078125, 0.10275650024414062, 0.11693572998046875, 0.13111495971679688, 0.145294189453125, 0.15947341918945312, 0.17365264892578125, 0.18783187866210938, 0.2020111083984375, 0.21619033813476562, 0.23036956787109375, 0.24454879760742188, 0.25872802734375, 0.2729072570800781, 0.28708648681640625, 0.3012657165527344, 0.3154449462890625, 0.3296241760253906, 0.34380340576171875, 0.3579826354980469, 0.372161865234375, 0.3863410949707031, 0.40052032470703125, 0.4146995544433594, 0.4288787841796875, 0.4430580139160156, 0.45723724365234375, 0.4714164733886719, 0.485595703125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 9.0, 7.0, 10.0, 13.0, 11.0, 19.0, 32.0, 34.0, 53.0, 49.0, 64.0, 68.0, 76.0, 89.0, 91.0, 66.0, 56.0, 40.0, 51.0, 24.0, 19.0, 26.0, 18.0, 15.0, 14.0, 7.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0090484619140625, -0.008799135684967041, -0.008549809455871582, -0.008300483226776123, -0.008051156997680664, -0.007801830768585205, -0.007552504539489746, -0.007303178310394287, -0.007053852081298828, -0.006804525852203369, -0.00655519962310791, -0.006305873394012451, -0.006056547164916992, -0.005807220935821533, -0.005557894706726074, -0.005308568477630615, -0.005059242248535156, -0.004809916019439697, -0.004560589790344238, -0.004311263561248779, -0.00406193733215332, -0.0038126111030578613, -0.0035632848739624023, -0.0033139586448669434, -0.0030646324157714844, -0.0028153061866760254, -0.0025659799575805664, -0.0023166537284851074, -0.0020673274993896484, -0.0018180012702941895, -0.0015686750411987305, -0.0013193488121032715, -0.0010700225830078125, -0.0008206963539123535, -0.0005713701248168945, -0.00032204389572143555, -7.271766662597656e-05, 0.00017660856246948242, 0.0004259347915649414, 0.0006752610206604004, 0.0009245872497558594, 0.0011739134788513184, 0.0014232397079467773, 0.0016725659370422363, 0.0019218921661376953, 0.0021712183952331543, 0.0024205446243286133, 0.0026698708534240723, 0.0029191970825195312, 0.0031685233116149902, 0.0034178495407104492, 0.003667175769805908, 0.003916501998901367, 0.004165828227996826, 0.004415154457092285, 0.004664480686187744, 0.004913806915283203, 0.005163133144378662, 0.005412459373474121, 0.00566178560256958, 0.005911111831665039, 0.006160438060760498, 0.006409764289855957, 0.006659090518951416, 0.006908416748046875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 13.0, 14.0, 16.0, 19.0, 22.0, 38.0, 53.0, 60.0, 72.0, 108.0, 165.0, 242.0, 352.0, 797.0, 57495.0, 986304.0, 1265.0, 493.0, 295.0, 166.0, 131.0, 109.0, 67.0, 37.0, 45.0, 43.0, 22.0, 25.0, 15.0, 12.0, 12.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.14490890502929688, -0.14040374755859375, -0.13589859008789062, -0.1313934326171875, -0.12688827514648438, -0.12238311767578125, -0.11787796020507812, -0.113372802734375, -0.10886764526367188, -0.10436248779296875, -0.09985733032226562, -0.0953521728515625, -0.09084701538085938, -0.08634185791015625, -0.08183670043945312, -0.07733154296875, -0.07282638549804688, -0.06832122802734375, -0.06381607055664062, -0.0593109130859375, -0.054805755615234375, -0.05030059814453125, -0.045795440673828125, -0.041290283203125, -0.036785125732421875, -0.03227996826171875, -0.027774810791015625, -0.0232696533203125, -0.018764495849609375, -0.01425933837890625, -0.009754180908203125, -0.0052490234375, -0.000743865966796875, 0.00376129150390625, 0.008266448974609375, 0.0127716064453125, 0.017276763916015625, 0.02178192138671875, 0.026287078857421875, 0.030792236328125, 0.035297393798828125, 0.03980255126953125, 0.044307708740234375, 0.0488128662109375, 0.053318023681640625, 0.05782318115234375, 0.062328338623046875, 0.06683349609375, 0.07133865356445312, 0.07584381103515625, 0.08034896850585938, 0.0848541259765625, 0.08935928344726562, 0.09386444091796875, 0.09836959838867188, 0.102874755859375, 0.10737991333007812, 0.11188507080078125, 0.11639022827148438, 0.1208953857421875, 0.12540054321289062, 0.12990570068359375, 0.13441085815429688, 0.138916015625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 11.0, 1002.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11226686835289001, -0.10927265882492065, -0.1062784492969513, -0.10328423976898193, -0.10029003024101257, -0.09729582071304321, -0.09430161118507385, -0.09130740165710449, -0.08831319212913513, -0.08531898260116577, -0.08232477307319641, -0.07933056354522705, -0.07633635401725769, -0.07334214448928833, -0.07034793496131897, -0.06735372543334961, -0.06435952335596085, -0.061365313827991486, -0.058371104300022125, -0.055376894772052765, -0.052382685244083405, -0.049388475716114044, -0.04639426991343498, -0.04340006038546562, -0.04040585085749626, -0.0374116413295269, -0.03441743180155754, -0.03142322599887848, -0.02842901460826397, -0.02543480508029461, -0.022440597414970398, -0.019446387887001038, -0.01645217090845108, -0.01345796138048172, -0.010463752783834934, -0.0074695441871881485, -0.004475334659218788, -0.0014811251312494278, 0.0015130825340747833, 0.004507292062044144, 0.007501501590013504, 0.010495711117982864, 0.01348991971462965, 0.016484128311276436, 0.019478337839245796, 0.022472547367215157, 0.025466755032539368, 0.028460964560508728, 0.03145517408847809, 0.03444938361644745, 0.03744359314441681, 0.04043780267238617, 0.04343201220035553, 0.04642622172832489, 0.04942042753100395, 0.05241463705897331, 0.05540884658694267, 0.05840305611491203, 0.06139726564288139, 0.06439147144556046, 0.06738568097352982, 0.07037989050149918, 0.07337410002946854, 0.0763683095574379, 0.07936251908540726]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 14.0, 10.0, 13.0, 15.0, 21.0, 31.0, 33.0, 31.0, 52.0, 54.0, 51.0, 73.0, 45.0, 54.0, 63.0, 50.0, 56.0, 53.0, 51.0, 37.0, 44.0, 38.0, 21.0, 27.0, 20.0, 9.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008620798587799072, -0.008395712822675705, -0.008170627057552338, -0.00794554129242897, -0.007720455527305603, -0.007495369762182236, -0.007270283997058868, -0.007045198231935501, -0.006820112466812134, -0.0065950267016887665, -0.006369940936565399, -0.006144855171442032, -0.0059197694063186646, -0.005694683641195297, -0.00546959787607193, -0.005244512110948563, -0.005019426345825195, -0.004794340580701828, -0.004569254815578461, -0.004344169050455093, -0.004119083285331726, -0.0038939975202083588, -0.0036689117550849915, -0.003443825989961624, -0.003218740224838257, -0.0029936544597148895, -0.002768568694591522, -0.002543482929468155, -0.0023183971643447876, -0.0020933113992214203, -0.001868225634098053, -0.0016431398689746857, -0.0014180541038513184, -0.001192968338727951, -0.0009678825736045837, -0.0007427968084812164, -0.0005177110433578491, -0.0002926252782344818, -6.75395131111145e-05, 0.0001575462520122528, 0.0003826320171356201, 0.0006077177822589874, 0.0008328035473823547, 0.001057889312505722, 0.0012829750776290894, 0.0015080608427524567, 0.001733146607875824, 0.0019582323729991913, 0.0021833181381225586, 0.002408403903245926, 0.002633489668369293, 0.0028585754334926605, 0.003083661198616028, 0.003308746963739395, 0.0035338327288627625, 0.0037589184939861298, 0.003984004259109497, 0.004209090024232864, 0.004434175789356232, 0.004659261554479599, 0.004884347319602966, 0.005109433084726334, 0.005334518849849701, 0.005559604614973068, 0.0057846903800964355]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 4.0, 9.0, 7.0, 16.0, 10.0, 11.0, 29.0, 24.0, 21.0, 21.0, 29.0, 38.0, 35.0, 41.0, 35.0, 52.0, 48.0, 52.0, 53.0, 48.0, 40.0, 46.0, 34.0, 34.0, 39.0, 35.0, 32.0, 24.0, 22.0, 16.0, 18.0, 19.0, 9.0, 12.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.69921875, -5.52685546875, -5.3544921875, -5.18212890625, -5.009765625, -4.83740234375, -4.6650390625, -4.49267578125, -4.3203125, -4.14794921875, -3.9755859375, -3.80322265625, -3.630859375, -3.45849609375, -3.2861328125, -3.11376953125, -2.94140625, -2.76904296875, -2.5966796875, -2.42431640625, -2.251953125, -2.07958984375, -1.9072265625, -1.73486328125, -1.5625, -1.39013671875, -1.2177734375, -1.04541015625, -0.873046875, -0.70068359375, -0.5283203125, -0.35595703125, -0.18359375, -0.01123046875, 0.1611328125, 0.33349609375, 0.505859375, 0.67822265625, 0.8505859375, 1.02294921875, 1.1953125, 1.36767578125, 1.5400390625, 1.71240234375, 1.884765625, 2.05712890625, 2.2294921875, 2.40185546875, 2.57421875, 2.74658203125, 2.9189453125, 3.09130859375, 3.263671875, 3.43603515625, 3.6083984375, 3.78076171875, 3.953125, 4.12548828125, 4.2978515625, 4.47021484375, 4.642578125, 4.81494140625, 4.9873046875, 5.15966796875, 5.33203125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 8.0, 12.0, 4.0, 18.0, 31.0, 38.0, 60.0, 58.0, 84.0, 150.0, 188.0, 246.0, 393.0, 503.0, 711.0, 958.0, 1418.0, 2043.0, 3047.0, 4476.0, 7408.0, 12693.0, 27574.0, 81385.0, 407033.0, 363775.0, 74668.0, 26086.0, 12381.0, 6974.0, 4431.0, 2899.0, 1954.0, 1423.0, 991.0, 689.0, 497.0, 362.0, 253.0, 159.0, 135.0, 96.0, 65.0, 49.0, 38.0, 25.0, 23.0, 16.0, 9.0, 2.0, 11.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-15.7109375, -15.234375, -14.7578125, -14.28125, -13.8046875, -13.328125, -12.8515625, -12.375, -11.8984375, -11.421875, -10.9453125, -10.46875, -9.9921875, -9.515625, -9.0390625, -8.5625, -8.0859375, -7.609375, -7.1328125, -6.65625, -6.1796875, -5.703125, -5.2265625, -4.75, -4.2734375, -3.796875, -3.3203125, -2.84375, -2.3671875, -1.890625, -1.4140625, -0.9375, -0.4609375, 0.015625, 0.4921875, 0.96875, 1.4453125, 1.921875, 2.3984375, 2.875, 3.3515625, 3.828125, 4.3046875, 4.78125, 5.2578125, 5.734375, 6.2109375, 6.6875, 7.1640625, 7.640625, 8.1171875, 8.59375, 9.0703125, 9.546875, 10.0234375, 10.5, 10.9765625, 11.453125, 11.9296875, 12.40625, 12.8828125, 13.359375, 13.8359375, 14.3125, 14.7890625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 14.0, 9.0, 19.0, 23.0, 18.0, 27.0, 31.0, 37.0, 47.0, 38.0, 59.0, 69.0, 81.0, 149.0, 1489.0, 352.0, 105.0, 67.0, 79.0, 56.0, 45.0, 33.0, 45.0, 36.0, 15.0, 20.0, 12.0, 19.0, 11.0, 6.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-23.828125, -23.215576171875, -22.60302734375, -21.990478515625, -21.3779296875, -20.765380859375, -20.15283203125, -19.540283203125, -18.927734375, -18.315185546875, -17.70263671875, -17.090087890625, -16.4775390625, -15.864990234375, -15.25244140625, -14.639892578125, -14.02734375, -13.414794921875, -12.80224609375, -12.189697265625, -11.5771484375, -10.964599609375, -10.35205078125, -9.739501953125, -9.126953125, -8.514404296875, -7.90185546875, -7.289306640625, -6.6767578125, -6.064208984375, -5.45166015625, -4.839111328125, -4.2265625, -3.614013671875, -3.00146484375, -2.388916015625, -1.7763671875, -1.163818359375, -0.55126953125, 0.061279296875, 0.673828125, 1.286376953125, 1.89892578125, 2.511474609375, 3.1240234375, 3.736572265625, 4.34912109375, 4.961669921875, 5.57421875, 6.186767578125, 6.79931640625, 7.411865234375, 8.0244140625, 8.636962890625, 9.24951171875, 9.862060546875, 10.474609375, 11.087158203125, 11.69970703125, 12.312255859375, 12.9248046875, 13.537353515625, 14.14990234375, 14.762451171875, 15.375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 10.0, 13.0, 8.0, 13.0, 17.0, 26.0, 35.0, 29.0, 49.0, 58.0, 108.0, 213.0, 797.0, 20860.0, 3115962.0, 6312.0, 594.0, 216.0, 87.0, 52.0, 45.0, 32.0, 25.0, 28.0, 20.0, 20.0, 20.0, 9.0, 11.0, 7.0, 4.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.0625, -69.2255859375, -66.388671875, -63.5517578125, -60.71484375, -57.8779296875, -55.041015625, -52.2041015625, -49.3671875, -46.5302734375, -43.693359375, -40.8564453125, -38.01953125, -35.1826171875, -32.345703125, -29.5087890625, -26.671875, -23.8349609375, -20.998046875, -18.1611328125, -15.32421875, -12.4873046875, -9.650390625, -6.8134765625, -3.9765625, -1.1396484375, 1.697265625, 4.5341796875, 7.37109375, 10.2080078125, 13.044921875, 15.8818359375, 18.71875, 21.5556640625, 24.392578125, 27.2294921875, 30.06640625, 32.9033203125, 35.740234375, 38.5771484375, 41.4140625, 44.2509765625, 47.087890625, 49.9248046875, 52.76171875, 55.5986328125, 58.435546875, 61.2724609375, 64.109375, 66.9462890625, 69.783203125, 72.6201171875, 75.45703125, 78.2939453125, 81.130859375, 83.9677734375, 86.8046875, 89.6416015625, 92.478515625, 95.3154296875, 98.15234375, 100.9892578125, 103.826171875, 106.6630859375, 109.5]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 135.0, 794.0, 75.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.062835693359375, -45.86117935180664, -39.659523010253906, -33.457862854003906, -27.256208419799805, -21.05455207824707, -14.852893829345703, -8.651237487792969, -2.4495811462402344, 3.752075672149658, 9.95373249053955, 16.1553897857666, 22.357046127319336, 28.55870246887207, 34.76036071777344, 40.96201705932617, 47.163673400878906, 53.36532974243164, 59.566986083984375, 65.76864624023438, 71.97029876708984, 78.17195892333984, 84.37361145019531, 90.57527160644531, 96.77693176269531, 102.97859191894531, 109.18024444580078, 115.38190460205078, 121.58355712890625, 127.78521728515625, 133.98687744140625, 140.18853759765625, 146.3901824951172, 152.5918426513672, 158.7935028076172, 164.99514770507812, 171.19680786132812, 177.39846801757812, 183.60012817382812, 189.80178833007812, 196.00343322753906, 202.20509338378906, 208.40675354003906, 214.6083984375, 220.81005859375, 227.01171875, 233.21337890625, 239.4150390625, 245.61669921875, 251.818359375, 258.02001953125, 264.2216796875, 270.42333984375, 276.6249694824219, 282.8266296386719, 289.0282897949219, 295.2299499511719, 301.4316101074219, 307.6332702636719, 313.8349304199219, 320.0365905761719, 326.23822021484375, 332.43988037109375, 338.64154052734375, 344.84320068359375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 8.0, 17.0, 12.0, 16.0, 14.0, 9.0, 12.0, 21.0, 26.0, 24.0, 31.0, 41.0, 27.0, 34.0, 34.0, 42.0, 35.0, 41.0, 45.0, 37.0, 36.0, 34.0, 34.0, 26.0, 25.0, 32.0, 38.0, 25.0, 21.0, 33.0, 18.0, 26.0, 24.0, 17.0, 13.0, 10.0, 8.0, 10.0, 6.0, 1.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-46.61278533935547, -45.103759765625, -43.5947380065918, -42.08571243286133, -40.576690673828125, -39.067665100097656, -37.55864334106445, -36.049617767333984, -34.54059600830078, -33.03157043457031, -31.52254867553711, -30.013525009155273, -28.504501342773438, -26.9954776763916, -25.486454010009766, -23.977428436279297, -22.46840476989746, -20.959381103515625, -19.45035743713379, -17.941333770751953, -16.432310104370117, -14.923286437988281, -13.414261817932129, -11.905238151550293, -10.396214485168457, -8.887190818786621, -7.378167152404785, -5.869143009185791, -4.360119342803955, -2.851095676422119, -1.342071533203125, 0.16695213317871094, 1.6759757995605469, 3.184999465942383, 4.694023132324219, 6.203047275543213, 7.712070941925049, 9.221094131469727, 10.730118751525879, 12.239142417907715, 13.74816608428955, 15.257189750671387, 16.76621437072754, 18.275238037109375, 19.78426170349121, 21.293285369873047, 22.802309036254883, 24.31133270263672, 25.820356369018555, 27.32938003540039, 28.838403701782227, 30.347427368164062, 31.8564510345459, 33.365474700927734, 34.8745002746582, 36.383522033691406, 37.892547607421875, 39.401573181152344, 40.91059494018555, 42.419620513916016, 43.92864227294922, 45.43766784667969, 46.94668960571289, 48.45571517944336, 49.96473693847656]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 10.0, 12.0, 17.0, 12.0, 26.0, 26.0, 22.0, 24.0, 21.0, 32.0, 39.0, 29.0, 37.0, 34.0, 51.0, 47.0, 39.0, 57.0, 46.0, 36.0, 39.0, 31.0, 29.0, 43.0, 38.0, 21.0, 20.0, 18.0, 20.0, 20.0, 18.0, 14.0, 13.0, 10.0, 2.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.54296875, -5.37347412109375, -5.2039794921875, -5.03448486328125, -4.864990234375, -4.69549560546875, -4.5260009765625, -4.35650634765625, -4.18701171875, -4.01751708984375, -3.8480224609375, -3.67852783203125, -3.509033203125, -3.33953857421875, -3.1700439453125, -3.00054931640625, -2.8310546875, -2.66156005859375, -2.4920654296875, -2.32257080078125, -2.153076171875, -1.98358154296875, -1.8140869140625, -1.64459228515625, -1.47509765625, -1.30560302734375, -1.1361083984375, -0.96661376953125, -0.797119140625, -0.62762451171875, -0.4581298828125, -0.28863525390625, -0.119140625, 0.05035400390625, 0.2198486328125, 0.38934326171875, 0.558837890625, 0.72833251953125, 0.8978271484375, 1.06732177734375, 1.23681640625, 1.40631103515625, 1.5758056640625, 1.74530029296875, 1.914794921875, 2.08428955078125, 2.2537841796875, 2.42327880859375, 2.5927734375, 2.76226806640625, 2.9317626953125, 3.10125732421875, 3.270751953125, 3.44024658203125, 3.6097412109375, 3.77923583984375, 3.94873046875, 4.11822509765625, 4.2877197265625, 4.45721435546875, 4.626708984375, 4.79620361328125, 4.9656982421875, 5.13519287109375, 5.3046875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 3.0, 7.0, 7.0, 15.0, 17.0, 15.0, 23.0, 30.0, 40.0, 51.0, 87.0, 102.0, 118.0, 194.0, 297.0, 412.0, 811.0, 1849.0, 5868.0, 25619.0, 185216.0, 2662572.0, 1199887.0, 88994.0, 14833.0, 3906.0, 1407.0, 640.0, 390.0, 226.0, 158.0, 127.0, 88.0, 60.0, 51.0, 44.0, 29.0, 20.0, 22.0, 12.0, 10.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.734375, -25.89453125, -25.0546875, -24.21484375, -23.375, -22.53515625, -21.6953125, -20.85546875, -20.015625, -19.17578125, -18.3359375, -17.49609375, -16.65625, -15.81640625, -14.9765625, -14.13671875, -13.296875, -12.45703125, -11.6171875, -10.77734375, -9.9375, -9.09765625, -8.2578125, -7.41796875, -6.578125, -5.73828125, -4.8984375, -4.05859375, -3.21875, -2.37890625, -1.5390625, -0.69921875, 0.140625, 0.98046875, 1.8203125, 2.66015625, 3.5, 4.33984375, 5.1796875, 6.01953125, 6.859375, 7.69921875, 8.5390625, 9.37890625, 10.21875, 11.05859375, 11.8984375, 12.73828125, 13.578125, 14.41796875, 15.2578125, 16.09765625, 16.9375, 17.77734375, 18.6171875, 19.45703125, 20.296875, 21.13671875, 21.9765625, 22.81640625, 23.65625, 24.49609375, 25.3359375, 26.17578125, 27.015625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 3.0, 0.0, 6.0, 8.0, 9.0, 15.0, 15.0, 21.0, 46.0, 58.0, 96.0, 109.0, 133.0, 215.0, 238.0, 334.0, 398.0, 491.0, 444.0, 351.0, 297.0, 240.0, 156.0, 99.0, 85.0, 63.0, 40.0, 30.0, 21.0, 17.0, 9.0, 12.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-24.453125, -23.819580078125, -23.18603515625, -22.552490234375, -21.9189453125, -21.285400390625, -20.65185546875, -20.018310546875, -19.384765625, -18.751220703125, -18.11767578125, -17.484130859375, -16.8505859375, -16.217041015625, -15.58349609375, -14.949951171875, -14.31640625, -13.682861328125, -13.04931640625, -12.415771484375, -11.7822265625, -11.148681640625, -10.51513671875, -9.881591796875, -9.248046875, -8.614501953125, -7.98095703125, -7.347412109375, -6.7138671875, -6.080322265625, -5.44677734375, -4.813232421875, -4.1796875, -3.546142578125, -2.91259765625, -2.279052734375, -1.6455078125, -1.011962890625, -0.37841796875, 0.255126953125, 0.888671875, 1.522216796875, 2.15576171875, 2.789306640625, 3.4228515625, 4.056396484375, 4.68994140625, 5.323486328125, 5.95703125, 6.590576171875, 7.22412109375, 7.857666015625, 8.4912109375, 9.124755859375, 9.75830078125, 10.391845703125, 11.025390625, 11.658935546875, 12.29248046875, 12.926025390625, 13.5595703125, 14.193115234375, 14.82666015625, 15.460205078125, 16.09375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 11.0, 10.0, 19.0, 42.0, 63.0, 84.0, 215.0, 521.0, 2087.0, 23776.0, 2144667.0, 1996869.0, 22929.0, 2011.0, 525.0, 208.0, 100.0, 49.0, 32.0, 21.0, 13.0, 4.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.3125, -55.7763671875, -53.240234375, -50.7041015625, -48.16796875, -45.6318359375, -43.095703125, -40.5595703125, -38.0234375, -35.4873046875, -32.951171875, -30.4150390625, -27.87890625, -25.3427734375, -22.806640625, -20.2705078125, -17.734375, -15.1982421875, -12.662109375, -10.1259765625, -7.58984375, -5.0537109375, -2.517578125, 0.0185546875, 2.5546875, 5.0908203125, 7.626953125, 10.1630859375, 12.69921875, 15.2353515625, 17.771484375, 20.3076171875, 22.84375, 25.3798828125, 27.916015625, 30.4521484375, 32.98828125, 35.5244140625, 38.060546875, 40.5966796875, 43.1328125, 45.6689453125, 48.205078125, 50.7412109375, 53.27734375, 55.8134765625, 58.349609375, 60.8857421875, 63.421875, 65.9580078125, 68.494140625, 71.0302734375, 73.56640625, 76.1025390625, 78.638671875, 81.1748046875, 83.7109375, 86.2470703125, 88.783203125, 91.3193359375, 93.85546875, 96.3916015625, 98.927734375, 101.4638671875, 104.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 15.0, 117.0, 377.0, 381.0, 105.0, 16.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.77667236328125, -77.08786010742188, -67.3990478515625, -57.71023941040039, -48.021427154541016, -38.33261489868164, -28.64380645751953, -18.954994201660156, -9.266181945800781, 0.42262935638427734, 10.111440658569336, 19.800251007080078, 29.489063262939453, 39.17787551879883, 48.86668395996094, 58.55549621582031, 68.24430847167969, 77.93312072753906, 87.62193298339844, 97.31074523925781, 106.99955749511719, 116.68836975097656, 126.3771743774414, 136.06597900390625, 145.75479125976562, 155.443603515625, 165.13241577148438, 174.82122802734375, 184.51004028320312, 194.1988525390625, 203.88766479492188, 213.57647705078125, 223.26528930664062, 232.9541015625, 242.64291381835938, 252.33172607421875, 262.0205383300781, 271.7093505859375, 281.3981628417969, 291.08697509765625, 300.7757873535156, 310.464599609375, 320.1534118652344, 329.84222412109375, 339.5310363769531, 349.2198486328125, 358.9086608886719, 368.59747314453125, 378.2862548828125, 387.9750671386719, 397.66387939453125, 407.3526916503906, 417.04150390625, 426.7303161621094, 436.41912841796875, 446.1079406738281, 455.7967529296875, 465.4855651855469, 475.17437744140625, 484.8631896972656, 494.552001953125, 504.2408142089844, 513.9296264648438, 523.618408203125, 533.3072509765625]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 4.0, 3.0, 5.0, 7.0, 10.0, 6.0, 11.0, 12.0, 14.0, 13.0, 17.0, 16.0, 20.0, 21.0, 27.0, 26.0, 20.0, 38.0, 24.0, 29.0, 32.0, 37.0, 38.0, 33.0, 42.0, 47.0, 39.0, 39.0, 42.0, 33.0, 30.0, 30.0, 34.0, 28.0, 30.0, 18.0, 17.0, 17.0, 21.0, 16.0, 9.0, 8.0, 14.0, 10.0, 4.0, 2.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.096397399902344, -50.28776168823242, -48.4791259765625, -46.67048645019531, -44.86185073852539, -43.05321502685547, -41.24457931518555, -39.435943603515625, -37.62730407714844, -35.818668365478516, -34.010032653808594, -32.201393127441406, -30.392757415771484, -28.584121704101562, -26.77548599243164, -24.966848373413086, -23.158212661743164, -21.349576950073242, -19.540939331054688, -17.732303619384766, -15.923666000366211, -14.115030288696289, -12.30639362335205, -10.497756958007812, -8.689120292663574, -6.880483627319336, -5.071846961975098, -3.2632107734680176, -1.4545741081237793, 0.3540620803833008, 2.162698745727539, 3.9713354110717773, 5.779972076416016, 7.588608741760254, 9.397245407104492, 11.205881118774414, 13.014518737792969, 14.82315444946289, 16.631790161132812, 18.440427780151367, 20.249065399169922, 22.057701110839844, 23.8663387298584, 25.67497444152832, 27.483612060546875, 29.292247772216797, 31.10088348388672, 32.909523010253906, 34.71815490722656, 36.526790618896484, 38.335426330566406, 40.144065856933594, 41.952701568603516, 43.76133728027344, 45.56997299194336, 47.37860870361328, 49.18724822998047, 50.99588394165039, 52.80451965332031, 54.6131591796875, 56.42179489135742, 58.230430603027344, 60.039066314697266, 61.84770202636719, 63.656341552734375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 5.0, 5.0, 7.0, 11.0, 19.0, 16.0, 22.0, 23.0, 26.0, 26.0, 22.0, 40.0, 28.0, 40.0, 50.0, 35.0, 45.0, 42.0, 37.0, 49.0, 38.0, 50.0, 36.0, 37.0, 36.0, 32.0, 31.0, 36.0, 27.0, 18.0, 22.0, 16.0, 15.0, 8.0, 6.0, 7.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.98046875, -5.79681396484375, -5.6131591796875, -5.42950439453125, -5.245849609375, -5.06219482421875, -4.8785400390625, -4.69488525390625, -4.51123046875, -4.32757568359375, -4.1439208984375, -3.96026611328125, -3.776611328125, -3.59295654296875, -3.4093017578125, -3.22564697265625, -3.0419921875, -2.85833740234375, -2.6746826171875, -2.49102783203125, -2.307373046875, -2.12371826171875, -1.9400634765625, -1.75640869140625, -1.57275390625, -1.38909912109375, -1.2054443359375, -1.02178955078125, -0.838134765625, -0.65447998046875, -0.4708251953125, -0.28717041015625, -0.103515625, 0.08013916015625, 0.2637939453125, 0.44744873046875, 0.631103515625, 0.81475830078125, 0.9984130859375, 1.18206787109375, 1.36572265625, 1.54937744140625, 1.7330322265625, 1.91668701171875, 2.100341796875, 2.28399658203125, 2.4676513671875, 2.65130615234375, 2.8349609375, 3.01861572265625, 3.2022705078125, 3.38592529296875, 3.569580078125, 3.75323486328125, 3.9368896484375, 4.12054443359375, 4.30419921875, 4.48785400390625, 4.6715087890625, 4.85516357421875, 5.038818359375, 5.22247314453125, 5.4061279296875, 5.58978271484375, 5.7734375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 18.0, 16.0, 27.0, 48.0, 68.0, 98.0, 172.0, 227.0, 342.0, 581.0, 909.0, 1434.0, 2321.0, 3550.0, 5903.0, 9838.0, 15715.0, 26152.0, 44905.0, 79685.0, 146801.0, 233214.0, 203592.0, 116856.0, 63638.0, 36395.0, 21777.0, 12996.0, 8018.0, 4901.0, 3103.0, 1973.0, 1223.0, 747.0, 474.0, 277.0, 202.0, 118.0, 59.0, 58.0, 32.0, 31.0, 16.0, 10.0, 8.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.85986328125, -0.8336563110351562, -0.8074493408203125, -0.7812423706054688, -0.755035400390625, -0.7288284301757812, -0.7026214599609375, -0.6764144897460938, -0.65020751953125, -0.6240005493164062, -0.5977935791015625, -0.5715866088867188, -0.545379638671875, -0.5191726684570312, -0.4929656982421875, -0.46675872802734375, -0.4405517578125, -0.41434478759765625, -0.3881378173828125, -0.36193084716796875, -0.335723876953125, -0.30951690673828125, -0.2833099365234375, -0.25710296630859375, -0.23089599609375, -0.20468902587890625, -0.1784820556640625, -0.15227508544921875, -0.126068115234375, -0.09986114501953125, -0.0736541748046875, -0.04744720458984375, -0.021240234375, 0.00496673583984375, 0.0311737060546875, 0.05738067626953125, 0.083587646484375, 0.10979461669921875, 0.1360015869140625, 0.16220855712890625, 0.18841552734375, 0.21462249755859375, 0.2408294677734375, 0.26703643798828125, 0.293243408203125, 0.31945037841796875, 0.3456573486328125, 0.37186431884765625, 0.3980712890625, 0.42427825927734375, 0.4504852294921875, 0.47669219970703125, 0.502899169921875, 0.5291061401367188, 0.5553131103515625, 0.5815200805664062, 0.60772705078125, 0.6339340209960938, 0.6601409912109375, 0.6863479614257812, 0.712554931640625, 0.7387619018554688, 0.7649688720703125, 0.7911758422851562, 0.8173828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 10.0, 11.0, 10.0, 13.0, 13.0, 17.0, 19.0, 20.0, 25.0, 15.0, 34.0, 34.0, 32.0, 33.0, 44.0, 50.0, 40.0, 42.0, 27.0, 1060.0, 37.0, 48.0, 47.0, 25.0, 40.0, 19.0, 24.0, 31.0, 26.0, 15.0, 27.0, 15.0, 13.0, 17.0, 7.0, 11.0, 6.0, 12.0, 9.0, 5.0, 4.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1484375, -3.043548583984375, -2.93865966796875, -2.833770751953125, -2.7288818359375, -2.623992919921875, -2.51910400390625, -2.414215087890625, -2.309326171875, -2.204437255859375, -2.09954833984375, -1.994659423828125, -1.8897705078125, -1.784881591796875, -1.67999267578125, -1.575103759765625, -1.47021484375, -1.365325927734375, -1.26043701171875, -1.155548095703125, -1.0506591796875, -0.945770263671875, -0.84088134765625, -0.735992431640625, -0.631103515625, -0.526214599609375, -0.42132568359375, -0.316436767578125, -0.2115478515625, -0.106658935546875, -0.00177001953125, 0.103118896484375, 0.2080078125, 0.312896728515625, 0.41778564453125, 0.522674560546875, 0.6275634765625, 0.732452392578125, 0.83734130859375, 0.942230224609375, 1.047119140625, 1.152008056640625, 1.25689697265625, 1.361785888671875, 1.4666748046875, 1.571563720703125, 1.67645263671875, 1.781341552734375, 1.88623046875, 1.991119384765625, 2.09600830078125, 2.200897216796875, 2.3057861328125, 2.410675048828125, 2.51556396484375, 2.620452880859375, 2.725341796875, 2.830230712890625, 2.93511962890625, 3.040008544921875, 3.1448974609375, 3.249786376953125, 3.35467529296875, 3.459564208984375, 3.564453125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 10.0, 10.0, 29.0, 31.0, 69.0, 91.0, 122.0, 207.0, 276.0, 420.0, 665.0, 1042.0, 1562.0, 2331.0, 3753.0, 5847.0, 9143.0, 15214.0, 25218.0, 42311.0, 70851.0, 115866.0, 172660.0, 1234233.0, 150801.0, 97103.0, 58284.0, 34258.0, 20379.0, 12414.0, 7787.0, 4918.0, 3180.0, 2040.0, 1375.0, 853.0, 578.0, 413.0, 221.0, 205.0, 110.0, 75.0, 58.0, 32.0, 18.0, 17.0, 15.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.465087890625, -0.4506950378417969, -0.43630218505859375, -0.4219093322753906, -0.4075164794921875, -0.3931236267089844, -0.37873077392578125, -0.3643379211425781, -0.349945068359375, -0.3355522155761719, -0.32115936279296875, -0.3067665100097656, -0.2923736572265625, -0.2779808044433594, -0.26358795166015625, -0.24919509887695312, -0.23480224609375, -0.22040939331054688, -0.20601654052734375, -0.19162368774414062, -0.1772308349609375, -0.16283798217773438, -0.14844512939453125, -0.13405227661132812, -0.119659423828125, -0.10526657104492188, -0.09087371826171875, -0.07648086547851562, -0.0620880126953125, -0.047695159912109375, -0.03330230712890625, -0.018909454345703125, -0.0045166015625, 0.009876251220703125, 0.02426910400390625, 0.038661956787109375, 0.0530548095703125, 0.06744766235351562, 0.08184051513671875, 0.09623336791992188, 0.110626220703125, 0.12501907348632812, 0.13941192626953125, 0.15380477905273438, 0.1681976318359375, 0.18259048461914062, 0.19698333740234375, 0.21137619018554688, 0.22576904296875, 0.24016189575195312, 0.25455474853515625, 0.2689476013183594, 0.2833404541015625, 0.2977333068847656, 0.31212615966796875, 0.3265190124511719, 0.340911865234375, 0.3553047180175781, 0.36969757080078125, 0.3840904235839844, 0.3984832763671875, 0.4128761291503906, 0.42726898193359375, 0.4416618347167969, 0.4560546875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 4.0, 9.0, 4.0, 13.0, 9.0, 15.0, 9.0, 21.0, 28.0, 32.0, 24.0, 32.0, 51.0, 60.0, 85.0, 94.0, 60.0, 83.0, 62.0, 49.0, 44.0, 38.0, 27.0, 28.0, 26.0, 13.0, 19.0, 11.0, 13.0, 5.0, 6.0, 4.0, 2.0, 3.0, 5.0, 1.0, 6.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00826263427734375, -0.008008003234863281, -0.0077533721923828125, -0.007498741149902344, -0.007244110107421875, -0.006989479064941406, -0.0067348480224609375, -0.006480216979980469, -0.0062255859375, -0.005970954895019531, -0.0057163238525390625, -0.005461692810058594, -0.005207061767578125, -0.004952430725097656, -0.0046977996826171875, -0.004443168640136719, -0.00418853759765625, -0.003933906555175781, -0.0036792755126953125, -0.0034246444702148438, -0.003170013427734375, -0.0029153823852539062, -0.0026607513427734375, -0.0024061203002929688, -0.0021514892578125, -0.0018968582153320312, -0.0016422271728515625, -0.0013875961303710938, -0.001132965087890625, -0.0008783340454101562, -0.0006237030029296875, -0.00036907196044921875, -0.00011444091796875, 0.00014019012451171875, 0.0003948211669921875, 0.0006494522094726562, 0.000904083251953125, 0.0011587142944335938, 0.0014133453369140625, 0.0016679763793945312, 0.001922607421875, 0.0021772384643554688, 0.0024318695068359375, 0.0026865005493164062, 0.002941131591796875, 0.0031957626342773438, 0.0034503936767578125, 0.0037050247192382812, 0.00395965576171875, 0.004214286804199219, 0.0044689178466796875, 0.004723548889160156, 0.004978179931640625, 0.005232810974121094, 0.0054874420166015625, 0.005742073059082031, 0.0059967041015625, 0.006251335144042969, 0.0065059661865234375, 0.006760597229003906, 0.007015228271484375, 0.007269859313964844, 0.0075244903564453125, 0.007779121398925781, 0.00803375244140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 10.0, 11.0, 23.0, 16.0, 28.0, 38.0, 40.0, 47.0, 79.0, 126.0, 157.0, 306.0, 588.0, 4530.0, 997222.0, 43324.0, 939.0, 370.0, 191.0, 127.0, 94.0, 67.0, 46.0, 39.0, 25.0, 16.0, 13.0, 16.0, 8.0, 14.0, 5.0, 9.0, 5.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.2037353515625, -0.1984710693359375, -0.193206787109375, -0.1879425048828125, -0.18267822265625, -0.1774139404296875, -0.172149658203125, -0.1668853759765625, -0.16162109375, -0.1563568115234375, -0.151092529296875, -0.1458282470703125, -0.14056396484375, -0.1352996826171875, -0.130035400390625, -0.1247711181640625, -0.1195068359375, -0.1142425537109375, -0.108978271484375, -0.1037139892578125, -0.09844970703125, -0.0931854248046875, -0.087921142578125, -0.0826568603515625, -0.077392578125, -0.0721282958984375, -0.066864013671875, -0.0615997314453125, -0.05633544921875, -0.0510711669921875, -0.045806884765625, -0.0405426025390625, -0.0352783203125, -0.0300140380859375, -0.024749755859375, -0.0194854736328125, -0.01422119140625, -0.0089569091796875, -0.003692626953125, 0.0015716552734375, 0.0068359375, 0.0121002197265625, 0.017364501953125, 0.0226287841796875, 0.02789306640625, 0.0331573486328125, 0.038421630859375, 0.0436859130859375, 0.0489501953125, 0.0542144775390625, 0.059478759765625, 0.0647430419921875, 0.07000732421875, 0.0752716064453125, 0.080535888671875, 0.0858001708984375, 0.091064453125, 0.0963287353515625, 0.101593017578125, 0.1068572998046875, 0.11212158203125, 0.1173858642578125, 0.122650146484375, 0.1279144287109375, 0.1331787109375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 59.0, 950.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12076413631439209, -0.11665929853916168, -0.11255446076393127, -0.10844962298870087, -0.10434478521347046, -0.10023994743824005, -0.09613510221242905, -0.09203026443719864, -0.08792542666196823, -0.08382058888673782, -0.07971575111150742, -0.07561091333627701, -0.071506068110466, -0.0674012303352356, -0.06329639256000519, -0.05919155478477478, -0.05508671700954437, -0.050981879234313965, -0.04687704145908356, -0.04277219995856285, -0.03866736218333244, -0.034562524408102036, -0.03045768477022648, -0.02635284513235092, -0.022248007357120514, -0.018143169581890106, -0.01403832994401455, -0.009933491237461567, -0.005828652530908585, -0.0017238147556781769, 0.00238102488219738, 0.006485864520072937, 0.010590702295303345, 0.014695541001856327, 0.01880037970840931, 0.022905219346284866, 0.027010057121515274, 0.031114894896745682, 0.03521973639726639, 0.039324574172496796, 0.0434294119477272, 0.04753424972295761, 0.05163908749818802, 0.055743928998708725, 0.05984876677393913, 0.06395360827445984, 0.06805844604969025, 0.07216328382492065, 0.07626812160015106, 0.08037295937538147, 0.08447779715061188, 0.08858263492584229, 0.09268747270107269, 0.0967923104763031, 0.1008971557021141, 0.10500199347734451, 0.10910683125257492, 0.11321166902780533, 0.11731650680303574, 0.12142134457826614, 0.12552618980407715, 0.12963102757930756, 0.13373586535453796, 0.13784070312976837, 0.14194554090499878]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 1.0, 4.0, 6.0, 9.0, 9.0, 25.0, 15.0, 25.0, 28.0, 25.0, 21.0, 43.0, 43.0, 45.0, 50.0, 47.0, 58.0, 73.0, 59.0, 61.0, 62.0, 44.0, 45.0, 38.0, 31.0, 29.0, 21.0, 24.0, 18.0, 14.0, 11.0, 8.0, 9.0, 7.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.01170361042022705, -0.011418513022363186, -0.011133415624499321, -0.010848318226635456, -0.010563220828771591, -0.010278123430907726, -0.009993026033043861, -0.009707928635179996, -0.009422831237316132, -0.009137733839452267, -0.008852636441588402, -0.008567539043724537, -0.008282441645860672, -0.007997344247996807, -0.007712246850132942, -0.007427149452269077, -0.007142052054405212, -0.0068569546565413475, -0.006571857258677483, -0.006286759860813618, -0.006001662462949753, -0.005716565065085888, -0.005431467667222023, -0.005146370269358158, -0.004861272871494293, -0.004576175473630428, -0.004291078075766563, -0.0040059806779026985, -0.0037208832800388336, -0.0034357858821749687, -0.003150688484311104, -0.002865591086447239, -0.002580493688583374, -0.002295396290719509, -0.0020102988928556442, -0.0017252014949917793, -0.0014401040971279144, -0.0011550066992640495, -0.0008699093014001846, -0.0005848119035363197, -0.00029971450567245483, -1.4617107808589935e-05, 0.00027048029005527496, 0.0005555776879191399, 0.0008406750857830048, 0.0011257724836468697, 0.0014108698815107346, 0.0016959672793745995, 0.0019810646772384644, 0.0022661620751023293, 0.002551259472966194, 0.002836356870830059, 0.003121454268693924, 0.003406551666557789, 0.0036916490644216537, 0.003976746462285519, 0.0042618438601493835, 0.0045469412580132484, 0.004832038655877113, 0.005117136053740978, 0.005402233451604843, 0.005687330849468708, 0.005972428247332573, 0.006257525645196438, 0.006542623043060303]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 5.0, 5.0, 7.0, 11.0, 19.0, 16.0, 22.0, 23.0, 26.0, 25.0, 23.0, 40.0, 28.0, 40.0, 50.0, 35.0, 45.0, 42.0, 37.0, 49.0, 38.0, 50.0, 36.0, 38.0, 35.0, 32.0, 31.0, 36.0, 27.0, 18.0, 22.0, 16.0, 15.0, 8.0, 6.0, 7.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.98046875, -5.79681396484375, -5.6131591796875, -5.42950439453125, -5.245849609375, -5.06219482421875, -4.8785400390625, -4.69488525390625, -4.51123046875, -4.32757568359375, -4.1439208984375, -3.96026611328125, -3.776611328125, -3.59295654296875, -3.4093017578125, -3.22564697265625, -3.0419921875, -2.85833740234375, -2.6746826171875, -2.49102783203125, -2.307373046875, -2.12371826171875, -1.9400634765625, -1.75640869140625, -1.57275390625, -1.38909912109375, -1.2054443359375, -1.02178955078125, -0.838134765625, -0.65447998046875, -0.4708251953125, -0.28717041015625, -0.103515625, 0.08013916015625, 0.2637939453125, 0.44744873046875, 0.631103515625, 0.81475830078125, 0.9984130859375, 1.18206787109375, 1.36572265625, 1.54937744140625, 1.7330322265625, 1.91668701171875, 2.100341796875, 2.28399658203125, 2.4676513671875, 2.65130615234375, 2.8349609375, 3.01861572265625, 3.2022705078125, 3.38592529296875, 3.569580078125, 3.75323486328125, 3.9368896484375, 4.12054443359375, 4.30419921875, 4.48785400390625, 4.6715087890625, 4.85516357421875, 5.038818359375, 5.22247314453125, 5.4061279296875, 5.58978271484375, 5.7734375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 7.0, 4.0, 2.0, 13.0, 16.0, 10.0, 14.0, 32.0, 37.0, 59.0, 72.0, 83.0, 131.0, 198.0, 267.0, 388.0, 660.0, 1187.0, 2345.0, 5826.0, 15772.0, 49696.0, 165623.0, 447873.0, 247814.0, 72467.0, 23156.0, 7989.0, 3059.0, 1471.0, 806.0, 471.0, 276.0, 202.0, 141.0, 103.0, 83.0, 58.0, 35.0, 30.0, 19.0, 15.0, 27.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.86328125, -5.68377685546875, -5.5042724609375, -5.32476806640625, -5.145263671875, -4.96575927734375, -4.7862548828125, -4.60675048828125, -4.42724609375, -4.24774169921875, -4.0682373046875, -3.88873291015625, -3.709228515625, -3.52972412109375, -3.3502197265625, -3.17071533203125, -2.9912109375, -2.81170654296875, -2.6322021484375, -2.45269775390625, -2.273193359375, -2.09368896484375, -1.9141845703125, -1.73468017578125, -1.55517578125, -1.37567138671875, -1.1961669921875, -1.01666259765625, -0.837158203125, -0.65765380859375, -0.4781494140625, -0.29864501953125, -0.119140625, 0.06036376953125, 0.2398681640625, 0.41937255859375, 0.598876953125, 0.77838134765625, 0.9578857421875, 1.13739013671875, 1.31689453125, 1.49639892578125, 1.6759033203125, 1.85540771484375, 2.034912109375, 2.21441650390625, 2.3939208984375, 2.57342529296875, 2.7529296875, 2.93243408203125, 3.1119384765625, 3.29144287109375, 3.470947265625, 3.65045166015625, 3.8299560546875, 4.00946044921875, 4.18896484375, 4.36846923828125, 4.5479736328125, 4.72747802734375, 4.906982421875, 5.08648681640625, 5.2659912109375, 5.44549560546875, 5.625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 8.0, 12.0, 8.0, 15.0, 16.0, 25.0, 15.0, 20.0, 28.0, 28.0, 38.0, 45.0, 43.0, 44.0, 62.0, 111.0, 1669.0, 375.0, 83.0, 46.0, 41.0, 48.0, 32.0, 39.0, 31.0, 32.0, 26.0, 29.0, 27.0, 12.0, 12.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.421875, -25.6845703125, -24.947265625, -24.2099609375, -23.47265625, -22.7353515625, -21.998046875, -21.2607421875, -20.5234375, -19.7861328125, -19.048828125, -18.3115234375, -17.57421875, -16.8369140625, -16.099609375, -15.3623046875, -14.625, -13.8876953125, -13.150390625, -12.4130859375, -11.67578125, -10.9384765625, -10.201171875, -9.4638671875, -8.7265625, -7.9892578125, -7.251953125, -6.5146484375, -5.77734375, -5.0400390625, -4.302734375, -3.5654296875, -2.828125, -2.0908203125, -1.353515625, -0.6162109375, 0.12109375, 0.8583984375, 1.595703125, 2.3330078125, 3.0703125, 3.8076171875, 4.544921875, 5.2822265625, 6.01953125, 6.7568359375, 7.494140625, 8.2314453125, 8.96875, 9.7060546875, 10.443359375, 11.1806640625, 11.91796875, 12.6552734375, 13.392578125, 14.1298828125, 14.8671875, 15.6044921875, 16.341796875, 17.0791015625, 17.81640625, 18.5537109375, 19.291015625, 20.0283203125, 20.765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 11.0, 7.0, 32.0, 28.0, 26.0, 30.0, 44.0, 46.0, 62.0, 105.0, 164.0, 398.0, 1564.0, 441523.0, 2698410.0, 2136.0, 449.0, 199.0, 108.0, 76.0, 66.0, 35.0, 31.0, 23.0, 20.0, 21.0, 16.0, 15.0, 8.0, 11.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.71875, -45.0546875, -43.390625, -41.7265625, -40.0625, -38.3984375, -36.734375, -35.0703125, -33.40625, -31.7421875, -30.078125, -28.4140625, -26.75, -25.0859375, -23.421875, -21.7578125, -20.09375, -18.4296875, -16.765625, -15.1015625, -13.4375, -11.7734375, -10.109375, -8.4453125, -6.78125, -5.1171875, -3.453125, -1.7890625, -0.125, 1.5390625, 3.203125, 4.8671875, 6.53125, 8.1953125, 9.859375, 11.5234375, 13.1875, 14.8515625, 16.515625, 18.1796875, 19.84375, 21.5078125, 23.171875, 24.8359375, 26.5, 28.1640625, 29.828125, 31.4921875, 33.15625, 34.8203125, 36.484375, 38.1484375, 39.8125, 41.4765625, 43.140625, 44.8046875, 46.46875, 48.1328125, 49.796875, 51.4609375, 53.125, 54.7890625, 56.453125, 58.1171875, 59.78125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 29.0, 896.0, 92.0], "bins": [-323.5816345214844, -318.41217041015625, -313.2427062988281, -308.0732421875, -302.9037780761719, -297.73431396484375, -292.5648498535156, -287.3953857421875, -282.2259216308594, -277.05645751953125, -271.8869934082031, -266.717529296875, -261.5480651855469, -256.37860107421875, -251.20913696289062, -246.03968811035156, -240.8702392578125, -235.70077514648438, -230.53131103515625, -225.36184692382812, -220.1923828125, -215.02291870117188, -209.85345458984375, -204.6840057373047, -199.5145263671875, -194.34506225585938, -189.17559814453125, -184.00613403320312, -178.836669921875, -173.66720581054688, -168.49774169921875, -163.3282928466797, -158.15882873535156, -152.98936462402344, -147.8199005126953, -142.6504364013672, -137.48097229003906, -132.3115234375, -127.14205169677734, -121.97259521484375, -116.80313110351562, -111.6336669921875, -106.46420288085938, -101.29473876953125, -96.12528228759766, -90.95581817626953, -85.7863540649414, -80.61689758300781, -75.44742584228516, -70.27796173095703, -65.1084976196289, -59.93903732299805, -54.76957702636719, -49.60011291503906, -44.43064880371094, -39.26118850708008, -34.09172439575195, -28.92226219177246, -23.75279998779297, -18.583335876464844, -13.413873672485352, -8.24441146850586, -3.0749473571777344, 2.094512939453125, 7.26397705078125]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 8.0, 11.0, 2.0, 15.0, 19.0, 13.0, 15.0, 21.0, 29.0, 24.0, 26.0, 33.0, 42.0, 34.0, 34.0, 33.0, 46.0, 54.0, 42.0, 39.0, 39.0, 49.0, 41.0, 35.0, 24.0, 23.0, 38.0, 28.0, 26.0, 19.0, 9.0, 21.0, 21.0, 13.0, 13.0, 14.0, 9.0, 9.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-65.44229888916016, -63.547157287597656, -61.652015686035156, -59.756874084472656, -57.861732482910156, -55.966590881347656, -54.071449279785156, -52.176307678222656, -50.281166076660156, -48.386024475097656, -46.490882873535156, -44.595741271972656, -42.700599670410156, -40.805458068847656, -38.910316467285156, -37.015174865722656, -35.12003707885742, -33.22489547729492, -31.329753875732422, -29.434612274169922, -27.539470672607422, -25.644329071044922, -23.749189376831055, -21.854047775268555, -19.958906173706055, -18.063764572143555, -16.168622970581055, -14.273482322692871, -12.378340721130371, -10.483199119567871, -8.588058471679688, -6.6929168701171875, -4.7977752685546875, -2.9026339054107666, -1.0074925422668457, 0.8876485824584961, 2.782790184020996, 4.677931785583496, 6.57307243347168, 8.46821403503418, 10.36335563659668, 12.25849723815918, 14.15363883972168, 16.048778533935547, 17.943920135498047, 19.839061737060547, 21.734203338623047, 23.629344940185547, 25.524486541748047, 27.419628143310547, 29.314769744873047, 31.209911346435547, 33.10505294799805, 35.00019454956055, 36.89533233642578, 38.79047393798828, 40.68561553955078, 42.58075714111328, 44.47589874267578, 46.37104034423828, 48.26618194580078, 50.16132354736328, 52.05646514892578, 53.95160675048828, 55.84674835205078]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 10.0, 7.0, 9.0, 19.0, 20.0, 18.0, 28.0, 27.0, 21.0, 40.0, 29.0, 40.0, 35.0, 41.0, 36.0, 37.0, 53.0, 45.0, 46.0, 47.0, 38.0, 38.0, 38.0, 26.0, 42.0, 36.0, 33.0, 23.0, 14.0, 15.0, 17.0, 15.0, 7.0, 3.0, 7.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.1015625, -5.91156005859375, -5.7215576171875, -5.53155517578125, -5.341552734375, -5.15155029296875, -4.9615478515625, -4.77154541015625, -4.58154296875, -4.39154052734375, -4.2015380859375, -4.01153564453125, -3.821533203125, -3.63153076171875, -3.4415283203125, -3.25152587890625, -3.0615234375, -2.87152099609375, -2.6815185546875, -2.49151611328125, -2.301513671875, -2.11151123046875, -1.9215087890625, -1.73150634765625, -1.54150390625, -1.35150146484375, -1.1614990234375, -0.97149658203125, -0.781494140625, -0.59149169921875, -0.4014892578125, -0.21148681640625, -0.021484375, 0.16851806640625, 0.3585205078125, 0.54852294921875, 0.738525390625, 0.92852783203125, 1.1185302734375, 1.30853271484375, 1.49853515625, 1.68853759765625, 1.8785400390625, 2.06854248046875, 2.258544921875, 2.44854736328125, 2.6385498046875, 2.82855224609375, 3.0185546875, 3.20855712890625, 3.3985595703125, 3.58856201171875, 3.778564453125, 3.96856689453125, 4.1585693359375, 4.34857177734375, 4.53857421875, 4.72857666015625, 4.9185791015625, 5.10858154296875, 5.298583984375, 5.48858642578125, 5.6785888671875, 5.86859130859375, 6.05859375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 8.0, 10.0, 12.0, 10.0, 13.0, 14.0, 18.0, 42.0, 39.0, 45.0, 50.0, 75.0, 65.0, 74.0, 149.0, 258.0, 568.0, 1528.0, 6012.0, 28091.0, 191980.0, 2250141.0, 1556265.0, 130755.0, 20910.0, 4494.0, 1326.0, 495.0, 209.0, 130.0, 112.0, 73.0, 61.0, 43.0, 35.0, 30.0, 31.0, 25.0, 24.0, 14.0, 11.0, 9.0, 3.0, 6.0, 7.0, 3.0, 2.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.078125, -21.38623046875, -20.6943359375, -20.00244140625, -19.310546875, -18.61865234375, -17.9267578125, -17.23486328125, -16.54296875, -15.85107421875, -15.1591796875, -14.46728515625, -13.775390625, -13.08349609375, -12.3916015625, -11.69970703125, -11.0078125, -10.31591796875, -9.6240234375, -8.93212890625, -8.240234375, -7.54833984375, -6.8564453125, -6.16455078125, -5.47265625, -4.78076171875, -4.0888671875, -3.39697265625, -2.705078125, -2.01318359375, -1.3212890625, -0.62939453125, 0.0625, 0.75439453125, 1.4462890625, 2.13818359375, 2.830078125, 3.52197265625, 4.2138671875, 4.90576171875, 5.59765625, 6.28955078125, 6.9814453125, 7.67333984375, 8.365234375, 9.05712890625, 9.7490234375, 10.44091796875, 11.1328125, 11.82470703125, 12.5166015625, 13.20849609375, 13.900390625, 14.59228515625, 15.2841796875, 15.97607421875, 16.66796875, 17.35986328125, 18.0517578125, 18.74365234375, 19.435546875, 20.12744140625, 20.8193359375, 21.51123046875, 22.203125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 15.0, 10.0, 20.0, 17.0, 29.0, 42.0, 67.0, 77.0, 117.0, 162.0, 225.0, 303.0, 377.0, 501.0, 499.0, 412.0, 351.0, 244.0, 174.0, 110.0, 100.0, 55.0, 44.0, 37.0, 28.0, 16.0, 10.0, 10.0, 2.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.015625, -23.351318359375, -22.68701171875, -22.022705078125, -21.3583984375, -20.694091796875, -20.02978515625, -19.365478515625, -18.701171875, -18.036865234375, -17.37255859375, -16.708251953125, -16.0439453125, -15.379638671875, -14.71533203125, -14.051025390625, -13.38671875, -12.722412109375, -12.05810546875, -11.393798828125, -10.7294921875, -10.065185546875, -9.40087890625, -8.736572265625, -8.072265625, -7.407958984375, -6.74365234375, -6.079345703125, -5.4150390625, -4.750732421875, -4.08642578125, -3.422119140625, -2.7578125, -2.093505859375, -1.42919921875, -0.764892578125, -0.1005859375, 0.563720703125, 1.22802734375, 1.892333984375, 2.556640625, 3.220947265625, 3.88525390625, 4.549560546875, 5.2138671875, 5.878173828125, 6.54248046875, 7.206787109375, 7.87109375, 8.535400390625, 9.19970703125, 9.864013671875, 10.5283203125, 11.192626953125, 11.85693359375, 12.521240234375, 13.185546875, 13.849853515625, 14.51416015625, 15.178466796875, 15.8427734375, 16.507080078125, 17.17138671875, 17.835693359375, 18.5]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 11.0, 5.0, 15.0, 26.0, 56.0, 84.0, 149.0, 287.0, 708.0, 2295.0, 11174.0, 94408.0, 1540540.0, 2383258.0, 141485.0, 15270.0, 2927.0, 840.0, 355.0, 172.0, 88.0, 55.0, 24.0, 10.0, 9.0, 12.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.28125, -30.8193359375, -29.357421875, -27.8955078125, -26.43359375, -24.9716796875, -23.509765625, -22.0478515625, -20.5859375, -19.1240234375, -17.662109375, -16.2001953125, -14.73828125, -13.2763671875, -11.814453125, -10.3525390625, -8.890625, -7.4287109375, -5.966796875, -4.5048828125, -3.04296875, -1.5810546875, -0.119140625, 1.3427734375, 2.8046875, 4.2666015625, 5.728515625, 7.1904296875, 8.65234375, 10.1142578125, 11.576171875, 13.0380859375, 14.5, 15.9619140625, 17.423828125, 18.8857421875, 20.34765625, 21.8095703125, 23.271484375, 24.7333984375, 26.1953125, 27.6572265625, 29.119140625, 30.5810546875, 32.04296875, 33.5048828125, 34.966796875, 36.4287109375, 37.890625, 39.3525390625, 40.814453125, 42.2763671875, 43.73828125, 45.2001953125, 46.662109375, 48.1240234375, 49.5859375, 51.0478515625, 52.509765625, 53.9716796875, 55.43359375, 56.8955078125, 58.357421875, 59.8193359375, 61.28125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 23.0, 89.0, 249.0, 310.0, 232.0, 88.0, 14.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.79596710205078, -91.80632781982422, -83.81668090820312, -75.82704162597656, -67.83740234375, -59.84775924682617, -51.858116149902344, -43.86847686767578, -35.87883377075195, -27.889192581176758, -19.899551391601562, -11.909908294677734, -3.920267105102539, 4.069374084472656, 12.059017181396484, 20.048656463623047, 28.038299560546875, 36.0279426574707, 44.017581939697266, 52.007225036621094, 59.996864318847656, 67.98651123046875, 75.97615051269531, 83.96578979492188, 91.95542907714844, 99.945068359375, 107.9347152709961, 115.92435455322266, 123.91399383544922, 131.9036407470703, 139.89328002929688, 147.88291931152344, 155.87257385253906, 163.86221313476562, 171.8518524169922, 179.84149169921875, 187.83114624023438, 195.82078552246094, 203.8104248046875, 211.80006408691406, 219.78970336914062, 227.7793426513672, 235.76898193359375, 243.75863647460938, 251.74827575683594, 259.7379150390625, 267.7275390625, 275.7171936035156, 283.70684814453125, 291.6965026855469, 299.6861267089844, 307.67578125, 315.6654052734375, 323.6550598144531, 331.64471435546875, 339.63433837890625, 347.62396240234375, 355.6136169433594, 363.6032409667969, 371.5928955078125, 379.58251953125, 387.5721740722656, 395.56182861328125, 403.55145263671875, 411.5411071777344]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 5.0, 9.0, 13.0, 14.0, 11.0, 18.0, 17.0, 23.0, 26.0, 25.0, 41.0, 34.0, 44.0, 38.0, 46.0, 32.0, 34.0, 36.0, 42.0, 41.0, 41.0, 31.0, 43.0, 35.0, 37.0, 36.0, 29.0, 28.0, 24.0, 25.0, 16.0, 14.0, 10.0, 9.0, 10.0, 15.0, 12.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.21125793457031, -59.26491928100586, -57.318580627441406, -55.37224197387695, -53.4259033203125, -51.47956466674805, -49.533226013183594, -47.586883544921875, -45.64054870605469, -43.694210052490234, -41.74787139892578, -39.80153274536133, -37.855194091796875, -35.90885543823242, -33.96251678466797, -32.01617431640625, -30.069835662841797, -28.123497009277344, -26.17715835571289, -24.230819702148438, -22.284481048583984, -20.33814239501953, -18.391801834106445, -16.445463180541992, -14.499124526977539, -12.552785873413086, -10.606447219848633, -8.660107612609863, -6.71376895904541, -4.767430305480957, -2.8210906982421875, -0.8747520446777344, 1.0715866088867188, 3.017925500869751, 4.964264392852783, 6.9106035232543945, 8.856942176818848, 10.8032808303833, 12.74962043762207, 14.695959091186523, 16.642297744750977, 18.58863639831543, 20.534975051879883, 22.48131561279297, 24.427654266357422, 26.373992919921875, 28.320331573486328, 30.26667022705078, 32.213008880615234, 34.15934753417969, 36.10568618774414, 38.052024841308594, 39.99836349487305, 41.9447021484375, 43.89104461669922, 45.837379455566406, 47.783721923828125, 49.73006057739258, 51.67639923095703, 53.622737884521484, 55.56907653808594, 57.51541519165039, 59.461753845214844, 61.40809631347656, 63.35443115234375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 10.0, 10.0, 6.0, 8.0, 16.0, 28.0, 24.0, 24.0, 26.0, 31.0, 32.0, 36.0, 40.0, 45.0, 31.0, 37.0, 49.0, 46.0, 50.0, 46.0, 43.0, 42.0, 49.0, 32.0, 18.0, 28.0, 36.0, 24.0, 17.0, 15.0, 13.0, 11.0, 16.0, 10.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.734130859375, -5.53857421875, -5.343017578125, -5.1474609375, -4.951904296875, -4.75634765625, -4.560791015625, -4.365234375, -4.169677734375, -3.97412109375, -3.778564453125, -3.5830078125, -3.387451171875, -3.19189453125, -2.996337890625, -2.80078125, -2.605224609375, -2.40966796875, -2.214111328125, -2.0185546875, -1.822998046875, -1.62744140625, -1.431884765625, -1.236328125, -1.040771484375, -0.84521484375, -0.649658203125, -0.4541015625, -0.258544921875, -0.06298828125, 0.132568359375, 0.328125, 0.523681640625, 0.71923828125, 0.914794921875, 1.1103515625, 1.305908203125, 1.50146484375, 1.697021484375, 1.892578125, 2.088134765625, 2.28369140625, 2.479248046875, 2.6748046875, 2.870361328125, 3.06591796875, 3.261474609375, 3.45703125, 3.652587890625, 3.84814453125, 4.043701171875, 4.2392578125, 4.434814453125, 4.63037109375, 4.825927734375, 5.021484375, 5.217041015625, 5.41259765625, 5.608154296875, 5.8037109375, 5.999267578125, 6.19482421875, 6.390380859375, 6.5859375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 8.0, 7.0, 7.0, 17.0, 20.0, 31.0, 38.0, 58.0, 93.0, 152.0, 251.0, 315.0, 494.0, 746.0, 1175.0, 1764.0, 2783.0, 4167.0, 6571.0, 9982.0, 15996.0, 25849.0, 42648.0, 73364.0, 130091.0, 214428.0, 209454.0, 126485.0, 71226.0, 41400.0, 25134.0, 15691.0, 9912.0, 6468.0, 4137.0, 2627.0, 1678.0, 1120.0, 739.0, 487.0, 304.0, 208.0, 127.0, 95.0, 61.0, 51.0, 31.0, 25.0, 14.0, 11.0, 11.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.8828125, -0.8552017211914062, -0.8275909423828125, -0.7999801635742188, -0.772369384765625, -0.7447586059570312, -0.7171478271484375, -0.6895370483398438, -0.66192626953125, -0.6343154907226562, -0.6067047119140625, -0.5790939331054688, -0.551483154296875, -0.5238723754882812, -0.4962615966796875, -0.46865081787109375, -0.4410400390625, -0.41342926025390625, -0.3858184814453125, -0.35820770263671875, -0.330596923828125, -0.30298614501953125, -0.2753753662109375, -0.24776458740234375, -0.22015380859375, -0.19254302978515625, -0.1649322509765625, -0.13732147216796875, -0.109710693359375, -0.08209991455078125, -0.0544891357421875, -0.02687835693359375, 0.000732421875, 0.02834320068359375, 0.0559539794921875, 0.08356475830078125, 0.111175537109375, 0.13878631591796875, 0.1663970947265625, 0.19400787353515625, 0.22161865234375, 0.24922943115234375, 0.2768402099609375, 0.30445098876953125, 0.332061767578125, 0.35967254638671875, 0.3872833251953125, 0.41489410400390625, 0.4425048828125, 0.47011566162109375, 0.4977264404296875, 0.5253372192382812, 0.552947998046875, 0.5805587768554688, 0.6081695556640625, 0.6357803344726562, 0.66339111328125, 0.6910018920898438, 0.7186126708984375, 0.7462234497070312, 0.773834228515625, 0.8014450073242188, 0.8290557861328125, 0.8566665649414062, 0.88427734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 4.0, 6.0, 6.0, 8.0, 6.0, 10.0, 13.0, 19.0, 15.0, 13.0, 21.0, 27.0, 23.0, 28.0, 22.0, 31.0, 32.0, 40.0, 38.0, 45.0, 32.0, 1066.0, 41.0, 45.0, 41.0, 39.0, 37.0, 24.0, 34.0, 28.0, 39.0, 21.0, 35.0, 25.0, 20.0, 19.0, 16.0, 9.0, 3.0, 2.0, 5.0, 6.0, 6.0, 5.0, 5.0, 1.0, 4.0, 6.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.53125, -3.4168701171875, -3.302490234375, -3.1881103515625, -3.07373046875, -2.9593505859375, -2.844970703125, -2.7305908203125, -2.6162109375, -2.5018310546875, -2.387451171875, -2.2730712890625, -2.15869140625, -2.0443115234375, -1.929931640625, -1.8155517578125, -1.701171875, -1.5867919921875, -1.472412109375, -1.3580322265625, -1.24365234375, -1.1292724609375, -1.014892578125, -0.9005126953125, -0.7861328125, -0.6717529296875, -0.557373046875, -0.4429931640625, -0.32861328125, -0.2142333984375, -0.099853515625, 0.0145263671875, 0.12890625, 0.2432861328125, 0.357666015625, 0.4720458984375, 0.58642578125, 0.7008056640625, 0.815185546875, 0.9295654296875, 1.0439453125, 1.1583251953125, 1.272705078125, 1.3870849609375, 1.50146484375, 1.6158447265625, 1.730224609375, 1.8446044921875, 1.958984375, 2.0733642578125, 2.187744140625, 2.3021240234375, 2.41650390625, 2.5308837890625, 2.645263671875, 2.7596435546875, 2.8740234375, 2.9884033203125, 3.102783203125, 3.2171630859375, 3.33154296875, 3.4459228515625, 3.560302734375, 3.6746826171875, 3.7890625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 11.0, 24.0, 24.0, 30.0, 48.0, 72.0, 95.0, 185.0, 282.0, 403.0, 620.0, 978.0, 1492.0, 2380.0, 3691.0, 5856.0, 9285.0, 14980.0, 24812.0, 41488.0, 70601.0, 117299.0, 176493.0, 1241200.0, 149466.0, 94103.0, 55589.0, 33239.0, 19645.0, 12119.0, 7642.0, 4713.0, 2952.0, 1896.0, 1190.0, 780.0, 514.0, 305.0, 217.0, 120.0, 105.0, 58.0, 39.0, 36.0, 19.0, 13.0, 9.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.505859375, -0.4891510009765625, -0.472442626953125, -0.4557342529296875, -0.43902587890625, -0.4223175048828125, -0.405609130859375, -0.3889007568359375, -0.3721923828125, -0.3554840087890625, -0.338775634765625, -0.3220672607421875, -0.30535888671875, -0.2886505126953125, -0.271942138671875, -0.2552337646484375, -0.238525390625, -0.2218170166015625, -0.205108642578125, -0.1884002685546875, -0.17169189453125, -0.1549835205078125, -0.138275146484375, -0.1215667724609375, -0.1048583984375, -0.0881500244140625, -0.071441650390625, -0.0547332763671875, -0.03802490234375, -0.0213165283203125, -0.004608154296875, 0.0121002197265625, 0.02880859375, 0.0455169677734375, 0.062225341796875, 0.0789337158203125, 0.09564208984375, 0.1123504638671875, 0.129058837890625, 0.1457672119140625, 0.1624755859375, 0.1791839599609375, 0.195892333984375, 0.2126007080078125, 0.22930908203125, 0.2460174560546875, 0.262725830078125, 0.2794342041015625, 0.296142578125, 0.3128509521484375, 0.329559326171875, 0.3462677001953125, 0.36297607421875, 0.3796844482421875, 0.396392822265625, 0.4131011962890625, 0.4298095703125, 0.4465179443359375, 0.463226318359375, 0.4799346923828125, 0.49664306640625, 0.5133514404296875, 0.530059814453125, 0.5467681884765625, 0.5634765625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 8.0, 9.0, 5.0, 10.0, 17.0, 20.0, 30.0, 18.0, 29.0, 44.0, 50.0, 58.0, 70.0, 73.0, 71.0, 85.0, 65.0, 67.0, 43.0, 51.0, 42.0, 31.0, 26.0, 19.0, 17.0, 17.0, 7.0, 1.0, 3.0, 2.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00783538818359375, -0.0075953006744384766, -0.007355213165283203, -0.00711512565612793, -0.006875038146972656, -0.006634950637817383, -0.006394863128662109, -0.006154775619506836, -0.0059146881103515625, -0.005674600601196289, -0.005434513092041016, -0.005194425582885742, -0.004954338073730469, -0.004714250564575195, -0.004474163055419922, -0.0042340755462646484, -0.003993988037109375, -0.0037539005279541016, -0.003513813018798828, -0.0032737255096435547, -0.0030336380004882812, -0.002793550491333008, -0.0025534629821777344, -0.002313375473022461, -0.0020732879638671875, -0.001833200454711914, -0.0015931129455566406, -0.0013530254364013672, -0.0011129379272460938, -0.0008728504180908203, -0.0006327629089355469, -0.00039267539978027344, -0.000152587890625, 8.749961853027344e-05, 0.0003275871276855469, 0.0005676746368408203, 0.0008077621459960938, 0.0010478496551513672, 0.0012879371643066406, 0.001528024673461914, 0.0017681121826171875, 0.002008199691772461, 0.0022482872009277344, 0.002488374710083008, 0.0027284622192382812, 0.0029685497283935547, 0.003208637237548828, 0.0034487247467041016, 0.003688812255859375, 0.0039288997650146484, 0.004168987274169922, 0.004409074783325195, 0.004649162292480469, 0.004889249801635742, 0.005129337310791016, 0.005369424819946289, 0.0056095123291015625, 0.005849599838256836, 0.006089687347412109, 0.006329774856567383, 0.006569862365722656, 0.00680994987487793, 0.007050037384033203, 0.0072901248931884766, 0.00753021240234375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 3.0, 18.0, 23.0, 22.0, 40.0, 61.0, 102.0, 127.0, 203.0, 351.0, 1136.0, 32946.0, 983283.0, 28190.0, 1079.0, 348.0, 182.0, 133.0, 76.0, 58.0, 48.0, 38.0, 16.0, 12.0, 11.0, 10.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.1473865509033203, -0.14255142211914062, -0.13771629333496094, -0.13288116455078125, -0.12804603576660156, -0.12321090698242188, -0.11837577819824219, -0.1135406494140625, -0.10870552062988281, -0.10387039184570312, -0.09903526306152344, -0.09420013427734375, -0.08936500549316406, -0.08452987670898438, -0.07969474792480469, -0.074859619140625, -0.07002449035644531, -0.06518936157226562, -0.06035423278808594, -0.05551910400390625, -0.05068397521972656, -0.045848846435546875, -0.04101371765136719, -0.0361785888671875, -0.03134346008300781, -0.026508331298828125, -0.021673202514648438, -0.01683807373046875, -0.012002944946289062, -0.007167816162109375, -0.0023326873779296875, 0.00250244140625, 0.0073375701904296875, 0.012172698974609375, 0.017007827758789062, 0.02184295654296875, 0.026678085327148438, 0.031513214111328125, 0.03634834289550781, 0.0411834716796875, 0.04601860046386719, 0.050853729248046875, 0.05568885803222656, 0.06052398681640625, 0.06535911560058594, 0.07019424438476562, 0.07502937316894531, 0.079864501953125, 0.08469963073730469, 0.08953475952148438, 0.09436988830566406, 0.09920501708984375, 0.10404014587402344, 0.10887527465820312, 0.11371040344238281, 0.1185455322265625, 0.12338066101074219, 0.12821578979492188, 0.13305091857910156, 0.13788604736328125, 0.14272117614746094, 0.14755630493164062, 0.1523914337158203, 0.1572265625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 24.0, 171.0, 697.0, 111.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021026788279414177, -0.018813423812389374, -0.01660006120800972, -0.014386697672307491, -0.012173334136605263, -0.009959970600903034, -0.007746607065200806, -0.005533243529498577, -0.0033198799937963486, -0.00110651645809412, 0.0011068470776081085, 0.003320210613310337, 0.005533574149012566, 0.007746937684714794, 0.009960301220417023, 0.012173664756119251, 0.01438702829182148, 0.016600392758846283, 0.018813755363225937, 0.02102711796760559, 0.023240482434630394, 0.025453846901655197, 0.02766720950603485, 0.029880572110414505, 0.03209393471479416, 0.03430729731917381, 0.03652065992355347, 0.03873402625322342, 0.04094738885760307, 0.04316075146198273, 0.04537411779165268, 0.04758748039603233, 0.04980084300041199, 0.05201420560479164, 0.054227568209171295, 0.05644093453884125, 0.0586542971432209, 0.060867659747600555, 0.06308102607727051, 0.06529438495635986, 0.06750775128602982, 0.06972111761569977, 0.07193447649478912, 0.07414784282445908, 0.07636120915412903, 0.07857456803321838, 0.08078793436288834, 0.08300129324197769, 0.08521465957164764, 0.0874280259013176, 0.08964138478040695, 0.0918547511100769, 0.09406810998916626, 0.09628147631883621, 0.09849484264850616, 0.10070820152759552, 0.10292156785726547, 0.10513493418693542, 0.10734829306602478, 0.10956165939569473, 0.11177502572536469, 0.11398838460445404, 0.11620175093412399, 0.11841510981321335, 0.1206284761428833]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 8.0, 11.0, 8.0, 6.0, 16.0, 27.0, 20.0, 24.0, 30.0, 34.0, 34.0, 35.0, 52.0, 38.0, 43.0, 47.0, 57.0, 44.0, 42.0, 47.0, 49.0, 41.0, 39.0, 33.0, 30.0, 36.0, 35.0, 29.0, 16.0, 15.0, 15.0, 13.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0061585307121276855, -0.005986126139760017, -0.005813721567392349, -0.005641316995024681, -0.005468912422657013, -0.005296507850289345, -0.005124103277921677, -0.0049516987055540085, -0.00477929413318634, -0.004606889560818672, -0.004434484988451004, -0.004262080416083336, -0.004089675843715668, -0.003917271271348, -0.0037448666989803314, -0.0035724621266126633, -0.003400057554244995, -0.003227652981877327, -0.003055248409509659, -0.0028828438371419907, -0.0027104392647743225, -0.0025380346924066544, -0.002365630120038986, -0.002193225547671318, -0.00202082097530365, -0.0018484164029359818, -0.0016760118305683136, -0.0015036072582006454, -0.0013312026858329773, -0.0011587981134653091, -0.000986393541097641, -0.0008139889687299728, -0.0006415843963623047, -0.00046917982399463654, -0.0002967752516269684, -0.00012437067925930023, 4.803389310836792e-05, 0.00022043846547603607, 0.0003928430378437042, 0.0005652476102113724, 0.0007376521825790405, 0.0009100567549467087, 0.0010824613273143768, 0.001254865899682045, 0.0014272704720497131, 0.0015996750444173813, 0.0017720796167850494, 0.0019444841891527176, 0.0021168887615203857, 0.002289293333888054, 0.002461697906255722, 0.00263410247862339, 0.0028065070509910583, 0.0029789116233587265, 0.0031513161957263947, 0.003323720768094063, 0.003496125340461731, 0.003668529912829399, 0.0038409344851970673, 0.004013339057564735, 0.0041857436299324036, 0.004358148202300072, 0.00453055277466774, 0.004702957347035408, 0.004875361919403076]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 10.0, 10.0, 6.0, 8.0, 16.0, 28.0, 24.0, 24.0, 26.0, 31.0, 32.0, 36.0, 40.0, 45.0, 31.0, 37.0, 49.0, 46.0, 50.0, 46.0, 43.0, 42.0, 49.0, 32.0, 18.0, 28.0, 36.0, 24.0, 17.0, 15.0, 13.0, 11.0, 16.0, 10.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.734130859375, -5.53857421875, -5.343017578125, -5.1474609375, -4.951904296875, -4.75634765625, -4.560791015625, -4.365234375, -4.169677734375, -3.97412109375, -3.778564453125, -3.5830078125, -3.387451171875, -3.19189453125, -2.996337890625, -2.80078125, -2.605224609375, -2.40966796875, -2.214111328125, -2.0185546875, -1.822998046875, -1.62744140625, -1.431884765625, -1.236328125, -1.040771484375, -0.84521484375, -0.649658203125, -0.4541015625, -0.258544921875, -0.06298828125, 0.132568359375, 0.328125, 0.523681640625, 0.71923828125, 0.914794921875, 1.1103515625, 1.305908203125, 1.50146484375, 1.697021484375, 1.892578125, 2.088134765625, 2.28369140625, 2.479248046875, 2.6748046875, 2.870361328125, 3.06591796875, 3.261474609375, 3.45703125, 3.652587890625, 3.84814453125, 4.043701171875, 4.2392578125, 4.434814453125, 4.63037109375, 4.825927734375, 5.021484375, 5.217041015625, 5.41259765625, 5.608154296875, 5.8037109375, 5.999267578125, 6.19482421875, 6.390380859375, 6.5859375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 10.0, 15.0, 11.0, 20.0, 34.0, 44.0, 56.0, 67.0, 100.0, 177.0, 273.0, 361.0, 566.0, 757.0, 1029.0, 1665.0, 2554.0, 3996.0, 6580.0, 11145.0, 20771.0, 41888.0, 99152.0, 290551.0, 345409.0, 117679.0, 48424.0, 22989.0, 12458.0, 7087.0, 4250.0, 2816.0, 1829.0, 1153.0, 799.0, 549.0, 411.0, 276.0, 167.0, 132.0, 88.0, 70.0, 41.0, 24.0, 28.0, 15.0, 8.0, 6.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-4.1640625, -4.0382080078125, -3.912353515625, -3.7864990234375, -3.66064453125, -3.5347900390625, -3.408935546875, -3.2830810546875, -3.1572265625, -3.0313720703125, -2.905517578125, -2.7796630859375, -2.65380859375, -2.5279541015625, -2.402099609375, -2.2762451171875, -2.150390625, -2.0245361328125, -1.898681640625, -1.7728271484375, -1.64697265625, -1.5211181640625, -1.395263671875, -1.2694091796875, -1.1435546875, -1.0177001953125, -0.891845703125, -0.7659912109375, -0.64013671875, -0.5142822265625, -0.388427734375, -0.2625732421875, -0.13671875, -0.0108642578125, 0.114990234375, 0.2408447265625, 0.36669921875, 0.4925537109375, 0.618408203125, 0.7442626953125, 0.8701171875, 0.9959716796875, 1.121826171875, 1.2476806640625, 1.37353515625, 1.4993896484375, 1.625244140625, 1.7510986328125, 1.876953125, 2.0028076171875, 2.128662109375, 2.2545166015625, 2.38037109375, 2.5062255859375, 2.632080078125, 2.7579345703125, 2.8837890625, 3.0096435546875, 3.135498046875, 3.2613525390625, 3.38720703125, 3.5130615234375, 3.638916015625, 3.7647705078125, 3.890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 7.0, 9.0, 16.0, 15.0, 13.0, 11.0, 26.0, 17.0, 27.0, 34.0, 36.0, 24.0, 42.0, 38.0, 55.0, 64.0, 153.0, 1765.0, 183.0, 66.0, 44.0, 51.0, 40.0, 38.0, 37.0, 22.0, 23.0, 18.0, 29.0, 19.0, 17.0, 17.0, 15.0, 10.0, 8.0, 10.0, 3.0, 3.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-21.984375, -21.31005859375, -20.6357421875, -19.96142578125, -19.287109375, -18.61279296875, -17.9384765625, -17.26416015625, -16.58984375, -15.91552734375, -15.2412109375, -14.56689453125, -13.892578125, -13.21826171875, -12.5439453125, -11.86962890625, -11.1953125, -10.52099609375, -9.8466796875, -9.17236328125, -8.498046875, -7.82373046875, -7.1494140625, -6.47509765625, -5.80078125, -5.12646484375, -4.4521484375, -3.77783203125, -3.103515625, -2.42919921875, -1.7548828125, -1.08056640625, -0.40625, 0.26806640625, 0.9423828125, 1.61669921875, 2.291015625, 2.96533203125, 3.6396484375, 4.31396484375, 4.98828125, 5.66259765625, 6.3369140625, 7.01123046875, 7.685546875, 8.35986328125, 9.0341796875, 9.70849609375, 10.3828125, 11.05712890625, 11.7314453125, 12.40576171875, 13.080078125, 13.75439453125, 14.4287109375, 15.10302734375, 15.77734375, 16.45166015625, 17.1259765625, 17.80029296875, 18.474609375, 19.14892578125, 19.8232421875, 20.49755859375, 21.171875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 2.0, 4.0, 8.0, 7.0, 10.0, 8.0, 19.0, 18.0, 17.0, 35.0, 29.0, 37.0, 48.0, 87.0, 114.0, 206.0, 360.0, 879.0, 2694.0, 23366.0, 2931217.0, 177152.0, 6652.0, 1384.0, 527.0, 282.0, 153.0, 95.0, 56.0, 53.0, 31.0, 29.0, 16.0, 14.0, 19.0, 12.0, 12.0, 8.0, 9.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-35.28125, -34.169921875, -33.05859375, -31.947265625, -30.8359375, -29.724609375, -28.61328125, -27.501953125, -26.390625, -25.279296875, -24.16796875, -23.056640625, -21.9453125, -20.833984375, -19.72265625, -18.611328125, -17.5, -16.388671875, -15.27734375, -14.166015625, -13.0546875, -11.943359375, -10.83203125, -9.720703125, -8.609375, -7.498046875, -6.38671875, -5.275390625, -4.1640625, -3.052734375, -1.94140625, -0.830078125, 0.28125, 1.392578125, 2.50390625, 3.615234375, 4.7265625, 5.837890625, 6.94921875, 8.060546875, 9.171875, 10.283203125, 11.39453125, 12.505859375, 13.6171875, 14.728515625, 15.83984375, 16.951171875, 18.0625, 19.173828125, 20.28515625, 21.396484375, 22.5078125, 23.619140625, 24.73046875, 25.841796875, 26.953125, 28.064453125, 29.17578125, 30.287109375, 31.3984375, 32.509765625, 33.62109375, 34.732421875, 35.84375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 24.0, 73.0, 186.0, 307.0, 256.0, 117.0, 35.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40267562866211, -33.3916015625, -31.380529403686523, -29.369457244873047, -27.358383178710938, -25.347309112548828, -23.33623695373535, -21.325164794921875, -19.314090728759766, -17.303016662597656, -15.29194450378418, -13.280871391296387, -11.269798278808594, -9.2587251663208, -7.247652053833008, -5.236578941345215, -3.225505828857422, -1.214432716369629, 0.7966403961181641, 2.807713508605957, 4.81878662109375, 6.829859733581543, 8.840932846069336, 10.852005958557129, 12.863079071044922, 14.874152183532715, 16.885225296020508, 18.896297454833984, 20.907371520996094, 22.918445587158203, 24.92951774597168, 26.940589904785156, 28.95166015625, 30.96273422241211, 32.97380828857422, 34.98487854003906, 36.99595260620117, 39.00702667236328, 41.018096923828125, 43.029170989990234, 45.040245056152344, 47.05131912231445, 49.06239318847656, 51.073463439941406, 53.084537506103516, 55.095611572265625, 57.10668182373047, 59.11775588989258, 61.12882995605469, 63.1399040222168, 65.1509780883789, 67.16204833984375, 69.17312622070312, 71.18419647216797, 73.19526672363281, 75.20634460449219, 77.21741485595703, 79.22848510742188, 81.23956298828125, 83.2506332397461, 85.26170349121094, 87.27278137207031, 89.28385162353516, 91.29492950439453, 93.30599975585938]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 7.0, 8.0, 10.0, 17.0, 12.0, 22.0, 9.0, 21.0, 22.0, 27.0, 28.0, 29.0, 27.0, 31.0, 32.0, 43.0, 47.0, 35.0, 40.0, 41.0, 33.0, 34.0, 44.0, 38.0, 42.0, 33.0, 31.0, 27.0, 23.0, 24.0, 28.0, 24.0, 21.0, 8.0, 9.0, 15.0, 11.0, 7.0, 5.0, 8.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-69.46064758300781, -67.31611633300781, -65.17157745361328, -63.02704620361328, -60.882511138916016, -58.73797607421875, -56.59344482421875, -54.448909759521484, -52.30437469482422, -50.15983963012695, -48.01530456542969, -45.87077331542969, -43.72623825073242, -41.581703186035156, -39.437171936035156, -37.29263687133789, -35.148101806640625, -33.00356674194336, -30.859033584594727, -28.714500427246094, -26.569965362548828, -24.425430297851562, -22.28089714050293, -20.136363983154297, -17.99182891845703, -15.847294807434082, -13.702760696411133, -11.558226585388184, -9.413692474365234, -7.269158363342285, -5.124624252319336, -2.9800901412963867, -0.8355636596679688, 1.3089704513549805, 3.4535045623779297, 5.598038673400879, 7.742572784423828, 9.887106895446777, 12.031641006469727, 14.176175117492676, 16.320709228515625, 18.46524429321289, 20.609777450561523, 22.754310607910156, 24.898845672607422, 27.043380737304688, 29.18791389465332, 31.332447052001953, 33.47698211669922, 35.621517181396484, 37.76605224609375, 39.91058349609375, 42.055118560791016, 44.19965362548828, 46.34418487548828, 48.48871994018555, 50.63325500488281, 52.77779006958008, 54.922325134277344, 57.066856384277344, 59.21139144897461, 61.355926513671875, 63.500457763671875, 65.6449966430664, 67.7895278930664]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 7.0, 12.0, 7.0, 9.0, 8.0, 15.0, 16.0, 31.0, 22.0, 25.0, 36.0, 33.0, 42.0, 37.0, 35.0, 33.0, 42.0, 43.0, 45.0, 62.0, 45.0, 45.0, 36.0, 47.0, 31.0, 28.0, 23.0, 33.0, 24.0, 18.0, 18.0, 17.0, 13.0, 10.0, 16.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.4609375, -6.255615234375, -6.05029296875, -5.844970703125, -5.6396484375, -5.434326171875, -5.22900390625, -5.023681640625, -4.818359375, -4.613037109375, -4.40771484375, -4.202392578125, -3.9970703125, -3.791748046875, -3.58642578125, -3.381103515625, -3.17578125, -2.970458984375, -2.76513671875, -2.559814453125, -2.3544921875, -2.149169921875, -1.94384765625, -1.738525390625, -1.533203125, -1.327880859375, -1.12255859375, -0.917236328125, -0.7119140625, -0.506591796875, -0.30126953125, -0.095947265625, 0.109375, 0.314697265625, 0.52001953125, 0.725341796875, 0.9306640625, 1.135986328125, 1.34130859375, 1.546630859375, 1.751953125, 1.957275390625, 2.16259765625, 2.367919921875, 2.5732421875, 2.778564453125, 2.98388671875, 3.189208984375, 3.39453125, 3.599853515625, 3.80517578125, 4.010498046875, 4.2158203125, 4.421142578125, 4.62646484375, 4.831787109375, 5.037109375, 5.242431640625, 5.44775390625, 5.653076171875, 5.8583984375, 6.063720703125, 6.26904296875, 6.474365234375, 6.6796875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 5.0, 14.0, 13.0, 13.0, 23.0, 20.0, 34.0, 27.0, 48.0, 63.0, 85.0, 148.0, 351.0, 1143.0, 5600.0, 40349.0, 557856.0, 3264050.0, 292966.0, 25949.0, 3906.0, 846.0, 280.0, 125.0, 76.0, 59.0, 42.0, 27.0, 24.0, 22.0, 19.0, 16.0, 9.0, 15.0, 12.0, 6.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.65625, -26.775390625, -25.89453125, -25.013671875, -24.1328125, -23.251953125, -22.37109375, -21.490234375, -20.609375, -19.728515625, -18.84765625, -17.966796875, -17.0859375, -16.205078125, -15.32421875, -14.443359375, -13.5625, -12.681640625, -11.80078125, -10.919921875, -10.0390625, -9.158203125, -8.27734375, -7.396484375, -6.515625, -5.634765625, -4.75390625, -3.873046875, -2.9921875, -2.111328125, -1.23046875, -0.349609375, 0.53125, 1.412109375, 2.29296875, 3.173828125, 4.0546875, 4.935546875, 5.81640625, 6.697265625, 7.578125, 8.458984375, 9.33984375, 10.220703125, 11.1015625, 11.982421875, 12.86328125, 13.744140625, 14.625, 15.505859375, 16.38671875, 17.267578125, 18.1484375, 19.029296875, 19.91015625, 20.791015625, 21.671875, 22.552734375, 23.43359375, 24.314453125, 25.1953125, 26.076171875, 26.95703125, 27.837890625, 28.71875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 16.0, 13.0, 18.0, 47.0, 89.0, 131.0, 217.0, 366.0, 594.0, 755.0, 696.0, 469.0, 265.0, 169.0, 103.0, 53.0, 32.0, 19.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -36.107666015625, -35.12158203125, -34.135498046875, -33.1494140625, -32.163330078125, -31.17724609375, -30.191162109375, -29.205078125, -28.218994140625, -27.23291015625, -26.246826171875, -25.2607421875, -24.274658203125, -23.28857421875, -22.302490234375, -21.31640625, -20.330322265625, -19.34423828125, -18.358154296875, -17.3720703125, -16.385986328125, -15.39990234375, -14.413818359375, -13.427734375, -12.441650390625, -11.45556640625, -10.469482421875, -9.4833984375, -8.497314453125, -7.51123046875, -6.525146484375, -5.5390625, -4.552978515625, -3.56689453125, -2.580810546875, -1.5947265625, -0.608642578125, 0.37744140625, 1.363525390625, 2.349609375, 3.335693359375, 4.32177734375, 5.307861328125, 6.2939453125, 7.280029296875, 8.26611328125, 9.252197265625, 10.23828125, 11.224365234375, 12.21044921875, 13.196533203125, 14.1826171875, 15.168701171875, 16.15478515625, 17.140869140625, 18.126953125, 19.113037109375, 20.09912109375, 21.085205078125, 22.0712890625, 23.057373046875, 24.04345703125, 25.029541015625, 26.015625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 12.0, 9.0, 36.0, 48.0, 89.0, 167.0, 324.0, 703.0, 2292.0, 21573.0, 753249.0, 3320879.0, 87545.0, 5391.0, 1073.0, 421.0, 211.0, 110.0, 69.0, 36.0, 20.0, 16.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.65625, -47.51806640625, -45.3798828125, -43.24169921875, -41.103515625, -38.96533203125, -36.8271484375, -34.68896484375, -32.55078125, -30.41259765625, -28.2744140625, -26.13623046875, -23.998046875, -21.85986328125, -19.7216796875, -17.58349609375, -15.4453125, -13.30712890625, -11.1689453125, -9.03076171875, -6.892578125, -4.75439453125, -2.6162109375, -0.47802734375, 1.66015625, 3.79833984375, 5.9365234375, 8.07470703125, 10.212890625, 12.35107421875, 14.4892578125, 16.62744140625, 18.765625, 20.90380859375, 23.0419921875, 25.18017578125, 27.318359375, 29.45654296875, 31.5947265625, 33.73291015625, 35.87109375, 38.00927734375, 40.1474609375, 42.28564453125, 44.423828125, 46.56201171875, 48.7001953125, 50.83837890625, 52.9765625, 55.11474609375, 57.2529296875, 59.39111328125, 61.529296875, 63.66748046875, 65.8056640625, 67.94384765625, 70.08203125, 72.22021484375, 74.3583984375, 76.49658203125, 78.634765625, 80.77294921875, 82.9111328125, 85.04931640625, 87.1875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 11.0, 37.0, 94.0, 136.0, 192.0, 189.0, 167.0, 105.0, 52.0, 18.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-222.65126037597656, -216.95010375976562, -211.2489471435547, -205.54779052734375, -199.84664916992188, -194.14549255371094, -188.4443359375, -182.74317932128906, -177.04202270507812, -171.3408660888672, -165.63970947265625, -159.93856811523438, -154.23741149902344, -148.5362548828125, -142.83509826660156, -137.13394165039062, -131.43280029296875, -125.73164367675781, -120.0304946899414, -114.32933807373047, -108.62818908691406, -102.92703247070312, -97.22587585449219, -91.52471923828125, -85.82357025146484, -80.1224136352539, -74.4212646484375, -68.72010803222656, -63.01895523071289, -57.31780242919922, -51.61664581298828, -45.91549301147461, -40.21434020996094, -34.513187408447266, -28.81203269958496, -23.110877990722656, -17.409725189208984, -11.708572387695312, -6.007415771484375, -0.3062629699707031, 5.394889831542969, 11.096043586730957, 16.797197341918945, 22.49835205078125, 28.199504852294922, 33.900657653808594, 39.60181427001953, 45.3029670715332, 51.004119873046875, 56.70527267456055, 62.40642547607422, 68.10758209228516, 73.80873107910156, 79.5098876953125, 85.21104431152344, 90.91220092773438, 96.61334991455078, 102.31450653076172, 108.01565551757812, 113.71681213378906, 119.41796875, 125.1191177368164, 130.82028198242188, 136.52142333984375, 142.2225799560547]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 4.0, 14.0, 9.0, 14.0, 15.0, 12.0, 18.0, 21.0, 24.0, 21.0, 25.0, 31.0, 30.0, 35.0, 42.0, 36.0, 32.0, 39.0, 37.0, 44.0, 29.0, 41.0, 34.0, 37.0, 40.0, 29.0, 23.0, 27.0, 43.0, 27.0, 29.0, 23.0, 23.0, 12.0, 10.0, 11.0, 4.0, 8.0, 7.0, 5.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0], "bins": [-71.04208374023438, -69.0881576538086, -67.13423156738281, -65.18030548095703, -63.226375579833984, -61.2724494934082, -59.318519592285156, -57.364593505859375, -55.410667419433594, -53.45674133300781, -51.50281524658203, -49.548885345458984, -47.5949592590332, -45.64103317260742, -43.687103271484375, -41.733177185058594, -39.77925109863281, -37.82532501220703, -35.87139892578125, -33.9174690246582, -31.963542938232422, -30.00961685180664, -28.055688858032227, -26.101760864257812, -24.14783477783203, -22.19390869140625, -20.239980697631836, -18.286052703857422, -16.33212661743164, -14.378199577331543, -12.424272537231445, -10.470345497131348, -8.51641845703125, -6.562491416931152, -4.608564376831055, -2.654637336730957, -0.7007102966308594, 1.2532167434692383, 3.207143783569336, 5.161070823669434, 7.114997863769531, 9.068924903869629, 11.022851943969727, 12.976778984069824, 14.930706024169922, 16.884632110595703, 18.838560104370117, 20.79248809814453, 22.746414184570312, 24.700340270996094, 26.654268264770508, 28.608196258544922, 30.562122344970703, 32.516048431396484, 34.46997833251953, 36.42390441894531, 38.377830505371094, 40.331756591796875, 42.285682678222656, 44.2396125793457, 46.193538665771484, 48.147464752197266, 50.10139465332031, 52.055320739746094, 54.009246826171875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 4.0, 9.0, 9.0, 11.0, 18.0, 18.0, 20.0, 19.0, 20.0, 24.0, 31.0, 38.0, 44.0, 38.0, 45.0, 47.0, 51.0, 54.0, 31.0, 40.0, 43.0, 48.0, 44.0, 30.0, 35.0, 34.0, 23.0, 22.0, 31.0, 23.0, 20.0, 16.0, 11.0, 9.0, 11.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.16412353515625, -5.9454345703125, -5.72674560546875, -5.508056640625, -5.28936767578125, -5.0706787109375, -4.85198974609375, -4.63330078125, -4.41461181640625, -4.1959228515625, -3.97723388671875, -3.758544921875, -3.53985595703125, -3.3211669921875, -3.10247802734375, -2.8837890625, -2.66510009765625, -2.4464111328125, -2.22772216796875, -2.009033203125, -1.79034423828125, -1.5716552734375, -1.35296630859375, -1.13427734375, -0.91558837890625, -0.6968994140625, -0.47821044921875, -0.259521484375, -0.04083251953125, 0.1778564453125, 0.39654541015625, 0.615234375, 0.83392333984375, 1.0526123046875, 1.27130126953125, 1.489990234375, 1.70867919921875, 1.9273681640625, 2.14605712890625, 2.36474609375, 2.58343505859375, 2.8021240234375, 3.02081298828125, 3.239501953125, 3.45819091796875, 3.6768798828125, 3.89556884765625, 4.1142578125, 4.33294677734375, 4.5516357421875, 4.77032470703125, 4.989013671875, 5.20770263671875, 5.4263916015625, 5.64508056640625, 5.86376953125, 6.08245849609375, 6.3011474609375, 6.51983642578125, 6.738525390625, 6.95721435546875, 7.1759033203125, 7.39459228515625, 7.61328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 6.0, 18.0, 17.0, 32.0, 50.0, 84.0, 100.0, 154.0, 228.0, 389.0, 609.0, 969.0, 1475.0, 2398.0, 3671.0, 5868.0, 9528.0, 15543.0, 26189.0, 45421.0, 80345.0, 144002.0, 229772.0, 202664.0, 119063.0, 65630.0, 37266.0, 21901.0, 13190.0, 8058.0, 5113.0, 3171.0, 2012.0, 1312.0, 846.0, 509.0, 318.0, 215.0, 140.0, 88.0, 60.0, 34.0, 34.0, 22.0, 8.0, 10.0, 8.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.96142578125, -0.9312210083007812, -0.9010162353515625, -0.8708114624023438, -0.840606689453125, -0.8104019165039062, -0.7801971435546875, -0.7499923706054688, -0.71978759765625, -0.6895828247070312, -0.6593780517578125, -0.6291732788085938, -0.598968505859375, -0.5687637329101562, -0.5385589599609375, -0.5083541870117188, -0.4781494140625, -0.44794464111328125, -0.4177398681640625, -0.38753509521484375, -0.357330322265625, -0.32712554931640625, -0.2969207763671875, -0.26671600341796875, -0.23651123046875, -0.20630645751953125, -0.1761016845703125, -0.14589691162109375, -0.115692138671875, -0.08548736572265625, -0.0552825927734375, -0.02507781982421875, 0.005126953125, 0.03533172607421875, 0.0655364990234375, 0.09574127197265625, 0.125946044921875, 0.15615081787109375, 0.1863555908203125, 0.21656036376953125, 0.24676513671875, 0.27696990966796875, 0.3071746826171875, 0.33737945556640625, 0.367584228515625, 0.39778900146484375, 0.4279937744140625, 0.45819854736328125, 0.4884033203125, 0.5186080932617188, 0.5488128662109375, 0.5790176391601562, 0.609222412109375, 0.6394271850585938, 0.6696319580078125, 0.6998367309570312, 0.73004150390625, 0.7602462768554688, 0.7904510498046875, 0.8206558227539062, 0.850860595703125, 0.8810653686523438, 0.9112701416015625, 0.9414749145507812, 0.9716796875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 7.0, 8.0, 6.0, 4.0, 13.0, 11.0, 22.0, 18.0, 28.0, 27.0, 20.0, 25.0, 40.0, 47.0, 40.0, 42.0, 41.0, 36.0, 43.0, 1071.0, 41.0, 46.0, 38.0, 39.0, 26.0, 32.0, 26.0, 40.0, 33.0, 21.0, 22.0, 19.0, 14.0, 12.0, 13.0, 10.0, 6.0, 12.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.37164306640625, -4.2354736328125, -4.09930419921875, -3.963134765625, -3.82696533203125, -3.6907958984375, -3.55462646484375, -3.41845703125, -3.28228759765625, -3.1461181640625, -3.00994873046875, -2.873779296875, -2.73760986328125, -2.6014404296875, -2.46527099609375, -2.3291015625, -2.19293212890625, -2.0567626953125, -1.92059326171875, -1.784423828125, -1.64825439453125, -1.5120849609375, -1.37591552734375, -1.23974609375, -1.10357666015625, -0.9674072265625, -0.83123779296875, -0.695068359375, -0.55889892578125, -0.4227294921875, -0.28656005859375, -0.150390625, -0.01422119140625, 0.1219482421875, 0.25811767578125, 0.394287109375, 0.53045654296875, 0.6666259765625, 0.80279541015625, 0.93896484375, 1.07513427734375, 1.2113037109375, 1.34747314453125, 1.483642578125, 1.61981201171875, 1.7559814453125, 1.89215087890625, 2.0283203125, 2.16448974609375, 2.3006591796875, 2.43682861328125, 2.572998046875, 2.70916748046875, 2.8453369140625, 2.98150634765625, 3.11767578125, 3.25384521484375, 3.3900146484375, 3.52618408203125, 3.662353515625, 3.79852294921875, 3.9346923828125, 4.07086181640625, 4.20703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 5.0, 20.0, 22.0, 21.0, 40.0, 66.0, 92.0, 117.0, 182.0, 256.0, 358.0, 584.0, 784.0, 1173.0, 1913.0, 2785.0, 4219.0, 6639.0, 10140.0, 16564.0, 26857.0, 44537.0, 72718.0, 114717.0, 166893.0, 1221640.0, 145531.0, 98116.0, 60964.0, 37428.0, 22761.0, 13994.0, 8748.0, 5584.0, 3579.0, 2341.0, 1511.0, 1074.0, 659.0, 429.0, 352.0, 230.0, 144.0, 113.0, 66.0, 39.0, 35.0, 32.0, 19.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.5205078125, -0.5044021606445312, -0.4882965087890625, -0.47219085693359375, -0.456085205078125, -0.43997955322265625, -0.4238739013671875, -0.40776824951171875, -0.39166259765625, -0.37555694580078125, -0.3594512939453125, -0.34334564208984375, -0.327239990234375, -0.31113433837890625, -0.2950286865234375, -0.27892303466796875, -0.2628173828125, -0.24671173095703125, -0.2306060791015625, -0.21450042724609375, -0.198394775390625, -0.18228912353515625, -0.1661834716796875, -0.15007781982421875, -0.13397216796875, -0.11786651611328125, -0.1017608642578125, -0.08565521240234375, -0.069549560546875, -0.05344390869140625, -0.0373382568359375, -0.02123260498046875, -0.005126953125, 0.01097869873046875, 0.0270843505859375, 0.04319000244140625, 0.059295654296875, 0.07540130615234375, 0.0915069580078125, 0.10761260986328125, 0.12371826171875, 0.13982391357421875, 0.1559295654296875, 0.17203521728515625, 0.188140869140625, 0.20424652099609375, 0.2203521728515625, 0.23645782470703125, 0.2525634765625, 0.26866912841796875, 0.2847747802734375, 0.30088043212890625, 0.316986083984375, 0.33309173583984375, 0.3491973876953125, 0.36530303955078125, 0.38140869140625, 0.39751434326171875, 0.4136199951171875, 0.42972564697265625, 0.445831298828125, 0.46193695068359375, 0.4780426025390625, 0.49414825439453125, 0.51025390625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 6.0, 8.0, 12.0, 9.0, 13.0, 19.0, 29.0, 62.0, 62.0, 108.0, 170.0, 182.0, 110.0, 64.0, 47.0, 28.0, 22.0, 8.0, 9.0, 17.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016876220703125, -0.016201257705688477, -0.015526294708251953, -0.01485133171081543, -0.014176368713378906, -0.013501405715942383, -0.01282644271850586, -0.012151479721069336, -0.011476516723632812, -0.010801553726196289, -0.010126590728759766, -0.009451627731323242, -0.008776664733886719, -0.008101701736450195, -0.007426738739013672, -0.0067517757415771484, -0.006076812744140625, -0.0054018497467041016, -0.004726886749267578, -0.004051923751831055, -0.0033769607543945312, -0.002701997756958008, -0.0020270347595214844, -0.001352071762084961, -0.0006771087646484375, -2.1457672119140625e-06, 0.0006728172302246094, 0.0013477802276611328, 0.0020227432250976562, 0.0026977062225341797, 0.003372669219970703, 0.0040476322174072266, 0.00472259521484375, 0.0053975582122802734, 0.006072521209716797, 0.00674748420715332, 0.007422447204589844, 0.008097410202026367, 0.00877237319946289, 0.009447336196899414, 0.010122299194335938, 0.010797262191772461, 0.011472225189208984, 0.012147188186645508, 0.012822151184082031, 0.013497114181518555, 0.014172077178955078, 0.014847040176391602, 0.015522003173828125, 0.01619696617126465, 0.016871929168701172, 0.017546892166137695, 0.01822185516357422, 0.018896818161010742, 0.019571781158447266, 0.02024674415588379, 0.020921707153320312, 0.021596670150756836, 0.02227163314819336, 0.022946596145629883, 0.023621559143066406, 0.02429652214050293, 0.024971485137939453, 0.025646448135375977, 0.0263214111328125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 10.0, 15.0, 11.0, 18.0, 27.0, 44.0, 81.0, 145.0, 300.0, 1325.0, 584151.0, 460475.0, 1272.0, 292.0, 142.0, 61.0, 62.0, 36.0, 19.0, 13.0, 11.0, 9.0, 2.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4482421875, -0.4364433288574219, -0.42464447021484375, -0.4128456115722656, -0.4010467529296875, -0.3892478942871094, -0.37744903564453125, -0.3656501770019531, -0.353851318359375, -0.3420524597167969, -0.33025360107421875, -0.3184547424316406, -0.3066558837890625, -0.2948570251464844, -0.28305816650390625, -0.2712593078613281, -0.25946044921875, -0.24766159057617188, -0.23586273193359375, -0.22406387329101562, -0.2122650146484375, -0.20046615600585938, -0.18866729736328125, -0.17686843872070312, -0.165069580078125, -0.15327072143554688, -0.14147186279296875, -0.12967300415039062, -0.1178741455078125, -0.10607528686523438, -0.09427642822265625, -0.08247756958007812, -0.0706787109375, -0.058879852294921875, -0.04708099365234375, -0.035282135009765625, -0.0234832763671875, -0.011684417724609375, 0.00011444091796875, 0.011913299560546875, 0.023712158203125, 0.035511016845703125, 0.04730987548828125, 0.059108734130859375, 0.0709075927734375, 0.08270645141601562, 0.09450531005859375, 0.10630416870117188, 0.11810302734375, 0.12990188598632812, 0.14170074462890625, 0.15349960327148438, 0.1652984619140625, 0.17709732055664062, 0.18889617919921875, 0.20069503784179688, 0.212493896484375, 0.22429275512695312, 0.23609161376953125, 0.24789047241210938, 0.2596893310546875, 0.2714881896972656, 0.28328704833984375, 0.2950859069824219, 0.306884765625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 61.0, 841.0, 104.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10077457129955292, -0.09508166462182999, -0.08938875049352646, -0.08369584381580353, -0.0780029296875, -0.07231002300977707, -0.06661711633205414, -0.06092420592904091, -0.05523129552602768, -0.04953838512301445, -0.04384547472000122, -0.03815256804227829, -0.03245965763926506, -0.02676674723625183, -0.0210738405585289, -0.01538093015551567, -0.009688019752502441, -0.003995110280811787, 0.001697799190878868, 0.007390707731246948, 0.013083618134260178, 0.018776528537273407, 0.024469435214996338, 0.030162345618009567, 0.0358552560210228, 0.041548166424036026, 0.047241076827049255, 0.052933983504772186, 0.058626893907785416, 0.06431980431079865, 0.07001271098852158, 0.0757056176662445, 0.08139854669570923, 0.08709145337343216, 0.09278436750173569, 0.09847727417945862, 0.10417018830776215, 0.10986309498548508, 0.11555600166320801, 0.12124891579151154, 0.12694182991981506, 0.1326347440481186, 0.13832764327526093, 0.14402055740356445, 0.14971347153186798, 0.1554063856601715, 0.16109928488731384, 0.16679219901561737, 0.1724850982427597, 0.17817801237106323, 0.18387091159820557, 0.1895638257265091, 0.19525673985481262, 0.20094963908195496, 0.20664255321025848, 0.212335467338562, 0.21802836656570435, 0.22372128069400787, 0.2294141799211502, 0.23510709404945374, 0.24080000817775726, 0.2464929223060608, 0.2521858215332031, 0.25787872076034546, 0.2635716497898102]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 5.0, 8.0, 13.0, 9.0, 12.0, 17.0, 12.0, 28.0, 26.0, 21.0, 28.0, 25.0, 33.0, 35.0, 41.0, 39.0, 44.0, 51.0, 49.0, 48.0, 44.0, 44.0, 57.0, 28.0, 28.0, 42.0, 32.0, 27.0, 27.0, 20.0, 16.0, 13.0, 20.0, 11.0, 14.0, 6.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01444321870803833, -0.014026072807610035, -0.01360892690718174, -0.013191781006753445, -0.01277463510632515, -0.012357489205896854, -0.01194034330546856, -0.011523197405040264, -0.011106051504611969, -0.010688905604183674, -0.010271759703755379, -0.009854613803327084, -0.009437467902898788, -0.009020322002470493, -0.008603176102042198, -0.008186030201613903, -0.007768884301185608, -0.007351738400757313, -0.006934592500329018, -0.0065174465999007225, -0.006100300699472427, -0.005683154799044132, -0.005266008898615837, -0.004848862998187542, -0.004431717097759247, -0.004014571197330952, -0.0035974252969026566, -0.0031802793964743614, -0.0027631334960460663, -0.002345987595617771, -0.001928841695189476, -0.0015116957947611809, -0.0010945498943328857, -0.0006774039939045906, -0.00026025809347629547, 0.00015688780695199966, 0.0005740337073802948, 0.00099117960780859, 0.001408325508236885, 0.0018254714086651802, 0.0022426173090934753, 0.0026597632095217705, 0.0030769091099500656, 0.0034940550103783607, 0.003911200910806656, 0.004328346811234951, 0.004745492711663246, 0.005162638612091541, 0.005579784512519836, 0.0059969304129481316, 0.006414076313376427, 0.006831222213804722, 0.007248368114233017, 0.007665514014661312, 0.008082659915089607, 0.008499805815517902, 0.008916951715946198, 0.009334097616374493, 0.009751243516802788, 0.010168389417231083, 0.010585535317659378, 0.011002681218087673, 0.011419827118515968, 0.011836973018944263, 0.012254118919372559]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 4.0, 9.0, 9.0, 11.0, 18.0, 18.0, 20.0, 19.0, 20.0, 24.0, 31.0, 38.0, 44.0, 38.0, 45.0, 47.0, 51.0, 54.0, 31.0, 40.0, 43.0, 48.0, 44.0, 30.0, 35.0, 34.0, 23.0, 22.0, 31.0, 23.0, 20.0, 16.0, 11.0, 9.0, 11.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.16412353515625, -5.9454345703125, -5.72674560546875, -5.508056640625, -5.28936767578125, -5.0706787109375, -4.85198974609375, -4.63330078125, -4.41461181640625, -4.1959228515625, -3.97723388671875, -3.758544921875, -3.53985595703125, -3.3211669921875, -3.10247802734375, -2.8837890625, -2.66510009765625, -2.4464111328125, -2.22772216796875, -2.009033203125, -1.79034423828125, -1.5716552734375, -1.35296630859375, -1.13427734375, -0.91558837890625, -0.6968994140625, -0.47821044921875, -0.259521484375, -0.04083251953125, 0.1778564453125, 0.39654541015625, 0.615234375, 0.83392333984375, 1.0526123046875, 1.27130126953125, 1.489990234375, 1.70867919921875, 1.9273681640625, 2.14605712890625, 2.36474609375, 2.58343505859375, 2.8021240234375, 3.02081298828125, 3.239501953125, 3.45819091796875, 3.6768798828125, 3.89556884765625, 4.1142578125, 4.33294677734375, 4.5516357421875, 4.77032470703125, 4.989013671875, 5.20770263671875, 5.4263916015625, 5.64508056640625, 5.86376953125, 6.08245849609375, 6.3011474609375, 6.51983642578125, 6.738525390625, 6.95721435546875, 7.1759033203125, 7.39459228515625, 7.61328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 3.0, 11.0, 9.0, 22.0, 23.0, 32.0, 49.0, 79.0, 68.0, 130.0, 208.0, 351.0, 598.0, 959.0, 1813.0, 3355.0, 6224.0, 12964.0, 27925.0, 69690.0, 211225.0, 441843.0, 166471.0, 57129.0, 23737.0, 11313.0, 5497.0, 2893.0, 1571.0, 907.0, 562.0, 261.0, 209.0, 136.0, 84.0, 68.0, 39.0, 29.0, 21.0, 17.0, 10.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.51953125, -4.388153076171875, -4.25677490234375, -4.125396728515625, -3.9940185546875, -3.862640380859375, -3.73126220703125, -3.599884033203125, -3.468505859375, -3.337127685546875, -3.20574951171875, -3.074371337890625, -2.9429931640625, -2.811614990234375, -2.68023681640625, -2.548858642578125, -2.41748046875, -2.286102294921875, -2.15472412109375, -2.023345947265625, -1.8919677734375, -1.760589599609375, -1.62921142578125, -1.497833251953125, -1.366455078125, -1.235076904296875, -1.10369873046875, -0.972320556640625, -0.8409423828125, -0.709564208984375, -0.57818603515625, -0.446807861328125, -0.3154296875, -0.184051513671875, -0.05267333984375, 0.078704833984375, 0.2100830078125, 0.341461181640625, 0.47283935546875, 0.604217529296875, 0.735595703125, 0.866973876953125, 0.99835205078125, 1.129730224609375, 1.2611083984375, 1.392486572265625, 1.52386474609375, 1.655242919921875, 1.78662109375, 1.917999267578125, 2.04937744140625, 2.180755615234375, 2.3121337890625, 2.443511962890625, 2.57489013671875, 2.706268310546875, 2.837646484375, 2.969024658203125, 3.10040283203125, 3.231781005859375, 3.3631591796875, 3.494537353515625, 3.62591552734375, 3.757293701171875, 3.888671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 9.0, 10.0, 9.0, 12.0, 14.0, 16.0, 14.0, 16.0, 19.0, 33.0, 28.0, 22.0, 31.0, 39.0, 37.0, 40.0, 52.0, 80.0, 184.0, 1762.0, 145.0, 60.0, 52.0, 41.0, 32.0, 37.0, 30.0, 28.0, 32.0, 22.0, 21.0, 16.0, 14.0, 20.0, 15.0, 9.0, 13.0, 8.0, 11.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-24.625, -23.908935546875, -23.19287109375, -22.476806640625, -21.7607421875, -21.044677734375, -20.32861328125, -19.612548828125, -18.896484375, -18.180419921875, -17.46435546875, -16.748291015625, -16.0322265625, -15.316162109375, -14.60009765625, -13.884033203125, -13.16796875, -12.451904296875, -11.73583984375, -11.019775390625, -10.3037109375, -9.587646484375, -8.87158203125, -8.155517578125, -7.439453125, -6.723388671875, -6.00732421875, -5.291259765625, -4.5751953125, -3.859130859375, -3.14306640625, -2.427001953125, -1.7109375, -0.994873046875, -0.27880859375, 0.437255859375, 1.1533203125, 1.869384765625, 2.58544921875, 3.301513671875, 4.017578125, 4.733642578125, 5.44970703125, 6.165771484375, 6.8818359375, 7.597900390625, 8.31396484375, 9.030029296875, 9.74609375, 10.462158203125, 11.17822265625, 11.894287109375, 12.6103515625, 13.326416015625, 14.04248046875, 14.758544921875, 15.474609375, 16.190673828125, 16.90673828125, 17.622802734375, 18.3388671875, 19.054931640625, 19.77099609375, 20.487060546875, 21.203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 6.0, 10.0, 8.0, 13.0, 9.0, 17.0, 20.0, 10.0, 21.0, 23.0, 28.0, 49.0, 52.0, 83.0, 120.0, 150.0, 267.0, 567.0, 1448.0, 18242.0, 3052714.0, 67950.0, 2299.0, 601.0, 318.0, 193.0, 148.0, 73.0, 42.0, 38.0, 34.0, 35.0, 16.0, 17.0, 13.0, 15.0, 9.0, 16.0, 8.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.40625, -35.25537109375, -34.1044921875, -32.95361328125, -31.802734375, -30.65185546875, -29.5009765625, -28.35009765625, -27.19921875, -26.04833984375, -24.8974609375, -23.74658203125, -22.595703125, -21.44482421875, -20.2939453125, -19.14306640625, -17.9921875, -16.84130859375, -15.6904296875, -14.53955078125, -13.388671875, -12.23779296875, -11.0869140625, -9.93603515625, -8.78515625, -7.63427734375, -6.4833984375, -5.33251953125, -4.181640625, -3.03076171875, -1.8798828125, -0.72900390625, 0.421875, 1.57275390625, 2.7236328125, 3.87451171875, 5.025390625, 6.17626953125, 7.3271484375, 8.47802734375, 9.62890625, 10.77978515625, 11.9306640625, 13.08154296875, 14.232421875, 15.38330078125, 16.5341796875, 17.68505859375, 18.8359375, 19.98681640625, 21.1376953125, 22.28857421875, 23.439453125, 24.59033203125, 25.7412109375, 26.89208984375, 28.04296875, 29.19384765625, 30.3447265625, 31.49560546875, 32.646484375, 33.79736328125, 34.9482421875, 36.09912109375, 37.25]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 13.0, 109.0, 420.0, 393.0, 77.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.21961498260498, -8.356374740600586, -5.493134021759033, -2.6298933029174805, 0.23334693908691406, 3.0965871810913086, 5.9598283767700195, 8.823067665100098, 11.686308860778809, 14.549549102783203, 17.412790298461914, 20.276031494140625, 23.139270782470703, 26.00251007080078, 28.865753173828125, 31.728992462158203, 34.59223175048828, 37.45547103881836, 40.3187141418457, 43.18195343017578, 46.04519271850586, 48.90843200683594, 51.77167510986328, 54.63491439819336, 57.4981575012207, 60.36139678955078, 63.224639892578125, 66.08787536621094, 68.95111846923828, 71.81436157226562, 74.67759704589844, 77.54084014892578, 80.4040756225586, 83.26731872558594, 86.13055419921875, 88.9937973022461, 91.85704040527344, 94.72027587890625, 97.5835189819336, 100.44676208496094, 103.30999755859375, 106.1732406616211, 109.0364761352539, 111.89971923828125, 114.7629623413086, 117.6261978149414, 120.48944091796875, 123.35267639160156, 126.21592712402344, 129.07916259765625, 131.94241333007812, 134.80564880371094, 137.66888427734375, 140.53213500976562, 143.39537048339844, 146.25860595703125, 149.12184143066406, 151.98507690429688, 154.84832763671875, 157.71156311035156, 160.57479858398438, 163.43804931640625, 166.30128479003906, 169.16452026367188, 172.02777099609375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 9.0, 2.0, 5.0, 9.0, 17.0, 5.0, 16.0, 13.0, 19.0, 20.0, 26.0, 23.0, 43.0, 41.0, 34.0, 37.0, 39.0, 48.0, 48.0, 47.0, 53.0, 39.0, 47.0, 38.0, 54.0, 30.0, 30.0, 28.0, 22.0, 26.0, 24.0, 17.0, 22.0, 14.0, 10.0, 8.0, 8.0, 4.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.22504425048828, -80.7425308227539, -78.26002502441406, -75.77751159667969, -73.29499816894531, -70.81249237060547, -68.3299789428711, -65.84747314453125, -63.364959716796875, -60.882450103759766, -58.399940490722656, -55.91742706298828, -53.43491744995117, -50.95240783691406, -48.46989440917969, -45.98738479614258, -43.50487518310547, -41.02236557006836, -38.53985595703125, -36.057342529296875, -33.574832916259766, -31.092323303222656, -28.609811782836914, -26.127300262451172, -23.644790649414062, -21.162281036376953, -18.67976951599121, -16.19725799560547, -13.71474838256836, -11.232237815856934, -8.749727249145508, -6.267215728759766, -3.784698486328125, -1.3021879196166992, 1.1803226470947266, 3.6628332138061523, 6.145343780517578, 8.627854347229004, 11.11036491394043, 13.592876434326172, 16.07538604736328, 18.55789566040039, 21.040407180786133, 23.522918701171875, 26.005428314208984, 28.487937927246094, 30.970449447631836, 33.45296096801758, 35.93547058105469, 38.4179801940918, 40.900489807128906, 43.38300323486328, 45.86551284790039, 48.3480224609375, 50.830535888671875, 53.313045501708984, 55.795555114746094, 58.2780647277832, 60.76057434082031, 63.24308776855469, 65.72560119628906, 68.2081069946289, 70.69062042236328, 73.17312622070312, 75.6556396484375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 8.0, 9.0, 9.0, 15.0, 19.0, 22.0, 16.0, 24.0, 26.0, 28.0, 38.0, 44.0, 38.0, 50.0, 55.0, 45.0, 53.0, 44.0, 39.0, 40.0, 47.0, 33.0, 45.0, 34.0, 27.0, 32.0, 22.0, 25.0, 18.0, 24.0, 14.0, 10.0, 6.0, 13.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83203125, -6.604248046875, -6.37646484375, -6.148681640625, -5.9208984375, -5.693115234375, -5.46533203125, -5.237548828125, -5.009765625, -4.781982421875, -4.55419921875, -4.326416015625, -4.0986328125, -3.870849609375, -3.64306640625, -3.415283203125, -3.1875, -2.959716796875, -2.73193359375, -2.504150390625, -2.2763671875, -2.048583984375, -1.82080078125, -1.593017578125, -1.365234375, -1.137451171875, -0.90966796875, -0.681884765625, -0.4541015625, -0.226318359375, 0.00146484375, 0.229248046875, 0.45703125, 0.684814453125, 0.91259765625, 1.140380859375, 1.3681640625, 1.595947265625, 1.82373046875, 2.051513671875, 2.279296875, 2.507080078125, 2.73486328125, 2.962646484375, 3.1904296875, 3.418212890625, 3.64599609375, 3.873779296875, 4.1015625, 4.329345703125, 4.55712890625, 4.784912109375, 5.0126953125, 5.240478515625, 5.46826171875, 5.696044921875, 5.923828125, 6.151611328125, 6.37939453125, 6.607177734375, 6.8349609375, 7.062744140625, 7.29052734375, 7.518310546875, 7.74609375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 10.0, 4.0, 12.0, 8.0, 19.0, 17.0, 38.0, 53.0, 81.0, 159.0, 312.0, 689.0, 1658.0, 4368.0, 13419.0, 46153.0, 192002.0, 1174809.0, 2190002.0, 445525.0, 89395.0, 23851.0, 7409.0, 2428.0, 919.0, 412.0, 221.0, 109.0, 55.0, 29.0, 26.0, 22.0, 18.0, 8.0, 7.0, 3.0, 5.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.46875, -14.9736328125, -14.478515625, -13.9833984375, -13.48828125, -12.9931640625, -12.498046875, -12.0029296875, -11.5078125, -11.0126953125, -10.517578125, -10.0224609375, -9.52734375, -9.0322265625, -8.537109375, -8.0419921875, -7.546875, -7.0517578125, -6.556640625, -6.0615234375, -5.56640625, -5.0712890625, -4.576171875, -4.0810546875, -3.5859375, -3.0908203125, -2.595703125, -2.1005859375, -1.60546875, -1.1103515625, -0.615234375, -0.1201171875, 0.375, 0.8701171875, 1.365234375, 1.8603515625, 2.35546875, 2.8505859375, 3.345703125, 3.8408203125, 4.3359375, 4.8310546875, 5.326171875, 5.8212890625, 6.31640625, 6.8115234375, 7.306640625, 7.8017578125, 8.296875, 8.7919921875, 9.287109375, 9.7822265625, 10.27734375, 10.7724609375, 11.267578125, 11.7626953125, 12.2578125, 12.7529296875, 13.248046875, 13.7431640625, 14.23828125, 14.7333984375, 15.228515625, 15.7236328125, 16.21875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 5.0, 12.0, 14.0, 18.0, 15.0, 30.0, 29.0, 39.0, 50.0, 70.0, 97.0, 102.0, 153.0, 187.0, 250.0, 298.0, 383.0, 399.0, 390.0, 299.0, 258.0, 216.0, 159.0, 139.0, 97.0, 89.0, 73.0, 45.0, 37.0, 16.0, 26.0, 20.0, 12.0, 10.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.21875, -14.723388671875, -14.22802734375, -13.732666015625, -13.2373046875, -12.741943359375, -12.24658203125, -11.751220703125, -11.255859375, -10.760498046875, -10.26513671875, -9.769775390625, -9.2744140625, -8.779052734375, -8.28369140625, -7.788330078125, -7.29296875, -6.797607421875, -6.30224609375, -5.806884765625, -5.3115234375, -4.816162109375, -4.32080078125, -3.825439453125, -3.330078125, -2.834716796875, -2.33935546875, -1.843994140625, -1.3486328125, -0.853271484375, -0.35791015625, 0.137451171875, 0.6328125, 1.128173828125, 1.62353515625, 2.118896484375, 2.6142578125, 3.109619140625, 3.60498046875, 4.100341796875, 4.595703125, 5.091064453125, 5.58642578125, 6.081787109375, 6.5771484375, 7.072509765625, 7.56787109375, 8.063232421875, 8.55859375, 9.053955078125, 9.54931640625, 10.044677734375, 10.5400390625, 11.035400390625, 11.53076171875, 12.026123046875, 12.521484375, 13.016845703125, 13.51220703125, 14.007568359375, 14.5029296875, 14.998291015625, 15.49365234375, 15.989013671875, 16.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 1.0, 9.0, 12.0, 17.0, 18.0, 32.0, 41.0, 63.0, 111.0, 155.0, 274.0, 631.0, 1542.0, 5510.0, 27388.0, 194616.0, 2028073.0, 1736428.0, 167516.0, 24269.0, 4907.0, 1409.0, 536.0, 279.0, 148.0, 89.0, 51.0, 45.0, 27.0, 27.0, 13.0, 5.0, 10.0, 10.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.223388671875, -26.08740234375, -24.951416015625, -23.8154296875, -22.679443359375, -21.54345703125, -20.407470703125, -19.271484375, -18.135498046875, -16.99951171875, -15.863525390625, -14.7275390625, -13.591552734375, -12.45556640625, -11.319580078125, -10.18359375, -9.047607421875, -7.91162109375, -6.775634765625, -5.6396484375, -4.503662109375, -3.36767578125, -2.231689453125, -1.095703125, 0.040283203125, 1.17626953125, 2.312255859375, 3.4482421875, 4.584228515625, 5.72021484375, 6.856201171875, 7.9921875, 9.128173828125, 10.26416015625, 11.400146484375, 12.5361328125, 13.672119140625, 14.80810546875, 15.944091796875, 17.080078125, 18.216064453125, 19.35205078125, 20.488037109375, 21.6240234375, 22.760009765625, 23.89599609375, 25.031982421875, 26.16796875, 27.303955078125, 28.43994140625, 29.575927734375, 30.7119140625, 31.847900390625, 32.98388671875, 34.119873046875, 35.255859375, 36.391845703125, 37.52783203125, 38.663818359375, 39.7998046875, 40.935791015625, 42.07177734375, 43.207763671875, 44.34375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 3.0, 19.0, 49.0, 136.0, 233.0, 246.0, 189.0, 95.0, 26.0, 17.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.7142219543457, -35.017738342285156, -28.32125473022461, -21.62476921081543, -14.928285598754883, -8.231800079345703, -1.5353164672851562, 5.161167144775391, 11.857650756835938, 18.554134368896484, 25.25061798095703, 31.94710350036621, 38.643585205078125, 45.34007263183594, 52.036556243896484, 58.73303985595703, 65.42951965332031, 72.12600708007812, 78.8224868774414, 85.51897430419922, 92.2154541015625, 98.91194152832031, 105.60842895507812, 112.3049087524414, 119.00139617919922, 125.69788360595703, 132.3943634033203, 139.09085083007812, 145.78733825683594, 152.48382568359375, 159.1802978515625, 165.8767852783203, 172.57325744628906, 179.26974487304688, 185.9662322998047, 192.66270446777344, 199.35919189453125, 206.05567932128906, 212.75216674804688, 219.44863891601562, 226.14512634277344, 232.84161376953125, 239.53810119628906, 246.2345733642578, 252.93106079101562, 259.6275634765625, 266.32403564453125, 273.0205078125, 279.7170104980469, 286.4134826660156, 293.1099853515625, 299.80645751953125, 306.5029602050781, 313.1994323730469, 319.8959045410156, 326.5924072265625, 333.28887939453125, 339.9853515625, 346.6818542480469, 353.3783264160156, 360.0748291015625, 366.77130126953125, 373.4677734375, 380.1642761230469, 386.8607482910156]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 3.0, 5.0, 7.0, 12.0, 7.0, 16.0, 18.0, 27.0, 19.0, 23.0, 25.0, 31.0, 33.0, 39.0, 28.0, 36.0, 39.0, 44.0, 33.0, 47.0, 50.0, 39.0, 42.0, 36.0, 32.0, 41.0, 34.0, 28.0, 25.0, 27.0, 32.0, 28.0, 24.0, 12.0, 7.0, 10.0, 6.0, 4.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.13417053222656, -61.20676803588867, -59.27936935424805, -57.351966857910156, -55.424564361572266, -53.497161865234375, -51.56976318359375, -49.64236068725586, -47.71495819091797, -45.78755569458008, -43.86015701293945, -41.93275451660156, -40.00535202026367, -38.07794952392578, -36.150550842285156, -34.223148345947266, -32.29574966430664, -30.368349075317383, -28.440946578979492, -26.513545989990234, -24.586143493652344, -22.658742904663086, -20.731342315673828, -18.803939819335938, -16.87653923034668, -14.949137687683105, -13.021736145019531, -11.094335556030273, -9.1669340133667, -7.239532470703125, -5.312131881713867, -3.384730339050293, -1.4573287963867188, 0.47007250785827637, 2.3974738121032715, 4.3248748779296875, 6.252276420593262, 8.179677963256836, 10.107078552246094, 12.034480094909668, 13.961881637573242, 15.889283180236816, 17.81668472290039, 19.74408531188965, 21.671485900878906, 23.598888397216797, 25.526288986206055, 27.453689575195312, 29.381092071533203, 31.30849266052246, 33.23589324951172, 35.16329574584961, 37.0906982421875, 39.018096923828125, 40.945499420166016, 42.872901916503906, 44.80030059814453, 46.72770309448242, 48.65510177612305, 50.58250427246094, 52.50990676879883, 54.43730926513672, 56.364707946777344, 58.292110443115234, 60.219512939453125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 6.0, 3.0, 6.0, 10.0, 7.0, 19.0, 9.0, 18.0, 27.0, 24.0, 29.0, 26.0, 33.0, 46.0, 51.0, 43.0, 41.0, 47.0, 45.0, 46.0, 37.0, 42.0, 40.0, 36.0, 42.0, 36.0, 34.0, 24.0, 19.0, 20.0, 19.0, 26.0, 19.0, 14.0, 10.0, 10.0, 12.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.0626220703125, -6.836181640625, -6.6097412109375, -6.38330078125, -6.1568603515625, -5.930419921875, -5.7039794921875, -5.4775390625, -5.2510986328125, -5.024658203125, -4.7982177734375, -4.57177734375, -4.3453369140625, -4.118896484375, -3.8924560546875, -3.666015625, -3.4395751953125, -3.213134765625, -2.9866943359375, -2.76025390625, -2.5338134765625, -2.307373046875, -2.0809326171875, -1.8544921875, -1.6280517578125, -1.401611328125, -1.1751708984375, -0.94873046875, -0.7222900390625, -0.495849609375, -0.2694091796875, -0.04296875, 0.1834716796875, 0.409912109375, 0.6363525390625, 0.86279296875, 1.0892333984375, 1.315673828125, 1.5421142578125, 1.7685546875, 1.9949951171875, 2.221435546875, 2.4478759765625, 2.67431640625, 2.9007568359375, 3.127197265625, 3.3536376953125, 3.580078125, 3.8065185546875, 4.032958984375, 4.2593994140625, 4.48583984375, 4.7122802734375, 4.938720703125, 5.1651611328125, 5.3916015625, 5.6180419921875, 5.844482421875, 6.0709228515625, 6.29736328125, 6.5238037109375, 6.750244140625, 6.9766845703125, 7.203125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 7.0, 15.0, 7.0, 12.0, 25.0, 31.0, 47.0, 66.0, 128.0, 187.0, 289.0, 433.0, 633.0, 978.0, 1516.0, 2326.0, 3842.0, 6050.0, 9938.0, 16630.0, 28606.0, 50714.0, 95793.0, 184277.0, 253487.0, 179554.0, 93944.0, 49148.0, 27674.0, 16058.0, 9702.0, 5973.0, 3781.0, 2457.0, 1436.0, 966.0, 680.0, 403.0, 265.0, 171.0, 105.0, 74.0, 44.0, 25.0, 23.0, 10.0, 6.0, 5.0, 9.0, 8.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0615234375, -1.028839111328125, -0.99615478515625, -0.963470458984375, -0.9307861328125, -0.898101806640625, -0.86541748046875, -0.832733154296875, -0.800048828125, -0.767364501953125, -0.73468017578125, -0.701995849609375, -0.6693115234375, -0.636627197265625, -0.60394287109375, -0.571258544921875, -0.53857421875, -0.505889892578125, -0.47320556640625, -0.440521240234375, -0.4078369140625, -0.375152587890625, -0.34246826171875, -0.309783935546875, -0.277099609375, -0.244415283203125, -0.21173095703125, -0.179046630859375, -0.1463623046875, -0.113677978515625, -0.08099365234375, -0.048309326171875, -0.015625, 0.017059326171875, 0.04974365234375, 0.082427978515625, 0.1151123046875, 0.147796630859375, 0.18048095703125, 0.213165283203125, 0.245849609375, 0.278533935546875, 0.31121826171875, 0.343902587890625, 0.3765869140625, 0.409271240234375, 0.44195556640625, 0.474639892578125, 0.50732421875, 0.540008544921875, 0.57269287109375, 0.605377197265625, 0.6380615234375, 0.670745849609375, 0.70343017578125, 0.736114501953125, 0.768798828125, 0.801483154296875, 0.83416748046875, 0.866851806640625, 0.8995361328125, 0.932220458984375, 0.96490478515625, 0.997589111328125, 1.0302734375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 10.0, 5.0, 11.0, 11.0, 17.0, 17.0, 23.0, 21.0, 26.0, 31.0, 29.0, 36.0, 22.0, 25.0, 40.0, 43.0, 40.0, 29.0, 42.0, 1064.0, 33.0, 51.0, 33.0, 34.0, 41.0, 31.0, 45.0, 33.0, 25.0, 18.0, 19.0, 18.0, 17.0, 18.0, 12.0, 11.0, 7.0, 6.0, 5.0, 4.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.0267333984375, -3.889404296875, -3.7520751953125, -3.61474609375, -3.4774169921875, -3.340087890625, -3.2027587890625, -3.0654296875, -2.9281005859375, -2.790771484375, -2.6534423828125, -2.51611328125, -2.3787841796875, -2.241455078125, -2.1041259765625, -1.966796875, -1.8294677734375, -1.692138671875, -1.5548095703125, -1.41748046875, -1.2801513671875, -1.142822265625, -1.0054931640625, -0.8681640625, -0.7308349609375, -0.593505859375, -0.4561767578125, -0.31884765625, -0.1815185546875, -0.044189453125, 0.0931396484375, 0.23046875, 0.3677978515625, 0.505126953125, 0.6424560546875, 0.77978515625, 0.9171142578125, 1.054443359375, 1.1917724609375, 1.3291015625, 1.4664306640625, 1.603759765625, 1.7410888671875, 1.87841796875, 2.0157470703125, 2.153076171875, 2.2904052734375, 2.427734375, 2.5650634765625, 2.702392578125, 2.8397216796875, 2.97705078125, 3.1143798828125, 3.251708984375, 3.3890380859375, 3.5263671875, 3.6636962890625, 3.801025390625, 3.9383544921875, 4.07568359375, 4.2130126953125, 4.350341796875, 4.4876708984375, 4.625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 8.0, 13.0, 18.0, 31.0, 38.0, 71.0, 97.0, 126.0, 164.0, 271.0, 482.0, 597.0, 971.0, 1480.0, 2325.0, 3510.0, 5616.0, 8692.0, 14300.0, 23802.0, 40172.0, 68714.0, 111944.0, 166520.0, 1237813.0, 154912.0, 101426.0, 61450.0, 35956.0, 21040.0, 12887.0, 7666.0, 4875.0, 3185.0, 2060.0, 1303.0, 866.0, 569.0, 368.0, 259.0, 176.0, 122.0, 68.0, 58.0, 41.0, 29.0, 20.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.60009765625, -0.581573486328125, -0.56304931640625, -0.544525146484375, -0.5260009765625, -0.507476806640625, -0.48895263671875, -0.470428466796875, -0.451904296875, -0.433380126953125, -0.41485595703125, -0.396331787109375, -0.3778076171875, -0.359283447265625, -0.34075927734375, -0.322235107421875, -0.3037109375, -0.285186767578125, -0.26666259765625, -0.248138427734375, -0.2296142578125, -0.211090087890625, -0.19256591796875, -0.174041748046875, -0.155517578125, -0.136993408203125, -0.11846923828125, -0.099945068359375, -0.0814208984375, -0.062896728515625, -0.04437255859375, -0.025848388671875, -0.00732421875, 0.011199951171875, 0.02972412109375, 0.048248291015625, 0.0667724609375, 0.085296630859375, 0.10382080078125, 0.122344970703125, 0.140869140625, 0.159393310546875, 0.17791748046875, 0.196441650390625, 0.2149658203125, 0.233489990234375, 0.25201416015625, 0.270538330078125, 0.2890625, 0.307586669921875, 0.32611083984375, 0.344635009765625, 0.3631591796875, 0.381683349609375, 0.40020751953125, 0.418731689453125, 0.437255859375, 0.455780029296875, 0.47430419921875, 0.492828369140625, 0.5113525390625, 0.529876708984375, 0.54840087890625, 0.566925048828125, 0.58544921875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 10.0, 15.0, 13.0, 30.0, 34.0, 47.0, 39.0, 56.0, 65.0, 81.0, 68.0, 73.0, 76.0, 65.0, 59.0, 57.0, 28.0, 37.0, 28.0, 20.0, 15.0, 9.0, 8.0, 9.0, 3.0, 2.0, 9.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.0100250244140625, -0.00972294807434082, -0.00942087173461914, -0.009118795394897461, -0.008816719055175781, -0.008514642715454102, -0.008212566375732422, -0.007910490036010742, -0.0076084136962890625, -0.007306337356567383, -0.007004261016845703, -0.0067021846771240234, -0.006400108337402344, -0.006098031997680664, -0.005795955657958984, -0.005493879318237305, -0.005191802978515625, -0.004889726638793945, -0.004587650299072266, -0.004285573959350586, -0.003983497619628906, -0.0036814212799072266, -0.003379344940185547, -0.003077268600463867, -0.0027751922607421875, -0.002473115921020508, -0.002171039581298828, -0.0018689632415771484, -0.0015668869018554688, -0.001264810562133789, -0.0009627342224121094, -0.0006606578826904297, -0.00035858154296875, -5.650520324707031e-05, 0.0002455711364746094, 0.0005476474761962891, 0.0008497238159179688, 0.0011518001556396484, 0.0014538764953613281, 0.0017559528350830078, 0.0020580291748046875, 0.002360105514526367, 0.002662181854248047, 0.0029642581939697266, 0.0032663345336914062, 0.003568410873413086, 0.0038704872131347656, 0.004172563552856445, 0.004474639892578125, 0.004776716232299805, 0.005078792572021484, 0.005380868911743164, 0.005682945251464844, 0.0059850215911865234, 0.006287097930908203, 0.006589174270629883, 0.0068912506103515625, 0.007193326950073242, 0.007495403289794922, 0.0077974796295166016, 0.008099555969238281, 0.008401632308959961, 0.00870370864868164, 0.00900578498840332, 0.009307861328125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 18.0, 17.0, 29.0, 22.0, 28.0, 53.0, 67.0, 82.0, 155.0, 226.0, 453.0, 2396.0, 65992.0, 947686.0, 28853.0, 1387.0, 372.0, 176.0, 133.0, 105.0, 70.0, 46.0, 28.0, 29.0, 33.0, 22.0, 9.0, 6.0, 5.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.17402267456054688, -0.16847991943359375, -0.16293716430664062, -0.1573944091796875, -0.15185165405273438, -0.14630889892578125, -0.14076614379882812, -0.135223388671875, -0.12968063354492188, -0.12413787841796875, -0.11859512329101562, -0.1130523681640625, -0.10750961303710938, -0.10196685791015625, -0.09642410278320312, -0.09088134765625, -0.08533859252929688, -0.07979583740234375, -0.07425308227539062, -0.0687103271484375, -0.06316757202148438, -0.05762481689453125, -0.052082061767578125, -0.046539306640625, -0.040996551513671875, -0.03545379638671875, -0.029911041259765625, -0.0243682861328125, -0.018825531005859375, -0.01328277587890625, -0.007740020751953125, -0.002197265625, 0.003345489501953125, 0.00888824462890625, 0.014430999755859375, 0.0199737548828125, 0.025516510009765625, 0.03105926513671875, 0.036602020263671875, 0.042144775390625, 0.047687530517578125, 0.05323028564453125, 0.058773040771484375, 0.0643157958984375, 0.06985855102539062, 0.07540130615234375, 0.08094406127929688, 0.08648681640625, 0.09202957153320312, 0.09757232666015625, 0.10311508178710938, 0.1086578369140625, 0.11420059204101562, 0.11974334716796875, 0.12528610229492188, 0.130828857421875, 0.13637161254882812, 0.14191436767578125, 0.14745712280273438, 0.1529998779296875, 0.15854263305664062, 0.16408538818359375, 0.16962814331054688, 0.1751708984375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 10.0, 10.0, 50.0, 218.0, 586.0, 119.0, 20.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06401921063661575, -0.061771370470523834, -0.059523530304431915, -0.057275690138339996, -0.05502784997224808, -0.05278000980615616, -0.05053216591477394, -0.04828432574868202, -0.0460364855825901, -0.043788645416498184, -0.041540805250406265, -0.039292965084314346, -0.03704512119293213, -0.03479728102684021, -0.03254944086074829, -0.030301600694656372, -0.028053760528564453, -0.025805920362472534, -0.023558080196380615, -0.021310238167643547, -0.019062398001551628, -0.01681455783545971, -0.014566716738045216, -0.012318875640630722, -0.010071035474538803, -0.007823195308446884, -0.005575354211032391, -0.0033275135792791843, -0.001079672947525978, 0.0011681672185659409, 0.0034160083159804344, 0.005663849413394928, 0.00791168212890625, 0.010159522294998169, 0.012407363392412663, 0.014655204489827156, 0.016903044655919075, 0.019150884822010994, 0.021398726850748062, 0.02364656701683998, 0.0258944071829319, 0.02814224734902382, 0.030390087515115738, 0.03263792768120766, 0.034885771572589874, 0.03713361173868179, 0.03938145190477371, 0.04162929207086563, 0.04387713223695755, 0.04612497240304947, 0.04837281256914139, 0.05062065273523331, 0.052868492901325226, 0.055116333067417145, 0.05736417695879936, 0.05961201712489128, 0.0618598572909832, 0.06410770118236542, 0.06635554134845734, 0.06860338151454926, 0.07085122168064117, 0.0730990618467331, 0.07534690201282501, 0.07759474217891693, 0.07984258234500885]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 6.0, 4.0, 17.0, 17.0, 27.0, 34.0, 31.0, 33.0, 38.0, 39.0, 47.0, 44.0, 34.0, 42.0, 52.0, 54.0, 51.0, 48.0, 51.0, 47.0, 40.0, 46.0, 28.0, 25.0, 25.0, 15.0, 26.0, 12.0, 9.0, 15.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00861513614654541, -0.00834089145064354, -0.008066646754741669, -0.007792402058839798, -0.007518157362937927, -0.0072439126670360565, -0.006969667971134186, -0.006695423275232315, -0.006421178579330444, -0.006146933883428574, -0.005872689187526703, -0.005598444491624832, -0.005324199795722961, -0.005049955099821091, -0.00477571040391922, -0.004501465708017349, -0.0042272210121154785, -0.003952976316213608, -0.003678731620311737, -0.0034044869244098663, -0.0031302422285079956, -0.002855997532606125, -0.002581752836704254, -0.0023075081408023834, -0.0020332634449005127, -0.001759018748998642, -0.0014847740530967712, -0.0012105293571949005, -0.0009362846612930298, -0.0006620399653911591, -0.00038779526948928833, -0.0001135505735874176, 0.00016069412231445312, 0.00043493881821632385, 0.0007091835141181946, 0.0009834282100200653, 0.001257672905921936, 0.0015319176018238068, 0.0018061622977256775, 0.0020804069936275482, 0.002354651689529419, 0.0026288963854312897, 0.0029031410813331604, 0.003177385777235031, 0.003451630473136902, 0.0037258751690387726, 0.004000119864940643, 0.004274364560842514, 0.004548609256744385, 0.0048228539526462555, 0.005097098648548126, 0.005371343344449997, 0.005645588040351868, 0.005919832736253738, 0.006194077432155609, 0.00646832212805748, 0.006742566823959351, 0.007016811519861221, 0.007291056215763092, 0.007565300911664963, 0.007839545607566833, 0.008113790303468704, 0.008388034999370575, 0.008662279695272446, 0.008936524391174316]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 6.0, 3.0, 6.0, 10.0, 7.0, 19.0, 9.0, 18.0, 27.0, 24.0, 29.0, 26.0, 33.0, 46.0, 51.0, 43.0, 41.0, 47.0, 45.0, 46.0, 37.0, 42.0, 40.0, 36.0, 42.0, 36.0, 34.0, 24.0, 19.0, 20.0, 19.0, 26.0, 19.0, 14.0, 10.0, 10.0, 12.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.0626220703125, -6.836181640625, -6.6097412109375, -6.38330078125, -6.1568603515625, -5.930419921875, -5.7039794921875, -5.4775390625, -5.2510986328125, -5.024658203125, -4.7982177734375, -4.57177734375, -4.3453369140625, -4.118896484375, -3.8924560546875, -3.666015625, -3.4395751953125, -3.213134765625, -2.9866943359375, -2.76025390625, -2.5338134765625, -2.307373046875, -2.0809326171875, -1.8544921875, -1.6280517578125, -1.401611328125, -1.1751708984375, -0.94873046875, -0.7222900390625, -0.495849609375, -0.2694091796875, -0.04296875, 0.1834716796875, 0.409912109375, 0.6363525390625, 0.86279296875, 1.0892333984375, 1.315673828125, 1.5421142578125, 1.7685546875, 1.9949951171875, 2.221435546875, 2.4478759765625, 2.67431640625, 2.9007568359375, 3.127197265625, 3.3536376953125, 3.580078125, 3.8065185546875, 4.032958984375, 4.2593994140625, 4.48583984375, 4.7122802734375, 4.938720703125, 5.1651611328125, 5.3916015625, 5.6180419921875, 5.844482421875, 6.0709228515625, 6.29736328125, 6.5238037109375, 6.750244140625, 6.9766845703125, 7.203125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 12.0, 9.0, 17.0, 29.0, 39.0, 49.0, 83.0, 83.0, 145.0, 186.0, 212.0, 298.0, 416.0, 619.0, 781.0, 1083.0, 1508.0, 2260.0, 3271.0, 5449.0, 8762.0, 16136.0, 33893.0, 88638.0, 301354.0, 378299.0, 116489.0, 41297.0, 18814.0, 10122.0, 5922.0, 3833.0, 2480.0, 1691.0, 1146.0, 790.0, 604.0, 447.0, 339.0, 244.0, 192.0, 151.0, 94.0, 58.0, 67.0, 45.0, 30.0, 23.0, 13.0, 9.0, 13.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.83984375, -4.68914794921875, -4.5384521484375, -4.38775634765625, -4.237060546875, -4.08636474609375, -3.9356689453125, -3.78497314453125, -3.63427734375, -3.48358154296875, -3.3328857421875, -3.18218994140625, -3.031494140625, -2.88079833984375, -2.7301025390625, -2.57940673828125, -2.4287109375, -2.27801513671875, -2.1273193359375, -1.97662353515625, -1.825927734375, -1.67523193359375, -1.5245361328125, -1.37384033203125, -1.22314453125, -1.07244873046875, -0.9217529296875, -0.77105712890625, -0.620361328125, -0.46966552734375, -0.3189697265625, -0.16827392578125, -0.017578125, 0.13311767578125, 0.2838134765625, 0.43450927734375, 0.585205078125, 0.73590087890625, 0.8865966796875, 1.03729248046875, 1.18798828125, 1.33868408203125, 1.4893798828125, 1.64007568359375, 1.790771484375, 1.94146728515625, 2.0921630859375, 2.24285888671875, 2.3935546875, 2.54425048828125, 2.6949462890625, 2.84564208984375, 2.996337890625, 3.14703369140625, 3.2977294921875, 3.44842529296875, 3.59912109375, 3.74981689453125, 3.9005126953125, 4.05120849609375, 4.201904296875, 4.35260009765625, 4.5032958984375, 4.65399169921875, 4.8046875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 3.0, 7.0, 9.0, 11.0, 16.0, 19.0, 24.0, 21.0, 41.0, 34.0, 48.0, 51.0, 58.0, 69.0, 187.0, 1842.0, 144.0, 60.0, 57.0, 54.0, 42.0, 48.0, 43.0, 29.0, 31.0, 17.0, 14.0, 16.0, 12.0, 4.0, 11.0, 5.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -24.820556640625, -23.84423828125, -22.867919921875, -21.8916015625, -20.915283203125, -19.93896484375, -18.962646484375, -17.986328125, -17.010009765625, -16.03369140625, -15.057373046875, -14.0810546875, -13.104736328125, -12.12841796875, -11.152099609375, -10.17578125, -9.199462890625, -8.22314453125, -7.246826171875, -6.2705078125, -5.294189453125, -4.31787109375, -3.341552734375, -2.365234375, -1.388916015625, -0.41259765625, 0.563720703125, 1.5400390625, 2.516357421875, 3.49267578125, 4.468994140625, 5.4453125, 6.421630859375, 7.39794921875, 8.374267578125, 9.3505859375, 10.326904296875, 11.30322265625, 12.279541015625, 13.255859375, 14.232177734375, 15.20849609375, 16.184814453125, 17.1611328125, 18.137451171875, 19.11376953125, 20.090087890625, 21.06640625, 22.042724609375, 23.01904296875, 23.995361328125, 24.9716796875, 25.947998046875, 26.92431640625, 27.900634765625, 28.876953125, 29.853271484375, 30.82958984375, 31.805908203125, 32.7822265625, 33.758544921875, 34.73486328125, 35.711181640625, 36.6875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 6.0, 11.0, 8.0, 13.0, 14.0, 15.0, 22.0, 28.0, 41.0, 72.0, 95.0, 154.0, 208.0, 447.0, 1146.0, 20089.0, 3092006.0, 28937.0, 1278.0, 459.0, 239.0, 133.0, 70.0, 58.0, 46.0, 22.0, 20.0, 19.0, 11.0, 6.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.09375, -59.46630859375, -57.8388671875, -56.21142578125, -54.583984375, -52.95654296875, -51.3291015625, -49.70166015625, -48.07421875, -46.44677734375, -44.8193359375, -43.19189453125, -41.564453125, -39.93701171875, -38.3095703125, -36.68212890625, -35.0546875, -33.42724609375, -31.7998046875, -30.17236328125, -28.544921875, -26.91748046875, -25.2900390625, -23.66259765625, -22.03515625, -20.40771484375, -18.7802734375, -17.15283203125, -15.525390625, -13.89794921875, -12.2705078125, -10.64306640625, -9.015625, -7.38818359375, -5.7607421875, -4.13330078125, -2.505859375, -0.87841796875, 0.7490234375, 2.37646484375, 4.00390625, 5.63134765625, 7.2587890625, 8.88623046875, 10.513671875, 12.14111328125, 13.7685546875, 15.39599609375, 17.0234375, 18.65087890625, 20.2783203125, 21.90576171875, 23.533203125, 25.16064453125, 26.7880859375, 28.41552734375, 30.04296875, 31.67041015625, 33.2978515625, 34.92529296875, 36.552734375, 38.18017578125, 39.8076171875, 41.43505859375, 43.0625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [31.0, 553.0, 403.0, 28.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.018672943115234, -5.344668388366699, 0.32933616638183594, 6.0033416748046875, 11.677345275878906, 17.351348876953125, 23.02535629272461, 28.699359893798828, 34.37336349487305, 40.047367095947266, 45.72137451171875, 51.39537811279297, 57.06938171386719, 62.743385314941406, 68.41738891601562, 74.09140014648438, 79.76539611816406, 85.43939971923828, 91.1134033203125, 96.78741455078125, 102.46141052246094, 108.13542175292969, 113.8094253540039, 119.48342895507812, 125.15744018554688, 130.83145141601562, 136.5054473876953, 142.17945861816406, 147.85345458984375, 153.5274658203125, 159.20147705078125, 164.87547302246094, 170.54946899414062, 176.22348022460938, 181.89747619628906, 187.5714874267578, 193.2454833984375, 198.91949462890625, 204.593505859375, 210.2675018310547, 215.94149780273438, 221.61550903320312, 227.2895050048828, 232.96351623535156, 238.63751220703125, 244.3115234375, 249.98553466796875, 255.65953063964844, 261.33355712890625, 267.007568359375, 272.68157958984375, 278.3555603027344, 284.0295715332031, 289.7035827636719, 295.3775939941406, 301.05157470703125, 306.7255859375, 312.39959716796875, 318.0736083984375, 323.7475891113281, 329.4216003417969, 335.0956115722656, 340.7696228027344, 346.443603515625, 352.11761474609375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 12.0, 10.0, 7.0, 15.0, 13.0, 20.0, 23.0, 25.0, 20.0, 38.0, 21.0, 25.0, 20.0, 32.0, 25.0, 41.0, 35.0, 36.0, 38.0, 40.0, 36.0, 41.0, 37.0, 35.0, 33.0, 36.0, 31.0, 30.0, 33.0, 15.0, 30.0, 19.0, 16.0, 20.0, 19.0, 11.0, 14.0, 11.0, 6.0, 8.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-72.92232513427734, -70.63267517089844, -68.34303283691406, -66.05338287353516, -63.76373291015625, -61.474082946777344, -59.1844367980957, -56.89479064941406, -54.605140686035156, -52.31549072265625, -50.02584457397461, -47.73619842529297, -45.44654846191406, -43.156898498535156, -40.867252349853516, -38.577606201171875, -36.28795623779297, -33.99830627441406, -31.708660125732422, -29.41901206970215, -27.129364013671875, -24.8397159576416, -22.550067901611328, -20.260419845581055, -17.97077178955078, -15.681123733520508, -13.391475677490234, -11.101827621459961, -8.812179565429688, -6.522531509399414, -4.232883453369141, -1.9432353973388672, 0.3464202880859375, 2.636068344116211, 4.925716400146484, 7.215364456176758, 9.505012512207031, 11.794660568237305, 14.084308624267578, 16.37395668029785, 18.663604736328125, 20.9532527923584, 23.242900848388672, 25.532548904418945, 27.82219696044922, 30.111845016479492, 32.401493072509766, 34.691139221191406, 36.98078918457031, 39.27043914794922, 41.56008529663086, 43.8497314453125, 46.139381408691406, 48.42903137207031, 50.71867752075195, 53.008323669433594, 55.2979736328125, 57.587623596191406, 59.87726974487305, 62.16691589355469, 64.4565658569336, 66.7462158203125, 69.03585815429688, 71.32550811767578, 73.61515808105469]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 4.0, 4.0, 5.0, 12.0, 9.0, 12.0, 12.0, 10.0, 31.0, 23.0, 32.0, 23.0, 29.0, 49.0, 41.0, 33.0, 59.0, 42.0, 53.0, 41.0, 38.0, 48.0, 37.0, 48.0, 35.0, 34.0, 36.0, 26.0, 18.0, 18.0, 20.0, 18.0, 29.0, 16.0, 14.0, 6.0, 11.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.73046875, -7.49920654296875, -7.2679443359375, -7.03668212890625, -6.805419921875, -6.57415771484375, -6.3428955078125, -6.11163330078125, -5.88037109375, -5.64910888671875, -5.4178466796875, -5.18658447265625, -4.955322265625, -4.72406005859375, -4.4927978515625, -4.26153564453125, -4.0302734375, -3.79901123046875, -3.5677490234375, -3.33648681640625, -3.105224609375, -2.87396240234375, -2.6427001953125, -2.41143798828125, -2.18017578125, -1.94891357421875, -1.7176513671875, -1.48638916015625, -1.255126953125, -1.02386474609375, -0.7926025390625, -0.56134033203125, -0.330078125, -0.09881591796875, 0.1324462890625, 0.36370849609375, 0.594970703125, 0.82623291015625, 1.0574951171875, 1.28875732421875, 1.52001953125, 1.75128173828125, 1.9825439453125, 2.21380615234375, 2.445068359375, 2.67633056640625, 2.9075927734375, 3.13885498046875, 3.3701171875, 3.60137939453125, 3.8326416015625, 4.06390380859375, 4.295166015625, 4.52642822265625, 4.7576904296875, 4.98895263671875, 5.22021484375, 5.45147705078125, 5.6827392578125, 5.91400146484375, 6.145263671875, 6.37652587890625, 6.6077880859375, 6.83905029296875, 7.0703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 6.0, 4.0, 11.0, 11.0, 8.0, 22.0, 22.0, 32.0, 51.0, 57.0, 91.0, 256.0, 567.0, 1523.0, 5520.0, 23396.0, 134177.0, 1357540.0, 2352944.0, 266274.0, 39673.0, 8331.0, 2346.0, 729.0, 293.0, 115.0, 75.0, 44.0, 41.0, 23.0, 19.0, 15.0, 15.0, 11.0, 10.0, 7.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.96875, -22.29638671875, -21.6240234375, -20.95166015625, -20.279296875, -19.60693359375, -18.9345703125, -18.26220703125, -17.58984375, -16.91748046875, -16.2451171875, -15.57275390625, -14.900390625, -14.22802734375, -13.5556640625, -12.88330078125, -12.2109375, -11.53857421875, -10.8662109375, -10.19384765625, -9.521484375, -8.84912109375, -8.1767578125, -7.50439453125, -6.83203125, -6.15966796875, -5.4873046875, -4.81494140625, -4.142578125, -3.47021484375, -2.7978515625, -2.12548828125, -1.453125, -0.78076171875, -0.1083984375, 0.56396484375, 1.236328125, 1.90869140625, 2.5810546875, 3.25341796875, 3.92578125, 4.59814453125, 5.2705078125, 5.94287109375, 6.615234375, 7.28759765625, 7.9599609375, 8.63232421875, 9.3046875, 9.97705078125, 10.6494140625, 11.32177734375, 11.994140625, 12.66650390625, 13.3388671875, 14.01123046875, 14.68359375, 15.35595703125, 16.0283203125, 16.70068359375, 17.373046875, 18.04541015625, 18.7177734375, 19.39013671875, 20.0625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 8.0, 9.0, 5.0, 8.0, 13.0, 23.0, 20.0, 39.0, 50.0, 43.0, 82.0, 85.0, 131.0, 150.0, 198.0, 235.0, 279.0, 345.0, 392.0, 331.0, 336.0, 236.0, 213.0, 163.0, 157.0, 124.0, 91.0, 78.0, 45.0, 50.0, 29.0, 26.0, 22.0, 9.0, 7.0, 7.0, 11.0, 4.0, 9.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.109375, -16.6309814453125, -16.152587890625, -15.6741943359375, -15.19580078125, -14.7174072265625, -14.239013671875, -13.7606201171875, -13.2822265625, -12.8038330078125, -12.325439453125, -11.8470458984375, -11.36865234375, -10.8902587890625, -10.411865234375, -9.9334716796875, -9.455078125, -8.9766845703125, -8.498291015625, -8.0198974609375, -7.54150390625, -7.0631103515625, -6.584716796875, -6.1063232421875, -5.6279296875, -5.1495361328125, -4.671142578125, -4.1927490234375, -3.71435546875, -3.2359619140625, -2.757568359375, -2.2791748046875, -1.80078125, -1.3223876953125, -0.843994140625, -0.3656005859375, 0.11279296875, 0.5911865234375, 1.069580078125, 1.5479736328125, 2.0263671875, 2.5047607421875, 2.983154296875, 3.4615478515625, 3.93994140625, 4.4183349609375, 4.896728515625, 5.3751220703125, 5.853515625, 6.3319091796875, 6.810302734375, 7.2886962890625, 7.76708984375, 8.2454833984375, 8.723876953125, 9.2022705078125, 9.6806640625, 10.1590576171875, 10.637451171875, 11.1158447265625, 11.59423828125, 12.0726318359375, 12.551025390625, 13.0294189453125, 13.5078125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 12.0, 14.0, 24.0, 27.0, 40.0, 61.0, 72.0, 112.0, 226.0, 453.0, 1386.0, 6404.0, 49160.0, 574423.0, 3106072.0, 411592.0, 37050.0, 5070.0, 1128.0, 402.0, 199.0, 107.0, 68.0, 54.0, 43.0, 31.0, 16.0, 11.0, 12.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.9375, -32.65380859375, -31.3701171875, -30.08642578125, -28.802734375, -27.51904296875, -26.2353515625, -24.95166015625, -23.66796875, -22.38427734375, -21.1005859375, -19.81689453125, -18.533203125, -17.24951171875, -15.9658203125, -14.68212890625, -13.3984375, -12.11474609375, -10.8310546875, -9.54736328125, -8.263671875, -6.97998046875, -5.6962890625, -4.41259765625, -3.12890625, -1.84521484375, -0.5615234375, 0.72216796875, 2.005859375, 3.28955078125, 4.5732421875, 5.85693359375, 7.140625, 8.42431640625, 9.7080078125, 10.99169921875, 12.275390625, 13.55908203125, 14.8427734375, 16.12646484375, 17.41015625, 18.69384765625, 19.9775390625, 21.26123046875, 22.544921875, 23.82861328125, 25.1123046875, 26.39599609375, 27.6796875, 28.96337890625, 30.2470703125, 31.53076171875, 32.814453125, 34.09814453125, 35.3818359375, 36.66552734375, 37.94921875, 39.23291015625, 40.5166015625, 41.80029296875, 43.083984375, 44.36767578125, 45.6513671875, 46.93505859375, 48.21875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 8.0, 22.0, 32.0, 67.0, 114.0, 120.0, 153.0, 150.0, 136.0, 82.0, 54.0, 35.0, 17.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.15119171142578, -101.86615753173828, -97.58111572265625, -93.29608154296875, -89.01104736328125, -84.72601318359375, -80.44097900390625, -76.15593719482422, -71.87090301513672, -67.58586883544922, -63.30083084106445, -59.01579284667969, -54.73075866699219, -50.44572448730469, -46.16068649291992, -41.875648498535156, -37.590614318847656, -33.305580139160156, -29.02054214477539, -24.735506057739258, -20.450469970703125, -16.165433883666992, -11.88039779663086, -7.595361709594727, -3.3103256225585938, 0.9747104644775391, 5.259746551513672, 9.544782638549805, 13.829818725585938, 18.11485481262207, 22.399890899658203, 26.684926986694336, 30.969955444335938, 35.25498962402344, 39.5400276184082, 43.82506561279297, 48.11009979248047, 52.39513397216797, 56.680171966552734, 60.9652099609375, 65.250244140625, 69.5352783203125, 73.8203125, 78.10535430908203, 82.39038848876953, 86.67542266845703, 90.96046447753906, 95.24549865722656, 99.53053283691406, 103.81556701660156, 108.10060119628906, 112.3856430053711, 116.6706771850586, 120.9557113647461, 125.24075317382812, 129.52578735351562, 133.81082153320312, 138.09585571289062, 142.38088989257812, 146.66592407226562, 150.95095825195312, 155.2360076904297, 159.5210418701172, 163.8060760498047, 168.0911102294922]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 5.0, 9.0, 10.0, 15.0, 4.0, 12.0, 13.0, 23.0, 20.0, 30.0, 19.0, 21.0, 35.0, 33.0, 45.0, 35.0, 25.0, 41.0, 33.0, 30.0, 32.0, 42.0, 46.0, 30.0, 38.0, 36.0, 23.0, 36.0, 25.0, 32.0, 24.0, 16.0, 21.0, 20.0, 16.0, 13.0, 13.0, 17.0, 8.0, 13.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-54.22406005859375, -52.52210235595703, -50.82014846801758, -49.118194580078125, -47.416236877441406, -45.71427917480469, -44.012325286865234, -42.31037139892578, -40.60841369628906, -38.906455993652344, -37.20450210571289, -35.50254821777344, -33.80059051513672, -32.0986328125, -30.396678924560547, -28.69472312927246, -26.992767333984375, -25.29081153869629, -23.588855743408203, -21.886899948120117, -20.18494415283203, -18.482988357543945, -16.78103256225586, -15.079076766967773, -13.377120971679688, -11.675165176391602, -9.973209381103516, -8.27125358581543, -6.569297790527344, -4.867341995239258, -3.165386199951172, -1.463430404663086, 0.238525390625, 1.940481185913086, 3.642436981201172, 5.344392776489258, 7.046348571777344, 8.74830436706543, 10.450260162353516, 12.152215957641602, 13.854171752929688, 15.556127548217773, 17.25808334350586, 18.960039138793945, 20.66199493408203, 22.363950729370117, 24.065906524658203, 25.76786231994629, 27.469818115234375, 29.17177391052246, 30.873729705810547, 32.57568359375, 34.27764129638672, 35.97959899902344, 37.68155288696289, 39.383506774902344, 41.08546447753906, 42.78742218017578, 44.489376068115234, 46.19132995605469, 47.893287658691406, 49.595245361328125, 51.29719924926758, 52.99915313720703, 54.70111083984375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 9.0, 14.0, 16.0, 22.0, 20.0, 34.0, 24.0, 27.0, 30.0, 31.0, 36.0, 50.0, 30.0, 57.0, 43.0, 46.0, 35.0, 49.0, 38.0, 31.0, 45.0, 38.0, 23.0, 28.0, 27.0, 28.0, 20.0, 16.0, 15.0, 26.0, 8.0, 11.0, 9.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1015625, -6.87615966796875, -6.6507568359375, -6.42535400390625, -6.199951171875, -5.97454833984375, -5.7491455078125, -5.52374267578125, -5.29833984375, -5.07293701171875, -4.8475341796875, -4.62213134765625, -4.396728515625, -4.17132568359375, -3.9459228515625, -3.72052001953125, -3.4951171875, -3.26971435546875, -3.0443115234375, -2.81890869140625, -2.593505859375, -2.36810302734375, -2.1427001953125, -1.91729736328125, -1.69189453125, -1.46649169921875, -1.2410888671875, -1.01568603515625, -0.790283203125, -0.56488037109375, -0.3394775390625, -0.11407470703125, 0.111328125, 0.33673095703125, 0.5621337890625, 0.78753662109375, 1.012939453125, 1.23834228515625, 1.4637451171875, 1.68914794921875, 1.91455078125, 2.13995361328125, 2.3653564453125, 2.59075927734375, 2.816162109375, 3.04156494140625, 3.2669677734375, 3.49237060546875, 3.7177734375, 3.94317626953125, 4.1685791015625, 4.39398193359375, 4.619384765625, 4.84478759765625, 5.0701904296875, 5.29559326171875, 5.52099609375, 5.74639892578125, 5.9718017578125, 6.19720458984375, 6.422607421875, 6.64801025390625, 6.8734130859375, 7.09881591796875, 7.32421875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 8.0, 8.0, 17.0, 24.0, 46.0, 75.0, 117.0, 152.0, 282.0, 439.0, 752.0, 1215.0, 2228.0, 3904.0, 6723.0, 11610.0, 21279.0, 39604.0, 77772.0, 162681.0, 281387.0, 217157.0, 106498.0, 51701.0, 27691.0, 15058.0, 8436.0, 4700.0, 2830.0, 1632.0, 978.0, 566.0, 340.0, 219.0, 145.0, 88.0, 68.0, 41.0, 23.0, 12.0, 13.0, 16.0, 9.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.349609375, -1.3070526123046875, -1.264495849609375, -1.2219390869140625, -1.17938232421875, -1.1368255615234375, -1.094268798828125, -1.0517120361328125, -1.0091552734375, -0.9665985107421875, -0.924041748046875, -0.8814849853515625, -0.83892822265625, -0.7963714599609375, -0.753814697265625, -0.7112579345703125, -0.668701171875, -0.6261444091796875, -0.583587646484375, -0.5410308837890625, -0.49847412109375, -0.4559173583984375, -0.413360595703125, -0.3708038330078125, -0.3282470703125, -0.2856903076171875, -0.243133544921875, -0.2005767822265625, -0.15802001953125, -0.1154632568359375, -0.072906494140625, -0.0303497314453125, 0.01220703125, 0.0547637939453125, 0.097320556640625, 0.1398773193359375, 0.18243408203125, 0.2249908447265625, 0.267547607421875, 0.3101043701171875, 0.3526611328125, 0.3952178955078125, 0.437774658203125, 0.4803314208984375, 0.52288818359375, 0.5654449462890625, 0.608001708984375, 0.6505584716796875, 0.693115234375, 0.7356719970703125, 0.778228759765625, 0.8207855224609375, 0.86334228515625, 0.9058990478515625, 0.948455810546875, 0.9910125732421875, 1.0335693359375, 1.0761260986328125, 1.118682861328125, 1.1612396240234375, 1.20379638671875, 1.2463531494140625, 1.288909912109375, 1.3314666748046875, 1.3740234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 10.0, 10.0, 11.0, 11.0, 22.0, 11.0, 17.0, 16.0, 25.0, 28.0, 26.0, 24.0, 22.0, 35.0, 36.0, 29.0, 37.0, 39.0, 39.0, 1074.0, 35.0, 45.0, 23.0, 39.0, 21.0, 33.0, 33.0, 26.0, 12.0, 20.0, 24.0, 21.0, 25.0, 17.0, 16.0, 22.0, 10.0, 8.0, 11.0, 9.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-4.14453125, -4.018310546875, -3.89208984375, -3.765869140625, -3.6396484375, -3.513427734375, -3.38720703125, -3.260986328125, -3.134765625, -3.008544921875, -2.88232421875, -2.756103515625, -2.6298828125, -2.503662109375, -2.37744140625, -2.251220703125, -2.125, -1.998779296875, -1.87255859375, -1.746337890625, -1.6201171875, -1.493896484375, -1.36767578125, -1.241455078125, -1.115234375, -0.989013671875, -0.86279296875, -0.736572265625, -0.6103515625, -0.484130859375, -0.35791015625, -0.231689453125, -0.10546875, 0.020751953125, 0.14697265625, 0.273193359375, 0.3994140625, 0.525634765625, 0.65185546875, 0.778076171875, 0.904296875, 1.030517578125, 1.15673828125, 1.282958984375, 1.4091796875, 1.535400390625, 1.66162109375, 1.787841796875, 1.9140625, 2.040283203125, 2.16650390625, 2.292724609375, 2.4189453125, 2.545166015625, 2.67138671875, 2.797607421875, 2.923828125, 3.050048828125, 3.17626953125, 3.302490234375, 3.4287109375, 3.554931640625, 3.68115234375, 3.807373046875, 3.93359375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 9.0, 25.0, 30.0, 46.0, 44.0, 110.0, 115.0, 188.0, 291.0, 446.0, 599.0, 911.0, 1440.0, 2128.0, 3490.0, 5517.0, 8834.0, 14616.0, 24721.0, 43133.0, 74782.0, 124843.0, 193284.0, 1232528.0, 145622.0, 90329.0, 52468.0, 30283.0, 17556.0, 10671.0, 6366.0, 4139.0, 2648.0, 1600.0, 1082.0, 733.0, 456.0, 332.0, 244.0, 154.0, 96.0, 75.0, 48.0, 31.0, 23.0, 20.0, 8.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.609375, -0.5891799926757812, -0.5689849853515625, -0.5487899780273438, -0.528594970703125, -0.5083999633789062, -0.4882049560546875, -0.46800994873046875, -0.44781494140625, -0.42761993408203125, -0.4074249267578125, -0.38722991943359375, -0.367034912109375, -0.34683990478515625, -0.3266448974609375, -0.30644989013671875, -0.2862548828125, -0.26605987548828125, -0.2458648681640625, -0.22566986083984375, -0.205474853515625, -0.18527984619140625, -0.1650848388671875, -0.14488983154296875, -0.12469482421875, -0.10449981689453125, -0.0843048095703125, -0.06410980224609375, -0.043914794921875, -0.02371978759765625, -0.0035247802734375, 0.01667022705078125, 0.036865234375, 0.05706024169921875, 0.0772552490234375, 0.09745025634765625, 0.117645263671875, 0.13784027099609375, 0.1580352783203125, 0.17823028564453125, 0.19842529296875, 0.21862030029296875, 0.2388153076171875, 0.25901031494140625, 0.279205322265625, 0.29940032958984375, 0.3195953369140625, 0.33979034423828125, 0.3599853515625, 0.38018035888671875, 0.4003753662109375, 0.42057037353515625, 0.440765380859375, 0.46096038818359375, 0.4811553955078125, 0.5013504028320312, 0.52154541015625, 0.5417404174804688, 0.5619354248046875, 0.5821304321289062, 0.602325439453125, 0.6225204467773438, 0.6427154541015625, 0.6629104614257812, 0.68310546875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 12.0, 12.0, 15.0, 8.0, 16.0, 30.0, 36.0, 46.0, 68.0, 95.0, 86.0, 92.0, 86.0, 85.0, 82.0, 48.0, 28.0, 37.0, 15.0, 16.0, 21.0, 13.0, 10.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00787353515625, -0.007561683654785156, -0.0072498321533203125, -0.006937980651855469, -0.006626129150390625, -0.006314277648925781, -0.0060024261474609375, -0.005690574645996094, -0.00537872314453125, -0.005066871643066406, -0.0047550201416015625, -0.004443168640136719, -0.004131317138671875, -0.0038194656372070312, -0.0035076141357421875, -0.0031957626342773438, -0.0028839111328125, -0.0025720596313476562, -0.0022602081298828125, -0.0019483566284179688, -0.001636505126953125, -0.0013246536254882812, -0.0010128021240234375, -0.0007009506225585938, -0.00038909912109375, -7.724761962890625e-05, 0.0002346038818359375, 0.0005464553833007812, 0.000858306884765625, 0.0011701583862304688, 0.0014820098876953125, 0.0017938613891601562, 0.002105712890625, 0.0024175643920898438, 0.0027294158935546875, 0.0030412673950195312, 0.003353118896484375, 0.0036649703979492188, 0.0039768218994140625, 0.004288673400878906, 0.00460052490234375, 0.004912376403808594, 0.0052242279052734375, 0.005536079406738281, 0.005847930908203125, 0.006159782409667969, 0.0064716339111328125, 0.006783485412597656, 0.0070953369140625, 0.007407188415527344, 0.0077190399169921875, 0.008030891418457031, 0.008342742919921875, 0.008654594421386719, 0.008966445922851562, 0.009278297424316406, 0.00959014892578125, 0.009902000427246094, 0.010213851928710938, 0.010525703430175781, 0.010837554931640625, 0.011149406433105469, 0.011461257934570312, 0.011773109436035156, 0.0120849609375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 3.0, 4.0, 12.0, 9.0, 19.0, 34.0, 36.0, 47.0, 109.0, 172.0, 407.0, 1872.0, 36486.0, 948389.0, 57474.0, 2564.0, 424.0, 169.0, 122.0, 67.0, 44.0, 25.0, 14.0, 15.0, 10.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.249755859375, -0.24327850341796875, -0.2368011474609375, -0.23032379150390625, -0.223846435546875, -0.21736907958984375, -0.2108917236328125, -0.20441436767578125, -0.19793701171875, -0.19145965576171875, -0.1849822998046875, -0.17850494384765625, -0.172027587890625, -0.16555023193359375, -0.1590728759765625, -0.15259552001953125, -0.1461181640625, -0.13964080810546875, -0.1331634521484375, -0.12668609619140625, -0.120208740234375, -0.11373138427734375, -0.1072540283203125, -0.10077667236328125, -0.09429931640625, -0.08782196044921875, -0.0813446044921875, -0.07486724853515625, -0.068389892578125, -0.06191253662109375, -0.0554351806640625, -0.04895782470703125, -0.04248046875, -0.03600311279296875, -0.0295257568359375, -0.02304840087890625, -0.016571044921875, -0.01009368896484375, -0.0036163330078125, 0.00286102294921875, 0.00933837890625, 0.01581573486328125, 0.0222930908203125, 0.02877044677734375, 0.035247802734375, 0.04172515869140625, 0.0482025146484375, 0.05467987060546875, 0.0611572265625, 0.06763458251953125, 0.0741119384765625, 0.08058929443359375, 0.087066650390625, 0.09354400634765625, 0.1000213623046875, 0.10649871826171875, 0.11297607421875, 0.11945343017578125, 0.1259307861328125, 0.13240814208984375, 0.138885498046875, 0.14536285400390625, 0.1518402099609375, 0.15831756591796875, 0.164794921875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 11.0, 28.0, 55.0, 183.0, 411.0, 225.0, 66.0, 20.0, 7.0, 2.0, 1.0, 1.0], "bins": [-0.10225333273410797, -0.1004474014043808, -0.09864147752523422, -0.09683554619550705, -0.09502961486577988, -0.0932236909866333, -0.09141775965690613, -0.08961182832717896, -0.08780590444803238, -0.0859999731183052, -0.08419404923915863, -0.08238811790943146, -0.08058218657970428, -0.07877626270055771, -0.07697033137083054, -0.07516440004110336, -0.07335846871137619, -0.07155253738164902, -0.06974661350250244, -0.06794068217277527, -0.0661347508430481, -0.06432882696390152, -0.06252289563417435, -0.060716964304447174, -0.0589110404253006, -0.057105112820863724, -0.05529918149113655, -0.053493253886699677, -0.0516873262822628, -0.04988139495253563, -0.048075467348098755, -0.04626953601837158, -0.04446360468864441, -0.042657677084207535, -0.04085174575448036, -0.03904581815004349, -0.03723989054560661, -0.03543395921587944, -0.033628031611442566, -0.03182210028171539, -0.030016176402568817, -0.028210246935486794, -0.02640431933104992, -0.024598389863967896, -0.022792460396885872, -0.02098653092980385, -0.019180603325366974, -0.01737467385828495, -0.015568744391202927, -0.013762815855443478, -0.011956886388361454, -0.010150957852602005, -0.008345028385519981, -0.006539099849760532, -0.004733171314001083, -0.0029272418469190598, -0.0011213133111596107, 0.0006846155738458037, 0.0024905444588512182, 0.004296473227441311, 0.006102402228862047, 0.007908331230282784, 0.009714259766042233, 0.011520189233124256, 0.013326117768883705]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 12.0, 14.0, 11.0, 17.0, 14.0, 17.0, 28.0, 26.0, 35.0, 28.0, 39.0, 43.0, 29.0, 48.0, 38.0, 48.0, 56.0, 42.0, 47.0, 49.0, 35.0, 40.0, 44.0, 32.0, 30.0, 36.0, 25.0, 24.0, 14.0, 17.0, 14.0, 10.0, 11.0, 5.0, 8.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004029393196105957, -0.003883812576532364, -0.0037382319569587708, -0.0035926513373851776, -0.0034470707178115845, -0.0033014900982379913, -0.003155909478664398, -0.003010328859090805, -0.002864748239517212, -0.0027191676199436188, -0.0025735870003700256, -0.0024280063807964325, -0.0022824257612228394, -0.002136845141649246, -0.001991264522075653, -0.00184568390250206, -0.0017001032829284668, -0.0015545226633548737, -0.0014089420437812805, -0.0012633614242076874, -0.0011177808046340942, -0.0009722001850605011, -0.000826619565486908, -0.0006810389459133148, -0.0005354583263397217, -0.00038987770676612854, -0.0002442970871925354, -9.871646761894226e-05, 4.686415195465088e-05, 0.00019244477152824402, 0.00033802539110183716, 0.0004836060106754303, 0.0006291866302490234, 0.0007747672498226166, 0.0009203478693962097, 0.0010659284889698029, 0.001211509108543396, 0.0013570897281169891, 0.0015026703476905823, 0.0016482509672641754, 0.0017938315868377686, 0.0019394122064113617, 0.002084992825984955, 0.002230573445558548, 0.002376154065132141, 0.0025217346847057343, 0.0026673153042793274, 0.0028128959238529205, 0.0029584765434265137, 0.003104057163000107, 0.0032496377825737, 0.003395218402147293, 0.0035407990217208862, 0.0036863796412944794, 0.0038319602608680725, 0.003977540880441666, 0.004123121500015259, 0.004268702119588852, 0.004414282739162445, 0.004559863358736038, 0.004705443978309631, 0.0048510245978832245, 0.004996605217456818, 0.005142185837030411, 0.005287766456604004]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 9.0, 14.0, 16.0, 22.0, 20.0, 34.0, 24.0, 27.0, 30.0, 31.0, 36.0, 50.0, 30.0, 57.0, 43.0, 46.0, 35.0, 49.0, 38.0, 31.0, 45.0, 38.0, 23.0, 28.0, 27.0, 28.0, 20.0, 16.0, 15.0, 26.0, 8.0, 11.0, 9.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1015625, -6.87615966796875, -6.6507568359375, -6.42535400390625, -6.199951171875, -5.97454833984375, -5.7491455078125, -5.52374267578125, -5.29833984375, -5.07293701171875, -4.8475341796875, -4.62213134765625, -4.396728515625, -4.17132568359375, -3.9459228515625, -3.72052001953125, -3.4951171875, -3.26971435546875, -3.0443115234375, -2.81890869140625, -2.593505859375, -2.36810302734375, -2.1427001953125, -1.91729736328125, -1.69189453125, -1.46649169921875, -1.2410888671875, -1.01568603515625, -0.790283203125, -0.56488037109375, -0.3394775390625, -0.11407470703125, 0.111328125, 0.33673095703125, 0.5621337890625, 0.78753662109375, 1.012939453125, 1.23834228515625, 1.4637451171875, 1.68914794921875, 1.91455078125, 2.13995361328125, 2.3653564453125, 2.59075927734375, 2.816162109375, 3.04156494140625, 3.2669677734375, 3.49237060546875, 3.7177734375, 3.94317626953125, 4.1685791015625, 4.39398193359375, 4.619384765625, 4.84478759765625, 5.0701904296875, 5.29559326171875, 5.52099609375, 5.74639892578125, 5.9718017578125, 6.19720458984375, 6.422607421875, 6.64801025390625, 6.8734130859375, 7.09881591796875, 7.32421875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 12.0, 15.0, 31.0, 34.0, 57.0, 61.0, 99.0, 129.0, 223.0, 299.0, 441.0, 607.0, 853.0, 1209.0, 1659.0, 2318.0, 3183.0, 4670.0, 7237.0, 12307.0, 24198.0, 59052.0, 191259.0, 482097.0, 152321.0, 49988.0, 21492.0, 11077.0, 6568.0, 4489.0, 3061.0, 2076.0, 1587.0, 1165.0, 807.0, 529.0, 390.0, 273.0, 237.0, 126.0, 117.0, 69.0, 40.0, 27.0, 27.0, 16.0, 13.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.48046875, -6.29217529296875, -6.1038818359375, -5.91558837890625, -5.727294921875, -5.53900146484375, -5.3507080078125, -5.16241455078125, -4.97412109375, -4.78582763671875, -4.5975341796875, -4.40924072265625, -4.220947265625, -4.03265380859375, -3.8443603515625, -3.65606689453125, -3.4677734375, -3.27947998046875, -3.0911865234375, -2.90289306640625, -2.714599609375, -2.52630615234375, -2.3380126953125, -2.14971923828125, -1.96142578125, -1.77313232421875, -1.5848388671875, -1.39654541015625, -1.208251953125, -1.01995849609375, -0.8316650390625, -0.64337158203125, -0.455078125, -0.26678466796875, -0.0784912109375, 0.10980224609375, 0.298095703125, 0.48638916015625, 0.6746826171875, 0.86297607421875, 1.05126953125, 1.23956298828125, 1.4278564453125, 1.61614990234375, 1.804443359375, 1.99273681640625, 2.1810302734375, 2.36932373046875, 2.5576171875, 2.74591064453125, 2.9342041015625, 3.12249755859375, 3.310791015625, 3.49908447265625, 3.6873779296875, 3.87567138671875, 4.06396484375, 4.25225830078125, 4.4405517578125, 4.62884521484375, 4.817138671875, 5.00543212890625, 5.1937255859375, 5.38201904296875, 5.5703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 5.0, 7.0, 5.0, 7.0, 10.0, 12.0, 12.0, 19.0, 13.0, 27.0, 29.0, 20.0, 31.0, 38.0, 36.0, 42.0, 55.0, 45.0, 63.0, 152.0, 1806.0, 154.0, 74.0, 64.0, 43.0, 33.0, 25.0, 29.0, 21.0, 26.0, 26.0, 23.0, 12.0, 22.0, 17.0, 10.0, 14.0, 9.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.71875, -24.90234375, -24.0859375, -23.26953125, -22.453125, -21.63671875, -20.8203125, -20.00390625, -19.1875, -18.37109375, -17.5546875, -16.73828125, -15.921875, -15.10546875, -14.2890625, -13.47265625, -12.65625, -11.83984375, -11.0234375, -10.20703125, -9.390625, -8.57421875, -7.7578125, -6.94140625, -6.125, -5.30859375, -4.4921875, -3.67578125, -2.859375, -2.04296875, -1.2265625, -0.41015625, 0.40625, 1.22265625, 2.0390625, 2.85546875, 3.671875, 4.48828125, 5.3046875, 6.12109375, 6.9375, 7.75390625, 8.5703125, 9.38671875, 10.203125, 11.01953125, 11.8359375, 12.65234375, 13.46875, 14.28515625, 15.1015625, 15.91796875, 16.734375, 17.55078125, 18.3671875, 19.18359375, 20.0, 20.81640625, 21.6328125, 22.44921875, 23.265625, 24.08203125, 24.8984375, 25.71484375, 26.53125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 5.0, 11.0, 18.0, 18.0, 31.0, 18.0, 34.0, 56.0, 72.0, 115.0, 162.0, 262.0, 634.0, 4303.0, 168694.0, 2955173.0, 13739.0, 1271.0, 342.0, 212.0, 160.0, 91.0, 59.0, 48.0, 39.0, 32.0, 16.0, 22.0, 11.0, 10.0, 7.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.28125, -56.5263671875, -54.771484375, -53.0166015625, -51.26171875, -49.5068359375, -47.751953125, -45.9970703125, -44.2421875, -42.4873046875, -40.732421875, -38.9775390625, -37.22265625, -35.4677734375, -33.712890625, -31.9580078125, -30.203125, -28.4482421875, -26.693359375, -24.9384765625, -23.18359375, -21.4287109375, -19.673828125, -17.9189453125, -16.1640625, -14.4091796875, -12.654296875, -10.8994140625, -9.14453125, -7.3896484375, -5.634765625, -3.8798828125, -2.125, -0.3701171875, 1.384765625, 3.1396484375, 4.89453125, 6.6494140625, 8.404296875, 10.1591796875, 11.9140625, 13.6689453125, 15.423828125, 17.1787109375, 18.93359375, 20.6884765625, 22.443359375, 24.1982421875, 25.953125, 27.7080078125, 29.462890625, 31.2177734375, 32.97265625, 34.7275390625, 36.482421875, 38.2373046875, 39.9921875, 41.7470703125, 43.501953125, 45.2568359375, 47.01171875, 48.7666015625, 50.521484375, 52.2763671875, 54.03125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 12.0, 9.0, 27.0, 38.0, 66.0, 66.0, 90.0, 112.0, 91.0, 109.0, 106.0, 74.0, 67.0, 41.0, 39.0, 25.0, 12.0, 10.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.861297607421875, -14.018092155456543, -13.174887657165527, -12.331682205200195, -11.48847770690918, -10.645272254943848, -9.802066802978516, -8.9588623046875, -8.115656852722168, -7.272451877593994, -6.42924690246582, -5.586041450500488, -4.7428364753723145, -3.8996315002441406, -3.0564260482788086, -2.2132210731506348, -1.370016098022461, -0.5268110036849976, 0.3163940906524658, 1.1595993041992188, 2.0028042793273926, 2.8460092544555664, 3.6892147064208984, 4.532419681549072, 5.375624656677246, 6.21882963180542, 7.062034606933594, 7.905240058898926, 8.748445510864258, 9.591650009155273, 10.434855461120605, 11.278060913085938, 12.121265411376953, 12.964470863342285, 13.8076753616333, 14.650880813598633, 15.494085311889648, 16.337291717529297, 17.180496215820312, 18.023700714111328, 18.866905212402344, 19.71010971069336, 20.553316116333008, 21.396520614624023, 22.23972511291504, 23.082931518554688, 23.926136016845703, 24.76934051513672, 25.612546920776367, 26.455751419067383, 27.29895782470703, 28.142162322998047, 28.985366821289062, 29.828571319580078, 30.671777725219727, 31.514982223510742, 32.35818862915039, 33.201393127441406, 34.04459762573242, 34.88780212402344, 35.73101043701172, 36.574214935302734, 37.41741943359375, 38.260623931884766, 39.10382843017578]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 2.0, 6.0, 8.0, 6.0, 14.0, 16.0, 18.0, 23.0, 28.0, 24.0, 31.0, 32.0, 27.0, 25.0, 34.0, 36.0, 44.0, 37.0, 44.0, 30.0, 43.0, 43.0, 42.0, 38.0, 45.0, 32.0, 30.0, 34.0, 26.0, 28.0, 24.0, 21.0, 16.0, 18.0, 7.0, 10.0, 7.0, 6.0, 7.0, 5.0, 6.0, 7.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-77.84317016601562, -75.57748413085938, -73.31179809570312, -71.04611206054688, -68.7804183959961, -66.51473236083984, -64.2490463256836, -61.983360290527344, -59.717674255371094, -57.451988220214844, -55.18629837036133, -52.92061233520508, -50.65492630004883, -48.38923645019531, -46.12355041503906, -43.85786437988281, -41.5921745300293, -39.32648849487305, -37.06079864501953, -34.79511260986328, -32.52942657470703, -30.26373863220215, -27.998050689697266, -25.732364654541016, -23.466676712036133, -21.20098876953125, -18.935302734375, -16.669614791870117, -14.40392780303955, -12.138240814208984, -9.872552871704102, -7.606865882873535, -5.341178894042969, -3.0754916667938232, -0.8098044395446777, 1.4558830261230469, 3.7215700149536133, 5.98725700378418, 8.252944946289062, 10.518631935119629, 12.784318923950195, 15.050005912780762, 17.315692901611328, 19.58138084411621, 21.847068786621094, 24.112754821777344, 26.378442764282227, 28.64413070678711, 30.90981674194336, 33.17550277709961, 35.441192626953125, 37.706878662109375, 39.972564697265625, 42.238250732421875, 44.50394058227539, 46.76962661743164, 49.035316467285156, 51.301002502441406, 53.56669235229492, 55.83237838745117, 58.09806442260742, 60.36375427246094, 62.62944030761719, 64.89512634277344, 67.16081237792969]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 10.0, 20.0, 21.0, 34.0, 26.0, 21.0, 28.0, 29.0, 27.0, 45.0, 31.0, 36.0, 40.0, 64.0, 35.0, 30.0, 47.0, 41.0, 37.0, 37.0, 27.0, 34.0, 26.0, 28.0, 23.0, 24.0, 20.0, 19.0, 17.0, 11.0, 14.0, 11.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.13671875, -6.9169921875, -6.697265625, -6.4775390625, -6.2578125, -6.0380859375, -5.818359375, -5.5986328125, -5.37890625, -5.1591796875, -4.939453125, -4.7197265625, -4.5, -4.2802734375, -4.060546875, -3.8408203125, -3.62109375, -3.4013671875, -3.181640625, -2.9619140625, -2.7421875, -2.5224609375, -2.302734375, -2.0830078125, -1.86328125, -1.6435546875, -1.423828125, -1.2041015625, -0.984375, -0.7646484375, -0.544921875, -0.3251953125, -0.10546875, 0.1142578125, 0.333984375, 0.5537109375, 0.7734375, 0.9931640625, 1.212890625, 1.4326171875, 1.65234375, 1.8720703125, 2.091796875, 2.3115234375, 2.53125, 2.7509765625, 2.970703125, 3.1904296875, 3.41015625, 3.6298828125, 3.849609375, 4.0693359375, 4.2890625, 4.5087890625, 4.728515625, 4.9482421875, 5.16796875, 5.3876953125, 5.607421875, 5.8271484375, 6.046875, 6.2666015625, 6.486328125, 6.7060546875, 6.92578125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 9.0, 3.0, 10.0, 13.0, 20.0, 25.0, 51.0, 73.0, 79.0, 136.0, 201.0, 350.0, 598.0, 927.0, 1759.0, 3284.0, 6273.0, 12562.0, 26503.0, 59965.0, 149232.0, 445942.0, 1192696.0, 1371130.0, 588285.0, 196245.0, 75001.0, 32704.0, 14862.0, 7290.0, 3575.0, 1930.0, 1007.0, 561.0, 365.0, 247.0, 113.0, 80.0, 65.0, 33.0, 26.0, 19.0, 8.0, 9.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.296875, -8.9981689453125, -8.699462890625, -8.4007568359375, -8.10205078125, -7.8033447265625, -7.504638671875, -7.2059326171875, -6.9072265625, -6.6085205078125, -6.309814453125, -6.0111083984375, -5.71240234375, -5.4136962890625, -5.114990234375, -4.8162841796875, -4.517578125, -4.2188720703125, -3.920166015625, -3.6214599609375, -3.32275390625, -3.0240478515625, -2.725341796875, -2.4266357421875, -2.1279296875, -1.8292236328125, -1.530517578125, -1.2318115234375, -0.93310546875, -0.6343994140625, -0.335693359375, -0.0369873046875, 0.26171875, 0.5604248046875, 0.859130859375, 1.1578369140625, 1.45654296875, 1.7552490234375, 2.053955078125, 2.3526611328125, 2.6513671875, 2.9500732421875, 3.248779296875, 3.5474853515625, 3.84619140625, 4.1448974609375, 4.443603515625, 4.7423095703125, 5.041015625, 5.3397216796875, 5.638427734375, 5.9371337890625, 6.23583984375, 6.5345458984375, 6.833251953125, 7.1319580078125, 7.4306640625, 7.7293701171875, 8.028076171875, 8.3267822265625, 8.62548828125, 8.9241943359375, 9.222900390625, 9.5216064453125, 9.8203125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 13.0, 15.0, 19.0, 26.0, 37.0, 37.0, 65.0, 64.0, 94.0, 112.0, 155.0, 212.0, 270.0, 314.0, 362.0, 420.0, 332.0, 323.0, 277.0, 222.0, 172.0, 123.0, 88.0, 64.0, 54.0, 53.0, 26.0, 25.0, 18.0, 17.0, 14.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.29736328125, -17.7822265625, -17.26708984375, -16.751953125, -16.23681640625, -15.7216796875, -15.20654296875, -14.69140625, -14.17626953125, -13.6611328125, -13.14599609375, -12.630859375, -12.11572265625, -11.6005859375, -11.08544921875, -10.5703125, -10.05517578125, -9.5400390625, -9.02490234375, -8.509765625, -7.99462890625, -7.4794921875, -6.96435546875, -6.44921875, -5.93408203125, -5.4189453125, -4.90380859375, -4.388671875, -3.87353515625, -3.3583984375, -2.84326171875, -2.328125, -1.81298828125, -1.2978515625, -0.78271484375, -0.267578125, 0.24755859375, 0.7626953125, 1.27783203125, 1.79296875, 2.30810546875, 2.8232421875, 3.33837890625, 3.853515625, 4.36865234375, 4.8837890625, 5.39892578125, 5.9140625, 6.42919921875, 6.9443359375, 7.45947265625, 7.974609375, 8.48974609375, 9.0048828125, 9.52001953125, 10.03515625, 10.55029296875, 11.0654296875, 11.58056640625, 12.095703125, 12.61083984375, 13.1259765625, 13.64111328125, 14.15625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 12.0, 6.0, 15.0, 17.0, 16.0, 31.0, 37.0, 58.0, 101.0, 153.0, 284.0, 601.0, 1895.0, 8689.0, 58108.0, 600169.0, 2991753.0, 474465.0, 47598.0, 7412.0, 1658.0, 536.0, 256.0, 134.0, 72.0, 58.0, 38.0, 18.0, 25.0, 20.0, 9.0, 11.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.21875, -32.05126953125, -30.8837890625, -29.71630859375, -28.548828125, -27.38134765625, -26.2138671875, -25.04638671875, -23.87890625, -22.71142578125, -21.5439453125, -20.37646484375, -19.208984375, -18.04150390625, -16.8740234375, -15.70654296875, -14.5390625, -13.37158203125, -12.2041015625, -11.03662109375, -9.869140625, -8.70166015625, -7.5341796875, -6.36669921875, -5.19921875, -4.03173828125, -2.8642578125, -1.69677734375, -0.529296875, 0.63818359375, 1.8056640625, 2.97314453125, 4.140625, 5.30810546875, 6.4755859375, 7.64306640625, 8.810546875, 9.97802734375, 11.1455078125, 12.31298828125, 13.48046875, 14.64794921875, 15.8154296875, 16.98291015625, 18.150390625, 19.31787109375, 20.4853515625, 21.65283203125, 22.8203125, 23.98779296875, 25.1552734375, 26.32275390625, 27.490234375, 28.65771484375, 29.8251953125, 30.99267578125, 32.16015625, 33.32763671875, 34.4951171875, 35.66259765625, 36.830078125, 37.99755859375, 39.1650390625, 40.33251953125, 41.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 19.0, 37.0, 84.0, 132.0, 202.0, 172.0, 153.0, 103.0, 53.0, 21.0, 9.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.37494659423828, -81.3268051147461, -76.2786636352539, -71.23052215576172, -66.18238830566406, -61.13424301147461, -56.08610534667969, -51.0379638671875, -45.98982238769531, -40.941680908203125, -35.89353942871094, -30.845401763916016, -25.797260284423828, -20.74911880493164, -15.700979232788086, -10.652839660644531, -5.604698181152344, -0.5565576553344727, 4.491582870483398, 9.53972339630127, 14.58786392211914, 19.636005401611328, 24.684144973754883, 29.732284545898438, 34.780426025390625, 39.82856750488281, 44.876708984375, 49.92484664916992, 54.97298812866211, 60.0211296081543, 65.06926727294922, 70.1174087524414, 75.16555786132812, 80.21369934082031, 85.2618408203125, 90.30998229980469, 95.35812377929688, 100.40626525878906, 105.45439910888672, 110.5025405883789, 115.5506820678711, 120.59882354736328, 125.64696502685547, 130.69509887695312, 135.7432403564453, 140.7913818359375, 145.8395233154297, 150.88766479492188, 155.93580627441406, 160.98394775390625, 166.03208923339844, 171.08023071289062, 176.1283721923828, 181.176513671875, 186.2246551513672, 191.27279663085938, 196.3209228515625, 201.3690643310547, 206.41720581054688, 211.46534729003906, 216.51348876953125, 221.56163024902344, 226.60977172851562, 231.65789794921875, 236.7060546875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 2.0, 8.0, 11.0, 14.0, 14.0, 14.0, 19.0, 19.0, 25.0, 34.0, 28.0, 34.0, 36.0, 31.0, 45.0, 31.0, 42.0, 52.0, 52.0, 57.0, 38.0, 35.0, 36.0, 44.0, 33.0, 33.0, 33.0, 23.0, 35.0, 18.0, 15.0, 12.0, 13.0, 12.0, 9.0, 10.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-70.25039672851562, -68.22891235351562, -66.20742797851562, -64.18594360351562, -62.164459228515625, -60.142974853515625, -58.121490478515625, -56.100006103515625, -54.078521728515625, -52.057037353515625, -50.035552978515625, -48.014068603515625, -45.992584228515625, -43.971099853515625, -41.949615478515625, -39.928131103515625, -37.906646728515625, -35.885162353515625, -33.863677978515625, -31.842193603515625, -29.820709228515625, -27.799224853515625, -25.777740478515625, -23.756256103515625, -21.734771728515625, -19.713287353515625, -17.691802978515625, -15.670318603515625, -13.648834228515625, -11.627349853515625, -9.605865478515625, -7.584381103515625, -5.562896728515625, -3.541412353515625, -1.519927978515625, 0.501556396484375, 2.523040771484375, 4.544525146484375, 6.566009521484375, 8.587493896484375, 10.608978271484375, 12.630462646484375, 14.651947021484375, 16.673431396484375, 18.694915771484375, 20.716400146484375, 22.737884521484375, 24.759368896484375, 26.780853271484375, 28.802337646484375, 30.823822021484375, 32.845306396484375, 34.866790771484375, 36.888275146484375, 38.909759521484375, 40.931243896484375, 42.952728271484375, 44.974212646484375, 46.995697021484375, 49.017181396484375, 51.038665771484375, 53.060150146484375, 55.081634521484375, 57.103118896484375, 59.124603271484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 7.0, 5.0, 11.0, 11.0, 11.0, 21.0, 15.0, 14.0, 19.0, 27.0, 32.0, 37.0, 29.0, 30.0, 34.0, 47.0, 34.0, 41.0, 38.0, 38.0, 45.0, 51.0, 36.0, 37.0, 34.0, 30.0, 38.0, 29.0, 28.0, 20.0, 25.0, 24.0, 17.0, 12.0, 12.0, 11.0, 11.0, 7.0, 7.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.296875, -7.06640625, -6.8359375, -6.60546875, -6.375, -6.14453125, -5.9140625, -5.68359375, -5.453125, -5.22265625, -4.9921875, -4.76171875, -4.53125, -4.30078125, -4.0703125, -3.83984375, -3.609375, -3.37890625, -3.1484375, -2.91796875, -2.6875, -2.45703125, -2.2265625, -1.99609375, -1.765625, -1.53515625, -1.3046875, -1.07421875, -0.84375, -0.61328125, -0.3828125, -0.15234375, 0.078125, 0.30859375, 0.5390625, 0.76953125, 1.0, 1.23046875, 1.4609375, 1.69140625, 1.921875, 2.15234375, 2.3828125, 2.61328125, 2.84375, 3.07421875, 3.3046875, 3.53515625, 3.765625, 3.99609375, 4.2265625, 4.45703125, 4.6875, 4.91796875, 5.1484375, 5.37890625, 5.609375, 5.83984375, 6.0703125, 6.30078125, 6.53125, 6.76171875, 6.9921875, 7.22265625, 7.453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 14.0, 16.0, 23.0, 33.0, 43.0, 64.0, 116.0, 160.0, 213.0, 362.0, 570.0, 861.0, 1395.0, 2260.0, 3472.0, 5729.0, 9177.0, 14972.0, 25297.0, 43949.0, 82739.0, 160433.0, 253085.0, 201239.0, 107336.0, 55982.0, 31408.0, 18226.0, 11063.0, 6706.0, 4187.0, 2618.0, 1699.0, 1045.0, 728.0, 446.0, 282.0, 222.0, 124.0, 83.0, 60.0, 41.0, 26.0, 21.0, 14.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.2304229736328125, -1.190338134765625, -1.1502532958984375, -1.11016845703125, -1.0700836181640625, -1.029998779296875, -0.9899139404296875, -0.9498291015625, -0.9097442626953125, -0.869659423828125, -0.8295745849609375, -0.78948974609375, -0.7494049072265625, -0.709320068359375, -0.6692352294921875, -0.629150390625, -0.5890655517578125, -0.548980712890625, -0.5088958740234375, -0.46881103515625, -0.4287261962890625, -0.388641357421875, -0.3485565185546875, -0.3084716796875, -0.2683868408203125, -0.228302001953125, -0.1882171630859375, -0.14813232421875, -0.1080474853515625, -0.067962646484375, -0.0278778076171875, 0.01220703125, 0.0522918701171875, 0.092376708984375, 0.1324615478515625, 0.17254638671875, 0.2126312255859375, 0.252716064453125, 0.2928009033203125, 0.3328857421875, 0.3729705810546875, 0.413055419921875, 0.4531402587890625, 0.49322509765625, 0.5333099365234375, 0.573394775390625, 0.6134796142578125, 0.653564453125, 0.6936492919921875, 0.733734130859375, 0.7738189697265625, 0.81390380859375, 0.8539886474609375, 0.894073486328125, 0.9341583251953125, 0.9742431640625, 1.0143280029296875, 1.054412841796875, 1.0944976806640625, 1.13458251953125, 1.1746673583984375, 1.214752197265625, 1.2548370361328125, 1.294921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 10.0, 12.0, 13.0, 16.0, 15.0, 22.0, 14.0, 19.0, 21.0, 33.0, 37.0, 32.0, 35.0, 25.0, 29.0, 30.0, 34.0, 34.0, 38.0, 1062.0, 40.0, 34.0, 44.0, 44.0, 27.0, 39.0, 35.0, 26.0, 27.0, 16.0, 22.0, 20.0, 18.0, 14.0, 15.0, 11.0, 7.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-4.62890625, -4.490966796875, -4.35302734375, -4.215087890625, -4.0771484375, -3.939208984375, -3.80126953125, -3.663330078125, -3.525390625, -3.387451171875, -3.24951171875, -3.111572265625, -2.9736328125, -2.835693359375, -2.69775390625, -2.559814453125, -2.421875, -2.283935546875, -2.14599609375, -2.008056640625, -1.8701171875, -1.732177734375, -1.59423828125, -1.456298828125, -1.318359375, -1.180419921875, -1.04248046875, -0.904541015625, -0.7666015625, -0.628662109375, -0.49072265625, -0.352783203125, -0.21484375, -0.076904296875, 0.06103515625, 0.198974609375, 0.3369140625, 0.474853515625, 0.61279296875, 0.750732421875, 0.888671875, 1.026611328125, 1.16455078125, 1.302490234375, 1.4404296875, 1.578369140625, 1.71630859375, 1.854248046875, 1.9921875, 2.130126953125, 2.26806640625, 2.406005859375, 2.5439453125, 2.681884765625, 2.81982421875, 2.957763671875, 3.095703125, 3.233642578125, 3.37158203125, 3.509521484375, 3.6474609375, 3.785400390625, 3.92333984375, 4.061279296875, 4.19921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 16.0, 13.0, 24.0, 28.0, 59.0, 61.0, 105.0, 194.0, 292.0, 385.0, 627.0, 907.0, 1534.0, 2313.0, 3698.0, 5707.0, 9081.0, 14720.0, 24417.0, 40414.0, 68569.0, 111314.0, 163732.0, 1234168.0, 154733.0, 102473.0, 61801.0, 37018.0, 22042.0, 13485.0, 8241.0, 5273.0, 3385.0, 2185.0, 1414.0, 946.0, 610.0, 340.0, 266.0, 179.0, 124.0, 79.0, 48.0, 38.0, 31.0, 12.0, 15.0, 5.0, 8.0, 3.0, 3.0], "bins": [-0.72705078125, -0.7070846557617188, -0.6871185302734375, -0.6671524047851562, -0.647186279296875, -0.6272201538085938, -0.6072540283203125, -0.5872879028320312, -0.56732177734375, -0.5473556518554688, -0.5273895263671875, -0.5074234008789062, -0.487457275390625, -0.46749114990234375, -0.4475250244140625, -0.42755889892578125, -0.4075927734375, -0.38762664794921875, -0.3676605224609375, -0.34769439697265625, -0.327728271484375, -0.30776214599609375, -0.2877960205078125, -0.26782989501953125, -0.24786376953125, -0.22789764404296875, -0.2079315185546875, -0.18796539306640625, -0.167999267578125, -0.14803314208984375, -0.1280670166015625, -0.10810089111328125, -0.088134765625, -0.06816864013671875, -0.0482025146484375, -0.02823638916015625, -0.008270263671875, 0.01169586181640625, 0.0316619873046875, 0.05162811279296875, 0.07159423828125, 0.09156036376953125, 0.1115264892578125, 0.13149261474609375, 0.151458740234375, 0.17142486572265625, 0.1913909912109375, 0.21135711669921875, 0.2313232421875, 0.25128936767578125, 0.2712554931640625, 0.29122161865234375, 0.311187744140625, 0.33115386962890625, 0.3511199951171875, 0.37108612060546875, 0.39105224609375, 0.41101837158203125, 0.4309844970703125, 0.45095062255859375, 0.470916748046875, 0.49088287353515625, 0.5108489990234375, 0.5308151245117188, 0.55078125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 2.0, 10.0, 10.0, 7.0, 8.0, 11.0, 13.0, 10.0, 14.0, 28.0, 27.0, 31.0, 32.0, 68.0, 76.0, 77.0, 88.0, 91.0, 61.0, 47.0, 52.0, 44.0, 32.0, 32.0, 17.0, 22.0, 15.0, 15.0, 9.0, 11.0, 8.0, 10.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00946044921875, -0.009162425994873047, -0.008864402770996094, -0.00856637954711914, -0.008268356323242188, -0.007970333099365234, -0.007672309875488281, -0.007374286651611328, -0.007076263427734375, -0.006778240203857422, -0.006480216979980469, -0.006182193756103516, -0.0058841705322265625, -0.005586147308349609, -0.005288124084472656, -0.004990100860595703, -0.00469207763671875, -0.004394054412841797, -0.004096031188964844, -0.0037980079650878906, -0.0034999847412109375, -0.0032019615173339844, -0.0029039382934570312, -0.002605915069580078, -0.002307891845703125, -0.002009868621826172, -0.0017118453979492188, -0.0014138221740722656, -0.0011157989501953125, -0.0008177757263183594, -0.0005197525024414062, -0.00022172927856445312, 7.62939453125e-05, 0.0003743171691894531, 0.0006723403930664062, 0.0009703636169433594, 0.0012683868408203125, 0.0015664100646972656, 0.0018644332885742188, 0.002162456512451172, 0.002460479736328125, 0.002758502960205078, 0.0030565261840820312, 0.0033545494079589844, 0.0036525726318359375, 0.003950595855712891, 0.004248619079589844, 0.004546642303466797, 0.00484466552734375, 0.005142688751220703, 0.005440711975097656, 0.005738735198974609, 0.0060367584228515625, 0.006334781646728516, 0.006632804870605469, 0.006930828094482422, 0.007228851318359375, 0.007526874542236328, 0.007824897766113281, 0.008122920989990234, 0.008420944213867188, 0.00871896743774414, 0.009016990661621094, 0.009315013885498047, 0.009613037109375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 9.0, 12.0, 12.0, 20.0, 21.0, 45.0, 29.0, 67.0, 116.0, 197.0, 530.0, 2455.0, 17243.0, 269123.0, 720078.0, 32986.0, 4183.0, 843.0, 226.0, 115.0, 72.0, 39.0, 30.0, 20.0, 18.0, 15.0, 9.0, 11.0, 7.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2071533203125, -0.20070838928222656, -0.19426345825195312, -0.1878185272216797, -0.18137359619140625, -0.1749286651611328, -0.16848373413085938, -0.16203880310058594, -0.1555938720703125, -0.14914894104003906, -0.14270401000976562, -0.1362590789794922, -0.12981414794921875, -0.12336921691894531, -0.11692428588867188, -0.11047935485839844, -0.104034423828125, -0.09758949279785156, -0.09114456176757812, -0.08469963073730469, -0.07825469970703125, -0.07180976867675781, -0.06536483764648438, -0.05891990661621094, -0.0524749755859375, -0.04603004455566406, -0.039585113525390625, -0.03314018249511719, -0.02669525146484375, -0.020250320434570312, -0.013805389404296875, -0.0073604583740234375, -0.00091552734375, 0.0055294036865234375, 0.011974334716796875, 0.018419265747070312, 0.02486419677734375, 0.03130912780761719, 0.037754058837890625, 0.04419898986816406, 0.0506439208984375, 0.05708885192871094, 0.06353378295898438, 0.06997871398925781, 0.07642364501953125, 0.08286857604980469, 0.08931350708007812, 0.09575843811035156, 0.102203369140625, 0.10864830017089844, 0.11509323120117188, 0.12153816223144531, 0.12798309326171875, 0.1344280242919922, 0.14087295532226562, 0.14731788635253906, 0.1537628173828125, 0.16020774841308594, 0.16665267944335938, 0.1730976104736328, 0.17954254150390625, 0.1859874725341797, 0.19243240356445312, 0.19887733459472656, 0.205322265625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 15.0, 18.0, 40.0, 57.0, 84.0, 196.0, 257.0, 160.0, 72.0, 35.0, 22.0, 13.0, 11.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039211470633745193, -0.03753205016255379, -0.03585263341665268, -0.03417321294546127, -0.03249379247426987, -0.03081437572836876, -0.029134955257177353, -0.027455536648631096, -0.02577611804008484, -0.024096699431538582, -0.022417280822992325, -0.02073786035180092, -0.01905844174325466, -0.017379023134708405, -0.015699602663517, -0.014020184054970741, -0.012340765446424484, -0.010661346837878227, -0.008981927298009396, -0.007302508223801851, -0.005623089149594307, -0.00394367054104805, -0.0022642510011792183, -0.0005848314613103867, 0.0010945871472358704, 0.0027740062214434147, 0.004453425295650959, 0.006132844369858503, 0.007812263444066048, 0.009491682052612305, 0.011171101592481136, 0.012850521132349968, 0.014529936015605927, 0.016209354624152184, 0.01788877323269844, 0.019568193703889847, 0.021247612312436104, 0.02292703092098236, 0.024606451392173767, 0.026285870000720024, 0.02796528860926628, 0.029644707217812538, 0.031324125826358795, 0.0330035462975502, 0.03468296676874161, 0.036362383514642715, 0.03804180398583412, 0.03972122073173523, 0.041400641202926636, 0.04308006167411804, 0.04475947842001915, 0.046438898891210556, 0.048118315637111664, 0.04979773610830307, 0.051477156579494476, 0.05315657705068588, 0.05483599379658699, 0.0565154142677784, 0.058194831013679504, 0.05987425148487091, 0.06155367195606232, 0.06323309242725372, 0.06491250544786453, 0.06659192591905594, 0.06827134639024734]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 11.0, 5.0, 11.0, 10.0, 13.0, 13.0, 18.0, 16.0, 20.0, 27.0, 27.0, 29.0, 26.0, 37.0, 29.0, 35.0, 36.0, 37.0, 42.0, 39.0, 39.0, 36.0, 54.0, 36.0, 42.0, 37.0, 28.0, 36.0, 22.0, 22.0, 18.0, 25.0, 23.0, 26.0, 13.0, 12.0, 11.0, 9.0, 4.0, 3.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.005060851573944092, -0.004908060654997826, -0.0047552697360515594, -0.004602478817105293, -0.004449687898159027, -0.004296896979212761, -0.004144106060266495, -0.003991315141320229, -0.0038385242223739624, -0.0036857333034276962, -0.00353294238448143, -0.003380151465535164, -0.0032273605465888977, -0.0030745696276426315, -0.0029217787086963654, -0.002768987789750099, -0.002616196870803833, -0.002463405951857567, -0.0023106150329113007, -0.0021578241139650345, -0.0020050331950187683, -0.0018522422760725021, -0.001699451357126236, -0.0015466604381799698, -0.0013938695192337036, -0.0012410786002874374, -0.0010882876813411713, -0.0009354967623949051, -0.0007827058434486389, -0.0006299149245023727, -0.00047712400555610657, -0.0003243330866098404, -0.00017154216766357422, -1.8751248717308044e-05, 0.00013403967022895813, 0.0002868305891752243, 0.0004396215081214905, 0.0005924124270677567, 0.0007452033460140228, 0.000897994264960289, 0.0010507851839065552, 0.0012035761028528214, 0.0013563670217990875, 0.0015091579407453537, 0.0016619488596916199, 0.001814739778637886, 0.0019675306975841522, 0.0021203216165304184, 0.0022731125354766846, 0.0024259034544229507, 0.002578694373369217, 0.002731485292315483, 0.0028842762112617493, 0.0030370671302080154, 0.0031898580491542816, 0.003342648968100548, 0.003495439887046814, 0.00364823080599308, 0.0038010217249393463, 0.0039538126438856125, 0.004106603562831879, 0.004259394481778145, 0.004412185400724411, 0.004564976319670677, 0.004717767238616943]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 7.0, 5.0, 11.0, 11.0, 11.0, 22.0, 14.0, 14.0, 19.0, 27.0, 32.0, 37.0, 29.0, 30.0, 34.0, 47.0, 34.0, 41.0, 38.0, 38.0, 45.0, 51.0, 36.0, 37.0, 34.0, 30.0, 38.0, 29.0, 28.0, 20.0, 25.0, 24.0, 17.0, 12.0, 12.0, 11.0, 11.0, 7.0, 7.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.296875, -7.06640625, -6.8359375, -6.60546875, -6.375, -6.14453125, -5.9140625, -5.68359375, -5.453125, -5.22265625, -4.9921875, -4.76171875, -4.53125, -4.30078125, -4.0703125, -3.83984375, -3.609375, -3.37890625, -3.1484375, -2.91796875, -2.6875, -2.45703125, -2.2265625, -1.99609375, -1.765625, -1.53515625, -1.3046875, -1.07421875, -0.84375, -0.61328125, -0.3828125, -0.15234375, 0.078125, 0.30859375, 0.5390625, 0.76953125, 1.0, 1.23046875, 1.4609375, 1.69140625, 1.921875, 2.15234375, 2.3828125, 2.61328125, 2.84375, 3.07421875, 3.3046875, 3.53515625, 3.765625, 3.99609375, 4.2265625, 4.45703125, 4.6875, 4.91796875, 5.1484375, 5.37890625, 5.609375, 5.83984375, 6.0703125, 6.30078125, 6.53125, 6.76171875, 6.9921875, 7.22265625, 7.453125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 9.0, 8.0, 13.0, 30.0, 27.0, 54.0, 52.0, 102.0, 134.0, 215.0, 275.0, 430.0, 646.0, 840.0, 1202.0, 1785.0, 2661.0, 3937.0, 6278.0, 10126.0, 18784.0, 39919.0, 110252.0, 363250.0, 312747.0, 94941.0, 35867.0, 17002.0, 9396.0, 5808.0, 3736.0, 2463.0, 1654.0, 1197.0, 820.0, 560.0, 387.0, 318.0, 196.0, 133.0, 95.0, 58.0, 44.0, 29.0, 23.0, 16.0, 15.0, 11.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.60546875, -5.42425537109375, -5.2430419921875, -5.06182861328125, -4.880615234375, -4.69940185546875, -4.5181884765625, -4.33697509765625, -4.15576171875, -3.97454833984375, -3.7933349609375, -3.61212158203125, -3.430908203125, -3.24969482421875, -3.0684814453125, -2.88726806640625, -2.7060546875, -2.52484130859375, -2.3436279296875, -2.16241455078125, -1.981201171875, -1.79998779296875, -1.6187744140625, -1.43756103515625, -1.25634765625, -1.07513427734375, -0.8939208984375, -0.71270751953125, -0.531494140625, -0.35028076171875, -0.1690673828125, 0.01214599609375, 0.193359375, 0.37457275390625, 0.5557861328125, 0.73699951171875, 0.918212890625, 1.09942626953125, 1.2806396484375, 1.46185302734375, 1.64306640625, 1.82427978515625, 2.0054931640625, 2.18670654296875, 2.367919921875, 2.54913330078125, 2.7303466796875, 2.91156005859375, 3.0927734375, 3.27398681640625, 3.4552001953125, 3.63641357421875, 3.817626953125, 3.99884033203125, 4.1800537109375, 4.36126708984375, 4.54248046875, 4.72369384765625, 4.9049072265625, 5.08612060546875, 5.267333984375, 5.44854736328125, 5.6297607421875, 5.81097412109375, 5.9921875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 4.0, 7.0, 8.0, 15.0, 11.0, 20.0, 13.0, 24.0, 26.0, 30.0, 25.0, 44.0, 46.0, 44.0, 64.0, 74.0, 123.0, 1696.0, 244.0, 88.0, 59.0, 42.0, 48.0, 41.0, 38.0, 43.0, 21.0, 21.0, 28.0, 16.0, 14.0, 14.0, 11.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.6875, -27.781982421875, -26.87646484375, -25.970947265625, -25.0654296875, -24.159912109375, -23.25439453125, -22.348876953125, -21.443359375, -20.537841796875, -19.63232421875, -18.726806640625, -17.8212890625, -16.915771484375, -16.01025390625, -15.104736328125, -14.19921875, -13.293701171875, -12.38818359375, -11.482666015625, -10.5771484375, -9.671630859375, -8.76611328125, -7.860595703125, -6.955078125, -6.049560546875, -5.14404296875, -4.238525390625, -3.3330078125, -2.427490234375, -1.52197265625, -0.616455078125, 0.2890625, 1.194580078125, 2.10009765625, 3.005615234375, 3.9111328125, 4.816650390625, 5.72216796875, 6.627685546875, 7.533203125, 8.438720703125, 9.34423828125, 10.249755859375, 11.1552734375, 12.060791015625, 12.96630859375, 13.871826171875, 14.77734375, 15.682861328125, 16.58837890625, 17.493896484375, 18.3994140625, 19.304931640625, 20.21044921875, 21.115966796875, 22.021484375, 22.927001953125, 23.83251953125, 24.738037109375, 25.6435546875, 26.549072265625, 27.45458984375, 28.360107421875, 29.265625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 3.0, 9.0, 11.0, 13.0, 18.0, 15.0, 33.0, 28.0, 44.0, 59.0, 80.0, 104.0, 135.0, 217.0, 347.0, 789.0, 6243.0, 1566145.0, 1563282.0, 6204.0, 795.0, 338.0, 193.0, 131.0, 103.0, 81.0, 55.0, 37.0, 31.0, 31.0, 30.0, 15.0, 18.0, 12.0, 6.0, 8.0, 7.0, 5.0, 4.0, 4.0, 0.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-58.34375, -56.5205078125, -54.697265625, -52.8740234375, -51.05078125, -49.2275390625, -47.404296875, -45.5810546875, -43.7578125, -41.9345703125, -40.111328125, -38.2880859375, -36.46484375, -34.6416015625, -32.818359375, -30.9951171875, -29.171875, -27.3486328125, -25.525390625, -23.7021484375, -21.87890625, -20.0556640625, -18.232421875, -16.4091796875, -14.5859375, -12.7626953125, -10.939453125, -9.1162109375, -7.29296875, -5.4697265625, -3.646484375, -1.8232421875, 0.0, 1.8232421875, 3.646484375, 5.4697265625, 7.29296875, 9.1162109375, 10.939453125, 12.7626953125, 14.5859375, 16.4091796875, 18.232421875, 20.0556640625, 21.87890625, 23.7021484375, 25.525390625, 27.3486328125, 29.171875, 30.9951171875, 32.818359375, 34.6416015625, 36.46484375, 38.2880859375, 40.111328125, 41.9345703125, 43.7578125, 45.5810546875, 47.404296875, 49.2275390625, 51.05078125, 52.8740234375, 54.697265625, 56.5205078125, 58.34375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 20.0, 103.0, 379.0, 367.0, 128.0, 19.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.058876037597656, -20.62887191772461, -17.198869705200195, -13.768866539001465, -10.338863372802734, -6.9088592529296875, -3.4788570404052734, -0.048854827880859375, 3.3811492919921875, 6.811152458190918, 10.241155624389648, 13.671158790588379, 17.10116195678711, 20.531166076660156, 23.96116828918457, 27.391170501708984, 30.82117462158203, 34.25117874145508, 37.681182861328125, 41.111183166503906, 44.54118728637695, 47.97119140625, 51.40119171142578, 54.83119583129883, 58.261199951171875, 61.69120407104492, 65.12120819091797, 68.55120849609375, 71.98121643066406, 75.41121673583984, 78.84121704101562, 82.27122497558594, 85.70123291015625, 89.13123321533203, 92.56124114990234, 95.99124145507812, 99.42124938964844, 102.85124969482422, 106.28125, 109.71125793457031, 113.1412582397461, 116.57125854492188, 120.00126647949219, 123.43126678466797, 126.86126708984375, 130.29127502441406, 133.72128295898438, 137.15127563476562, 140.58128356933594, 144.01129150390625, 147.4412841796875, 150.8712921142578, 154.30130004882812, 157.73129272460938, 161.1613006591797, 164.59130859375, 168.02130126953125, 171.45130920410156, 174.8813018798828, 178.31130981445312, 181.74131774902344, 185.17132568359375, 188.601318359375, 192.0313262939453, 195.46133422851562]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 0.0, 6.0, 14.0, 10.0, 14.0, 14.0, 20.0, 15.0, 19.0, 26.0, 24.0, 28.0, 24.0, 29.0, 32.0, 40.0, 36.0, 30.0, 31.0, 35.0, 40.0, 34.0, 46.0, 46.0, 51.0, 36.0, 34.0, 38.0, 28.0, 30.0, 28.0, 21.0, 12.0, 16.0, 20.0, 12.0, 16.0, 4.0, 10.0, 6.0, 6.0, 9.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.23607635498047, -58.20308303833008, -56.17009353637695, -54.13710021972656, -52.10411071777344, -50.07111740112305, -48.038124084472656, -46.00513458251953, -43.97214126586914, -41.93914794921875, -39.906158447265625, -37.873165130615234, -35.840171813964844, -33.80718231201172, -31.774188995361328, -29.74119758605957, -27.708206176757812, -25.675214767456055, -23.642223358154297, -21.609230041503906, -19.57623863220215, -17.54324722290039, -15.510254859924316, -13.477262496948242, -11.444271087646484, -9.411279678344727, -7.378287315368652, -5.345295429229736, -3.3123035430908203, -1.2793121337890625, 0.7536802291870117, 2.786672592163086, 4.8196563720703125, 6.8526482582092285, 8.885640144348145, 10.918632507324219, 12.951623916625977, 14.984615325927734, 17.017608642578125, 19.050600051879883, 21.08359146118164, 23.1165828704834, 25.149574279785156, 27.182567596435547, 29.215559005737305, 31.248550415039062, 33.28154373168945, 35.314537048339844, 37.34752655029297, 39.38051986694336, 41.413509368896484, 43.446502685546875, 45.4794921875, 47.51248550415039, 49.54547882080078, 51.578468322753906, 53.6114616394043, 55.64445495605469, 57.67744445800781, 59.7104377746582, 61.743431091308594, 63.77642059326172, 65.80941009521484, 67.8424072265625, 69.87539672851562]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 6.0, 3.0, 8.0, 6.0, 14.0, 13.0, 12.0, 21.0, 18.0, 14.0, 18.0, 23.0, 29.0, 33.0, 36.0, 39.0, 35.0, 46.0, 21.0, 43.0, 42.0, 41.0, 32.0, 54.0, 38.0, 32.0, 34.0, 26.0, 38.0, 29.0, 30.0, 16.0, 22.0, 19.0, 19.0, 24.0, 11.0, 12.0, 7.0, 7.0, 7.0, 5.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.5078125, -7.27685546875, -7.0458984375, -6.81494140625, -6.583984375, -6.35302734375, -6.1220703125, -5.89111328125, -5.66015625, -5.42919921875, -5.1982421875, -4.96728515625, -4.736328125, -4.50537109375, -4.2744140625, -4.04345703125, -3.8125, -3.58154296875, -3.3505859375, -3.11962890625, -2.888671875, -2.65771484375, -2.4267578125, -2.19580078125, -1.96484375, -1.73388671875, -1.5029296875, -1.27197265625, -1.041015625, -0.81005859375, -0.5791015625, -0.34814453125, -0.1171875, 0.11376953125, 0.3447265625, 0.57568359375, 0.806640625, 1.03759765625, 1.2685546875, 1.49951171875, 1.73046875, 1.96142578125, 2.1923828125, 2.42333984375, 2.654296875, 2.88525390625, 3.1162109375, 3.34716796875, 3.578125, 3.80908203125, 4.0400390625, 4.27099609375, 4.501953125, 4.73291015625, 4.9638671875, 5.19482421875, 5.42578125, 5.65673828125, 5.8876953125, 6.11865234375, 6.349609375, 6.58056640625, 6.8115234375, 7.04248046875, 7.2734375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 7.0, 3.0, 4.0, 8.0, 14.0, 12.0, 24.0, 21.0, 31.0, 31.0, 33.0, 44.0, 76.0, 107.0, 175.0, 364.0, 1454.0, 10608.0, 156999.0, 3270498.0, 721743.0, 27929.0, 2832.0, 594.0, 207.0, 122.0, 73.0, 61.0, 41.0, 34.0, 23.0, 24.0, 28.0, 13.0, 10.0, 8.0, 12.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.2021484375, -34.091796875, -32.9814453125, -31.87109375, -30.7607421875, -29.650390625, -28.5400390625, -27.4296875, -26.3193359375, -25.208984375, -24.0986328125, -22.98828125, -21.8779296875, -20.767578125, -19.6572265625, -18.546875, -17.4365234375, -16.326171875, -15.2158203125, -14.10546875, -12.9951171875, -11.884765625, -10.7744140625, -9.6640625, -8.5537109375, -7.443359375, -6.3330078125, -5.22265625, -4.1123046875, -3.001953125, -1.8916015625, -0.78125, 0.3291015625, 1.439453125, 2.5498046875, 3.66015625, 4.7705078125, 5.880859375, 6.9912109375, 8.1015625, 9.2119140625, 10.322265625, 11.4326171875, 12.54296875, 13.6533203125, 14.763671875, 15.8740234375, 16.984375, 18.0947265625, 19.205078125, 20.3154296875, 21.42578125, 22.5361328125, 23.646484375, 24.7568359375, 25.8671875, 26.9775390625, 28.087890625, 29.1982421875, 30.30859375, 31.4189453125, 32.529296875, 33.6396484375, 34.75]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 8.0, 5.0, 7.0, 14.0, 16.0, 26.0, 42.0, 43.0, 58.0, 84.0, 135.0, 186.0, 206.0, 262.0, 366.0, 470.0, 426.0, 429.0, 314.0, 248.0, 171.0, 150.0, 110.0, 89.0, 68.0, 42.0, 25.0, 23.0, 11.0, 6.0, 15.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.67578125, -19.0859375, -18.49609375, -17.90625, -17.31640625, -16.7265625, -16.13671875, -15.546875, -14.95703125, -14.3671875, -13.77734375, -13.1875, -12.59765625, -12.0078125, -11.41796875, -10.828125, -10.23828125, -9.6484375, -9.05859375, -8.46875, -7.87890625, -7.2890625, -6.69921875, -6.109375, -5.51953125, -4.9296875, -4.33984375, -3.75, -3.16015625, -2.5703125, -1.98046875, -1.390625, -0.80078125, -0.2109375, 0.37890625, 0.96875, 1.55859375, 2.1484375, 2.73828125, 3.328125, 3.91796875, 4.5078125, 5.09765625, 5.6875, 6.27734375, 6.8671875, 7.45703125, 8.046875, 8.63671875, 9.2265625, 9.81640625, 10.40625, 10.99609375, 11.5859375, 12.17578125, 12.765625, 13.35546875, 13.9453125, 14.53515625, 15.125, 15.71484375, 16.3046875, 16.89453125, 17.484375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 12.0, 12.0, 21.0, 42.0, 48.0, 63.0, 125.0, 154.0, 241.0, 472.0, 1721.0, 17752.0, 586051.0, 3452435.0, 127162.0, 5976.0, 934.0, 393.0, 240.0, 134.0, 80.0, 61.0, 50.0, 36.0, 18.0, 15.0, 11.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.25, -58.384765625, -56.51953125, -54.654296875, -52.7890625, -50.923828125, -49.05859375, -47.193359375, -45.328125, -43.462890625, -41.59765625, -39.732421875, -37.8671875, -36.001953125, -34.13671875, -32.271484375, -30.40625, -28.541015625, -26.67578125, -24.810546875, -22.9453125, -21.080078125, -19.21484375, -17.349609375, -15.484375, -13.619140625, -11.75390625, -9.888671875, -8.0234375, -6.158203125, -4.29296875, -2.427734375, -0.5625, 1.302734375, 3.16796875, 5.033203125, 6.8984375, 8.763671875, 10.62890625, 12.494140625, 14.359375, 16.224609375, 18.08984375, 19.955078125, 21.8203125, 23.685546875, 25.55078125, 27.416015625, 29.28125, 31.146484375, 33.01171875, 34.876953125, 36.7421875, 38.607421875, 40.47265625, 42.337890625, 44.203125, 46.068359375, 47.93359375, 49.798828125, 51.6640625, 53.529296875, 55.39453125, 57.259765625, 59.125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 35.0, 43.0, 77.0, 99.0, 141.0, 141.0, 128.0, 134.0, 86.0, 43.0, 27.0, 20.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-127.82731628417969, -123.79938507080078, -119.77145385742188, -115.7435302734375, -111.7155990600586, -107.68766784667969, -103.65974426269531, -99.6318130493164, -95.6038818359375, -91.5759506225586, -87.54801940917969, -83.52009582519531, -79.4921646118164, -75.4642333984375, -71.43630981445312, -67.40837860107422, -63.38044738769531, -59.352516174316406, -55.324588775634766, -51.296661376953125, -47.26873016357422, -43.24079895019531, -39.21287155151367, -35.18494415283203, -31.157012939453125, -27.12908363342285, -23.101154327392578, -19.073225021362305, -15.045295715332031, -11.017366409301758, -6.989437103271484, -2.961507797241211, 1.066436767578125, 5.094366073608398, 9.122295379638672, 13.150224685668945, 17.17815399169922, 21.206083297729492, 25.234012603759766, 29.26194190979004, 33.28987121582031, 37.31780242919922, 41.34572982788086, 45.3736572265625, 49.401588439941406, 53.42951965332031, 57.45744705200195, 61.485374450683594, 65.5133056640625, 69.5412368774414, 73.56916809082031, 77.59709167480469, 81.6250228881836, 85.6529541015625, 89.68087768554688, 93.70880889892578, 97.73674011230469, 101.7646713256836, 105.7926025390625, 109.82052612304688, 113.84845733642578, 117.87638854980469, 121.90431213378906, 125.93224334716797, 129.96017456054688]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 5.0, 1.0, 8.0, 11.0, 13.0, 8.0, 11.0, 18.0, 12.0, 25.0, 25.0, 28.0, 26.0, 22.0, 33.0, 37.0, 49.0, 46.0, 41.0, 50.0, 41.0, 47.0, 42.0, 42.0, 35.0, 35.0, 40.0, 30.0, 37.0, 23.0, 22.0, 31.0, 18.0, 19.0, 17.0, 11.0, 9.0, 5.0, 5.0, 10.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-67.4093017578125, -65.42747497558594, -63.44565200805664, -61.46382522583008, -59.48200225830078, -57.50017547607422, -55.518348693847656, -53.536521911621094, -51.5546989440918, -49.572872161865234, -47.59104919433594, -45.609222412109375, -43.62739562988281, -41.645572662353516, -39.66374588012695, -37.681922912597656, -35.700096130371094, -33.71826934814453, -31.736446380615234, -29.754619598388672, -27.772794723510742, -25.790969848632812, -23.80914306640625, -21.82731819152832, -19.84549331665039, -17.86366844177246, -15.881842613220215, -13.900016784667969, -11.918191909790039, -9.93636703491211, -7.954541206359863, -5.972715377807617, -3.9908905029296875, -2.0090651512145996, -0.02723979949951172, 1.9545855522155762, 3.936410903930664, 5.918235778808594, 7.90006160736084, 9.881887435913086, 11.863712310791016, 13.845537185668945, 15.827363014221191, 17.809188842773438, 19.791013717651367, 21.772838592529297, 23.75466537475586, 25.73649024963379, 27.71831512451172, 29.70013999938965, 31.681964874267578, 33.66379165649414, 35.64561462402344, 37.62744140625, 39.60926818847656, 41.591094970703125, 43.57291793823242, 45.554744720458984, 47.53656768798828, 49.518394470214844, 51.500221252441406, 53.4820442199707, 55.463871002197266, 57.44569396972656, 59.427520751953125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 4.0, 4.0, 12.0, 8.0, 13.0, 8.0, 16.0, 23.0, 29.0, 16.0, 20.0, 29.0, 26.0, 43.0, 36.0, 31.0, 41.0, 40.0, 45.0, 43.0, 32.0, 43.0, 34.0, 37.0, 37.0, 35.0, 28.0, 30.0, 29.0, 26.0, 23.0, 18.0, 20.0, 15.0, 10.0, 14.0, 16.0, 12.0, 9.0, 8.0, 8.0, 9.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.39453125, -7.158203125, -6.921875, -6.685546875, -6.44921875, -6.212890625, -5.9765625, -5.740234375, -5.50390625, -5.267578125, -5.03125, -4.794921875, -4.55859375, -4.322265625, -4.0859375, -3.849609375, -3.61328125, -3.376953125, -3.140625, -2.904296875, -2.66796875, -2.431640625, -2.1953125, -1.958984375, -1.72265625, -1.486328125, -1.25, -1.013671875, -0.77734375, -0.541015625, -0.3046875, -0.068359375, 0.16796875, 0.404296875, 0.640625, 0.876953125, 1.11328125, 1.349609375, 1.5859375, 1.822265625, 2.05859375, 2.294921875, 2.53125, 2.767578125, 3.00390625, 3.240234375, 3.4765625, 3.712890625, 3.94921875, 4.185546875, 4.421875, 4.658203125, 4.89453125, 5.130859375, 5.3671875, 5.603515625, 5.83984375, 6.076171875, 6.3125, 6.548828125, 6.78515625, 7.021484375, 7.2578125, 7.494140625, 7.73046875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 11.0, 17.0, 28.0, 44.0, 57.0, 81.0, 116.0, 190.0, 307.0, 459.0, 720.0, 1116.0, 1839.0, 2831.0, 4425.0, 7146.0, 11626.0, 19136.0, 32232.0, 56451.0, 104388.0, 186974.0, 240011.0, 165219.0, 90262.0, 49618.0, 28335.0, 16918.0, 10280.0, 6527.0, 4090.0, 2632.0, 1552.0, 1048.0, 668.0, 417.0, 264.0, 172.0, 109.0, 82.0, 49.0, 34.0, 25.0, 17.0, 8.0, 6.0, 7.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.150390625, -1.1148681640625, -1.079345703125, -1.0438232421875, -1.00830078125, -0.9727783203125, -0.937255859375, -0.9017333984375, -0.8662109375, -0.8306884765625, -0.795166015625, -0.7596435546875, -0.72412109375, -0.6885986328125, -0.653076171875, -0.6175537109375, -0.58203125, -0.5465087890625, -0.510986328125, -0.4754638671875, -0.43994140625, -0.4044189453125, -0.368896484375, -0.3333740234375, -0.2978515625, -0.2623291015625, -0.226806640625, -0.1912841796875, -0.15576171875, -0.1202392578125, -0.084716796875, -0.0491943359375, -0.013671875, 0.0218505859375, 0.057373046875, 0.0928955078125, 0.12841796875, 0.1639404296875, 0.199462890625, 0.2349853515625, 0.2705078125, 0.3060302734375, 0.341552734375, 0.3770751953125, 0.41259765625, 0.4481201171875, 0.483642578125, 0.5191650390625, 0.5546875, 0.5902099609375, 0.625732421875, 0.6612548828125, 0.69677734375, 0.7322998046875, 0.767822265625, 0.8033447265625, 0.8388671875, 0.8743896484375, 0.909912109375, 0.9454345703125, 0.98095703125, 1.0164794921875, 1.052001953125, 1.0875244140625, 1.123046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 4.0, 8.0, 10.0, 6.0, 13.0, 13.0, 18.0, 22.0, 27.0, 22.0, 30.0, 28.0, 25.0, 31.0, 24.0, 31.0, 49.0, 35.0, 36.0, 1064.0, 45.0, 46.0, 45.0, 39.0, 44.0, 35.0, 28.0, 21.0, 28.0, 21.0, 24.0, 35.0, 17.0, 17.0, 24.0, 6.0, 12.0, 4.0, 9.0, 4.0, 7.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.77734375, -4.62200927734375, -4.4666748046875, -4.31134033203125, -4.156005859375, -4.00067138671875, -3.8453369140625, -3.69000244140625, -3.53466796875, -3.37933349609375, -3.2239990234375, -3.06866455078125, -2.913330078125, -2.75799560546875, -2.6026611328125, -2.44732666015625, -2.2919921875, -2.13665771484375, -1.9813232421875, -1.82598876953125, -1.670654296875, -1.51531982421875, -1.3599853515625, -1.20465087890625, -1.04931640625, -0.89398193359375, -0.7386474609375, -0.58331298828125, -0.427978515625, -0.27264404296875, -0.1173095703125, 0.03802490234375, 0.193359375, 0.34869384765625, 0.5040283203125, 0.65936279296875, 0.814697265625, 0.97003173828125, 1.1253662109375, 1.28070068359375, 1.43603515625, 1.59136962890625, 1.7467041015625, 1.90203857421875, 2.057373046875, 2.21270751953125, 2.3680419921875, 2.52337646484375, 2.6787109375, 2.83404541015625, 2.9893798828125, 3.14471435546875, 3.300048828125, 3.45538330078125, 3.6107177734375, 3.76605224609375, 3.92138671875, 4.07672119140625, 4.2320556640625, 4.38739013671875, 4.542724609375, 4.69805908203125, 4.8533935546875, 5.00872802734375, 5.1640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 9.0, 14.0, 15.0, 18.0, 28.0, 43.0, 90.0, 108.0, 160.0, 238.0, 349.0, 561.0, 892.0, 1386.0, 2225.0, 3548.0, 5900.0, 9946.0, 16932.0, 28974.0, 50884.0, 87146.0, 138660.0, 1089416.0, 329968.0, 132344.0, 81832.0, 47483.0, 27684.0, 15803.0, 9348.0, 5722.0, 3319.0, 2238.0, 1308.0, 863.0, 553.0, 387.0, 232.0, 165.0, 111.0, 56.0, 56.0, 33.0, 28.0, 20.0, 14.0, 9.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.7099609375, -0.6884078979492188, -0.6668548583984375, -0.6453018188476562, -0.623748779296875, -0.6021957397460938, -0.5806427001953125, -0.5590896606445312, -0.53753662109375, -0.5159835815429688, -0.4944305419921875, -0.47287750244140625, -0.451324462890625, -0.42977142333984375, -0.4082183837890625, -0.38666534423828125, -0.3651123046875, -0.34355926513671875, -0.3220062255859375, -0.30045318603515625, -0.278900146484375, -0.25734710693359375, -0.2357940673828125, -0.21424102783203125, -0.19268798828125, -0.17113494873046875, -0.1495819091796875, -0.12802886962890625, -0.106475830078125, -0.08492279052734375, -0.0633697509765625, -0.04181671142578125, -0.020263671875, 0.00128936767578125, 0.0228424072265625, 0.04439544677734375, 0.065948486328125, 0.08750152587890625, 0.1090545654296875, 0.13060760498046875, 0.15216064453125, 0.17371368408203125, 0.1952667236328125, 0.21681976318359375, 0.238372802734375, 0.25992584228515625, 0.2814788818359375, 0.30303192138671875, 0.3245849609375, 0.34613800048828125, 0.3676910400390625, 0.38924407958984375, 0.410797119140625, 0.43235015869140625, 0.4539031982421875, 0.47545623779296875, 0.49700927734375, 0.5185623168945312, 0.5401153564453125, 0.5616683959960938, 0.583221435546875, 0.6047744750976562, 0.6263275146484375, 0.6478805541992188, 0.66943359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 11.0, 6.0, 10.0, 13.0, 19.0, 24.0, 23.0, 34.0, 47.0, 44.0, 51.0, 56.0, 62.0, 73.0, 64.0, 59.0, 70.0, 67.0, 58.0, 40.0, 33.0, 20.0, 16.0, 20.0, 17.0, 13.0, 12.0, 11.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.011566162109375, -0.011197924613952637, -0.010829687118530273, -0.01046144962310791, -0.010093212127685547, -0.009724974632263184, -0.00935673713684082, -0.008988499641418457, -0.008620262145996094, -0.00825202465057373, -0.007883787155151367, -0.007515549659729004, -0.007147312164306641, -0.006779074668884277, -0.006410837173461914, -0.006042599678039551, -0.0056743621826171875, -0.005306124687194824, -0.004937887191772461, -0.004569649696350098, -0.004201412200927734, -0.003833174705505371, -0.003464937210083008, -0.0030966997146606445, -0.0027284622192382812, -0.002360224723815918, -0.0019919872283935547, -0.0016237497329711914, -0.0012555122375488281, -0.0008872747421264648, -0.0005190372467041016, -0.00015079975128173828, 0.000217437744140625, 0.0005856752395629883, 0.0009539127349853516, 0.0013221502304077148, 0.0016903877258300781, 0.0020586252212524414, 0.0024268627166748047, 0.002795100212097168, 0.0031633377075195312, 0.0035315752029418945, 0.003899812698364258, 0.004268050193786621, 0.004636287689208984, 0.005004525184631348, 0.005372762680053711, 0.005741000175476074, 0.0061092376708984375, 0.006477475166320801, 0.006845712661743164, 0.007213950157165527, 0.007582187652587891, 0.007950425148010254, 0.008318662643432617, 0.00868690013885498, 0.009055137634277344, 0.009423375129699707, 0.00979161262512207, 0.010159850120544434, 0.010528087615966797, 0.01089632511138916, 0.011264562606811523, 0.011632800102233887, 0.01200103759765625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 19.0, 11.0, 19.0, 15.0, 24.0, 38.0, 73.0, 91.0, 199.0, 521.0, 3157.0, 69367.0, 925693.0, 45943.0, 2372.0, 472.0, 180.0, 108.0, 73.0, 42.0, 37.0, 27.0, 17.0, 9.0, 5.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24253082275390625, -0.2348175048828125, -0.22710418701171875, -0.219390869140625, -0.21167755126953125, -0.2039642333984375, -0.19625091552734375, -0.18853759765625, -0.18082427978515625, -0.1731109619140625, -0.16539764404296875, -0.157684326171875, -0.14997100830078125, -0.1422576904296875, -0.13454437255859375, -0.1268310546875, -0.11911773681640625, -0.1114044189453125, -0.10369110107421875, -0.095977783203125, -0.08826446533203125, -0.0805511474609375, -0.07283782958984375, -0.06512451171875, -0.05741119384765625, -0.0496978759765625, -0.04198455810546875, -0.034271240234375, -0.02655792236328125, -0.0188446044921875, -0.01113128662109375, -0.00341796875, 0.00429534912109375, 0.0120086669921875, 0.01972198486328125, 0.027435302734375, 0.03514862060546875, 0.0428619384765625, 0.05057525634765625, 0.05828857421875, 0.06600189208984375, 0.0737152099609375, 0.08142852783203125, 0.089141845703125, 0.09685516357421875, 0.1045684814453125, 0.11228179931640625, 0.1199951171875, 0.12770843505859375, 0.1354217529296875, 0.14313507080078125, 0.150848388671875, 0.15856170654296875, 0.1662750244140625, 0.17398834228515625, 0.18170166015625, 0.18941497802734375, 0.1971282958984375, 0.20484161376953125, 0.212554931640625, 0.22026824951171875, 0.2279815673828125, 0.23569488525390625, 0.243408203125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 23.0, 26.0, 53.0, 126.0, 375.0, 284.0, 79.0, 22.0, 11.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05454837530851364, -0.0522654764354229, -0.04998257756233215, -0.04769968241453171, -0.045416783541440964, -0.04313388466835022, -0.040850989520549774, -0.03856809064745903, -0.036285191774368286, -0.03400229290127754, -0.0317193940281868, -0.029436498880386353, -0.02715360000729561, -0.024870701134204865, -0.02258780412375927, -0.020304907113313675, -0.01802200824022293, -0.015739109367132187, -0.013456212356686592, -0.011173314414918423, -0.008890416473150253, -0.006607518531382084, -0.0043246205896139145, -0.0020417235791683197, 0.00024117529392242432, 0.0025240732356905937, 0.004806971177458763, 0.0070898691192269325, 0.009372767060995102, 0.011655665002763271, 0.01393856294453144, 0.016221459954977036, 0.018504351377487183, 0.020787250250577927, 0.02307014726102352, 0.025353044271469116, 0.02763594314455986, 0.029918842017650604, 0.03220173716545105, 0.034484636038541794, 0.03676753491163254, 0.03905043378472328, 0.041333332657814026, 0.04361622780561447, 0.045899126678705215, 0.04818202555179596, 0.050464920699596405, 0.05274781957268715, 0.05503071844577789, 0.05731361731886864, 0.05959651619195938, 0.06187941133975983, 0.06416231393814087, 0.06644520908594131, 0.06872810423374176, 0.0710110068321228, 0.07329390197992325, 0.0755767971277237, 0.07785969972610474, 0.08014259487390518, 0.08242549002170563, 0.08470839262008667, 0.08699128776788712, 0.08927418291568756, 0.0915570855140686]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 13.0, 5.0, 9.0, 6.0, 5.0, 5.0, 11.0, 16.0, 6.0, 14.0, 18.0, 16.0, 24.0, 16.0, 22.0, 30.0, 26.0, 28.0, 33.0, 29.0, 33.0, 41.0, 43.0, 30.0, 38.0, 44.0, 38.0, 37.0, 40.0, 38.0, 30.0, 34.0, 34.0, 31.0, 20.0, 15.0, 18.0, 23.0, 15.0, 7.0, 12.0, 7.0, 7.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.006208837032318115, -0.006016128696501255, -0.005823420360684395, -0.005630712024867535, -0.0054380036890506744, -0.005245295353233814, -0.005052587017416954, -0.004859878681600094, -0.004667170345783234, -0.0044744620099663734, -0.004281753674149513, -0.004089045338332653, -0.003896337002515793, -0.0037036286666989326, -0.0035109203308820724, -0.0033182119950652122, -0.003125503659248352, -0.002932795323431492, -0.0027400869876146317, -0.0025473786517977715, -0.0023546703159809113, -0.002161961980164051, -0.001969253644347191, -0.0017765453085303307, -0.0015838369727134705, -0.0013911286368966103, -0.00119842030107975, -0.0010057119652628899, -0.0008130036294460297, -0.0006202952936291695, -0.00042758695781230927, -0.00023487862199544907, -4.217028617858887e-05, 0.00015053804963827133, 0.00034324638545513153, 0.0005359547212719917, 0.0007286630570888519, 0.0009213713929057121, 0.0011140797287225723, 0.0013067880645394325, 0.0014994964003562927, 0.001692204736173153, 0.0018849130719900131, 0.0020776214078068733, 0.0022703297436237335, 0.0024630380794405937, 0.002655746415257454, 0.002848454751074314, 0.0030411630868911743, 0.0032338714227080345, 0.0034265797585248947, 0.003619288094341755, 0.003811996430158615, 0.004004704765975475, 0.0041974131017923355, 0.004390121437609196, 0.004582829773426056, 0.004775538109242916, 0.004968246445059776, 0.0051609547808766365, 0.005353663116693497, 0.005546371452510357, 0.005739079788327217, 0.005931788124144077, 0.0061244964599609375]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 4.0, 4.0, 12.0, 8.0, 13.0, 8.0, 16.0, 23.0, 29.0, 16.0, 20.0, 29.0, 26.0, 43.0, 36.0, 31.0, 41.0, 40.0, 45.0, 43.0, 32.0, 43.0, 34.0, 37.0, 37.0, 35.0, 28.0, 30.0, 29.0, 25.0, 24.0, 18.0, 20.0, 15.0, 10.0, 14.0, 16.0, 12.0, 9.0, 8.0, 8.0, 9.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.39453125, -7.158203125, -6.921875, -6.685546875, -6.44921875, -6.212890625, -5.9765625, -5.740234375, -5.50390625, -5.267578125, -5.03125, -4.794921875, -4.55859375, -4.322265625, -4.0859375, -3.849609375, -3.61328125, -3.376953125, -3.140625, -2.904296875, -2.66796875, -2.431640625, -2.1953125, -1.958984375, -1.72265625, -1.486328125, -1.25, -1.013671875, -0.77734375, -0.541015625, -0.3046875, -0.068359375, 0.16796875, 0.404296875, 0.640625, 0.876953125, 1.11328125, 1.349609375, 1.5859375, 1.822265625, 2.05859375, 2.294921875, 2.53125, 2.767578125, 3.00390625, 3.240234375, 3.4765625, 3.712890625, 3.94921875, 4.185546875, 4.421875, 4.658203125, 4.89453125, 5.130859375, 5.3671875, 5.603515625, 5.83984375, 6.076171875, 6.3125, 6.548828125, 6.78515625, 7.021484375, 7.2578125, 7.494140625, 7.73046875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 10.0, 14.0, 15.0, 28.0, 37.0, 65.0, 83.0, 115.0, 156.0, 226.0, 326.0, 423.0, 618.0, 953.0, 1404.0, 2012.0, 3009.0, 4497.0, 7239.0, 11589.0, 20132.0, 37731.0, 85189.0, 253410.0, 383122.0, 122043.0, 49920.0, 25377.0, 13887.0, 8518.0, 5490.0, 3447.0, 2294.0, 1639.0, 1099.0, 708.0, 532.0, 366.0, 245.0, 195.0, 114.0, 93.0, 56.0, 30.0, 25.0, 26.0, 10.0, 19.0, 7.0, 2.0, 0.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.0078125, -4.84722900390625, -4.6866455078125, -4.52606201171875, -4.365478515625, -4.20489501953125, -4.0443115234375, -3.88372802734375, -3.72314453125, -3.56256103515625, -3.4019775390625, -3.24139404296875, -3.080810546875, -2.92022705078125, -2.7596435546875, -2.59906005859375, -2.4384765625, -2.27789306640625, -2.1173095703125, -1.95672607421875, -1.796142578125, -1.63555908203125, -1.4749755859375, -1.31439208984375, -1.15380859375, -0.99322509765625, -0.8326416015625, -0.67205810546875, -0.511474609375, -0.35089111328125, -0.1903076171875, -0.02972412109375, 0.130859375, 0.29144287109375, 0.4520263671875, 0.61260986328125, 0.773193359375, 0.93377685546875, 1.0943603515625, 1.25494384765625, 1.41552734375, 1.57611083984375, 1.7366943359375, 1.89727783203125, 2.057861328125, 2.21844482421875, 2.3790283203125, 2.53961181640625, 2.7001953125, 2.86077880859375, 3.0213623046875, 3.18194580078125, 3.342529296875, 3.50311279296875, 3.6636962890625, 3.82427978515625, 3.98486328125, 4.14544677734375, 4.3060302734375, 4.46661376953125, 4.627197265625, 4.78778076171875, 4.9483642578125, 5.10894775390625, 5.26953125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 6.0, 12.0, 14.0, 19.0, 20.0, 20.0, 29.0, 23.0, 29.0, 28.0, 44.0, 44.0, 63.0, 78.0, 130.0, 316.0, 1563.0, 119.0, 88.0, 52.0, 44.0, 44.0, 34.0, 29.0, 29.0, 23.0, 23.0, 21.0, 28.0, 12.0, 10.0, 7.0, 4.0, 7.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.078125, -26.079833984375, -25.08154296875, -24.083251953125, -23.0849609375, -22.086669921875, -21.08837890625, -20.090087890625, -19.091796875, -18.093505859375, -17.09521484375, -16.096923828125, -15.0986328125, -14.100341796875, -13.10205078125, -12.103759765625, -11.10546875, -10.107177734375, -9.10888671875, -8.110595703125, -7.1123046875, -6.114013671875, -5.11572265625, -4.117431640625, -3.119140625, -2.120849609375, -1.12255859375, -0.124267578125, 0.8740234375, 1.872314453125, 2.87060546875, 3.868896484375, 4.8671875, 5.865478515625, 6.86376953125, 7.862060546875, 8.8603515625, 9.858642578125, 10.85693359375, 11.855224609375, 12.853515625, 13.851806640625, 14.85009765625, 15.848388671875, 16.8466796875, 17.844970703125, 18.84326171875, 19.841552734375, 20.83984375, 21.838134765625, 22.83642578125, 23.834716796875, 24.8330078125, 25.831298828125, 26.82958984375, 27.827880859375, 28.826171875, 29.824462890625, 30.82275390625, 31.821044921875, 32.8193359375, 33.817626953125, 34.81591796875, 35.814208984375, 36.8125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 7.0, 8.0, 11.0, 28.0, 27.0, 40.0, 63.0, 102.0, 119.0, 244.0, 461.0, 1746.0, 234454.0, 2904053.0, 3034.0, 606.0, 259.0, 152.0, 87.0, 66.0, 41.0, 29.0, 23.0, 8.0, 13.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.9375, -86.6201171875, -83.302734375, -79.9853515625, -76.66796875, -73.3505859375, -70.033203125, -66.7158203125, -63.3984375, -60.0810546875, -56.763671875, -53.4462890625, -50.12890625, -46.8115234375, -43.494140625, -40.1767578125, -36.859375, -33.5419921875, -30.224609375, -26.9072265625, -23.58984375, -20.2724609375, -16.955078125, -13.6376953125, -10.3203125, -7.0029296875, -3.685546875, -0.3681640625, 2.94921875, 6.2666015625, 9.583984375, 12.9013671875, 16.21875, 19.5361328125, 22.853515625, 26.1708984375, 29.48828125, 32.8056640625, 36.123046875, 39.4404296875, 42.7578125, 46.0751953125, 49.392578125, 52.7099609375, 56.02734375, 59.3447265625, 62.662109375, 65.9794921875, 69.296875, 72.6142578125, 75.931640625, 79.2490234375, 82.56640625, 85.8837890625, 89.201171875, 92.5185546875, 95.8359375, 99.1533203125, 102.470703125, 105.7880859375, 109.10546875, 112.4228515625, 115.740234375, 119.0576171875, 122.375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 42.0, 289.0, 536.0, 137.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.2476806640625, -88.46859741210938, -82.68950653076172, -76.9104232788086, -71.13133239746094, -65.35224914550781, -59.57316207885742, -53.79407501220703, -48.01498794555664, -42.23590087890625, -36.45681381225586, -30.6777286529541, -24.89864158630371, -19.11955451965332, -13.340469360351562, -7.561382293701172, -1.7822952270507812, 3.996791362762451, 9.775877952575684, 15.554964065551758, 21.33405113220215, 27.11313819885254, 32.8922233581543, 38.67131042480469, 44.45039749145508, 50.22948455810547, 56.00857162475586, 61.78765869140625, 67.56674194335938, 73.34583282470703, 79.12491607666016, 84.90400695800781, 90.68309020996094, 96.46217346191406, 102.24126434326172, 108.02034759521484, 113.7994384765625, 119.57852172851562, 125.35760498046875, 131.13668823242188, 136.91578674316406, 142.6948699951172, 148.4739532470703, 154.2530517578125, 160.03213500976562, 165.81121826171875, 171.59030151367188, 177.369384765625, 183.14846801757812, 188.92755126953125, 194.70663452148438, 200.48573303222656, 206.2648162841797, 212.0438995361328, 217.82298278808594, 223.60208129882812, 229.38116455078125, 235.16024780273438, 240.9393310546875, 246.7184295654297, 252.4975128173828, 258.276611328125, 264.0556945800781, 269.83477783203125, 275.6138610839844]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 5.0, 6.0, 7.0, 6.0, 9.0, 9.0, 14.0, 10.0, 20.0, 25.0, 19.0, 21.0, 36.0, 35.0, 31.0, 35.0, 41.0, 52.0, 39.0, 46.0, 38.0, 37.0, 48.0, 36.0, 34.0, 36.0, 31.0, 27.0, 28.0, 26.0, 28.0, 25.0, 27.0, 18.0, 11.0, 17.0, 12.0, 10.0, 7.0, 10.0, 4.0, 7.0, 8.0, 3.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0], "bins": [-93.29328155517578, -90.59674835205078, -87.90022277832031, -85.20368957519531, -82.50715637207031, -79.81063079833984, -77.11409759521484, -74.41757202148438, -71.72103881835938, -69.02450561523438, -66.3279800415039, -63.631446838378906, -60.93491744995117, -58.23838806152344, -55.54185485839844, -52.8453254699707, -50.14879608154297, -47.452266693115234, -44.7557373046875, -42.0592041015625, -39.362674713134766, -36.66614532470703, -33.96961212158203, -31.273082733154297, -28.576553344726562, -25.880023956298828, -23.18349266052246, -20.486961364746094, -17.79043197631836, -15.093901634216309, -12.397371292114258, -9.70083999633789, -7.004310607910156, -4.3077802658081055, -1.6112499237060547, 1.085280418395996, 3.781810760498047, 6.478341102600098, 9.174871444702148, 11.871402740478516, 14.56793212890625, 17.264461517333984, 19.96099281311035, 22.65752410888672, 25.354053497314453, 28.050582885742188, 30.747114181518555, 33.44364547729492, 36.140174865722656, 38.83670425415039, 41.533233642578125, 44.229766845703125, 46.92629623413086, 49.622825622558594, 52.319358825683594, 55.01588821411133, 57.71241760253906, 60.4089469909668, 63.10547637939453, 65.80200958251953, 68.49853515625, 71.195068359375, 73.8916015625, 76.588134765625, 79.28466033935547]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 5.0, 6.0, 10.0, 16.0, 9.0, 15.0, 21.0, 20.0, 24.0, 26.0, 29.0, 38.0, 43.0, 41.0, 38.0, 27.0, 34.0, 53.0, 42.0, 41.0, 34.0, 39.0, 35.0, 45.0, 36.0, 31.0, 26.0, 30.0, 23.0, 14.0, 18.0, 16.0, 19.0, 10.0, 19.0, 13.0, 10.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.043212890625, -7.78173828125, -7.520263671875, -7.2587890625, -6.997314453125, -6.73583984375, -6.474365234375, -6.212890625, -5.951416015625, -5.68994140625, -5.428466796875, -5.1669921875, -4.905517578125, -4.64404296875, -4.382568359375, -4.12109375, -3.859619140625, -3.59814453125, -3.336669921875, -3.0751953125, -2.813720703125, -2.55224609375, -2.290771484375, -2.029296875, -1.767822265625, -1.50634765625, -1.244873046875, -0.9833984375, -0.721923828125, -0.46044921875, -0.198974609375, 0.0625, 0.323974609375, 0.58544921875, 0.846923828125, 1.1083984375, 1.369873046875, 1.63134765625, 1.892822265625, 2.154296875, 2.415771484375, 2.67724609375, 2.938720703125, 3.2001953125, 3.461669921875, 3.72314453125, 3.984619140625, 4.24609375, 4.507568359375, 4.76904296875, 5.030517578125, 5.2919921875, 5.553466796875, 5.81494140625, 6.076416015625, 6.337890625, 6.599365234375, 6.86083984375, 7.122314453125, 7.3837890625, 7.645263671875, 7.90673828125, 8.168212890625, 8.4296875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 8.0, 13.0, 18.0, 27.0, 44.0, 64.0, 95.0, 129.0, 227.0, 418.0, 791.0, 1662.0, 3535.0, 9570.0, 28836.0, 98254.0, 433757.0, 1530575.0, 1523357.0, 420569.0, 97652.0, 28233.0, 9438.0, 3598.0, 1564.0, 776.0, 424.0, 206.0, 118.0, 77.0, 72.0, 45.0, 30.0, 21.0, 19.0, 10.0, 16.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0], "bins": [-16.640625, -16.2138671875, -15.787109375, -15.3603515625, -14.93359375, -14.5068359375, -14.080078125, -13.6533203125, -13.2265625, -12.7998046875, -12.373046875, -11.9462890625, -11.51953125, -11.0927734375, -10.666015625, -10.2392578125, -9.8125, -9.3857421875, -8.958984375, -8.5322265625, -8.10546875, -7.6787109375, -7.251953125, -6.8251953125, -6.3984375, -5.9716796875, -5.544921875, -5.1181640625, -4.69140625, -4.2646484375, -3.837890625, -3.4111328125, -2.984375, -2.5576171875, -2.130859375, -1.7041015625, -1.27734375, -0.8505859375, -0.423828125, 0.0029296875, 0.4296875, 0.8564453125, 1.283203125, 1.7099609375, 2.13671875, 2.5634765625, 2.990234375, 3.4169921875, 3.84375, 4.2705078125, 4.697265625, 5.1240234375, 5.55078125, 5.9775390625, 6.404296875, 6.8310546875, 7.2578125, 7.6845703125, 8.111328125, 8.5380859375, 8.96484375, 9.3916015625, 9.818359375, 10.2451171875, 10.671875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 5.0, 10.0, 10.0, 15.0, 12.0, 8.0, 14.0, 25.0, 38.0, 54.0, 57.0, 50.0, 73.0, 100.0, 121.0, 150.0, 212.0, 204.0, 268.0, 290.0, 328.0, 315.0, 309.0, 269.0, 204.0, 186.0, 140.0, 123.0, 89.0, 96.0, 64.0, 51.0, 25.0, 45.0, 39.0, 16.0, 10.0, 13.0, 9.0, 5.0, 5.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.0078125, -14.5640869140625, -14.120361328125, -13.6766357421875, -13.23291015625, -12.7891845703125, -12.345458984375, -11.9017333984375, -11.4580078125, -11.0142822265625, -10.570556640625, -10.1268310546875, -9.68310546875, -9.2393798828125, -8.795654296875, -8.3519287109375, -7.908203125, -7.4644775390625, -7.020751953125, -6.5770263671875, -6.13330078125, -5.6895751953125, -5.245849609375, -4.8021240234375, -4.3583984375, -3.9146728515625, -3.470947265625, -3.0272216796875, -2.58349609375, -2.1397705078125, -1.696044921875, -1.2523193359375, -0.80859375, -0.3648681640625, 0.078857421875, 0.5225830078125, 0.96630859375, 1.4100341796875, 1.853759765625, 2.2974853515625, 2.7412109375, 3.1849365234375, 3.628662109375, 4.0723876953125, 4.51611328125, 4.9598388671875, 5.403564453125, 5.8472900390625, 6.291015625, 6.7347412109375, 7.178466796875, 7.6221923828125, 8.06591796875, 8.5096435546875, 8.953369140625, 9.3970947265625, 9.8408203125, 10.2845458984375, 10.728271484375, 11.1719970703125, 11.61572265625, 12.0594482421875, 12.503173828125, 12.9468994140625, 13.390625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 8.0, 18.0, 16.0, 10.0, 20.0, 20.0, 39.0, 30.0, 41.0, 58.0, 91.0, 109.0, 131.0, 219.0, 273.0, 463.0, 1009.0, 3151.0, 14676.0, 92087.0, 736507.0, 2712772.0, 545466.0, 70588.0, 11673.0, 2564.0, 861.0, 428.0, 243.0, 149.0, 112.0, 91.0, 81.0, 50.0, 35.0, 44.0, 39.0, 23.0, 12.0, 17.0, 13.0, 8.0, 8.0, 10.0, 3.0, 3.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-28.640625, -27.699462890625, -26.75830078125, -25.817138671875, -24.8759765625, -23.934814453125, -22.99365234375, -22.052490234375, -21.111328125, -20.170166015625, -19.22900390625, -18.287841796875, -17.3466796875, -16.405517578125, -15.46435546875, -14.523193359375, -13.58203125, -12.640869140625, -11.69970703125, -10.758544921875, -9.8173828125, -8.876220703125, -7.93505859375, -6.993896484375, -6.052734375, -5.111572265625, -4.17041015625, -3.229248046875, -2.2880859375, -1.346923828125, -0.40576171875, 0.535400390625, 1.4765625, 2.417724609375, 3.35888671875, 4.300048828125, 5.2412109375, 6.182373046875, 7.12353515625, 8.064697265625, 9.005859375, 9.947021484375, 10.88818359375, 11.829345703125, 12.7705078125, 13.711669921875, 14.65283203125, 15.593994140625, 16.53515625, 17.476318359375, 18.41748046875, 19.358642578125, 20.2998046875, 21.240966796875, 22.18212890625, 23.123291015625, 24.064453125, 25.005615234375, 25.94677734375, 26.887939453125, 27.8291015625, 28.770263671875, 29.71142578125, 30.652587890625, 31.59375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 15.0, 24.0, 49.0, 67.0, 104.0, 124.0, 118.0, 144.0, 105.0, 103.0, 69.0, 35.0, 25.0, 8.0, 7.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.75611877441406, -179.90872192382812, -176.0613250732422, -172.21392822265625, -168.3665313720703, -164.51913452148438, -160.6717529296875, -156.82435607910156, -152.97695922851562, -149.1295623779297, -145.28216552734375, -141.4347686767578, -137.58737182617188, -133.739990234375, -129.89259338378906, -126.04519653320312, -122.19779968261719, -118.35040283203125, -114.50300598144531, -110.6556167602539, -106.80821990966797, -102.96082305908203, -99.1134262084961, -95.26603698730469, -91.41863250732422, -87.57123565673828, -83.72383880615234, -79.87644958496094, -76.029052734375, -72.18165588378906, -68.33425903320312, -64.48686218261719, -60.63947296142578, -56.792076110839844, -52.94468307495117, -49.097286224365234, -45.24989318847656, -41.402496337890625, -37.55509948730469, -33.707706451416016, -29.86031150817871, -26.012916564941406, -22.1655216217041, -18.318126678466797, -14.470730781555176, -10.623334884643555, -6.77593994140625, -2.9285449981689453, 0.9188499450683594, 4.766244888305664, 8.613639831542969, 12.46103572845459, 16.308429718017578, 20.155826568603516, 24.00322151184082, 27.850616455078125, 31.69801139831543, 35.545406341552734, 39.39280319213867, 43.240196228027344, 47.08759307861328, 50.93498992919922, 54.78238296508789, 58.62977600097656, 62.4771728515625]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 10.0, 4.0, 10.0, 12.0, 22.0, 15.0, 21.0, 17.0, 26.0, 29.0, 32.0, 38.0, 44.0, 54.0, 57.0, 38.0, 54.0, 51.0, 39.0, 36.0, 42.0, 36.0, 33.0, 46.0, 33.0, 19.0, 33.0, 31.0, 23.0, 16.0, 18.0, 9.0, 12.0, 13.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-73.991943359375, -71.91132354736328, -69.8307113647461, -67.75009155273438, -65.66947174072266, -63.5888557434082, -61.50823974609375, -59.42761993408203, -57.34700393676758, -55.266387939453125, -53.185768127441406, -51.10515213012695, -49.0245361328125, -46.94391632080078, -44.86330032348633, -42.782684326171875, -40.702064514160156, -38.6214485168457, -36.540828704833984, -34.46021270751953, -32.37959289550781, -30.29897689819336, -28.218360900878906, -26.13774299621582, -24.057125091552734, -21.97650718688965, -19.895889282226562, -17.81527328491211, -15.734655380249023, -13.654037475585938, -11.573420524597168, -9.492803573608398, -7.4121856689453125, -5.331568241119385, -3.250950813293457, -1.1703333854675293, 0.9102840423583984, 2.9909019470214844, 5.071518898010254, 7.152135848999023, 9.23275375366211, 11.313371658325195, 13.393988609313965, 15.474605560302734, 17.55522346496582, 19.635841369628906, 21.71645736694336, 23.797075271606445, 25.87769317626953, 27.958311080932617, 30.038928985595703, 32.119544982910156, 34.200164794921875, 36.28078079223633, 38.36139678955078, 40.4420166015625, 42.52263259887695, 44.603248596191406, 46.683868408203125, 48.76448440551758, 50.84510040283203, 52.92572021484375, 55.0063362121582, 57.086952209472656, 59.167572021484375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 8.0, 8.0, 12.0, 11.0, 10.0, 13.0, 17.0, 21.0, 27.0, 28.0, 30.0, 20.0, 28.0, 35.0, 29.0, 32.0, 33.0, 52.0, 45.0, 43.0, 42.0, 41.0, 39.0, 28.0, 29.0, 35.0, 35.0, 32.0, 27.0, 24.0, 22.0, 16.0, 19.0, 14.0, 17.0, 12.0, 13.0, 5.0, 9.0, 6.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.4921875, -8.24090576171875, -7.9896240234375, -7.73834228515625, -7.487060546875, -7.23577880859375, -6.9844970703125, -6.73321533203125, -6.48193359375, -6.23065185546875, -5.9793701171875, -5.72808837890625, -5.476806640625, -5.22552490234375, -4.9742431640625, -4.72296142578125, -4.4716796875, -4.22039794921875, -3.9691162109375, -3.71783447265625, -3.466552734375, -3.21527099609375, -2.9639892578125, -2.71270751953125, -2.46142578125, -2.21014404296875, -1.9588623046875, -1.70758056640625, -1.456298828125, -1.20501708984375, -0.9537353515625, -0.70245361328125, -0.451171875, -0.19989013671875, 0.0513916015625, 0.30267333984375, 0.553955078125, 0.80523681640625, 1.0565185546875, 1.30780029296875, 1.55908203125, 1.81036376953125, 2.0616455078125, 2.31292724609375, 2.564208984375, 2.81549072265625, 3.0667724609375, 3.31805419921875, 3.5693359375, 3.82061767578125, 4.0718994140625, 4.32318115234375, 4.574462890625, 4.82574462890625, 5.0770263671875, 5.32830810546875, 5.57958984375, 5.83087158203125, 6.0821533203125, 6.33343505859375, 6.584716796875, 6.83599853515625, 7.0872802734375, 7.33856201171875, 7.58984375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 6.0, 15.0, 11.0, 22.0, 22.0, 42.0, 66.0, 92.0, 167.0, 223.0, 377.0, 600.0, 941.0, 1547.0, 2644.0, 4281.0, 7009.0, 12392.0, 21586.0, 37960.0, 69790.0, 130790.0, 223792.0, 229510.0, 137501.0, 73268.0, 39907.0, 22183.0, 12796.0, 7664.0, 4345.0, 2665.0, 1592.0, 1049.0, 589.0, 366.0, 258.0, 152.0, 106.0, 79.0, 47.0, 39.0, 22.0, 4.0, 16.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0], "bins": [-1.40234375, -1.3623199462890625, -1.322296142578125, -1.2822723388671875, -1.24224853515625, -1.2022247314453125, -1.162200927734375, -1.1221771240234375, -1.0821533203125, -1.0421295166015625, -1.002105712890625, -0.9620819091796875, -0.92205810546875, -0.8820343017578125, -0.842010498046875, -0.8019866943359375, -0.761962890625, -0.7219390869140625, -0.681915283203125, -0.6418914794921875, -0.60186767578125, -0.5618438720703125, -0.521820068359375, -0.4817962646484375, -0.4417724609375, -0.4017486572265625, -0.361724853515625, -0.3217010498046875, -0.28167724609375, -0.2416534423828125, -0.201629638671875, -0.1616058349609375, -0.12158203125, -0.0815582275390625, -0.041534423828125, -0.0015106201171875, 0.03851318359375, 0.0785369873046875, 0.118560791015625, 0.1585845947265625, 0.1986083984375, 0.2386322021484375, 0.278656005859375, 0.3186798095703125, 0.35870361328125, 0.3987274169921875, 0.438751220703125, 0.4787750244140625, 0.518798828125, 0.5588226318359375, 0.598846435546875, 0.6388702392578125, 0.67889404296875, 0.7189178466796875, 0.758941650390625, 0.7989654541015625, 0.8389892578125, 0.8790130615234375, 0.919036865234375, 0.9590606689453125, 0.99908447265625, 1.0391082763671875, 1.079132080078125, 1.1191558837890625, 1.1591796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 10.0, 4.0, 7.0, 7.0, 10.0, 16.0, 15.0, 17.0, 20.0, 13.0, 25.0, 22.0, 24.0, 18.0, 29.0, 35.0, 37.0, 40.0, 37.0, 41.0, 37.0, 1069.0, 43.0, 41.0, 36.0, 33.0, 36.0, 42.0, 39.0, 22.0, 20.0, 19.0, 27.0, 24.0, 13.0, 19.0, 12.0, 8.0, 9.0, 7.0, 8.0, 5.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0], "bins": [-6.00390625, -5.8387451171875, -5.673583984375, -5.5084228515625, -5.34326171875, -5.1781005859375, -5.012939453125, -4.8477783203125, -4.6826171875, -4.5174560546875, -4.352294921875, -4.1871337890625, -4.02197265625, -3.8568115234375, -3.691650390625, -3.5264892578125, -3.361328125, -3.1961669921875, -3.031005859375, -2.8658447265625, -2.70068359375, -2.5355224609375, -2.370361328125, -2.2052001953125, -2.0400390625, -1.8748779296875, -1.709716796875, -1.5445556640625, -1.37939453125, -1.2142333984375, -1.049072265625, -0.8839111328125, -0.71875, -0.5535888671875, -0.388427734375, -0.2232666015625, -0.05810546875, 0.1070556640625, 0.272216796875, 0.4373779296875, 0.6025390625, 0.7677001953125, 0.932861328125, 1.0980224609375, 1.26318359375, 1.4283447265625, 1.593505859375, 1.7586669921875, 1.923828125, 2.0889892578125, 2.254150390625, 2.4193115234375, 2.58447265625, 2.7496337890625, 2.914794921875, 3.0799560546875, 3.2451171875, 3.4102783203125, 3.575439453125, 3.7406005859375, 3.90576171875, 4.0709228515625, 4.236083984375, 4.4012451171875, 4.56640625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 9.0, 13.0, 17.0, 31.0, 48.0, 76.0, 87.0, 150.0, 224.0, 315.0, 474.0, 720.0, 1132.0, 1712.0, 2699.0, 4192.0, 6408.0, 10073.0, 16388.0, 25700.0, 42592.0, 67869.0, 105228.0, 149891.0, 1219873.0, 150019.0, 107307.0, 69253.0, 43021.0, 26617.0, 16266.0, 10318.0, 6570.0, 4057.0, 2721.0, 1730.0, 1143.0, 747.0, 505.0, 346.0, 203.0, 137.0, 87.0, 60.0, 38.0, 29.0, 16.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.60205078125, -0.5823211669921875, -0.562591552734375, -0.5428619384765625, -0.52313232421875, -0.5034027099609375, -0.483673095703125, -0.4639434814453125, -0.4442138671875, -0.4244842529296875, -0.404754638671875, -0.3850250244140625, -0.36529541015625, -0.3455657958984375, -0.325836181640625, -0.3061065673828125, -0.286376953125, -0.2666473388671875, -0.246917724609375, -0.2271881103515625, -0.20745849609375, -0.1877288818359375, -0.167999267578125, -0.1482696533203125, -0.1285400390625, -0.1088104248046875, -0.089080810546875, -0.0693511962890625, -0.04962158203125, -0.0298919677734375, -0.010162353515625, 0.0095672607421875, 0.029296875, 0.0490264892578125, 0.068756103515625, 0.0884857177734375, 0.10821533203125, 0.1279449462890625, 0.147674560546875, 0.1674041748046875, 0.1871337890625, 0.2068634033203125, 0.226593017578125, 0.2463226318359375, 0.26605224609375, 0.2857818603515625, 0.305511474609375, 0.3252410888671875, 0.344970703125, 0.3647003173828125, 0.384429931640625, 0.4041595458984375, 0.42388916015625, 0.4436187744140625, 0.463348388671875, 0.4830780029296875, 0.5028076171875, 0.5225372314453125, 0.542266845703125, 0.5619964599609375, 0.58172607421875, 0.6014556884765625, 0.621185302734375, 0.6409149169921875, 0.66064453125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 0.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 13.0, 7.0, 17.0, 13.0, 21.0, 18.0, 41.0, 47.0, 59.0, 68.0, 67.0, 83.0, 88.0, 73.0, 78.0, 57.0, 40.0, 40.0, 30.0, 19.0, 21.0, 12.0, 13.0, 7.0, 7.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006145477294921875, -0.005910098552703857, -0.00567471981048584, -0.005439341068267822, -0.005203962326049805, -0.004968583583831787, -0.0047332048416137695, -0.004497826099395752, -0.004262447357177734, -0.004027068614959717, -0.0037916898727416992, -0.0035563111305236816, -0.003320932388305664, -0.0030855536460876465, -0.002850174903869629, -0.0026147961616516113, -0.0023794174194335938, -0.002144038677215576, -0.0019086599349975586, -0.001673281192779541, -0.0014379024505615234, -0.0012025237083435059, -0.0009671449661254883, -0.0007317662239074707, -0.0004963874816894531, -0.00026100873947143555, -2.562999725341797e-05, 0.0002097487449645996, 0.0004451274871826172, 0.0006805062294006348, 0.0009158849716186523, 0.00115126371383667, 0.0013866424560546875, 0.001622021198272705, 0.0018573999404907227, 0.0020927786827087402, 0.002328157424926758, 0.0025635361671447754, 0.002798914909362793, 0.0030342936515808105, 0.003269672393798828, 0.0035050511360168457, 0.0037404298782348633, 0.003975808620452881, 0.0042111873626708984, 0.004446566104888916, 0.004681944847106934, 0.004917323589324951, 0.005152702331542969, 0.005388081073760986, 0.005623459815979004, 0.0058588385581970215, 0.006094217300415039, 0.006329596042633057, 0.006564974784851074, 0.006800353527069092, 0.007035732269287109, 0.007271111011505127, 0.0075064897537231445, 0.007741868495941162, 0.00797724723815918, 0.008212625980377197, 0.008448004722595215, 0.008683383464813232, 0.00891876220703125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 2.0, 4.0, 16.0, 8.0, 13.0, 13.0, 19.0, 21.0, 25.0, 43.0, 73.0, 116.0, 300.0, 816.0, 3883.0, 28533.0, 433508.0, 541615.0, 33551.0, 4367.0, 902.0, 307.0, 147.0, 76.0, 38.0, 29.0, 33.0, 17.0, 16.0, 11.0, 9.0, 8.0, 4.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1571044921875, -0.1526203155517578, -0.14813613891601562, -0.14365196228027344, -0.13916778564453125, -0.13468360900878906, -0.13019943237304688, -0.1257152557373047, -0.1212310791015625, -0.11674690246582031, -0.11226272583007812, -0.10777854919433594, -0.10329437255859375, -0.09881019592285156, -0.09432601928710938, -0.08984184265136719, -0.085357666015625, -0.08087348937988281, -0.07638931274414062, -0.07190513610839844, -0.06742095947265625, -0.06293678283691406, -0.058452606201171875, -0.05396842956542969, -0.0494842529296875, -0.04500007629394531, -0.040515899658203125, -0.03603172302246094, -0.03154754638671875, -0.027063369750976562, -0.022579193115234375, -0.018095016479492188, -0.01361083984375, -0.009126663208007812, -0.004642486572265625, -0.0001583099365234375, 0.00432586669921875, 0.008810043334960938, 0.013294219970703125, 0.017778396606445312, 0.0222625732421875, 0.026746749877929688, 0.031230926513671875, 0.03571510314941406, 0.04019927978515625, 0.04468345642089844, 0.049167633056640625, 0.05365180969238281, 0.058135986328125, 0.06262016296386719, 0.06710433959960938, 0.07158851623535156, 0.07607269287109375, 0.08055686950683594, 0.08504104614257812, 0.08952522277832031, 0.0940093994140625, 0.09849357604980469, 0.10297775268554688, 0.10746192932128906, 0.11194610595703125, 0.11643028259277344, 0.12091445922851562, 0.1253986358642578, 0.1298828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 8.0, 13.0, 15.0, 16.0, 17.0, 30.0, 49.0, 75.0, 107.0, 158.0, 184.0, 118.0, 70.0, 42.0, 33.0, 22.0, 12.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.029162703081965446, -0.02835770882666111, -0.027552714571356773, -0.026747722178697586, -0.02594272792339325, -0.025137733668088913, -0.024332739412784576, -0.02352774515748024, -0.022722750902175903, -0.021917756646871567, -0.02111276239156723, -0.020307768136262894, -0.019502775743603706, -0.01869778148829937, -0.017892787232995033, -0.017087792977690697, -0.01628280058503151, -0.015477806329727173, -0.014672813005745411, -0.013867818750441074, -0.013062824495136738, -0.012257831171154976, -0.01145283691585064, -0.010647842660546303, -0.009842848405241966, -0.00903785414993763, -0.008232860825955868, -0.007427866570651531, -0.006622872315347195, -0.005817878525704145, -0.005012884736061096, -0.00420789048075676, -0.003402896225452423, -0.00259790220297873, -0.0017929082969203591, -0.000987914390861988, -0.00018292036838829517, 0.0006220736540853977, 0.001427067443728447, 0.0022320616990327835, 0.0030370554886758327, 0.0038420495111495256, 0.0046470435336232185, 0.005452037323266268, 0.006257031112909317, 0.0070620253682136536, 0.00786701962351799, 0.008672013878822327, 0.009477007202804089, 0.010282001458108425, 0.011086994782090187, 0.011891989037394524, 0.01269698329269886, 0.013501977548003197, 0.014306970871984959, 0.015111965127289295, 0.015916958451271057, 0.016721952706575394, 0.01752694696187973, 0.018331941217184067, 0.019136933609843254, 0.01994192786514759, 0.020746922120451927, 0.021551916375756264, 0.0223569106310606]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 13.0, 7.0, 12.0, 11.0, 17.0, 16.0, 23.0, 25.0, 19.0, 38.0, 26.0, 45.0, 37.0, 42.0, 46.0, 46.0, 54.0, 55.0, 49.0, 39.0, 37.0, 50.0, 30.0, 35.0, 28.0, 30.0, 21.0, 21.0, 25.0, 17.0, 11.0, 19.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.005162954330444336, -0.005024814046919346, -0.004886673763394356, -0.004748533479869366, -0.004610393196344376, -0.0044722529128193855, -0.0043341126292943954, -0.004195972345769405, -0.004057832062244415, -0.003919691778719425, -0.003781551495194435, -0.003643411211669445, -0.003505270928144455, -0.003367130644619465, -0.003228990361094475, -0.0030908500775694847, -0.0029527097940444946, -0.0028145695105195045, -0.0026764292269945145, -0.0025382889434695244, -0.0024001486599445343, -0.0022620083764195442, -0.002123868092894554, -0.001985727809369564, -0.001847587525844574, -0.001709447242319584, -0.0015713069587945938, -0.0014331666752696037, -0.0012950263917446136, -0.0011568861082196236, -0.0010187458246946335, -0.0008806055411696434, -0.0007424652576446533, -0.0006043249741196632, -0.00046618469059467316, -0.0003280444070696831, -0.000189904123544693, -5.176384001970291e-05, 8.637644350528717e-05, 0.00022451672703027725, 0.00036265701055526733, 0.0005007972940802574, 0.0006389375776052475, 0.0007770778611302376, 0.0009152181446552277, 0.0010533584281802177, 0.0011914987117052078, 0.001329638995230198, 0.001467779278755188, 0.001605919562280178, 0.0017440598458051682, 0.0018822001293301582, 0.0020203404128551483, 0.0021584806963801384, 0.0022966209799051285, 0.0024347612634301186, 0.0025729015469551086, 0.0027110418304800987, 0.002849182114005089, 0.002987322397530079, 0.003125462681055069, 0.003263602964580059, 0.003401743248105049, 0.003539883531630039, 0.0036780238151550293]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 8.0, 8.0, 12.0, 11.0, 10.0, 13.0, 17.0, 21.0, 27.0, 28.0, 30.0, 20.0, 27.0, 36.0, 29.0, 32.0, 33.0, 52.0, 45.0, 43.0, 42.0, 41.0, 39.0, 28.0, 29.0, 35.0, 35.0, 32.0, 27.0, 24.0, 22.0, 16.0, 19.0, 14.0, 17.0, 12.0, 13.0, 5.0, 9.0, 6.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.4921875, -8.24090576171875, -7.9896240234375, -7.73834228515625, -7.487060546875, -7.23577880859375, -6.9844970703125, -6.73321533203125, -6.48193359375, -6.23065185546875, -5.9793701171875, -5.72808837890625, -5.476806640625, -5.22552490234375, -4.9742431640625, -4.72296142578125, -4.4716796875, -4.22039794921875, -3.9691162109375, -3.71783447265625, -3.466552734375, -3.21527099609375, -2.9639892578125, -2.71270751953125, -2.46142578125, -2.21014404296875, -1.9588623046875, -1.70758056640625, -1.456298828125, -1.20501708984375, -0.9537353515625, -0.70245361328125, -0.451171875, -0.19989013671875, 0.0513916015625, 0.30267333984375, 0.553955078125, 0.80523681640625, 1.0565185546875, 1.30780029296875, 1.55908203125, 1.81036376953125, 2.0616455078125, 2.31292724609375, 2.564208984375, 2.81549072265625, 3.0667724609375, 3.31805419921875, 3.5693359375, 3.82061767578125, 4.0718994140625, 4.32318115234375, 4.574462890625, 4.82574462890625, 5.0770263671875, 5.32830810546875, 5.57958984375, 5.83087158203125, 6.0821533203125, 6.33343505859375, 6.584716796875, 6.83599853515625, 7.0872802734375, 7.33856201171875, 7.58984375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 8.0, 19.0, 14.0, 16.0, 22.0, 48.0, 60.0, 91.0, 96.0, 143.0, 226.0, 349.0, 571.0, 962.0, 1572.0, 2870.0, 5349.0, 10340.0, 20657.0, 44473.0, 100128.0, 229147.0, 337907.0, 159529.0, 69729.0, 31846.0, 15144.0, 7607.0, 4030.0, 2189.0, 1228.0, 747.0, 448.0, 296.0, 207.0, 130.0, 96.0, 57.0, 37.0, 39.0, 34.0, 28.0, 12.0, 21.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.84765625, -4.69268798828125, -4.5377197265625, -4.38275146484375, -4.227783203125, -4.07281494140625, -3.9178466796875, -3.76287841796875, -3.60791015625, -3.45294189453125, -3.2979736328125, -3.14300537109375, -2.988037109375, -2.83306884765625, -2.6781005859375, -2.52313232421875, -2.3681640625, -2.21319580078125, -2.0582275390625, -1.90325927734375, -1.748291015625, -1.59332275390625, -1.4383544921875, -1.28338623046875, -1.12841796875, -0.97344970703125, -0.8184814453125, -0.66351318359375, -0.508544921875, -0.35357666015625, -0.1986083984375, -0.04364013671875, 0.111328125, 0.26629638671875, 0.4212646484375, 0.57623291015625, 0.731201171875, 0.88616943359375, 1.0411376953125, 1.19610595703125, 1.35107421875, 1.50604248046875, 1.6610107421875, 1.81597900390625, 1.970947265625, 2.12591552734375, 2.2808837890625, 2.43585205078125, 2.5908203125, 2.74578857421875, 2.9007568359375, 3.05572509765625, 3.210693359375, 3.36566162109375, 3.5206298828125, 3.67559814453125, 3.83056640625, 3.98553466796875, 4.1405029296875, 4.29547119140625, 4.450439453125, 4.60540771484375, 4.7603759765625, 4.91534423828125, 5.0703125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 3.0, 3.0, 6.0, 6.0, 9.0, 4.0, 6.0, 11.0, 13.0, 17.0, 28.0, 25.0, 35.0, 34.0, 37.0, 55.0, 62.0, 80.0, 225.0, 1766.0, 180.0, 76.0, 62.0, 58.0, 43.0, 28.0, 35.0, 27.0, 23.0, 17.0, 13.0, 10.0, 13.0, 12.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.59375, -38.33154296875, -37.0693359375, -35.80712890625, -34.544921875, -33.28271484375, -32.0205078125, -30.75830078125, -29.49609375, -28.23388671875, -26.9716796875, -25.70947265625, -24.447265625, -23.18505859375, -21.9228515625, -20.66064453125, -19.3984375, -18.13623046875, -16.8740234375, -15.61181640625, -14.349609375, -13.08740234375, -11.8251953125, -10.56298828125, -9.30078125, -8.03857421875, -6.7763671875, -5.51416015625, -4.251953125, -2.98974609375, -1.7275390625, -0.46533203125, 0.796875, 2.05908203125, 3.3212890625, 4.58349609375, 5.845703125, 7.10791015625, 8.3701171875, 9.63232421875, 10.89453125, 12.15673828125, 13.4189453125, 14.68115234375, 15.943359375, 17.20556640625, 18.4677734375, 19.72998046875, 20.9921875, 22.25439453125, 23.5166015625, 24.77880859375, 26.041015625, 27.30322265625, 28.5654296875, 29.82763671875, 31.08984375, 32.35205078125, 33.6142578125, 34.87646484375, 36.138671875, 37.40087890625, 38.6630859375, 39.92529296875, 41.1875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 12.0, 9.0, 16.0, 22.0, 12.0, 25.0, 27.0, 52.0, 74.0, 89.0, 101.0, 182.0, 249.0, 486.0, 1368.0, 106006.0, 3032017.0, 3380.0, 609.0, 270.0, 175.0, 159.0, 88.0, 48.0, 57.0, 36.0, 30.0, 27.0, 16.0, 9.0, 4.0, 8.0, 8.0, 6.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.75, -88.015625, -85.28125, -82.546875, -79.8125, -77.078125, -74.34375, -71.609375, -68.875, -66.140625, -63.40625, -60.671875, -57.9375, -55.203125, -52.46875, -49.734375, -47.0, -44.265625, -41.53125, -38.796875, -36.0625, -33.328125, -30.59375, -27.859375, -25.125, -22.390625, -19.65625, -16.921875, -14.1875, -11.453125, -8.71875, -5.984375, -3.25, -0.515625, 2.21875, 4.953125, 7.6875, 10.421875, 13.15625, 15.890625, 18.625, 21.359375, 24.09375, 26.828125, 29.5625, 32.296875, 35.03125, 37.765625, 40.5, 43.234375, 45.96875, 48.703125, 51.4375, 54.171875, 56.90625, 59.640625, 62.375, 65.109375, 67.84375, 70.578125, 73.3125, 76.046875, 78.78125, 81.515625, 84.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 512.0, 504.0], "bins": [-1027.9271240234375, -1011.6064453125, -995.2857666015625, -978.965087890625, -962.6444091796875, -946.32373046875, -930.0030517578125, -913.682373046875, -897.3616943359375, -881.041015625, -864.7203369140625, -848.399658203125, -832.0789794921875, -815.75830078125, -799.4376220703125, -783.116943359375, -766.7963256835938, -750.4756469726562, -734.1549682617188, -717.8342895507812, -701.5136108398438, -685.1929321289062, -668.8722534179688, -652.5516357421875, -636.23095703125, -619.9102783203125, -603.589599609375, -587.2689208984375, -570.9482421875, -554.6275634765625, -538.306884765625, -521.9862060546875, -505.6655578613281, -489.3448791503906, -473.0242004394531, -456.7035217285156, -440.38287353515625, -424.06219482421875, -407.74151611328125, -391.42083740234375, -375.10015869140625, -358.77947998046875, -342.45880126953125, -326.13812255859375, -309.81744384765625, -293.49676513671875, -277.1761169433594, -260.8554382324219, -244.53475952148438, -228.21408081054688, -211.89340209960938, -195.57273864746094, -179.25205993652344, -162.93138122558594, -146.6107177734375, -130.2900390625, -113.96936798095703, -97.64869689941406, -81.32801818847656, -65.00733947753906, -48.686668395996094, -32.365989685058594, -16.045318603515625, 0.27535247802734375, 16.596031188964844]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 4.0, 5.0, 12.0, 10.0, 10.0, 18.0, 17.0, 20.0, 22.0, 21.0, 32.0, 25.0, 26.0, 44.0, 34.0, 36.0, 45.0, 32.0, 39.0, 39.0, 46.0, 36.0, 45.0, 47.0, 33.0, 29.0, 34.0, 32.0, 23.0, 23.0, 22.0, 7.0, 16.0, 13.0, 9.0, 14.0, 9.0, 14.0, 9.0, 11.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.90977478027344, -68.4876937866211, -66.06561279296875, -63.64353561401367, -61.221458435058594, -58.79937744140625, -56.377296447753906, -53.95521926879883, -51.53314208984375, -49.111061096191406, -46.68898391723633, -44.266902923583984, -41.844825744628906, -39.42274475097656, -37.00066375732422, -34.57858657836914, -32.1565055847168, -29.734426498413086, -27.312347412109375, -24.89026641845703, -22.468189239501953, -20.04610824584961, -17.6240291595459, -15.201950073242188, -12.779870986938477, -10.357791900634766, -7.9357123374938965, -5.513632774353027, -3.0915536880493164, -0.6694746017456055, 1.7526054382324219, 4.174684524536133, 6.596763610839844, 9.018842697143555, 11.440921783447266, 13.863001823425293, 16.285079956054688, 18.70716094970703, 21.129240036010742, 23.551319122314453, 25.973398208618164, 28.395477294921875, 30.817556381225586, 33.2396354675293, 35.66171646118164, 38.08379364013672, 40.50587463378906, 42.927955627441406, 45.350032806396484, 47.77211380004883, 50.194190979003906, 52.61627197265625, 55.03834915161133, 57.46043014526367, 59.88250732421875, 62.304588317871094, 64.72666931152344, 67.14875030517578, 69.57083129882812, 71.99290466308594, 74.41498565673828, 76.83706665039062, 79.25914764404297, 81.68122863769531, 84.10330200195312]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 2.0, 4.0, 11.0, 16.0, 8.0, 9.0, 13.0, 17.0, 19.0, 33.0, 32.0, 28.0, 31.0, 23.0, 31.0, 28.0, 32.0, 44.0, 39.0, 42.0, 43.0, 48.0, 41.0, 31.0, 25.0, 36.0, 41.0, 25.0, 33.0, 23.0, 27.0, 19.0, 17.0, 15.0, 20.0, 16.0, 11.0, 7.0, 9.0, 6.0, 9.0, 4.0, 8.0, 6.0, 8.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.875, -8.61865234375, -8.3623046875, -8.10595703125, -7.849609375, -7.59326171875, -7.3369140625, -7.08056640625, -6.82421875, -6.56787109375, -6.3115234375, -6.05517578125, -5.798828125, -5.54248046875, -5.2861328125, -5.02978515625, -4.7734375, -4.51708984375, -4.2607421875, -4.00439453125, -3.748046875, -3.49169921875, -3.2353515625, -2.97900390625, -2.72265625, -2.46630859375, -2.2099609375, -1.95361328125, -1.697265625, -1.44091796875, -1.1845703125, -0.92822265625, -0.671875, -0.41552734375, -0.1591796875, 0.09716796875, 0.353515625, 0.60986328125, 0.8662109375, 1.12255859375, 1.37890625, 1.63525390625, 1.8916015625, 2.14794921875, 2.404296875, 2.66064453125, 2.9169921875, 3.17333984375, 3.4296875, 3.68603515625, 3.9423828125, 4.19873046875, 4.455078125, 4.71142578125, 4.9677734375, 5.22412109375, 5.48046875, 5.73681640625, 5.9931640625, 6.24951171875, 6.505859375, 6.76220703125, 7.0185546875, 7.27490234375, 7.53125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 6.0, 5.0, 4.0, 10.0, 14.0, 10.0, 18.0, 21.0, 24.0, 26.0, 26.0, 32.0, 48.0, 66.0, 125.0, 355.0, 1444.0, 8442.0, 92159.0, 1903833.0, 2072794.0, 103531.0, 9047.0, 1457.0, 333.0, 104.0, 63.0, 50.0, 42.0, 21.0, 22.0, 19.0, 18.0, 9.0, 20.0, 15.0, 7.0, 12.0, 11.0, 5.0, 8.0, 8.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-34.25, -33.27197265625, -32.2939453125, -31.31591796875, -30.337890625, -29.35986328125, -28.3818359375, -27.40380859375, -26.42578125, -25.44775390625, -24.4697265625, -23.49169921875, -22.513671875, -21.53564453125, -20.5576171875, -19.57958984375, -18.6015625, -17.62353515625, -16.6455078125, -15.66748046875, -14.689453125, -13.71142578125, -12.7333984375, -11.75537109375, -10.77734375, -9.79931640625, -8.8212890625, -7.84326171875, -6.865234375, -5.88720703125, -4.9091796875, -3.93115234375, -2.953125, -1.97509765625, -0.9970703125, -0.01904296875, 0.958984375, 1.93701171875, 2.9150390625, 3.89306640625, 4.87109375, 5.84912109375, 6.8271484375, 7.80517578125, 8.783203125, 9.76123046875, 10.7392578125, 11.71728515625, 12.6953125, 13.67333984375, 14.6513671875, 15.62939453125, 16.607421875, 17.58544921875, 18.5634765625, 19.54150390625, 20.51953125, 21.49755859375, 22.4755859375, 23.45361328125, 24.431640625, 25.40966796875, 26.3876953125, 27.36572265625, 28.34375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 8.0, 16.0, 19.0, 31.0, 47.0, 67.0, 90.0, 130.0, 186.0, 272.0, 335.0, 489.0, 542.0, 517.0, 389.0, 271.0, 191.0, 141.0, 106.0, 76.0, 49.0, 29.0, 13.0, 15.0, 14.0, 5.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.96875, -28.2724609375, -27.576171875, -26.8798828125, -26.18359375, -25.4873046875, -24.791015625, -24.0947265625, -23.3984375, -22.7021484375, -22.005859375, -21.3095703125, -20.61328125, -19.9169921875, -19.220703125, -18.5244140625, -17.828125, -17.1318359375, -16.435546875, -15.7392578125, -15.04296875, -14.3466796875, -13.650390625, -12.9541015625, -12.2578125, -11.5615234375, -10.865234375, -10.1689453125, -9.47265625, -8.7763671875, -8.080078125, -7.3837890625, -6.6875, -5.9912109375, -5.294921875, -4.5986328125, -3.90234375, -3.2060546875, -2.509765625, -1.8134765625, -1.1171875, -0.4208984375, 0.275390625, 0.9716796875, 1.66796875, 2.3642578125, 3.060546875, 3.7568359375, 4.453125, 5.1494140625, 5.845703125, 6.5419921875, 7.23828125, 7.9345703125, 8.630859375, 9.3271484375, 10.0234375, 10.7197265625, 11.416015625, 12.1123046875, 12.80859375, 13.5048828125, 14.201171875, 14.8974609375, 15.59375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 17.0, 15.0, 29.0, 32.0, 48.0, 57.0, 84.0, 130.0, 161.0, 204.0, 387.0, 791.0, 2221.0, 15913.0, 240311.0, 3143445.0, 744139.0, 39660.0, 4203.0, 1041.0, 431.0, 237.0, 178.0, 135.0, 98.0, 72.0, 64.0, 44.0, 24.0, 21.0, 11.0, 15.0, 4.0, 10.0, 8.0, 8.0, 1.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0, -31.6630859375, -30.326171875, -28.9892578125, -27.65234375, -26.3154296875, -24.978515625, -23.6416015625, -22.3046875, -20.9677734375, -19.630859375, -18.2939453125, -16.95703125, -15.6201171875, -14.283203125, -12.9462890625, -11.609375, -10.2724609375, -8.935546875, -7.5986328125, -6.26171875, -4.9248046875, -3.587890625, -2.2509765625, -0.9140625, 0.4228515625, 1.759765625, 3.0966796875, 4.43359375, 5.7705078125, 7.107421875, 8.4443359375, 9.78125, 11.1181640625, 12.455078125, 13.7919921875, 15.12890625, 16.4658203125, 17.802734375, 19.1396484375, 20.4765625, 21.8134765625, 23.150390625, 24.4873046875, 25.82421875, 27.1611328125, 28.498046875, 29.8349609375, 31.171875, 32.5087890625, 33.845703125, 35.1826171875, 36.51953125, 37.8564453125, 39.193359375, 40.5302734375, 41.8671875, 43.2041015625, 44.541015625, 45.8779296875, 47.21484375, 48.5517578125, 49.888671875, 51.2255859375, 52.5625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 92.0, 393.0, 414.0, 98.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-395.8339538574219, -382.196044921875, -368.55816650390625, -354.9202575683594, -341.2823486328125, -327.64447021484375, -314.0065612792969, -300.36865234375, -286.7307434082031, -273.09283447265625, -259.4549560546875, -245.81704711914062, -232.17913818359375, -218.54124450683594, -204.90335083007812, -191.26544189453125, -177.62754821777344, -163.98965454101562, -150.35174560546875, -136.71385192871094, -123.07594299316406, -109.43804931640625, -95.8001480102539, -82.16224670410156, -68.52434539794922, -54.886444091796875, -41.24854278564453, -27.610645294189453, -13.97274398803711, -0.33484649658203125, 13.303054809570312, 26.940956115722656, 40.578857421875, 54.216758728027344, 67.85466003417969, 81.4925537109375, 95.13046264648438, 108.76835632324219, 122.40625762939453, 136.04415893554688, 149.68206787109375, 163.31996154785156, 176.95787048339844, 190.59576416015625, 204.23367309570312, 217.87156677246094, 231.50946044921875, 245.14736938476562, 258.7852783203125, 272.4231872558594, 286.0610656738281, 299.698974609375, 313.3368835449219, 326.97479248046875, 340.6126708984375, 354.2505798339844, 367.8884582519531, 381.5263671875, 395.16424560546875, 408.8021545410156, 422.4400634765625, 436.07794189453125, 449.7158508300781, 463.353759765625, 476.9916687011719]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 7.0, 11.0, 13.0, 8.0, 18.0, 13.0, 20.0, 25.0, 22.0, 28.0, 30.0, 29.0, 45.0, 35.0, 32.0, 53.0, 34.0, 39.0, 40.0, 54.0, 28.0, 39.0, 31.0, 34.0, 33.0, 23.0, 26.0, 28.0, 30.0, 24.0, 20.0, 24.0, 10.0, 13.0, 13.0, 10.0, 9.0, 3.0, 5.0, 6.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.87067413330078, -55.0738525390625, -53.27703094482422, -51.48020553588867, -49.68338394165039, -47.88656234741211, -46.08974075317383, -44.29291534423828, -42.49609375, -40.69927215576172, -38.90245056152344, -37.10562515258789, -35.30880355834961, -33.51198196411133, -31.715160369873047, -29.918336868286133, -28.12151527404785, -26.32469367980957, -24.527870178222656, -22.731048583984375, -20.93422508239746, -19.13740348815918, -17.340579986572266, -15.543758392333984, -13.746935844421387, -11.950113296508789, -10.153290748596191, -8.356468200683594, -6.559646129608154, -4.762824058532715, -2.966001510620117, -1.1691789627075195, 0.6276435852050781, 2.424466133117676, 4.221288681030273, 6.018110752105713, 7.8149333000183105, 9.61175537109375, 11.408577919006348, 13.205400466918945, 15.002223014831543, 16.79904556274414, 18.595867156982422, 20.392690658569336, 22.189512252807617, 23.98633575439453, 25.783157348632812, 27.579978942871094, 29.376802444458008, 31.17362403869629, 32.9704475402832, 34.767269134521484, 36.564090728759766, 38.36091613769531, 40.157737731933594, 41.954559326171875, 43.751380920410156, 45.54820251464844, 47.34502410888672, 49.141849517822266, 50.93867111206055, 52.73549270629883, 54.53231430053711, 56.329139709472656, 58.12596130371094]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 17.0, 16.0, 19.0, 23.0, 20.0, 30.0, 32.0, 32.0, 43.0, 49.0, 30.0, 46.0, 35.0, 50.0, 55.0, 38.0, 40.0, 39.0, 38.0, 25.0, 41.0, 28.0, 24.0, 25.0, 17.0, 19.0, 22.0, 18.0, 18.0, 14.0, 14.0, 13.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.3065185546875, -9.027099609375, -8.7476806640625, -8.46826171875, -8.1888427734375, -7.909423828125, -7.6300048828125, -7.3505859375, -7.0711669921875, -6.791748046875, -6.5123291015625, -6.23291015625, -5.9534912109375, -5.674072265625, -5.3946533203125, -5.115234375, -4.8358154296875, -4.556396484375, -4.2769775390625, -3.99755859375, -3.7181396484375, -3.438720703125, -3.1593017578125, -2.8798828125, -2.6004638671875, -2.321044921875, -2.0416259765625, -1.76220703125, -1.4827880859375, -1.203369140625, -0.9239501953125, -0.64453125, -0.3651123046875, -0.085693359375, 0.1937255859375, 0.47314453125, 0.7525634765625, 1.031982421875, 1.3114013671875, 1.5908203125, 1.8702392578125, 2.149658203125, 2.4290771484375, 2.70849609375, 2.9879150390625, 3.267333984375, 3.5467529296875, 3.826171875, 4.1055908203125, 4.385009765625, 4.6644287109375, 4.94384765625, 5.2232666015625, 5.502685546875, 5.7821044921875, 6.0615234375, 6.3409423828125, 6.620361328125, 6.8997802734375, 7.17919921875, 7.4586181640625, 7.738037109375, 8.0174560546875, 8.296875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 9.0, 14.0, 15.0, 23.0, 43.0, 56.0, 62.0, 127.0, 170.0, 227.0, 396.0, 559.0, 798.0, 1196.0, 1861.0, 2705.0, 4107.0, 6258.0, 9637.0, 15315.0, 24891.0, 42649.0, 73332.0, 128032.0, 203227.0, 207512.0, 133045.0, 76747.0, 44478.0, 26017.0, 15831.0, 10010.0, 6455.0, 4275.0, 2811.0, 1877.0, 1185.0, 837.0, 570.0, 392.0, 253.0, 184.0, 114.0, 79.0, 57.0, 38.0, 25.0, 15.0, 11.0, 14.0, 8.0, 2.0, 4.0, 1.0, 2.0, 3.0], "bins": [-1.2119140625, -1.17523193359375, -1.1385498046875, -1.10186767578125, -1.065185546875, -1.02850341796875, -0.9918212890625, -0.95513916015625, -0.91845703125, -0.88177490234375, -0.8450927734375, -0.80841064453125, -0.771728515625, -0.73504638671875, -0.6983642578125, -0.66168212890625, -0.625, -0.58831787109375, -0.5516357421875, -0.51495361328125, -0.478271484375, -0.44158935546875, -0.4049072265625, -0.36822509765625, -0.33154296875, -0.29486083984375, -0.2581787109375, -0.22149658203125, -0.184814453125, -0.14813232421875, -0.1114501953125, -0.07476806640625, -0.0380859375, -0.00140380859375, 0.0352783203125, 0.07196044921875, 0.108642578125, 0.14532470703125, 0.1820068359375, 0.21868896484375, 0.25537109375, 0.29205322265625, 0.3287353515625, 0.36541748046875, 0.402099609375, 0.43878173828125, 0.4754638671875, 0.51214599609375, 0.548828125, 0.58551025390625, 0.6221923828125, 0.65887451171875, 0.695556640625, 0.73223876953125, 0.7689208984375, 0.80560302734375, 0.84228515625, 0.87896728515625, 0.9156494140625, 0.95233154296875, 0.989013671875, 1.02569580078125, 1.0623779296875, 1.09906005859375, 1.1357421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 6.0, 7.0, 15.0, 10.0, 7.0, 24.0, 15.0, 24.0, 27.0, 21.0, 25.0, 34.0, 23.0, 38.0, 30.0, 41.0, 44.0, 29.0, 40.0, 1078.0, 27.0, 39.0, 36.0, 43.0, 36.0, 40.0, 23.0, 30.0, 27.0, 20.0, 19.0, 21.0, 13.0, 13.0, 17.0, 11.0, 9.0, 7.0, 12.0, 9.0, 4.0, 9.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.17578125, -5.010009765625, -4.84423828125, -4.678466796875, -4.5126953125, -4.346923828125, -4.18115234375, -4.015380859375, -3.849609375, -3.683837890625, -3.51806640625, -3.352294921875, -3.1865234375, -3.020751953125, -2.85498046875, -2.689208984375, -2.5234375, -2.357666015625, -2.19189453125, -2.026123046875, -1.8603515625, -1.694580078125, -1.52880859375, -1.363037109375, -1.197265625, -1.031494140625, -0.86572265625, -0.699951171875, -0.5341796875, -0.368408203125, -0.20263671875, -0.036865234375, 0.12890625, 0.294677734375, 0.46044921875, 0.626220703125, 0.7919921875, 0.957763671875, 1.12353515625, 1.289306640625, 1.455078125, 1.620849609375, 1.78662109375, 1.952392578125, 2.1181640625, 2.283935546875, 2.44970703125, 2.615478515625, 2.78125, 2.947021484375, 3.11279296875, 3.278564453125, 3.4443359375, 3.610107421875, 3.77587890625, 3.941650390625, 4.107421875, 4.273193359375, 4.43896484375, 4.604736328125, 4.7705078125, 4.936279296875, 5.10205078125, 5.267822265625, 5.43359375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 11.0, 19.0, 22.0, 48.0, 61.0, 77.0, 97.0, 161.0, 242.0, 359.0, 558.0, 720.0, 1080.0, 1571.0, 2513.0, 3559.0, 5563.0, 8335.0, 13069.0, 20766.0, 32344.0, 51291.0, 80306.0, 117364.0, 191522.0, 1172923.0, 132091.0, 92524.0, 60583.0, 38264.0, 24540.0, 15461.0, 9917.0, 6453.0, 4233.0, 2744.0, 1870.0, 1208.0, 876.0, 554.0, 343.0, 305.0, 190.0, 127.0, 74.0, 54.0, 38.0, 21.0, 23.0, 17.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.60986328125, -0.590301513671875, -0.57073974609375, -0.551177978515625, -0.5316162109375, -0.512054443359375, -0.49249267578125, -0.472930908203125, -0.453369140625, -0.433807373046875, -0.41424560546875, -0.394683837890625, -0.3751220703125, -0.355560302734375, -0.33599853515625, -0.316436767578125, -0.296875, -0.277313232421875, -0.25775146484375, -0.238189697265625, -0.2186279296875, -0.199066162109375, -0.17950439453125, -0.159942626953125, -0.140380859375, -0.120819091796875, -0.10125732421875, -0.081695556640625, -0.0621337890625, -0.042572021484375, -0.02301025390625, -0.003448486328125, 0.01611328125, 0.035675048828125, 0.05523681640625, 0.074798583984375, 0.0943603515625, 0.113922119140625, 0.13348388671875, 0.153045654296875, 0.172607421875, 0.192169189453125, 0.21173095703125, 0.231292724609375, 0.2508544921875, 0.270416259765625, 0.28997802734375, 0.309539794921875, 0.3291015625, 0.348663330078125, 0.36822509765625, 0.387786865234375, 0.4073486328125, 0.426910400390625, 0.44647216796875, 0.466033935546875, 0.485595703125, 0.505157470703125, 0.52471923828125, 0.544281005859375, 0.5638427734375, 0.583404541015625, 0.60296630859375, 0.622528076171875, 0.64208984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 5.0, 7.0, 9.0, 10.0, 7.0, 14.0, 18.0, 16.0, 22.0, 33.0, 42.0, 61.0, 99.0, 99.0, 103.0, 95.0, 82.0, 65.0, 44.0, 32.0, 24.0, 26.0, 11.0, 16.0, 8.0, 14.0, 12.0, 12.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0150604248046875, -0.01462101936340332, -0.01418161392211914, -0.013742208480834961, -0.013302803039550781, -0.012863397598266602, -0.012423992156982422, -0.011984586715698242, -0.011545181274414062, -0.011105775833129883, -0.010666370391845703, -0.010226964950561523, -0.009787559509277344, -0.009348154067993164, -0.008908748626708984, -0.008469343185424805, -0.008029937744140625, -0.007590532302856445, -0.007151126861572266, -0.006711721420288086, -0.006272315979003906, -0.0058329105377197266, -0.005393505096435547, -0.004954099655151367, -0.0045146942138671875, -0.004075288772583008, -0.003635883331298828, -0.0031964778900146484, -0.0027570724487304688, -0.002317667007446289, -0.0018782615661621094, -0.0014388561248779297, -0.00099945068359375, -0.0005600452423095703, -0.00012063980102539062, 0.00031876564025878906, 0.0007581710815429688, 0.0011975765228271484, 0.0016369819641113281, 0.002076387405395508, 0.0025157928466796875, 0.002955198287963867, 0.003394603729248047, 0.0038340091705322266, 0.004273414611816406, 0.004712820053100586, 0.005152225494384766, 0.005591630935668945, 0.006031036376953125, 0.006470441818237305, 0.006909847259521484, 0.007349252700805664, 0.007788658142089844, 0.008228063583374023, 0.008667469024658203, 0.009106874465942383, 0.009546279907226562, 0.009985685348510742, 0.010425090789794922, 0.010864496231079102, 0.011303901672363281, 0.011743307113647461, 0.01218271255493164, 0.01262211799621582, 0.0130615234375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 4.0, 12.0, 17.0, 13.0, 16.0, 19.0, 32.0, 42.0, 74.0, 105.0, 240.0, 1405.0, 28528.0, 961845.0, 53544.0, 2038.0, 296.0, 114.0, 59.0, 34.0, 24.0, 17.0, 18.0, 12.0, 6.0, 7.0, 9.0, 6.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.28235626220703125, -0.2724761962890625, -0.26259613037109375, -0.252716064453125, -0.24283599853515625, -0.2329559326171875, -0.22307586669921875, -0.21319580078125, -0.20331573486328125, -0.1934356689453125, -0.18355560302734375, -0.173675537109375, -0.16379547119140625, -0.1539154052734375, -0.14403533935546875, -0.1341552734375, -0.12427520751953125, -0.1143951416015625, -0.10451507568359375, -0.094635009765625, -0.08475494384765625, -0.0748748779296875, -0.06499481201171875, -0.05511474609375, -0.04523468017578125, -0.0353546142578125, -0.02547454833984375, -0.015594482421875, -0.00571441650390625, 0.0041656494140625, 0.01404571533203125, 0.02392578125, 0.03380584716796875, 0.0436859130859375, 0.05356597900390625, 0.063446044921875, 0.07332611083984375, 0.0832061767578125, 0.09308624267578125, 0.10296630859375, 0.11284637451171875, 0.1227264404296875, 0.13260650634765625, 0.142486572265625, 0.15236663818359375, 0.1622467041015625, 0.17212677001953125, 0.1820068359375, 0.19188690185546875, 0.2017669677734375, 0.21164703369140625, 0.221527099609375, 0.23140716552734375, 0.2412872314453125, 0.25116729736328125, 0.26104736328125, 0.27092742919921875, 0.2808074951171875, 0.29068756103515625, 0.300567626953125, 0.31044769287109375, 0.3203277587890625, 0.33020782470703125, 0.340087890625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 10.0, 10.0, 33.0, 52.0, 85.0, 157.0, 305.0, 215.0, 60.0, 37.0, 16.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04302098974585533, -0.041349172592163086, -0.03967735916376114, -0.03800554573535919, -0.036333728581666946, -0.0346619114279747, -0.032990097999572754, -0.03131828457117081, -0.02964646741747856, -0.027974652126431465, -0.02630283683538437, -0.024631021544337273, -0.022959206253290176, -0.02128739096224308, -0.019615575671195984, -0.017943760380148888, -0.01627194508910179, -0.014600129798054695, -0.012928314507007599, -0.011256499215960503, -0.009584683924913406, -0.00791286863386631, -0.006241053342819214, -0.004569238051772118, -0.0028974227607250214, -0.0012256074696779251, 0.00044620782136917114, 0.0021180231124162674, 0.0037898384034633636, 0.00546165369451046, 0.007133468985557556, 0.008805284276604652, 0.010477103292942047, 0.012148918583989143, 0.01382073387503624, 0.015492549166083336, 0.017164364457130432, 0.01883617974817753, 0.020507995039224625, 0.02217981033027172, 0.023851625621318817, 0.025523440912365913, 0.02719525620341301, 0.028867071494460106, 0.030538886785507202, 0.03221070021390915, 0.033882517367601395, 0.03555433452129364, 0.03722614794969559, 0.038897961378097534, 0.04056977853178978, 0.042241595685482025, 0.04391340911388397, 0.04558522254228592, 0.047257039695978165, 0.04892885684967041, 0.05060067027807236, 0.052272483706474304, 0.05394430086016655, 0.055616118013858795, 0.05728793144226074, 0.05895974487066269, 0.060631562024354935, 0.06230337917804718, 0.06397519260644913]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 7.0, 9.0, 14.0, 20.0, 17.0, 22.0, 23.0, 33.0, 26.0, 23.0, 42.0, 38.0, 32.0, 31.0, 35.0, 40.0, 35.0, 43.0, 35.0, 39.0, 53.0, 41.0, 37.0, 36.0, 32.0, 26.0, 25.0, 19.0, 21.0, 18.0, 11.0, 8.0, 14.0, 16.0, 6.0, 5.0, 5.0, 6.0, 9.0, 4.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.006184577941894531, -0.005975761450827122, -0.005766944959759712, -0.005558128468692303, -0.005349311977624893, -0.005140495486557484, -0.004931678995490074, -0.004722862504422665, -0.004514046013355255, -0.004305229522287846, -0.004096413031220436, -0.0038875965401530266, -0.003678780049085617, -0.0034699635580182076, -0.003261147066950798, -0.0030523305758833885, -0.002843514084815979, -0.0026346975937485695, -0.00242588110268116, -0.0022170646116137505, -0.002008248120546341, -0.0017994316294789314, -0.001590615138411522, -0.0013817986473441124, -0.0011729821562767029, -0.0009641656652092934, -0.0007553491741418839, -0.0005465326830744743, -0.0003377161920070648, -0.0001288997009396553, 7.991679012775421e-05, 0.0002887332811951637, 0.0004975497722625732, 0.0007063662633299828, 0.0009151827543973923, 0.0011239992454648018, 0.0013328157365322113, 0.0015416322275996208, 0.0017504487186670303, 0.00195926520973444, 0.0021680817008018494, 0.002376898191869259, 0.0025857146829366684, 0.002794531174004078, 0.0030033476650714874, 0.003212164156138897, 0.0034209806472063065, 0.003629797138273716, 0.0038386136293411255, 0.004047430120408535, 0.0042562466114759445, 0.004465063102543354, 0.0046738795936107635, 0.004882696084678173, 0.005091512575745583, 0.005300329066812992, 0.005509145557880402, 0.005717962048947811, 0.005926778540015221, 0.00613559503108263, 0.00634441152215004, 0.006553228013217449, 0.006762044504284859, 0.006970860995352268, 0.007179677486419678]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 17.0, 16.0, 19.0, 23.0, 20.0, 30.0, 32.0, 32.0, 43.0, 49.0, 30.0, 46.0, 36.0, 49.0, 55.0, 38.0, 40.0, 39.0, 38.0, 25.0, 41.0, 28.0, 24.0, 25.0, 17.0, 19.0, 22.0, 18.0, 18.0, 14.0, 14.0, 13.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.3065185546875, -9.027099609375, -8.7476806640625, -8.46826171875, -8.1888427734375, -7.909423828125, -7.6300048828125, -7.3505859375, -7.0711669921875, -6.791748046875, -6.5123291015625, -6.23291015625, -5.9534912109375, -5.674072265625, -5.3946533203125, -5.115234375, -4.8358154296875, -4.556396484375, -4.2769775390625, -3.99755859375, -3.7181396484375, -3.438720703125, -3.1593017578125, -2.8798828125, -2.6004638671875, -2.321044921875, -2.0416259765625, -1.76220703125, -1.4827880859375, -1.203369140625, -0.9239501953125, -0.64453125, -0.3651123046875, -0.085693359375, 0.1937255859375, 0.47314453125, 0.7525634765625, 1.031982421875, 1.3114013671875, 1.5908203125, 1.8702392578125, 2.149658203125, 2.4290771484375, 2.70849609375, 2.9879150390625, 3.267333984375, 3.5467529296875, 3.826171875, 4.1055908203125, 4.385009765625, 4.6644287109375, 4.94384765625, 5.2232666015625, 5.502685546875, 5.7821044921875, 6.0615234375, 6.3409423828125, 6.620361328125, 6.8997802734375, 7.17919921875, 7.4586181640625, 7.738037109375, 8.0174560546875, 8.296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 17.0, 13.0, 30.0, 49.0, 65.0, 106.0, 150.0, 170.0, 287.0, 443.0, 642.0, 948.0, 1539.0, 2403.0, 3957.0, 6512.0, 10670.0, 18070.0, 31126.0, 55995.0, 106326.0, 250282.0, 293553.0, 119707.0, 61474.0, 34087.0, 19679.0, 11551.0, 7032.0, 4190.0, 2612.0, 1710.0, 1047.0, 698.0, 444.0, 298.0, 200.0, 153.0, 83.0, 60.0, 55.0, 27.0, 23.0, 14.0, 4.0, 11.0, 11.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.10546875, -4.93572998046875, -4.7659912109375, -4.59625244140625, -4.426513671875, -4.25677490234375, -4.0870361328125, -3.91729736328125, -3.74755859375, -3.57781982421875, -3.4080810546875, -3.23834228515625, -3.068603515625, -2.89886474609375, -2.7291259765625, -2.55938720703125, -2.3896484375, -2.21990966796875, -2.0501708984375, -1.88043212890625, -1.710693359375, -1.54095458984375, -1.3712158203125, -1.20147705078125, -1.03173828125, -0.86199951171875, -0.6922607421875, -0.52252197265625, -0.352783203125, -0.18304443359375, -0.0133056640625, 0.15643310546875, 0.326171875, 0.49591064453125, 0.6656494140625, 0.83538818359375, 1.005126953125, 1.17486572265625, 1.3446044921875, 1.51434326171875, 1.68408203125, 1.85382080078125, 2.0235595703125, 2.19329833984375, 2.363037109375, 2.53277587890625, 2.7025146484375, 2.87225341796875, 3.0419921875, 3.21173095703125, 3.3814697265625, 3.55120849609375, 3.720947265625, 3.89068603515625, 4.0604248046875, 4.23016357421875, 4.39990234375, 4.56964111328125, 4.7393798828125, 4.90911865234375, 5.078857421875, 5.24859619140625, 5.4183349609375, 5.58807373046875, 5.7578125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 12.0, 16.0, 18.0, 18.0, 25.0, 23.0, 26.0, 31.0, 45.0, 44.0, 48.0, 68.0, 47.0, 105.0, 312.0, 1570.0, 147.0, 89.0, 54.0, 48.0, 50.0, 34.0, 30.0, 27.0, 21.0, 20.0, 17.0, 16.0, 14.0, 6.0, 18.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-28.75, -27.7646484375, -26.779296875, -25.7939453125, -24.80859375, -23.8232421875, -22.837890625, -21.8525390625, -20.8671875, -19.8818359375, -18.896484375, -17.9111328125, -16.92578125, -15.9404296875, -14.955078125, -13.9697265625, -12.984375, -11.9990234375, -11.013671875, -10.0283203125, -9.04296875, -8.0576171875, -7.072265625, -6.0869140625, -5.1015625, -4.1162109375, -3.130859375, -2.1455078125, -1.16015625, -0.1748046875, 0.810546875, 1.7958984375, 2.78125, 3.7666015625, 4.751953125, 5.7373046875, 6.72265625, 7.7080078125, 8.693359375, 9.6787109375, 10.6640625, 11.6494140625, 12.634765625, 13.6201171875, 14.60546875, 15.5908203125, 16.576171875, 17.5615234375, 18.546875, 19.5322265625, 20.517578125, 21.5029296875, 22.48828125, 23.4736328125, 24.458984375, 25.4443359375, 26.4296875, 27.4150390625, 28.400390625, 29.3857421875, 30.37109375, 31.3564453125, 32.341796875, 33.3271484375, 34.3125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 19.0, 21.0, 26.0, 31.0, 46.0, 62.0, 101.0, 119.0, 184.0, 305.0, 727.0, 3513.0, 391213.0, 2741322.0, 5926.0, 946.0, 348.0, 215.0, 152.0, 105.0, 72.0, 62.0, 39.0, 33.0, 16.0, 20.0, 10.0, 8.0, 9.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-81.0, -78.3095703125, -75.619140625, -72.9287109375, -70.23828125, -67.5478515625, -64.857421875, -62.1669921875, -59.4765625, -56.7861328125, -54.095703125, -51.4052734375, -48.71484375, -46.0244140625, -43.333984375, -40.6435546875, -37.953125, -35.2626953125, -32.572265625, -29.8818359375, -27.19140625, -24.5009765625, -21.810546875, -19.1201171875, -16.4296875, -13.7392578125, -11.048828125, -8.3583984375, -5.66796875, -2.9775390625, -0.287109375, 2.4033203125, 5.09375, 7.7841796875, 10.474609375, 13.1650390625, 15.85546875, 18.5458984375, 21.236328125, 23.9267578125, 26.6171875, 29.3076171875, 31.998046875, 34.6884765625, 37.37890625, 40.0693359375, 42.759765625, 45.4501953125, 48.140625, 50.8310546875, 53.521484375, 56.2119140625, 58.90234375, 61.5927734375, 64.283203125, 66.9736328125, 69.6640625, 72.3544921875, 75.044921875, 77.7353515625, 80.42578125, 83.1162109375, 85.806640625, 88.4970703125, 91.1875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 12.0, 48.0, 102.0, 213.0, 236.0, 214.0, 122.0, 43.0, 12.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.385229110717773, -20.651582717895508, -17.917936325073242, -15.184290885925293, -12.450644493103027, -9.716998100280762, -6.9833526611328125, -4.249706268310547, -1.5160598754882812, 1.2175862789154053, 3.951232433319092, 6.684878349304199, 9.418524742126465, 12.15217113494873, 14.88581657409668, 17.619462966918945, 20.35310935974121, 23.086755752563477, 25.820402145385742, 28.554046630859375, 31.28769302368164, 34.021339416503906, 36.75498580932617, 39.48863220214844, 42.2222785949707, 44.95592498779297, 47.689571380615234, 50.4232177734375, 53.156864166259766, 55.89051055908203, 58.62415313720703, 61.35780334472656, 64.0914535522461, 66.8250961303711, 69.55874633789062, 72.29238891601562, 75.02603912353516, 77.75968170166016, 80.49333190917969, 83.22697448730469, 85.96062469482422, 88.69426727294922, 91.42791748046875, 94.16156005859375, 96.89521026611328, 99.62885284423828, 102.36250305175781, 105.09614562988281, 107.82978820800781, 110.56343078613281, 113.29708099365234, 116.03072357177734, 118.76437377929688, 121.49801635742188, 124.2316665649414, 126.9653091430664, 129.69895935058594, 132.43260192871094, 135.16624450683594, 137.89990234375, 140.633544921875, 143.3671875, 146.100830078125, 148.83448791503906, 151.56813049316406]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 1.0, 8.0, 6.0, 5.0, 5.0, 11.0, 14.0, 10.0, 12.0, 15.0, 21.0, 15.0, 20.0, 27.0, 25.0, 15.0, 38.0, 25.0, 27.0, 29.0, 40.0, 34.0, 39.0, 41.0, 45.0, 27.0, 27.0, 33.0, 39.0, 29.0, 29.0, 31.0, 37.0, 31.0, 19.0, 20.0, 31.0, 14.0, 18.0, 23.0, 9.0, 10.0, 3.0, 12.0, 7.0, 11.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0], "bins": [-80.02446746826172, -77.65386962890625, -75.28326416015625, -72.91265869140625, -70.54206085205078, -68.17146301269531, -65.80085754394531, -63.43025588989258, -61.059654235839844, -58.68905258178711, -56.318450927734375, -53.94784927368164, -51.577247619628906, -49.20664596557617, -46.83604431152344, -44.4654426574707, -42.09484100341797, -39.724239349365234, -37.3536376953125, -34.983036041259766, -32.61243438720703, -30.241832733154297, -27.871231079101562, -25.500629425048828, -23.130027770996094, -20.75942611694336, -18.388824462890625, -16.01822280883789, -13.647621154785156, -11.277019500732422, -8.906417846679688, -6.535816192626953, -4.165214538574219, -1.7946128845214844, 0.57598876953125, 2.9465904235839844, 5.317192077636719, 7.687793731689453, 10.058395385742188, 12.428997039794922, 14.799598693847656, 17.17020034790039, 19.540802001953125, 21.91140365600586, 24.282005310058594, 26.652606964111328, 29.023208618164062, 31.393810272216797, 33.76441192626953, 36.135013580322266, 38.505615234375, 40.876216888427734, 43.24681854248047, 45.6174201965332, 47.98802185058594, 50.35862350463867, 52.729225158691406, 55.09982681274414, 57.470428466796875, 59.84103012084961, 62.211631774902344, 64.58222961425781, 66.95283508300781, 69.32344055175781, 71.69403839111328]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 8.0, 5.0, 2.0, 8.0, 6.0, 10.0, 19.0, 16.0, 23.0, 21.0, 30.0, 22.0, 36.0, 34.0, 35.0, 40.0, 47.0, 45.0, 42.0, 46.0, 48.0, 41.0, 40.0, 39.0, 38.0, 33.0, 33.0, 28.0, 26.0, 27.0, 27.0, 14.0, 18.0, 13.0, 24.0, 15.0, 10.0, 6.0, 9.0, 3.0, 8.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.734375, -10.42919921875, -10.1240234375, -9.81884765625, -9.513671875, -9.20849609375, -8.9033203125, -8.59814453125, -8.29296875, -7.98779296875, -7.6826171875, -7.37744140625, -7.072265625, -6.76708984375, -6.4619140625, -6.15673828125, -5.8515625, -5.54638671875, -5.2412109375, -4.93603515625, -4.630859375, -4.32568359375, -4.0205078125, -3.71533203125, -3.41015625, -3.10498046875, -2.7998046875, -2.49462890625, -2.189453125, -1.88427734375, -1.5791015625, -1.27392578125, -0.96875, -0.66357421875, -0.3583984375, -0.05322265625, 0.251953125, 0.55712890625, 0.8623046875, 1.16748046875, 1.47265625, 1.77783203125, 2.0830078125, 2.38818359375, 2.693359375, 2.99853515625, 3.3037109375, 3.60888671875, 3.9140625, 4.21923828125, 4.5244140625, 4.82958984375, 5.134765625, 5.43994140625, 5.7451171875, 6.05029296875, 6.35546875, 6.66064453125, 6.9658203125, 7.27099609375, 7.576171875, 7.88134765625, 8.1865234375, 8.49169921875, 8.796875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 8.0, 6.0, 13.0, 17.0, 10.0, 20.0, 22.0, 30.0, 49.0, 59.0, 76.0, 214.0, 517.0, 1621.0, 7642.0, 63293.0, 1092566.0, 2751643.0, 251499.0, 20285.0, 3115.0, 816.0, 319.0, 121.0, 68.0, 45.0, 25.0, 29.0, 22.0, 25.0, 17.0, 13.0, 13.0, 10.0, 13.0, 6.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.78125, -31.851318359375, -30.92138671875, -29.991455078125, -29.0615234375, -28.131591796875, -27.20166015625, -26.271728515625, -25.341796875, -24.411865234375, -23.48193359375, -22.552001953125, -21.6220703125, -20.692138671875, -19.76220703125, -18.832275390625, -17.90234375, -16.972412109375, -16.04248046875, -15.112548828125, -14.1826171875, -13.252685546875, -12.32275390625, -11.392822265625, -10.462890625, -9.532958984375, -8.60302734375, -7.673095703125, -6.7431640625, -5.813232421875, -4.88330078125, -3.953369140625, -3.0234375, -2.093505859375, -1.16357421875, -0.233642578125, 0.6962890625, 1.626220703125, 2.55615234375, 3.486083984375, 4.416015625, 5.345947265625, 6.27587890625, 7.205810546875, 8.1357421875, 9.065673828125, 9.99560546875, 10.925537109375, 11.85546875, 12.785400390625, 13.71533203125, 14.645263671875, 15.5751953125, 16.505126953125, 17.43505859375, 18.364990234375, 19.294921875, 20.224853515625, 21.15478515625, 22.084716796875, 23.0146484375, 23.944580078125, 24.87451171875, 25.804443359375, 26.734375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 7.0, 14.0, 15.0, 16.0, 25.0, 35.0, 39.0, 70.0, 92.0, 120.0, 142.0, 190.0, 234.0, 318.0, 387.0, 442.0, 420.0, 329.0, 299.0, 202.0, 167.0, 117.0, 91.0, 62.0, 49.0, 40.0, 38.0, 18.0, 22.0, 14.0, 11.0, 2.0, 7.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.3662109375, -15.794921875, -15.2236328125, -14.65234375, -14.0810546875, -13.509765625, -12.9384765625, -12.3671875, -11.7958984375, -11.224609375, -10.6533203125, -10.08203125, -9.5107421875, -8.939453125, -8.3681640625, -7.796875, -7.2255859375, -6.654296875, -6.0830078125, -5.51171875, -4.9404296875, -4.369140625, -3.7978515625, -3.2265625, -2.6552734375, -2.083984375, -1.5126953125, -0.94140625, -0.3701171875, 0.201171875, 0.7724609375, 1.34375, 1.9150390625, 2.486328125, 3.0576171875, 3.62890625, 4.2001953125, 4.771484375, 5.3427734375, 5.9140625, 6.4853515625, 7.056640625, 7.6279296875, 8.19921875, 8.7705078125, 9.341796875, 9.9130859375, 10.484375, 11.0556640625, 11.626953125, 12.1982421875, 12.76953125, 13.3408203125, 13.912109375, 14.4833984375, 15.0546875, 15.6259765625, 16.197265625, 16.7685546875, 17.33984375, 17.9111328125, 18.482421875, 19.0537109375, 19.625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 6.0, 6.0, 15.0, 12.0, 20.0, 10.0, 43.0, 46.0, 54.0, 74.0, 82.0, 106.0, 181.0, 206.0, 308.0, 604.0, 2627.0, 35049.0, 1822734.0, 2283353.0, 44023.0, 2934.0, 608.0, 303.0, 202.0, 171.0, 133.0, 92.0, 67.0, 40.0, 39.0, 28.0, 24.0, 17.0, 14.0, 11.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-59.53125, -57.72900390625, -55.9267578125, -54.12451171875, -52.322265625, -50.52001953125, -48.7177734375, -46.91552734375, -45.11328125, -43.31103515625, -41.5087890625, -39.70654296875, -37.904296875, -36.10205078125, -34.2998046875, -32.49755859375, -30.6953125, -28.89306640625, -27.0908203125, -25.28857421875, -23.486328125, -21.68408203125, -19.8818359375, -18.07958984375, -16.27734375, -14.47509765625, -12.6728515625, -10.87060546875, -9.068359375, -7.26611328125, -5.4638671875, -3.66162109375, -1.859375, -0.05712890625, 1.7451171875, 3.54736328125, 5.349609375, 7.15185546875, 8.9541015625, 10.75634765625, 12.55859375, 14.36083984375, 16.1630859375, 17.96533203125, 19.767578125, 21.56982421875, 23.3720703125, 25.17431640625, 26.9765625, 28.77880859375, 30.5810546875, 32.38330078125, 34.185546875, 35.98779296875, 37.7900390625, 39.59228515625, 41.39453125, 43.19677734375, 44.9990234375, 46.80126953125, 48.603515625, 50.40576171875, 52.2080078125, 54.01025390625, 55.8125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 89.0, 366.0, 419.0, 117.0, 14.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-403.6581115722656, -390.6505432128906, -377.6429748535156, -364.6353759765625, -351.6278076171875, -338.6202392578125, -325.6126708984375, -312.6051025390625, -299.5975341796875, -286.5899658203125, -273.5823974609375, -260.5748291015625, -247.56724548339844, -234.55966186523438, -221.55209350585938, -208.54452514648438, -195.5369415283203, -182.5293731689453, -169.52178955078125, -156.51422119140625, -143.50665283203125, -130.49908447265625, -117.49150085449219, -104.48393249511719, -91.47635650634766, -78.46878051757812, -65.46121215820312, -52.453636169433594, -39.44606399536133, -26.438491821289062, -13.430915832519531, -0.42334747314453125, 12.584228515625, 25.591800689697266, 38.59937286376953, 51.60694885253906, 64.61451721191406, 77.6220932006836, 90.62966918945312, 103.63723754882812, 116.64481353759766, 129.6523895263672, 142.6599578857422, 155.66754150390625, 168.67510986328125, 181.68267822265625, 194.69024658203125, 207.69781494140625, 220.7053985595703, 233.7129669189453, 246.72055053710938, 259.7281188964844, 272.7356872558594, 285.7432556152344, 298.7508544921875, 311.7584228515625, 324.7659912109375, 337.7735595703125, 350.7811279296875, 363.7886962890625, 376.7962951660156, 389.8038635253906, 402.8114318847656, 415.8190002441406, 428.8265686035156]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 10.0, 5.0, 11.0, 12.0, 12.0, 15.0, 16.0, 11.0, 8.0, 18.0, 28.0, 22.0, 21.0, 29.0, 27.0, 30.0, 32.0, 39.0, 30.0, 38.0, 30.0, 44.0, 45.0, 31.0, 29.0, 39.0, 38.0, 40.0, 46.0, 38.0, 31.0, 19.0, 23.0, 26.0, 16.0, 14.0, 12.0, 13.0, 19.0, 5.0, 6.0, 3.0, 10.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.1649169921875, -54.21916198730469, -52.27340316772461, -50.32764434814453, -48.38188934326172, -46.436134338378906, -44.49037551879883, -42.54461669921875, -40.59886169433594, -38.653106689453125, -36.70734786987305, -34.76158905029297, -32.815834045410156, -30.87007713317871, -28.924320220947266, -26.97856330871582, -25.032806396484375, -23.08704948425293, -21.141292572021484, -19.19553565979004, -17.249778747558594, -15.304021835327148, -13.358264923095703, -11.412508010864258, -9.466751098632812, -7.520994186401367, -5.575237274169922, -3.6294803619384766, -1.6837234497070312, 0.26203346252441406, 2.2077903747558594, 4.153547286987305, 6.09930419921875, 8.045061111450195, 9.99081802368164, 11.936574935913086, 13.882331848144531, 15.828088760375977, 17.773845672607422, 19.719602584838867, 21.665359497070312, 23.611116409301758, 25.556873321533203, 27.50263023376465, 29.448387145996094, 31.39414405822754, 33.339900970458984, 35.28565979003906, 37.231414794921875, 39.17716979980469, 41.122928619384766, 43.068687438964844, 45.014442443847656, 46.96019744873047, 48.90595626831055, 50.851715087890625, 52.79747009277344, 54.74322509765625, 56.68898391723633, 58.634742736816406, 60.58049774169922, 62.52625274658203, 64.47201538085938, 66.41777038574219, 68.363525390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 11.0, 3.0, 9.0, 16.0, 17.0, 23.0, 21.0, 28.0, 20.0, 32.0, 36.0, 35.0, 46.0, 50.0, 47.0, 40.0, 40.0, 46.0, 41.0, 42.0, 44.0, 32.0, 44.0, 30.0, 25.0, 34.0, 23.0, 32.0, 23.0, 12.0, 16.0, 12.0, 17.0, 12.0, 4.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.46875, -10.171875, -9.875, -9.578125, -9.28125, -8.984375, -8.6875, -8.390625, -8.09375, -7.796875, -7.5, -7.203125, -6.90625, -6.609375, -6.3125, -6.015625, -5.71875, -5.421875, -5.125, -4.828125, -4.53125, -4.234375, -3.9375, -3.640625, -3.34375, -3.046875, -2.75, -2.453125, -2.15625, -1.859375, -1.5625, -1.265625, -0.96875, -0.671875, -0.375, -0.078125, 0.21875, 0.515625, 0.8125, 1.109375, 1.40625, 1.703125, 2.0, 2.296875, 2.59375, 2.890625, 3.1875, 3.484375, 3.78125, 4.078125, 4.375, 4.671875, 4.96875, 5.265625, 5.5625, 5.859375, 6.15625, 6.453125, 6.75, 7.046875, 7.34375, 7.640625, 7.9375, 8.234375, 8.53125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 15.0, 21.0, 21.0, 37.0, 55.0, 85.0, 134.0, 217.0, 252.0, 408.0, 585.0, 900.0, 1323.0, 2006.0, 3021.0, 4507.0, 6531.0, 10078.0, 15849.0, 25413.0, 42252.0, 72362.0, 123347.0, 189654.0, 200842.0, 138896.0, 82308.0, 47525.0, 28840.0, 17692.0, 11107.0, 7374.0, 4832.0, 3338.0, 2209.0, 1529.0, 1001.0, 609.0, 449.0, 317.0, 212.0, 135.0, 84.0, 61.0, 33.0, 34.0, 20.0, 10.0, 6.0, 9.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.1025390625, -1.067108154296875, -1.03167724609375, -0.996246337890625, -0.9608154296875, -0.925384521484375, -0.88995361328125, -0.854522705078125, -0.819091796875, -0.783660888671875, -0.74822998046875, -0.712799072265625, -0.6773681640625, -0.641937255859375, -0.60650634765625, -0.571075439453125, -0.53564453125, -0.500213623046875, -0.46478271484375, -0.429351806640625, -0.3939208984375, -0.358489990234375, -0.32305908203125, -0.287628173828125, -0.252197265625, -0.216766357421875, -0.18133544921875, -0.145904541015625, -0.1104736328125, -0.075042724609375, -0.03961181640625, -0.004180908203125, 0.03125, 0.066680908203125, 0.10211181640625, 0.137542724609375, 0.1729736328125, 0.208404541015625, 0.24383544921875, 0.279266357421875, 0.314697265625, 0.350128173828125, 0.38555908203125, 0.420989990234375, 0.4564208984375, 0.491851806640625, 0.52728271484375, 0.562713623046875, 0.59814453125, 0.633575439453125, 0.66900634765625, 0.704437255859375, 0.7398681640625, 0.775299072265625, 0.81072998046875, 0.846160888671875, 0.881591796875, 0.917022705078125, 0.95245361328125, 0.987884521484375, 1.0233154296875, 1.058746337890625, 1.09417724609375, 1.129608154296875, 1.1650390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 8.0, 5.0, 12.0, 12.0, 12.0, 15.0, 14.0, 16.0, 21.0, 32.0, 26.0, 33.0, 37.0, 26.0, 38.0, 31.0, 34.0, 30.0, 35.0, 37.0, 1058.0, 47.0, 38.0, 39.0, 34.0, 26.0, 28.0, 28.0, 28.0, 23.0, 33.0, 23.0, 26.0, 18.0, 17.0, 16.0, 9.0, 11.0, 7.0, 5.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.78125, -4.6175537109375, -4.453857421875, -4.2901611328125, -4.12646484375, -3.9627685546875, -3.799072265625, -3.6353759765625, -3.4716796875, -3.3079833984375, -3.144287109375, -2.9805908203125, -2.81689453125, -2.6531982421875, -2.489501953125, -2.3258056640625, -2.162109375, -1.9984130859375, -1.834716796875, -1.6710205078125, -1.50732421875, -1.3436279296875, -1.179931640625, -1.0162353515625, -0.8525390625, -0.6888427734375, -0.525146484375, -0.3614501953125, -0.19775390625, -0.0340576171875, 0.129638671875, 0.2933349609375, 0.45703125, 0.6207275390625, 0.784423828125, 0.9481201171875, 1.11181640625, 1.2755126953125, 1.439208984375, 1.6029052734375, 1.7666015625, 1.9302978515625, 2.093994140625, 2.2576904296875, 2.42138671875, 2.5850830078125, 2.748779296875, 2.9124755859375, 3.076171875, 3.2398681640625, 3.403564453125, 3.5672607421875, 3.73095703125, 3.8946533203125, 4.058349609375, 4.2220458984375, 4.3857421875, 4.5494384765625, 4.713134765625, 4.8768310546875, 5.04052734375, 5.2042236328125, 5.367919921875, 5.5316162109375, 5.6953125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 7.0, 12.0, 13.0, 29.0, 41.0, 53.0, 90.0, 121.0, 173.0, 285.0, 459.0, 664.0, 1021.0, 1613.0, 2437.0, 3992.0, 6110.0, 10055.0, 16444.0, 27200.0, 44352.0, 72075.0, 114568.0, 162145.0, 1220736.0, 146806.0, 101815.0, 63707.0, 38817.0, 23421.0, 14231.0, 8706.0, 5474.0, 3435.0, 2094.0, 1389.0, 887.0, 588.0, 364.0, 230.0, 154.0, 98.0, 77.0, 46.0, 35.0, 19.0, 9.0, 10.0, 14.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6237716674804688, -0.6025238037109375, -0.5812759399414062, -0.560028076171875, -0.5387802124023438, -0.5175323486328125, -0.49628448486328125, -0.47503662109375, -0.45378875732421875, -0.4325408935546875, -0.41129302978515625, -0.390045166015625, -0.36879730224609375, -0.3475494384765625, -0.32630157470703125, -0.3050537109375, -0.28380584716796875, -0.2625579833984375, -0.24131011962890625, -0.220062255859375, -0.19881439208984375, -0.1775665283203125, -0.15631866455078125, -0.13507080078125, -0.11382293701171875, -0.0925750732421875, -0.07132720947265625, -0.050079345703125, -0.02883148193359375, -0.0075836181640625, 0.01366424560546875, 0.034912109375, 0.05615997314453125, 0.0774078369140625, 0.09865570068359375, 0.119903564453125, 0.14115142822265625, 0.1623992919921875, 0.18364715576171875, 0.20489501953125, 0.22614288330078125, 0.2473907470703125, 0.26863861083984375, 0.289886474609375, 0.31113433837890625, 0.3323822021484375, 0.35363006591796875, 0.3748779296875, 0.39612579345703125, 0.4173736572265625, 0.43862152099609375, 0.459869384765625, 0.48111724853515625, 0.5023651123046875, 0.5236129760742188, 0.54486083984375, 0.5661087036132812, 0.5873565673828125, 0.6086044311523438, 0.629852294921875, 0.6511001586914062, 0.6723480224609375, 0.6935958862304688, 0.71484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 12.0, 9.0, 10.0, 15.0, 17.0, 16.0, 28.0, 28.0, 42.0, 45.0, 68.0, 78.0, 87.0, 108.0, 99.0, 78.0, 58.0, 44.0, 31.0, 20.0, 18.0, 18.0, 14.0, 9.0, 7.0, 3.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01471710205078125, -0.01423180103302002, -0.013746500015258789, -0.013261198997497559, -0.012775897979736328, -0.012290596961975098, -0.011805295944213867, -0.011319994926452637, -0.010834693908691406, -0.010349392890930176, -0.009864091873168945, -0.009378790855407715, -0.008893489837646484, -0.008408188819885254, -0.007922887802124023, -0.007437586784362793, -0.0069522857666015625, -0.006466984748840332, -0.0059816837310791016, -0.005496382713317871, -0.005011081695556641, -0.00452578067779541, -0.00404047966003418, -0.0035551786422729492, -0.0030698776245117188, -0.0025845766067504883, -0.002099275588989258, -0.0016139745712280273, -0.0011286735534667969, -0.0006433725357055664, -0.00015807151794433594, 0.00032722949981689453, 0.000812530517578125, 0.0012978315353393555, 0.001783132553100586, 0.0022684335708618164, 0.002753734588623047, 0.0032390356063842773, 0.003724336624145508, 0.004209637641906738, 0.004694938659667969, 0.005180239677429199, 0.00566554069519043, 0.00615084171295166, 0.006636142730712891, 0.007121443748474121, 0.0076067447662353516, 0.008092045783996582, 0.008577346801757812, 0.009062647819519043, 0.009547948837280273, 0.010033249855041504, 0.010518550872802734, 0.011003851890563965, 0.011489152908325195, 0.011974453926086426, 0.012459754943847656, 0.012945055961608887, 0.013430356979370117, 0.013915657997131348, 0.014400959014892578, 0.014886260032653809, 0.015371561050415039, 0.01585686206817627, 0.0163421630859375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 5.0, 9.0, 4.0, 6.0, 8.0, 11.0, 19.0, 30.0, 37.0, 48.0, 70.0, 140.0, 473.0, 5637.0, 856454.0, 182549.0, 2316.0, 321.0, 109.0, 71.0, 58.0, 42.0, 19.0, 23.0, 16.0, 19.0, 7.0, 11.0, 9.0, 8.0, 5.0, 2.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3818359375, -0.3708839416503906, -0.35993194580078125, -0.3489799499511719, -0.3380279541015625, -0.3270759582519531, -0.31612396240234375, -0.3051719665527344, -0.294219970703125, -0.2832679748535156, -0.27231597900390625, -0.2613639831542969, -0.2504119873046875, -0.23945999145507812, -0.22850799560546875, -0.21755599975585938, -0.20660400390625, -0.19565200805664062, -0.18470001220703125, -0.17374801635742188, -0.1627960205078125, -0.15184402465820312, -0.14089202880859375, -0.12994003295898438, -0.118988037109375, -0.10803604125976562, -0.09708404541015625, -0.08613204956054688, -0.0751800537109375, -0.06422805786132812, -0.05327606201171875, -0.042324066162109375, -0.0313720703125, -0.020420074462890625, -0.00946807861328125, 0.001483917236328125, 0.0124359130859375, 0.023387908935546875, 0.03433990478515625, 0.045291900634765625, 0.056243896484375, 0.06719589233398438, 0.07814788818359375, 0.08909988403320312, 0.1000518798828125, 0.11100387573242188, 0.12195587158203125, 0.13290786743164062, 0.14385986328125, 0.15481185913085938, 0.16576385498046875, 0.17671585083007812, 0.1876678466796875, 0.19861984252929688, 0.20957183837890625, 0.22052383422851562, 0.231475830078125, 0.24242782592773438, 0.25337982177734375, 0.2643318176269531, 0.2752838134765625, 0.2862358093261719, 0.29718780517578125, 0.3081398010253906, 0.319091796875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 42.0, 239.0, 682.0, 44.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29820582270622253, -0.29261165857315063, -0.28701749444007874, -0.28142333030700684, -0.27582916617393494, -0.27023500204086304, -0.26464080810546875, -0.25904667377471924, -0.25345247983932495, -0.24785831570625305, -0.24226415157318115, -0.23666998744010925, -0.23107580840587616, -0.22548164427280426, -0.21988748013973236, -0.21429331600666046, -0.20869916677474976, -0.20310500264167786, -0.19751083850860596, -0.19191667437553406, -0.18632249534130096, -0.18072833120822906, -0.17513416707515717, -0.16954000294208527, -0.16394582390785217, -0.15835165977478027, -0.15275749564170837, -0.14716333150863647, -0.14156915247440338, -0.13597498834133148, -0.13038082420825958, -0.12478666007518768, -0.11919249594211578, -0.11359833180904388, -0.10800416022539139, -0.10240999609231949, -0.09681583195924759, -0.09122166037559509, -0.0856274962425232, -0.0800333321094513, -0.0744391605257988, -0.0688449963927269, -0.0632508248090744, -0.0576566606760025, -0.0520624965429306, -0.046468328684568405, -0.04087416082620621, -0.03527999669313431, -0.02968582883477211, -0.02409166283905506, -0.018497496843338013, -0.012903328984975815, -0.007309162989258766, -0.0017149969935417175, 0.0038791708648204803, 0.00947333499789238, 0.015067502856254578, 0.020661668851971626, 0.026255834847688675, 0.03185000270605087, 0.03744416683912277, 0.04303833469748497, 0.04863250255584717, 0.05422666668891907, 0.059820834547281265]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 0.0, 5.0, 5.0, 5.0, 6.0, 8.0, 10.0, 4.0, 19.0, 12.0, 23.0, 27.0, 24.0, 20.0, 41.0, 36.0, 22.0, 49.0, 41.0, 33.0, 48.0, 40.0, 31.0, 38.0, 41.0, 32.0, 36.0, 31.0, 42.0, 32.0, 25.0, 33.0, 27.0, 28.0, 22.0, 14.0, 14.0, 12.0, 10.0, 12.0, 12.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.011814773082733154, -0.011457051150500774, -0.011099329218268394, -0.010741607286036015, -0.010383885353803635, -0.010026163421571255, -0.009668441489338875, -0.009310719557106495, -0.008952997624874115, -0.008595275692641735, -0.008237553760409355, -0.007879831828176975, -0.007522109895944595, -0.007164387963712215, -0.0068066660314798355, -0.006448944099247456, -0.006091222167015076, -0.005733500234782696, -0.005375778302550316, -0.005018056370317936, -0.004660334438085556, -0.004302612505853176, -0.003944890573620796, -0.0035871686413884163, -0.0032294467091560364, -0.0028717247769236565, -0.0025140028446912766, -0.0021562809124588966, -0.0017985589802265167, -0.0014408370479941368, -0.001083115115761757, -0.000725393183529377, -0.00036767125129699707, -9.949319064617157e-06, 0.00034777261316776276, 0.0007054945454001427, 0.0010632164776325226, 0.0014209384098649025, 0.0017786603420972824, 0.0021363822743296623, 0.0024941042065620422, 0.002851826138794422, 0.003209548071026802, 0.003567270003259182, 0.003924991935491562, 0.004282713867723942, 0.004640435799956322, 0.004998157732188702, 0.0053558796644210815, 0.0057136015966534615, 0.006071323528885841, 0.006429045461118221, 0.006786767393350601, 0.007144489325582981, 0.007502211257815361, 0.007859933190047741, 0.00821765512228012, 0.0085753770545125, 0.00893309898674488, 0.00929082091897726, 0.00964854285120964, 0.01000626478344202, 0.0103639867156744, 0.01072170864790678, 0.01107943058013916]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 11.0, 3.0, 9.0, 16.0, 17.0, 23.0, 21.0, 28.0, 20.0, 32.0, 36.0, 35.0, 46.0, 50.0, 47.0, 40.0, 40.0, 46.0, 41.0, 42.0, 44.0, 32.0, 44.0, 30.0, 25.0, 34.0, 23.0, 32.0, 23.0, 12.0, 16.0, 12.0, 17.0, 12.0, 4.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.46875, -10.171875, -9.875, -9.578125, -9.28125, -8.984375, -8.6875, -8.390625, -8.09375, -7.796875, -7.5, -7.203125, -6.90625, -6.609375, -6.3125, -6.015625, -5.71875, -5.421875, -5.125, -4.828125, -4.53125, -4.234375, -3.9375, -3.640625, -3.34375, -3.046875, -2.75, -2.453125, -2.15625, -1.859375, -1.5625, -1.265625, -0.96875, -0.671875, -0.375, -0.078125, 0.21875, 0.515625, 0.8125, 1.109375, 1.40625, 1.703125, 2.0, 2.296875, 2.59375, 2.890625, 3.1875, 3.484375, 3.78125, 4.078125, 4.375, 4.671875, 4.96875, 5.265625, 5.5625, 5.859375, 6.15625, 6.453125, 6.75, 7.046875, 7.34375, 7.640625, 7.9375, 8.234375, 8.53125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 11.0, 20.0, 12.0, 27.0, 35.0, 73.0, 89.0, 137.0, 204.0, 286.0, 405.0, 649.0, 1028.0, 1547.0, 2414.0, 3779.0, 5677.0, 8893.0, 14762.0, 28782.0, 77576.0, 269834.0, 418469.0, 123839.0, 41043.0, 18824.0, 10908.0, 6706.0, 4269.0, 2830.0, 1900.0, 1230.0, 720.0, 498.0, 304.0, 220.0, 179.0, 106.0, 76.0, 48.0, 32.0, 31.0, 23.0, 17.0, 10.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.0546875, -6.8355712890625, -6.616455078125, -6.3973388671875, -6.17822265625, -5.9591064453125, -5.739990234375, -5.5208740234375, -5.3017578125, -5.0826416015625, -4.863525390625, -4.6444091796875, -4.42529296875, -4.2061767578125, -3.987060546875, -3.7679443359375, -3.548828125, -3.3297119140625, -3.110595703125, -2.8914794921875, -2.67236328125, -2.4532470703125, -2.234130859375, -2.0150146484375, -1.7958984375, -1.5767822265625, -1.357666015625, -1.1385498046875, -0.91943359375, -0.7003173828125, -0.481201171875, -0.2620849609375, -0.04296875, 0.1761474609375, 0.395263671875, 0.6143798828125, 0.83349609375, 1.0526123046875, 1.271728515625, 1.4908447265625, 1.7099609375, 1.9290771484375, 2.148193359375, 2.3673095703125, 2.58642578125, 2.8055419921875, 3.024658203125, 3.2437744140625, 3.462890625, 3.6820068359375, 3.901123046875, 4.1202392578125, 4.33935546875, 4.5584716796875, 4.777587890625, 4.9967041015625, 5.2158203125, 5.4349365234375, 5.654052734375, 5.8731689453125, 6.09228515625, 6.3114013671875, 6.530517578125, 6.7496337890625, 6.96875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 6.0, 15.0, 7.0, 15.0, 21.0, 18.0, 28.0, 20.0, 29.0, 52.0, 40.0, 34.0, 62.0, 87.0, 110.0, 1668.0, 310.0, 98.0, 59.0, 49.0, 52.0, 35.0, 29.0, 30.0, 32.0, 16.0, 20.0, 32.0, 17.0, 10.0, 6.0, 3.0, 9.0, 3.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.484375, -29.426025390625, -28.36767578125, -27.309326171875, -26.2509765625, -25.192626953125, -24.13427734375, -23.075927734375, -22.017578125, -20.959228515625, -19.90087890625, -18.842529296875, -17.7841796875, -16.725830078125, -15.66748046875, -14.609130859375, -13.55078125, -12.492431640625, -11.43408203125, -10.375732421875, -9.3173828125, -8.259033203125, -7.20068359375, -6.142333984375, -5.083984375, -4.025634765625, -2.96728515625, -1.908935546875, -0.8505859375, 0.207763671875, 1.26611328125, 2.324462890625, 3.3828125, 4.441162109375, 5.49951171875, 6.557861328125, 7.6162109375, 8.674560546875, 9.73291015625, 10.791259765625, 11.849609375, 12.907958984375, 13.96630859375, 15.024658203125, 16.0830078125, 17.141357421875, 18.19970703125, 19.258056640625, 20.31640625, 21.374755859375, 22.43310546875, 23.491455078125, 24.5498046875, 25.608154296875, 26.66650390625, 27.724853515625, 28.783203125, 29.841552734375, 30.89990234375, 31.958251953125, 33.0166015625, 34.074951171875, 35.13330078125, 36.191650390625, 37.25]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 25.0, 15.0, 28.0, 63.0, 79.0, 127.0, 195.0, 317.0, 615.0, 13001.0, 3122751.0, 7118.0, 552.0, 314.0, 156.0, 112.0, 75.0, 44.0, 34.0, 22.0, 11.0, 8.0, 4.0, 4.0, 4.0, 3.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.3125, -84.3779296875, -80.443359375, -76.5087890625, -72.57421875, -68.6396484375, -64.705078125, -60.7705078125, -56.8359375, -52.9013671875, -48.966796875, -45.0322265625, -41.09765625, -37.1630859375, -33.228515625, -29.2939453125, -25.359375, -21.4248046875, -17.490234375, -13.5556640625, -9.62109375, -5.6865234375, -1.751953125, 2.1826171875, 6.1171875, 10.0517578125, 13.986328125, 17.9208984375, 21.85546875, 25.7900390625, 29.724609375, 33.6591796875, 37.59375, 41.5283203125, 45.462890625, 49.3974609375, 53.33203125, 57.2666015625, 61.201171875, 65.1357421875, 69.0703125, 73.0048828125, 76.939453125, 80.8740234375, 84.80859375, 88.7431640625, 92.677734375, 96.6123046875, 100.546875, 104.4814453125, 108.416015625, 112.3505859375, 116.28515625, 120.2197265625, 124.154296875, 128.0888671875, 132.0234375, 135.9580078125, 139.892578125, 143.8271484375, 147.76171875, 151.6962890625, 155.630859375, 159.5654296875, 163.5]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 205.0, 769.0, 43.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.40789031982422, -54.23567199707031, -44.063453674316406, -33.8912353515625, -23.719017028808594, -13.546798706054688, -3.3745803833007812, 6.797637939453125, 16.96985626220703, 27.142074584960938, 37.314292907714844, 47.48651123046875, 57.658729553222656, 67.83094787597656, 78.00316619873047, 88.17538452148438, 98.34760284423828, 108.51982116699219, 118.6920394897461, 128.8642578125, 139.03646850585938, 149.2086944580078, 159.38092041015625, 169.55313110351562, 179.725341796875, 189.89755249023438, 200.0697784423828, 210.24200439453125, 220.41421508789062, 230.58642578125, 240.75865173339844, 250.93087768554688, 261.10308837890625, 271.2752990722656, 281.447509765625, 291.6197509765625, 301.7919616699219, 311.96417236328125, 322.13641357421875, 332.3086242675781, 342.4808349609375, 352.6530456542969, 362.82525634765625, 372.99749755859375, 383.1697082519531, 393.3419189453125, 403.51416015625, 413.6863708496094, 423.85858154296875, 434.0307922363281, 444.2030029296875, 454.375244140625, 464.5474548339844, 474.71966552734375, 484.89190673828125, 495.0641174316406, 505.236328125, 515.4085693359375, 525.5807495117188, 535.7529907226562, 545.9251708984375, 556.097412109375, 566.2696533203125, 576.4418334960938, 586.6140747070312]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 11.0, 8.0, 15.0, 12.0, 10.0, 17.0, 20.0, 19.0, 24.0, 14.0, 24.0, 27.0, 31.0, 34.0, 39.0, 49.0, 42.0, 51.0, 44.0, 37.0, 58.0, 39.0, 24.0, 30.0, 29.0, 34.0, 33.0, 36.0, 34.0, 23.0, 23.0, 22.0, 10.0, 7.0, 18.0, 8.0, 7.0, 7.0, 5.0, 8.0, 3.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.53298950195312, -72.13226318359375, -69.73152923583984, -67.33080291748047, -64.93006896972656, -62.52933883666992, -60.12860870361328, -57.727882385253906, -55.3271484375, -52.92641830444336, -50.52568817138672, -48.12495803833008, -45.72422790527344, -43.3234977722168, -40.922767639160156, -38.52204132080078, -36.12131118774414, -33.7205810546875, -31.31985092163086, -28.91912078857422, -26.518390655517578, -24.117660522460938, -21.71693229675293, -19.31620216369629, -16.91547203063965, -14.514741897583008, -12.114011764526367, -9.713282585144043, -7.312552452087402, -4.911822319030762, -2.5110931396484375, -0.11036300659179688, 2.2903671264648438, 4.691097259521484, 7.091826915740967, 9.49255657196045, 11.89328670501709, 14.29401683807373, 16.694746017456055, 19.095476150512695, 21.496206283569336, 23.896936416625977, 26.297666549682617, 28.698394775390625, 31.099124908447266, 33.499855041503906, 35.90058517456055, 38.30131530761719, 40.70204544067383, 43.10277557373047, 45.50350570678711, 47.90423583984375, 50.30496597290039, 52.70569610595703, 55.106422424316406, 57.50715637207031, 59.90788269042969, 62.30861282348633, 64.70934295654297, 67.11006927490234, 69.51080322265625, 71.91152954101562, 74.31226348876953, 76.7129898071289, 79.11372375488281]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 10.0, 4.0, 9.0, 20.0, 9.0, 27.0, 24.0, 26.0, 19.0, 40.0, 32.0, 41.0, 41.0, 53.0, 51.0, 38.0, 45.0, 50.0, 49.0, 47.0, 45.0, 34.0, 31.0, 31.0, 30.0, 28.0, 25.0, 28.0, 20.0, 26.0, 16.0, 10.0, 6.0, 4.0, 7.0, 5.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.1551513671875, -10.825927734375, -10.4967041015625, -10.16748046875, -9.8382568359375, -9.509033203125, -9.1798095703125, -8.8505859375, -8.5213623046875, -8.192138671875, -7.8629150390625, -7.53369140625, -7.2044677734375, -6.875244140625, -6.5460205078125, -6.216796875, -5.8875732421875, -5.558349609375, -5.2291259765625, -4.89990234375, -4.5706787109375, -4.241455078125, -3.9122314453125, -3.5830078125, -3.2537841796875, -2.924560546875, -2.5953369140625, -2.26611328125, -1.9368896484375, -1.607666015625, -1.2784423828125, -0.94921875, -0.6199951171875, -0.290771484375, 0.0384521484375, 0.36767578125, 0.6968994140625, 1.026123046875, 1.3553466796875, 1.6845703125, 2.0137939453125, 2.343017578125, 2.6722412109375, 3.00146484375, 3.3306884765625, 3.659912109375, 3.9891357421875, 4.318359375, 4.6475830078125, 4.976806640625, 5.3060302734375, 5.63525390625, 5.9644775390625, 6.293701171875, 6.6229248046875, 6.9521484375, 7.2813720703125, 7.610595703125, 7.9398193359375, 8.26904296875, 8.5982666015625, 8.927490234375, 9.2567138671875, 9.5859375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 12.0, 10.0, 15.0, 21.0, 20.0, 31.0, 36.0, 76.0, 101.0, 158.0, 322.0, 577.0, 1512.0, 4209.0, 15879.0, 77116.0, 521652.0, 2162391.0, 1185089.0, 181419.0, 31575.0, 7671.0, 2413.0, 938.0, 448.0, 201.0, 113.0, 98.0, 39.0, 30.0, 23.0, 12.0, 15.0, 15.0, 11.0, 5.0, 5.0, 6.0, 3.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-21.96875, -21.37060546875, -20.7724609375, -20.17431640625, -19.576171875, -18.97802734375, -18.3798828125, -17.78173828125, -17.18359375, -16.58544921875, -15.9873046875, -15.38916015625, -14.791015625, -14.19287109375, -13.5947265625, -12.99658203125, -12.3984375, -11.80029296875, -11.2021484375, -10.60400390625, -10.005859375, -9.40771484375, -8.8095703125, -8.21142578125, -7.61328125, -7.01513671875, -6.4169921875, -5.81884765625, -5.220703125, -4.62255859375, -4.0244140625, -3.42626953125, -2.828125, -2.22998046875, -1.6318359375, -1.03369140625, -0.435546875, 0.16259765625, 0.7607421875, 1.35888671875, 1.95703125, 2.55517578125, 3.1533203125, 3.75146484375, 4.349609375, 4.94775390625, 5.5458984375, 6.14404296875, 6.7421875, 7.34033203125, 7.9384765625, 8.53662109375, 9.134765625, 9.73291015625, 10.3310546875, 10.92919921875, 11.52734375, 12.12548828125, 12.7236328125, 13.32177734375, 13.919921875, 14.51806640625, 15.1162109375, 15.71435546875, 16.3125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 10.0, 16.0, 29.0, 32.0, 60.0, 80.0, 113.0, 152.0, 241.0, 320.0, 421.0, 525.0, 553.0, 429.0, 351.0, 207.0, 167.0, 105.0, 89.0, 56.0, 31.0, 20.0, 14.0, 13.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.90625, -26.216552734375, -25.52685546875, -24.837158203125, -24.1474609375, -23.457763671875, -22.76806640625, -22.078369140625, -21.388671875, -20.698974609375, -20.00927734375, -19.319580078125, -18.6298828125, -17.940185546875, -17.25048828125, -16.560791015625, -15.87109375, -15.181396484375, -14.49169921875, -13.802001953125, -13.1123046875, -12.422607421875, -11.73291015625, -11.043212890625, -10.353515625, -9.663818359375, -8.97412109375, -8.284423828125, -7.5947265625, -6.905029296875, -6.21533203125, -5.525634765625, -4.8359375, -4.146240234375, -3.45654296875, -2.766845703125, -2.0771484375, -1.387451171875, -0.69775390625, -0.008056640625, 0.681640625, 1.371337890625, 2.06103515625, 2.750732421875, 3.4404296875, 4.130126953125, 4.81982421875, 5.509521484375, 6.19921875, 6.888916015625, 7.57861328125, 8.268310546875, 8.9580078125, 9.647705078125, 10.33740234375, 11.027099609375, 11.716796875, 12.406494140625, 13.09619140625, 13.785888671875, 14.4755859375, 15.165283203125, 15.85498046875, 16.544677734375, 17.234375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 8.0, 9.0, 9.0, 21.0, 12.0, 32.0, 34.0, 67.0, 97.0, 124.0, 199.0, 322.0, 479.0, 1038.0, 8104.0, 559457.0, 3565780.0, 54389.0, 2291.0, 649.0, 387.0, 232.0, 183.0, 118.0, 75.0, 57.0, 31.0, 35.0, 18.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.19189453125, -50.0400390625, -47.88818359375, -45.736328125, -43.58447265625, -41.4326171875, -39.28076171875, -37.12890625, -34.97705078125, -32.8251953125, -30.67333984375, -28.521484375, -26.36962890625, -24.2177734375, -22.06591796875, -19.9140625, -17.76220703125, -15.6103515625, -13.45849609375, -11.306640625, -9.15478515625, -7.0029296875, -4.85107421875, -2.69921875, -0.54736328125, 1.6044921875, 3.75634765625, 5.908203125, 8.06005859375, 10.2119140625, 12.36376953125, 14.515625, 16.66748046875, 18.8193359375, 20.97119140625, 23.123046875, 25.27490234375, 27.4267578125, 29.57861328125, 31.73046875, 33.88232421875, 36.0341796875, 38.18603515625, 40.337890625, 42.48974609375, 44.6416015625, 46.79345703125, 48.9453125, 51.09716796875, 53.2490234375, 55.40087890625, 57.552734375, 59.70458984375, 61.8564453125, 64.00830078125, 66.16015625, 68.31201171875, 70.4638671875, 72.61572265625, 74.767578125, 76.91943359375, 79.0712890625, 81.22314453125, 83.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 11.0, 17.0, 22.0, 41.0, 64.0, 86.0, 121.0, 129.0, 109.0, 110.0, 96.0, 76.0, 48.0, 30.0, 20.0, 15.0, 9.0, 3.0, 1.0, 2.0], "bins": [-162.29354858398438, -159.1786651611328, -156.06378173828125, -152.94888305664062, -149.83399963378906, -146.7191162109375, -143.60423278808594, -140.4893341064453, -137.37445068359375, -134.2595672607422, -131.14468383789062, -128.02978515625, -124.91490173339844, -121.80001831054688, -118.68512725830078, -115.57024383544922, -112.45535278320312, -109.34046936035156, -106.22557830810547, -103.1106948852539, -99.99580383300781, -96.88092041015625, -93.76602935791016, -90.6511459350586, -87.53626251220703, -84.42137908935547, -81.30648803710938, -78.19160461425781, -75.07671356201172, -71.96183013916016, -68.84693908691406, -65.7320556640625, -62.61716079711914, -59.50227355957031, -56.387386322021484, -53.272499084472656, -50.15761184692383, -47.042724609375, -43.92784118652344, -40.812950134277344, -37.69806671142578, -34.58317947387695, -31.468292236328125, -28.353404998779297, -25.23851776123047, -22.12363052368164, -19.008745193481445, -15.893857955932617, -12.778968811035156, -9.664081573486328, -6.549194812774658, -3.4343080520629883, -0.31942081451416016, 2.795466423034668, 5.91035270690918, 9.025239944458008, 12.140127182006836, 15.255014419555664, 18.369901657104492, 21.484786987304688, 24.599674224853516, 27.714561462402344, 30.829448699951172, 33.9443359375, 37.05922317504883]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 17.0, 16.0, 9.0, 17.0, 17.0, 23.0, 24.0, 28.0, 31.0, 27.0, 35.0, 31.0, 42.0, 41.0, 38.0, 49.0, 32.0, 31.0, 43.0, 31.0, 41.0, 22.0, 37.0, 30.0, 32.0, 23.0, 22.0, 25.0, 15.0, 18.0, 16.0, 22.0, 18.0, 16.0, 6.0, 4.0, 5.0, 9.0, 6.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-56.75421142578125, -55.05633544921875, -53.35845947265625, -51.660587310791016, -49.962711334228516, -48.264835357666016, -46.56696319580078, -44.86908721923828, -43.17121124267578, -41.47333526611328, -39.77545928955078, -38.07758712768555, -36.37971115112305, -34.68183517456055, -32.98396301269531, -31.286087036132812, -29.588211059570312, -27.890335083007812, -26.192461013793945, -24.494586944580078, -22.796710968017578, -21.098834991455078, -19.40096092224121, -17.703086853027344, -16.005210876464844, -14.30733585357666, -12.609460830688477, -10.911585807800293, -9.21371078491211, -7.515835762023926, -5.817960739135742, -4.120085716247559, -2.422210693359375, -0.7243356704711914, 0.9735393524169922, 2.671414375305176, 4.369289398193359, 6.067164421081543, 7.765039443969727, 9.46291446685791, 11.160789489746094, 12.858664512634277, 14.556539535522461, 16.254413604736328, 17.952289581298828, 19.650165557861328, 21.348039627075195, 23.045913696289062, 24.743789672851562, 26.441665649414062, 28.13953971862793, 29.837413787841797, 31.535289764404297, 33.2331657409668, 34.93103790283203, 36.62891387939453, 38.32678985595703, 40.02466583251953, 41.72254180908203, 43.420413970947266, 45.118289947509766, 46.816165924072266, 48.5140380859375, 50.2119140625, 51.9097900390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 10.0, 16.0, 16.0, 16.0, 19.0, 18.0, 25.0, 32.0, 35.0, 46.0, 43.0, 51.0, 52.0, 39.0, 44.0, 38.0, 44.0, 43.0, 40.0, 42.0, 42.0, 34.0, 39.0, 24.0, 22.0, 29.0, 28.0, 21.0, 12.0, 20.0, 9.0, 6.0, 6.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0390625, -10.7198486328125, -10.400634765625, -10.0814208984375, -9.76220703125, -9.4429931640625, -9.123779296875, -8.8045654296875, -8.4853515625, -8.1661376953125, -7.846923828125, -7.5277099609375, -7.20849609375, -6.8892822265625, -6.570068359375, -6.2508544921875, -5.931640625, -5.6124267578125, -5.293212890625, -4.9739990234375, -4.65478515625, -4.3355712890625, -4.016357421875, -3.6971435546875, -3.3779296875, -3.0587158203125, -2.739501953125, -2.4202880859375, -2.10107421875, -1.7818603515625, -1.462646484375, -1.1434326171875, -0.82421875, -0.5050048828125, -0.185791015625, 0.1334228515625, 0.45263671875, 0.7718505859375, 1.091064453125, 1.4102783203125, 1.7294921875, 2.0487060546875, 2.367919921875, 2.6871337890625, 3.00634765625, 3.3255615234375, 3.644775390625, 3.9639892578125, 4.283203125, 4.6024169921875, 4.921630859375, 5.2408447265625, 5.56005859375, 5.8792724609375, 6.198486328125, 6.5177001953125, 6.8369140625, 7.1561279296875, 7.475341796875, 7.7945556640625, 8.11376953125, 8.4329833984375, 8.752197265625, 9.0714111328125, 9.390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 8.0, 16.0, 22.0, 28.0, 69.0, 106.0, 135.0, 167.0, 257.0, 347.0, 516.0, 758.0, 1065.0, 1527.0, 2038.0, 3107.0, 4558.0, 6647.0, 9864.0, 14816.0, 22729.0, 35688.0, 58476.0, 94663.0, 146947.0, 185460.0, 162838.0, 108434.0, 68015.0, 41597.0, 25919.0, 16839.0, 11048.0, 7342.0, 5213.0, 3476.0, 2343.0, 1684.0, 1164.0, 834.0, 545.0, 392.0, 266.0, 206.0, 127.0, 86.0, 47.0, 48.0, 24.0, 26.0, 7.0, 16.0, 5.0, 2.0, 3.0, 1.0], "bins": [-1.0361328125, -1.005340576171875, -0.97454833984375, -0.943756103515625, -0.9129638671875, -0.882171630859375, -0.85137939453125, -0.820587158203125, -0.789794921875, -0.759002685546875, -0.72821044921875, -0.697418212890625, -0.6666259765625, -0.635833740234375, -0.60504150390625, -0.574249267578125, -0.54345703125, -0.512664794921875, -0.48187255859375, -0.451080322265625, -0.4202880859375, -0.389495849609375, -0.35870361328125, -0.327911376953125, -0.297119140625, -0.266326904296875, -0.23553466796875, -0.204742431640625, -0.1739501953125, -0.143157958984375, -0.11236572265625, -0.081573486328125, -0.05078125, -0.019989013671875, 0.01080322265625, 0.041595458984375, 0.0723876953125, 0.103179931640625, 0.13397216796875, 0.164764404296875, 0.195556640625, 0.226348876953125, 0.25714111328125, 0.287933349609375, 0.3187255859375, 0.349517822265625, 0.38031005859375, 0.411102294921875, 0.44189453125, 0.472686767578125, 0.50347900390625, 0.534271240234375, 0.5650634765625, 0.595855712890625, 0.62664794921875, 0.657440185546875, 0.688232421875, 0.719024658203125, 0.74981689453125, 0.780609130859375, 0.8114013671875, 0.842193603515625, 0.87298583984375, 0.903778076171875, 0.9345703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 10.0, 9.0, 14.0, 16.0, 14.0, 23.0, 22.0, 18.0, 32.0, 29.0, 24.0, 28.0, 38.0, 32.0, 34.0, 42.0, 41.0, 1062.0, 54.0, 47.0, 30.0, 37.0, 46.0, 32.0, 34.0, 23.0, 29.0, 25.0, 30.0, 16.0, 24.0, 18.0, 9.0, 9.0, 10.0, 13.0, 6.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.66015625, -5.483154296875, -5.30615234375, -5.129150390625, -4.9521484375, -4.775146484375, -4.59814453125, -4.421142578125, -4.244140625, -4.067138671875, -3.89013671875, -3.713134765625, -3.5361328125, -3.359130859375, -3.18212890625, -3.005126953125, -2.828125, -2.651123046875, -2.47412109375, -2.297119140625, -2.1201171875, -1.943115234375, -1.76611328125, -1.589111328125, -1.412109375, -1.235107421875, -1.05810546875, -0.881103515625, -0.7041015625, -0.527099609375, -0.35009765625, -0.173095703125, 0.00390625, 0.180908203125, 0.35791015625, 0.534912109375, 0.7119140625, 0.888916015625, 1.06591796875, 1.242919921875, 1.419921875, 1.596923828125, 1.77392578125, 1.950927734375, 2.1279296875, 2.304931640625, 2.48193359375, 2.658935546875, 2.8359375, 3.012939453125, 3.18994140625, 3.366943359375, 3.5439453125, 3.720947265625, 3.89794921875, 4.074951171875, 4.251953125, 4.428955078125, 4.60595703125, 4.782958984375, 4.9599609375, 5.136962890625, 5.31396484375, 5.490966796875, 5.66796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 16.0, 7.0, 21.0, 27.0, 49.0, 75.0, 101.0, 172.0, 285.0, 430.0, 684.0, 1131.0, 1865.0, 3055.0, 5002.0, 8287.0, 14073.0, 23876.0, 41248.0, 69676.0, 114240.0, 168459.0, 1238277.0, 155171.0, 101742.0, 61457.0, 35686.0, 21120.0, 12309.0, 7346.0, 4401.0, 2512.0, 1678.0, 1004.0, 576.0, 423.0, 216.0, 162.0, 91.0, 57.0, 43.0, 33.0, 16.0, 12.0, 6.0, 10.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74072265625, -0.716339111328125, -0.69195556640625, -0.667572021484375, -0.6431884765625, -0.618804931640625, -0.59442138671875, -0.570037841796875, -0.545654296875, -0.521270751953125, -0.49688720703125, -0.472503662109375, -0.4481201171875, -0.423736572265625, -0.39935302734375, -0.374969482421875, -0.3505859375, -0.326202392578125, -0.30181884765625, -0.277435302734375, -0.2530517578125, -0.228668212890625, -0.20428466796875, -0.179901123046875, -0.155517578125, -0.131134033203125, -0.10675048828125, -0.082366943359375, -0.0579833984375, -0.033599853515625, -0.00921630859375, 0.015167236328125, 0.03955078125, 0.063934326171875, 0.08831787109375, 0.112701416015625, 0.1370849609375, 0.161468505859375, 0.18585205078125, 0.210235595703125, 0.234619140625, 0.259002685546875, 0.28338623046875, 0.307769775390625, 0.3321533203125, 0.356536865234375, 0.38092041015625, 0.405303955078125, 0.4296875, 0.454071044921875, 0.47845458984375, 0.502838134765625, 0.5272216796875, 0.551605224609375, 0.57598876953125, 0.600372314453125, 0.624755859375, 0.649139404296875, 0.67352294921875, 0.697906494140625, 0.7222900390625, 0.746673583984375, 0.77105712890625, 0.795440673828125, 0.81982421875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 9.0, 10.0, 27.0, 27.0, 26.0, 68.0, 90.0, 135.0, 144.0, 127.0, 91.0, 81.0, 55.0, 26.0, 23.0, 15.0, 7.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015289306640625, -0.014698028564453125, -0.01410675048828125, -0.013515472412109375, -0.0129241943359375, -0.012332916259765625, -0.01174163818359375, -0.011150360107421875, -0.01055908203125, -0.009967803955078125, -0.00937652587890625, -0.008785247802734375, -0.0081939697265625, -0.007602691650390625, -0.00701141357421875, -0.006420135498046875, -0.005828857421875, -0.005237579345703125, -0.00464630126953125, -0.004055023193359375, -0.0034637451171875, -0.002872467041015625, -0.00228118896484375, -0.001689910888671875, -0.0010986328125, -0.000507354736328125, 8.392333984375e-05, 0.000675201416015625, 0.0012664794921875, 0.001857757568359375, 0.00244903564453125, 0.003040313720703125, 0.003631591796875, 0.004222869873046875, 0.00481414794921875, 0.005405426025390625, 0.0059967041015625, 0.006587982177734375, 0.00717926025390625, 0.007770538330078125, 0.00836181640625, 0.008953094482421875, 0.00954437255859375, 0.010135650634765625, 0.0107269287109375, 0.011318206787109375, 0.01190948486328125, 0.012500762939453125, 0.013092041015625, 0.013683319091796875, 0.01427459716796875, 0.014865875244140625, 0.0154571533203125, 0.016048431396484375, 0.01663970947265625, 0.017230987548828125, 0.017822265625, 0.018413543701171875, 0.01900482177734375, 0.019596099853515625, 0.0201873779296875, 0.020778656005859375, 0.02136993408203125, 0.021961212158203125, 0.022552490234375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 3.0, 6.0, 7.0, 9.0, 18.0, 17.0, 37.0, 40.0, 93.0, 158.0, 748.0, 92870.0, 951575.0, 2412.0, 257.0, 102.0, 69.0, 39.0, 27.0, 19.0, 15.0, 12.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5159072875976562, -0.5020294189453125, -0.48815155029296875, -0.474273681640625, -0.46039581298828125, -0.4465179443359375, -0.43264007568359375, -0.41876220703125, -0.40488433837890625, -0.3910064697265625, -0.37712860107421875, -0.363250732421875, -0.34937286376953125, -0.3354949951171875, -0.32161712646484375, -0.3077392578125, -0.29386138916015625, -0.2799835205078125, -0.26610565185546875, -0.252227783203125, -0.23834991455078125, -0.2244720458984375, -0.21059417724609375, -0.19671630859375, -0.18283843994140625, -0.1689605712890625, -0.15508270263671875, -0.141204833984375, -0.12732696533203125, -0.1134490966796875, -0.09957122802734375, -0.085693359375, -0.07181549072265625, -0.0579376220703125, -0.04405975341796875, -0.030181884765625, -0.01630401611328125, -0.0024261474609375, 0.01145172119140625, 0.02532958984375, 0.03920745849609375, 0.0530853271484375, 0.06696319580078125, 0.080841064453125, 0.09471893310546875, 0.1085968017578125, 0.12247467041015625, 0.1363525390625, 0.15023040771484375, 0.1641082763671875, 0.17798614501953125, 0.191864013671875, 0.20574188232421875, 0.2196197509765625, 0.23349761962890625, 0.24737548828125, 0.26125335693359375, 0.2751312255859375, 0.28900909423828125, 0.302886962890625, 0.31676483154296875, 0.3306427001953125, 0.34452056884765625, 0.3583984375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 16.0, 25.0, 67.0, 163.0, 460.0, 207.0, 43.0, 12.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11028064042329788, -0.1081043928861618, -0.10592814534902573, -0.10375189781188965, -0.10157565772533417, -0.09939941018819809, -0.09722316265106201, -0.09504691511392593, -0.09287066757678986, -0.09069442003965378, -0.0885181725025177, -0.08634192496538162, -0.08416567742824554, -0.08198943734169006, -0.07981318980455399, -0.07763694226741791, -0.07546069473028183, -0.07328444719314575, -0.07110819965600967, -0.0689319521188736, -0.06675571203231812, -0.06457946449518204, -0.06240321695804596, -0.06022696942090988, -0.058050721883773804, -0.055874474346637726, -0.05369822680950165, -0.05152198299765587, -0.04934573546051979, -0.04716948792338371, -0.04499324411153793, -0.042816996574401855, -0.040640752762556076, -0.03846450522542, -0.03628826141357422, -0.03411201387643814, -0.03193576633930206, -0.029759518802165985, -0.027583273127675056, -0.025407027453184128, -0.02323077991604805, -0.021054532378911972, -0.018878286704421043, -0.016702041029930115, -0.014525793492794037, -0.012349546886980534, -0.01017330028116703, -0.007997053675353527, -0.005820807069540024, -0.0036445604637265205, -0.0014683138579130173, 0.000707932747900486, 0.0028841793537139893, 0.0050604259595274925, 0.007236672565340996, 0.009412919171154499, 0.011589165776968002, 0.013765412382781506, 0.01594165898859501, 0.018117904663085938, 0.020294152200222015, 0.022470399737358093, 0.024646645411849022, 0.02682289108633995, 0.02899913862347603]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 6.0, 7.0, 9.0, 15.0, 12.0, 18.0, 12.0, 14.0, 28.0, 19.0, 28.0, 39.0, 34.0, 40.0, 38.0, 50.0, 31.0, 42.0, 48.0, 36.0, 40.0, 43.0, 32.0, 39.0, 40.0, 29.0, 33.0, 30.0, 18.0, 16.0, 19.0, 27.0, 18.0, 17.0, 14.0, 6.0, 14.0, 7.0, 8.0, 7.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.009732306003570557, -0.009420500136911869, -0.009108694270253181, -0.008796888403594494, -0.008485082536935806, -0.008173276670277119, -0.007861470803618431, -0.0075496649369597435, -0.007237859070301056, -0.006926053203642368, -0.006614247336983681, -0.006302441470324993, -0.0059906356036663055, -0.005678829737007618, -0.00536702387034893, -0.005055218003690243, -0.004743412137031555, -0.004431606270372868, -0.00411980040371418, -0.0038079945370554924, -0.003496188670396805, -0.0031843828037381172, -0.0028725769370794296, -0.002560771070420742, -0.0022489652037620544, -0.0019371593371033669, -0.0016253534704446793, -0.0013135476037859917, -0.001001741737127304, -0.0006899358704686165, -0.0003781300038099289, -6.63241371512413e-05, 0.0002454817295074463, 0.0005572875961661339, 0.0008690934628248215, 0.001180899329483509, 0.0014927051961421967, 0.0018045110628008842, 0.002116316929459572, 0.0024281227961182594, 0.002739928662776947, 0.0030517345294356346, 0.003363540396094322, 0.00367534626275301, 0.003987152129411697, 0.004298957996070385, 0.004610763862729073, 0.00492256972938776, 0.005234375596046448, 0.005546181462705135, 0.005857987329363823, 0.0061697931960225105, 0.006481599062681198, 0.006793404929339886, 0.007105210795998573, 0.007417016662657261, 0.0077288225293159485, 0.008040628395974636, 0.008352434262633324, 0.008664240129292011, 0.008976045995950699, 0.009287851862609386, 0.009599657729268074, 0.009911463595926762, 0.01022326946258545]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 10.0, 16.0, 16.0, 16.0, 19.0, 18.0, 25.0, 32.0, 35.0, 46.0, 43.0, 52.0, 51.0, 39.0, 44.0, 38.0, 44.0, 43.0, 40.0, 42.0, 42.0, 34.0, 39.0, 24.0, 22.0, 29.0, 28.0, 21.0, 12.0, 20.0, 9.0, 6.0, 6.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0390625, -10.7198486328125, -10.400634765625, -10.0814208984375, -9.76220703125, -9.4429931640625, -9.123779296875, -8.8045654296875, -8.4853515625, -8.1661376953125, -7.846923828125, -7.5277099609375, -7.20849609375, -6.8892822265625, -6.570068359375, -6.2508544921875, -5.931640625, -5.6124267578125, -5.293212890625, -4.9739990234375, -4.65478515625, -4.3355712890625, -4.016357421875, -3.6971435546875, -3.3779296875, -3.0587158203125, -2.739501953125, -2.4202880859375, -2.10107421875, -1.7818603515625, -1.462646484375, -1.1434326171875, -0.82421875, -0.5050048828125, -0.185791015625, 0.1334228515625, 0.45263671875, 0.7718505859375, 1.091064453125, 1.4102783203125, 1.7294921875, 2.0487060546875, 2.367919921875, 2.6871337890625, 3.00634765625, 3.3255615234375, 3.644775390625, 3.9639892578125, 4.283203125, 4.6024169921875, 4.921630859375, 5.2408447265625, 5.56005859375, 5.8792724609375, 6.198486328125, 6.5177001953125, 6.8369140625, 7.1561279296875, 7.475341796875, 7.7945556640625, 8.11376953125, 8.4329833984375, 8.752197265625, 9.0714111328125, 9.390625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 12.0, 13.0, 23.0, 38.0, 56.0, 86.0, 125.0, 264.0, 459.0, 701.0, 1426.0, 2471.0, 4924.0, 10442.0, 28483.0, 132774.0, 621418.0, 185472.0, 35325.0, 12228.0, 5436.0, 2799.0, 1504.0, 874.0, 457.0, 248.0, 183.0, 99.0, 60.0, 45.0, 34.0, 16.0, 9.0, 10.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.241943359375, -9.93701171875, -9.632080078125, -9.3271484375, -9.022216796875, -8.71728515625, -8.412353515625, -8.107421875, -7.802490234375, -7.49755859375, -7.192626953125, -6.8876953125, -6.582763671875, -6.27783203125, -5.972900390625, -5.66796875, -5.363037109375, -5.05810546875, -4.753173828125, -4.4482421875, -4.143310546875, -3.83837890625, -3.533447265625, -3.228515625, -2.923583984375, -2.61865234375, -2.313720703125, -2.0087890625, -1.703857421875, -1.39892578125, -1.093994140625, -0.7890625, -0.484130859375, -0.17919921875, 0.125732421875, 0.4306640625, 0.735595703125, 1.04052734375, 1.345458984375, 1.650390625, 1.955322265625, 2.26025390625, 2.565185546875, 2.8701171875, 3.175048828125, 3.47998046875, 3.784912109375, 4.08984375, 4.394775390625, 4.69970703125, 5.004638671875, 5.3095703125, 5.614501953125, 5.91943359375, 6.224365234375, 6.529296875, 6.834228515625, 7.13916015625, 7.444091796875, 7.7490234375, 8.053955078125, 8.35888671875, 8.663818359375, 8.96875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 9.0, 5.0, 3.0, 16.0, 17.0, 13.0, 13.0, 18.0, 19.0, 35.0, 37.0, 33.0, 34.0, 36.0, 40.0, 40.0, 55.0, 114.0, 1723.0, 276.0, 63.0, 58.0, 37.0, 47.0, 42.0, 27.0, 34.0, 31.0, 32.0, 25.0, 22.0, 26.0, 8.0, 6.0, 10.0, 6.0, 5.0, 9.0, 6.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.765625, -27.797119140625, -26.82861328125, -25.860107421875, -24.8916015625, -23.923095703125, -22.95458984375, -21.986083984375, -21.017578125, -20.049072265625, -19.08056640625, -18.112060546875, -17.1435546875, -16.175048828125, -15.20654296875, -14.238037109375, -13.26953125, -12.301025390625, -11.33251953125, -10.364013671875, -9.3955078125, -8.427001953125, -7.45849609375, -6.489990234375, -5.521484375, -4.552978515625, -3.58447265625, -2.615966796875, -1.6474609375, -0.678955078125, 0.28955078125, 1.258056640625, 2.2265625, 3.195068359375, 4.16357421875, 5.132080078125, 6.1005859375, 7.069091796875, 8.03759765625, 9.006103515625, 9.974609375, 10.943115234375, 11.91162109375, 12.880126953125, 13.8486328125, 14.817138671875, 15.78564453125, 16.754150390625, 17.72265625, 18.691162109375, 19.65966796875, 20.628173828125, 21.5966796875, 22.565185546875, 23.53369140625, 24.502197265625, 25.470703125, 26.439208984375, 27.40771484375, 28.376220703125, 29.3447265625, 30.313232421875, 31.28173828125, 32.250244140625, 33.21875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 10.0, 9.0, 9.0, 12.0, 13.0, 32.0, 44.0, 55.0, 72.0, 79.0, 117.0, 203.0, 256.0, 472.0, 1671.0, 77881.0, 3058073.0, 5030.0, 656.0, 304.0, 199.0, 125.0, 104.0, 84.0, 30.0, 34.0, 22.0, 22.0, 19.0, 9.0, 10.0, 6.0, 0.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.4375, -74.873046875, -72.30859375, -69.744140625, -67.1796875, -64.615234375, -62.05078125, -59.486328125, -56.921875, -54.357421875, -51.79296875, -49.228515625, -46.6640625, -44.099609375, -41.53515625, -38.970703125, -36.40625, -33.841796875, -31.27734375, -28.712890625, -26.1484375, -23.583984375, -21.01953125, -18.455078125, -15.890625, -13.326171875, -10.76171875, -8.197265625, -5.6328125, -3.068359375, -0.50390625, 2.060546875, 4.625, 7.189453125, 9.75390625, 12.318359375, 14.8828125, 17.447265625, 20.01171875, 22.576171875, 25.140625, 27.705078125, 30.26953125, 32.833984375, 35.3984375, 37.962890625, 40.52734375, 43.091796875, 45.65625, 48.220703125, 50.78515625, 53.349609375, 55.9140625, 58.478515625, 61.04296875, 63.607421875, 66.171875, 68.736328125, 71.30078125, 73.865234375, 76.4296875, 78.994140625, 81.55859375, 84.123046875, 86.6875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 4.0, 7.0, 7.0, 12.0, 30.0, 32.0, 43.0, 70.0, 81.0, 99.0, 111.0, 110.0, 97.0, 73.0, 73.0, 58.0, 40.0, 32.0, 12.0, 8.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.293408393859863, -7.600240230560303, -6.9070725440979, -6.21390438079834, -5.5207366943359375, -4.827568531036377, -4.134400367736816, -3.441232681274414, -2.7480645179748535, -2.054896593093872, -1.361728549003601, -0.6685605049133301, 0.024607419967651367, 0.7177753448486328, 1.4109435081481934, 2.1041111946105957, 2.7972793579101562, 3.4904472827911377, 4.183615207672119, 4.87678337097168, 5.569951057434082, 6.263119220733643, 6.956287384033203, 7.6494550704956055, 8.342622756958008, 9.03579044342041, 9.728959083557129, 10.422126770019531, 11.115294456481934, 11.808462142944336, 12.501630783081055, 13.194798469543457, 13.887968063354492, 14.581135749816895, 15.274304389953613, 15.967472076416016, 16.660640716552734, 17.35380744934082, 18.04697608947754, 18.740142822265625, 19.433311462402344, 20.126480102539062, 20.81964683532715, 21.512815475463867, 22.205984115600586, 22.899150848388672, 23.59231948852539, 24.28548812866211, 24.978656768798828, 25.671825408935547, 26.364992141723633, 27.05816078186035, 27.75132942199707, 28.444496154785156, 29.137664794921875, 29.830833435058594, 30.52400016784668, 31.2171688079834, 31.910335540771484, 32.6035041809082, 33.29667282104492, 33.98984146118164, 34.683006286621094, 35.37617492675781, 36.06934356689453]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 3.0, 5.0, 4.0, 6.0, 15.0, 11.0, 10.0, 14.0, 13.0, 23.0, 23.0, 22.0, 29.0, 32.0, 32.0, 30.0, 35.0, 39.0, 43.0, 38.0, 51.0, 45.0, 45.0, 37.0, 39.0, 35.0, 24.0, 31.0, 33.0, 28.0, 26.0, 27.0, 19.0, 18.0, 22.0, 13.0, 12.0, 10.0, 12.0, 12.0, 6.0, 10.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.42304992675781, -79.01300811767578, -76.60296630859375, -74.19292449951172, -71.78288269042969, -69.37284088134766, -66.96279907226562, -64.5527572631836, -62.14271545410156, -59.73267364501953, -57.3226318359375, -54.91259002685547, -52.50254821777344, -50.092506408691406, -47.682464599609375, -45.272422790527344, -42.86237716674805, -40.452335357666016, -38.042293548583984, -35.63225173950195, -33.22220993041992, -30.81216812133789, -28.402124404907227, -25.992082595825195, -23.582040786743164, -21.171998977661133, -18.7619571685791, -16.351913452148438, -13.941872596740723, -11.531830787658691, -9.121788024902344, -6.7117462158203125, -4.301704406738281, -1.891662359237671, 0.5183796882629395, 2.928421974182129, 5.33846378326416, 7.748505592346191, 10.158548355102539, 12.56859016418457, 14.978631973266602, 17.388673782348633, 19.798715591430664, 22.208759307861328, 24.61880111694336, 27.02884292602539, 29.438884735107422, 31.848926544189453, 34.258968353271484, 36.669010162353516, 39.07905197143555, 41.48909378051758, 43.89913558959961, 46.30917739868164, 48.71922302246094, 51.12926483154297, 53.539306640625, 55.94934844970703, 58.35939025878906, 60.769432067871094, 63.179473876953125, 65.58951568603516, 67.99955749511719, 70.40959930419922, 72.81964111328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 9.0, 5.0, 7.0, 13.0, 16.0, 11.0, 16.0, 23.0, 15.0, 31.0, 30.0, 47.0, 46.0, 48.0, 45.0, 47.0, 49.0, 45.0, 46.0, 38.0, 45.0, 37.0, 33.0, 38.0, 40.0, 28.0, 27.0, 33.0, 25.0, 28.0, 17.0, 17.0, 12.0, 6.0, 6.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.178466796875, -10.84130859375, -10.504150390625, -10.1669921875, -9.829833984375, -9.49267578125, -9.155517578125, -8.818359375, -8.481201171875, -8.14404296875, -7.806884765625, -7.4697265625, -7.132568359375, -6.79541015625, -6.458251953125, -6.12109375, -5.783935546875, -5.44677734375, -5.109619140625, -4.7724609375, -4.435302734375, -4.09814453125, -3.760986328125, -3.423828125, -3.086669921875, -2.74951171875, -2.412353515625, -2.0751953125, -1.738037109375, -1.40087890625, -1.063720703125, -0.7265625, -0.389404296875, -0.05224609375, 0.284912109375, 0.6220703125, 0.959228515625, 1.29638671875, 1.633544921875, 1.970703125, 2.307861328125, 2.64501953125, 2.982177734375, 3.3193359375, 3.656494140625, 3.99365234375, 4.330810546875, 4.66796875, 5.005126953125, 5.34228515625, 5.679443359375, 6.0166015625, 6.353759765625, 6.69091796875, 7.028076171875, 7.365234375, 7.702392578125, 8.03955078125, 8.376708984375, 8.7138671875, 9.051025390625, 9.38818359375, 9.725341796875, 10.0625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 6.0, 15.0, 17.0, 25.0, 14.0, 25.0, 37.0, 45.0, 66.0, 90.0, 119.0, 216.0, 384.0, 816.0, 1873.0, 5604.0, 21779.0, 124806.0, 1002876.0, 2364229.0, 574881.0, 74521.0, 14562.0, 4133.0, 1475.0, 639.0, 343.0, 170.0, 135.0, 84.0, 66.0, 50.0, 47.0, 32.0, 19.0, 21.0, 10.0, 7.0, 11.0, 4.0, 6.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-23.4375, -22.79296875, -22.1484375, -21.50390625, -20.859375, -20.21484375, -19.5703125, -18.92578125, -18.28125, -17.63671875, -16.9921875, -16.34765625, -15.703125, -15.05859375, -14.4140625, -13.76953125, -13.125, -12.48046875, -11.8359375, -11.19140625, -10.546875, -9.90234375, -9.2578125, -8.61328125, -7.96875, -7.32421875, -6.6796875, -6.03515625, -5.390625, -4.74609375, -4.1015625, -3.45703125, -2.8125, -2.16796875, -1.5234375, -0.87890625, -0.234375, 0.41015625, 1.0546875, 1.69921875, 2.34375, 2.98828125, 3.6328125, 4.27734375, 4.921875, 5.56640625, 6.2109375, 6.85546875, 7.5, 8.14453125, 8.7890625, 9.43359375, 10.078125, 10.72265625, 11.3671875, 12.01171875, 12.65625, 13.30078125, 13.9453125, 14.58984375, 15.234375, 15.87890625, 16.5234375, 17.16796875, 17.8125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 10.0, 17.0, 20.0, 24.0, 37.0, 64.0, 85.0, 145.0, 198.0, 245.0, 405.0, 598.0, 615.0, 517.0, 362.0, 257.0, 171.0, 89.0, 74.0, 56.0, 19.0, 17.0, 18.0, 16.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.453125, -30.671875, -29.890625, -29.109375, -28.328125, -27.546875, -26.765625, -25.984375, -25.203125, -24.421875, -23.640625, -22.859375, -22.078125, -21.296875, -20.515625, -19.734375, -18.953125, -18.171875, -17.390625, -16.609375, -15.828125, -15.046875, -14.265625, -13.484375, -12.703125, -11.921875, -11.140625, -10.359375, -9.578125, -8.796875, -8.015625, -7.234375, -6.453125, -5.671875, -4.890625, -4.109375, -3.328125, -2.546875, -1.765625, -0.984375, -0.203125, 0.578125, 1.359375, 2.140625, 2.921875, 3.703125, 4.484375, 5.265625, 6.046875, 6.828125, 7.609375, 8.390625, 9.171875, 9.953125, 10.734375, 11.515625, 12.296875, 13.078125, 13.859375, 14.640625, 15.421875, 16.203125, 16.984375, 17.765625, 18.546875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 20.0, 11.0, 19.0, 31.0, 42.0, 66.0, 102.0, 145.0, 219.0, 304.0, 619.0, 1694.0, 54062.0, 3996453.0, 136506.0, 2333.0, 547.0, 349.0, 232.0, 150.0, 105.0, 83.0, 51.0, 37.0, 22.0, 18.0, 19.0, 8.0, 9.0, 8.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.375, -68.5849609375, -65.794921875, -63.0048828125, -60.21484375, -57.4248046875, -54.634765625, -51.8447265625, -49.0546875, -46.2646484375, -43.474609375, -40.6845703125, -37.89453125, -35.1044921875, -32.314453125, -29.5244140625, -26.734375, -23.9443359375, -21.154296875, -18.3642578125, -15.57421875, -12.7841796875, -9.994140625, -7.2041015625, -4.4140625, -1.6240234375, 1.166015625, 3.9560546875, 6.74609375, 9.5361328125, 12.326171875, 15.1162109375, 17.90625, 20.6962890625, 23.486328125, 26.2763671875, 29.06640625, 31.8564453125, 34.646484375, 37.4365234375, 40.2265625, 43.0166015625, 45.806640625, 48.5966796875, 51.38671875, 54.1767578125, 56.966796875, 59.7568359375, 62.546875, 65.3369140625, 68.126953125, 70.9169921875, 73.70703125, 76.4970703125, 79.287109375, 82.0771484375, 84.8671875, 87.6572265625, 90.447265625, 93.2373046875, 96.02734375, 98.8173828125, 101.607421875, 104.3974609375, 107.1875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 17.0, 22.0, 39.0, 60.0, 73.0, 81.0, 114.0, 104.0, 112.0, 106.0, 79.0, 64.0, 48.0, 33.0, 21.0, 12.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.5018539428711, -95.68376159667969, -92.86566925048828, -90.04757690429688, -87.22948455810547, -84.41139221191406, -81.59329223632812, -78.77520751953125, -75.95710754394531, -73.1390151977539, -70.3209228515625, -67.5028305053711, -64.68473815917969, -61.86664581298828, -59.04854965209961, -56.2304573059082, -53.41236877441406, -50.594276428222656, -47.77618408203125, -44.958091735839844, -42.13999938964844, -39.32190704345703, -36.50381088256836, -33.68571853637695, -30.867626190185547, -28.04953384399414, -25.231441497802734, -22.413347244262695, -19.59525489807129, -16.777162551879883, -13.959068298339844, -11.140975952148438, -8.322891235351562, -5.504798412322998, -2.6867055892944336, 0.13138771057128906, 2.9494800567626953, 5.767572402954102, 8.58566665649414, 11.403759002685547, 14.221851348876953, 17.03994369506836, 19.858036041259766, 22.676130294799805, 25.49422264099121, 28.312314987182617, 31.130409240722656, 33.94850158691406, 36.76659393310547, 39.584686279296875, 42.40277862548828, 45.22087097167969, 48.038963317871094, 50.8570556640625, 53.67515182495117, 56.49324417114258, 59.311336517333984, 62.12942886352539, 64.94752502441406, 67.76561737060547, 70.58370971679688, 73.40180206298828, 76.21989440917969, 79.0379867553711, 81.8560791015625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 11.0, 11.0, 9.0, 11.0, 14.0, 20.0, 22.0, 19.0, 28.0, 23.0, 36.0, 20.0, 35.0, 37.0, 34.0, 46.0, 43.0, 37.0, 44.0, 44.0, 36.0, 33.0, 34.0, 28.0, 38.0, 38.0, 23.0, 28.0, 31.0, 28.0, 25.0, 14.0, 15.0, 11.0, 12.0, 11.0, 8.0, 8.0, 10.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.1654052734375, -53.2896728515625, -51.413944244384766, -49.538211822509766, -47.66248321533203, -45.78675079345703, -43.91101837158203, -42.03528594970703, -40.1595573425293, -38.2838249206543, -36.40809631347656, -34.53236389160156, -32.65663146972656, -30.780902862548828, -28.905170440673828, -27.02943992614746, -25.153709411621094, -23.277978897094727, -21.40224838256836, -19.52651596069336, -17.650785446166992, -15.775054931640625, -13.899323463439941, -12.023591995239258, -10.14786148071289, -8.272130966186523, -6.39639949798584, -4.5206685066223145, -2.644937515258789, -0.7692070007324219, 1.1065244674682617, 2.9822559356689453, 4.8579864501953125, 6.733717441558838, 8.609448432922363, 10.485179901123047, 12.360910415649414, 14.236640930175781, 16.11237335205078, 17.98810386657715, 19.863834381103516, 21.739564895629883, 23.61529541015625, 25.49102783203125, 27.366758346557617, 29.242488861083984, 31.118221282958984, 32.99394989013672, 34.86968231201172, 36.74541473388672, 38.62114334106445, 40.49687576293945, 42.37260437011719, 44.24833679199219, 46.12406921386719, 47.99980163574219, 49.87553024291992, 51.75126266479492, 53.626991271972656, 55.502723693847656, 57.378456115722656, 59.25418472290039, 61.12991714477539, 63.005645751953125, 64.88137817382812]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 14.0, 10.0, 20.0, 22.0, 17.0, 24.0, 28.0, 35.0, 42.0, 44.0, 35.0, 54.0, 51.0, 51.0, 45.0, 35.0, 52.0, 49.0, 42.0, 41.0, 35.0, 35.0, 34.0, 32.0, 30.0, 20.0, 11.0, 18.0, 20.0, 11.0, 9.0, 6.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8125, -11.4732666015625, -11.134033203125, -10.7947998046875, -10.45556640625, -10.1163330078125, -9.777099609375, -9.4378662109375, -9.0986328125, -8.7593994140625, -8.420166015625, -8.0809326171875, -7.74169921875, -7.4024658203125, -7.063232421875, -6.7239990234375, -6.384765625, -6.0455322265625, -5.706298828125, -5.3670654296875, -5.02783203125, -4.6885986328125, -4.349365234375, -4.0101318359375, -3.6708984375, -3.3316650390625, -2.992431640625, -2.6531982421875, -2.31396484375, -1.9747314453125, -1.635498046875, -1.2962646484375, -0.95703125, -0.6177978515625, -0.278564453125, 0.0606689453125, 0.39990234375, 0.7391357421875, 1.078369140625, 1.4176025390625, 1.7568359375, 2.0960693359375, 2.435302734375, 2.7745361328125, 3.11376953125, 3.4530029296875, 3.792236328125, 4.1314697265625, 4.470703125, 4.8099365234375, 5.149169921875, 5.4884033203125, 5.82763671875, 6.1668701171875, 6.506103515625, 6.8453369140625, 7.1845703125, 7.5238037109375, 7.863037109375, 8.2022705078125, 8.54150390625, 8.8807373046875, 9.219970703125, 9.5592041015625, 9.8984375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 1.0, 6.0, 14.0, 21.0, 27.0, 32.0, 55.0, 76.0, 115.0, 178.0, 256.0, 353.0, 541.0, 725.0, 1163.0, 1745.0, 2536.0, 3859.0, 5742.0, 8691.0, 13148.0, 20785.0, 33923.0, 56898.0, 98318.0, 154748.0, 194485.0, 169456.0, 110757.0, 64646.0, 38220.0, 23518.0, 14699.0, 9659.0, 6274.0, 4254.0, 2808.0, 1922.0, 1202.0, 890.0, 585.0, 377.0, 275.0, 164.0, 161.0, 78.0, 64.0, 41.0, 20.0, 20.0, 12.0, 5.0, 8.0, 4.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.0517578125, -1.0195159912109375, -0.987274169921875, -0.9550323486328125, -0.92279052734375, -0.8905487060546875, -0.858306884765625, -0.8260650634765625, -0.7938232421875, -0.7615814208984375, -0.729339599609375, -0.6970977783203125, -0.66485595703125, -0.6326141357421875, -0.600372314453125, -0.5681304931640625, -0.535888671875, -0.5036468505859375, -0.471405029296875, -0.4391632080078125, -0.40692138671875, -0.3746795654296875, -0.342437744140625, -0.3101959228515625, -0.2779541015625, -0.2457122802734375, -0.213470458984375, -0.1812286376953125, -0.14898681640625, -0.1167449951171875, -0.084503173828125, -0.0522613525390625, -0.02001953125, 0.0122222900390625, 0.044464111328125, 0.0767059326171875, 0.10894775390625, 0.1411895751953125, 0.173431396484375, 0.2056732177734375, 0.2379150390625, 0.2701568603515625, 0.302398681640625, 0.3346405029296875, 0.36688232421875, 0.3991241455078125, 0.431365966796875, 0.4636077880859375, 0.495849609375, 0.5280914306640625, 0.560333251953125, 0.5925750732421875, 0.62481689453125, 0.6570587158203125, 0.689300537109375, 0.7215423583984375, 0.7537841796875, 0.7860260009765625, 0.818267822265625, 0.8505096435546875, 0.88275146484375, 0.9149932861328125, 0.947235107421875, 0.9794769287109375, 1.01171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 10.0, 9.0, 7.0, 15.0, 13.0, 19.0, 13.0, 21.0, 20.0, 29.0, 40.0, 33.0, 46.0, 44.0, 39.0, 56.0, 43.0, 1055.0, 44.0, 44.0, 42.0, 37.0, 50.0, 27.0, 42.0, 45.0, 30.0, 32.0, 18.0, 21.0, 17.0, 14.0, 8.0, 7.0, 9.0, 10.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.53125, -7.31561279296875, -7.0999755859375, -6.88433837890625, -6.668701171875, -6.45306396484375, -6.2374267578125, -6.02178955078125, -5.80615234375, -5.59051513671875, -5.3748779296875, -5.15924072265625, -4.943603515625, -4.72796630859375, -4.5123291015625, -4.29669189453125, -4.0810546875, -3.86541748046875, -3.6497802734375, -3.43414306640625, -3.218505859375, -3.00286865234375, -2.7872314453125, -2.57159423828125, -2.35595703125, -2.14031982421875, -1.9246826171875, -1.70904541015625, -1.493408203125, -1.27777099609375, -1.0621337890625, -0.84649658203125, -0.630859375, -0.41522216796875, -0.1995849609375, 0.01605224609375, 0.231689453125, 0.44732666015625, 0.6629638671875, 0.87860107421875, 1.09423828125, 1.30987548828125, 1.5255126953125, 1.74114990234375, 1.956787109375, 2.17242431640625, 2.3880615234375, 2.60369873046875, 2.8193359375, 3.03497314453125, 3.2506103515625, 3.46624755859375, 3.681884765625, 3.89752197265625, 4.1131591796875, 4.32879638671875, 4.54443359375, 4.76007080078125, 4.9757080078125, 5.19134521484375, 5.406982421875, 5.62261962890625, 5.8382568359375, 6.05389404296875, 6.26953125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 16.0, 23.0, 31.0, 42.0, 79.0, 107.0, 190.0, 292.0, 482.0, 787.0, 1424.0, 2223.0, 3789.0, 6215.0, 10215.0, 17874.0, 31736.0, 56218.0, 98656.0, 156007.0, 1244275.0, 181561.0, 119786.0, 70725.0, 39677.0, 22424.0, 12984.0, 7670.0, 4490.0, 2778.0, 1697.0, 1063.0, 594.0, 377.0, 238.0, 141.0, 95.0, 53.0, 37.0, 20.0, 13.0, 8.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.9130859375, -0.88751220703125, -0.8619384765625, -0.83636474609375, -0.810791015625, -0.78521728515625, -0.7596435546875, -0.73406982421875, -0.70849609375, -0.68292236328125, -0.6573486328125, -0.63177490234375, -0.606201171875, -0.58062744140625, -0.5550537109375, -0.52947998046875, -0.50390625, -0.47833251953125, -0.4527587890625, -0.42718505859375, -0.401611328125, -0.37603759765625, -0.3504638671875, -0.32489013671875, -0.29931640625, -0.27374267578125, -0.2481689453125, -0.22259521484375, -0.197021484375, -0.17144775390625, -0.1458740234375, -0.12030029296875, -0.0947265625, -0.06915283203125, -0.0435791015625, -0.01800537109375, 0.007568359375, 0.03314208984375, 0.0587158203125, 0.08428955078125, 0.10986328125, 0.13543701171875, 0.1610107421875, 0.18658447265625, 0.212158203125, 0.23773193359375, 0.2633056640625, 0.28887939453125, 0.314453125, 0.34002685546875, 0.3656005859375, 0.39117431640625, 0.416748046875, 0.44232177734375, 0.4678955078125, 0.49346923828125, 0.51904296875, 0.54461669921875, 0.5701904296875, 0.59576416015625, 0.621337890625, 0.64691162109375, 0.6724853515625, 0.69805908203125, 0.7236328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 4.0, 9.0, 10.0, 6.0, 8.0, 24.0, 21.0, 29.0, 41.0, 48.0, 54.0, 78.0, 73.0, 77.0, 97.0, 73.0, 58.0, 50.0, 39.0, 35.0, 35.0, 20.0, 13.0, 22.0, 7.0, 8.0, 10.0, 7.0, 7.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.0169830322265625, -0.016495585441589355, -0.01600813865661621, -0.015520691871643066, -0.015033245086669922, -0.014545798301696777, -0.014058351516723633, -0.013570904731750488, -0.013083457946777344, -0.0125960111618042, -0.012108564376831055, -0.01162111759185791, -0.011133670806884766, -0.010646224021911621, -0.010158777236938477, -0.009671330451965332, -0.009183883666992188, -0.008696436882019043, -0.008208990097045898, -0.007721543312072754, -0.007234096527099609, -0.006746649742126465, -0.00625920295715332, -0.005771756172180176, -0.005284309387207031, -0.004796862602233887, -0.004309415817260742, -0.0038219690322875977, -0.003334522247314453, -0.0028470754623413086, -0.002359628677368164, -0.0018721818923950195, -0.001384735107421875, -0.0008972883224487305, -0.00040984153747558594, 7.76052474975586e-05, 0.0005650520324707031, 0.0010524988174438477, 0.0015399456024169922, 0.0020273923873901367, 0.0025148391723632812, 0.0030022859573364258, 0.0034897327423095703, 0.003977179527282715, 0.004464626312255859, 0.004952073097229004, 0.0054395198822021484, 0.005926966667175293, 0.0064144134521484375, 0.006901860237121582, 0.0073893070220947266, 0.007876753807067871, 0.008364200592041016, 0.00885164737701416, 0.009339094161987305, 0.00982654094696045, 0.010313987731933594, 0.010801434516906738, 0.011288881301879883, 0.011776328086853027, 0.012263774871826172, 0.012751221656799316, 0.013238668441772461, 0.013726115226745605, 0.01421356201171875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 12.0, 9.0, 13.0, 29.0, 26.0, 30.0, 34.0, 54.0, 65.0, 112.0, 209.0, 581.0, 29919.0, 1010696.0, 5823.0, 421.0, 147.0, 95.0, 54.0, 38.0, 38.0, 30.0, 18.0, 15.0, 13.0, 5.0, 5.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347412109375, -0.3355751037597656, -0.32373809814453125, -0.3119010925292969, -0.3000640869140625, -0.2882270812988281, -0.27639007568359375, -0.2645530700683594, -0.252716064453125, -0.24087905883789062, -0.22904205322265625, -0.21720504760742188, -0.2053680419921875, -0.19353103637695312, -0.18169403076171875, -0.16985702514648438, -0.15802001953125, -0.14618301391601562, -0.13434600830078125, -0.12250900268554688, -0.1106719970703125, -0.09883499145507812, -0.08699798583984375, -0.07516098022460938, -0.063323974609375, -0.051486968994140625, -0.03964996337890625, -0.027812957763671875, -0.0159759521484375, -0.004138946533203125, 0.00769805908203125, 0.019535064697265625, 0.0313720703125, 0.043209075927734375, 0.05504608154296875, 0.06688308715820312, 0.0787200927734375, 0.09055709838867188, 0.10239410400390625, 0.11423110961914062, 0.126068115234375, 0.13790512084960938, 0.14974212646484375, 0.16157913208007812, 0.1734161376953125, 0.18525314331054688, 0.19709014892578125, 0.20892715454101562, 0.22076416015625, 0.23260116577148438, 0.24443817138671875, 0.2562751770019531, 0.2681121826171875, 0.2799491882324219, 0.29178619384765625, 0.3036231994628906, 0.315460205078125, 0.3272972106933594, 0.33913421630859375, 0.3509712219238281, 0.3628082275390625, 0.3746452331542969, 0.38648223876953125, 0.3983192443847656, 0.41015625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 15.0, 58.0, 604.0, 316.0, 19.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12497041374444962, -0.12049411982297897, -0.11601781845092773, -0.11154152452945709, -0.10706523060798645, -0.10258892923593521, -0.09811263531446457, -0.09363633394241333, -0.08916004002094269, -0.08468374609947205, -0.0802074447274208, -0.07573115080595016, -0.07125484943389893, -0.06677855551242828, -0.06230226159095764, -0.0578259639441967, -0.05334966629743576, -0.04887336865067482, -0.04439707100391388, -0.03992077708244324, -0.0354444794356823, -0.030968181788921356, -0.026491886004805565, -0.022015590220689774, -0.017539292573928833, -0.013062995858490467, -0.008586699143052101, -0.004110402427613735, 0.00036589428782463074, 0.004842191934585571, 0.009318487718701363, 0.013794783502817154, 0.01827108860015869, 0.022747386246919632, 0.027223682031035423, 0.031699977815151215, 0.036176275461912155, 0.040652573108673096, 0.04512886703014374, 0.04960516467690468, 0.05408146232366562, 0.05855775997042656, 0.0630340576171875, 0.06751035153865814, 0.07198664546012878, 0.07646294683218002, 0.08093924075365067, 0.0854155421257019, 0.08989183604717255, 0.09436812996864319, 0.09884443134069443, 0.10332072526216507, 0.10779702663421631, 0.11227332055568695, 0.11674961447715759, 0.12122590839862823, 0.12570220232009888, 0.13017849624156952, 0.13465479016304016, 0.139131098985672, 0.14360739290714264, 0.14808368682861328, 0.15255998075008392, 0.15703627467155457, 0.1615125834941864]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 6.0, 5.0, 15.0, 20.0, 20.0, 19.0, 27.0, 31.0, 38.0, 44.0, 46.0, 43.0, 41.0, 48.0, 56.0, 38.0, 40.0, 50.0, 37.0, 43.0, 46.0, 36.0, 43.0, 30.0, 31.0, 33.0, 25.0, 14.0, 10.0, 14.0, 12.0, 6.0, 7.0, 1.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.018219470977783203, -0.017660925164818764, -0.017102379351854324, -0.016543833538889885, -0.015985287725925446, -0.015426741912961006, -0.014868196099996567, -0.014309650287032127, -0.013751104474067688, -0.013192558661103249, -0.01263401284813881, -0.01207546703517437, -0.01151692122220993, -0.010958375409245491, -0.010399829596281052, -0.009841283783316612, -0.009282737970352173, -0.008724192157387733, -0.008165646344423294, -0.007607100531458855, -0.007048554718494415, -0.006490008905529976, -0.0059314630925655365, -0.005372917279601097, -0.004814371466636658, -0.004255825653672218, -0.003697279840707779, -0.0031387340277433395, -0.0025801882147789, -0.0020216424018144608, -0.0014630965888500214, -0.000904550775885582, -0.0003460049629211426, 0.00021254085004329681, 0.0007710866630077362, 0.0013296324759721756, 0.001888178288936615, 0.0024467241019010544, 0.0030052699148654938, 0.003563815727829933, 0.0041223615407943726, 0.004680907353758812, 0.005239453166723251, 0.005797998979687691, 0.00635654479265213, 0.0069150906056165695, 0.007473636418581009, 0.008032182231545448, 0.008590728044509888, 0.009149273857474327, 0.009707819670438766, 0.010266365483403206, 0.010824911296367645, 0.011383457109332085, 0.011942002922296524, 0.012500548735260963, 0.013059094548225403, 0.013617640361189842, 0.014176186174154282, 0.014734731987118721, 0.01529327780008316, 0.0158518236130476, 0.01641036942601204, 0.01696891523897648, 0.017527461051940918]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 14.0, 10.0, 20.0, 22.0, 17.0, 24.0, 28.0, 35.0, 42.0, 44.0, 35.0, 55.0, 50.0, 51.0, 44.0, 36.0, 52.0, 49.0, 42.0, 42.0, 34.0, 35.0, 34.0, 32.0, 30.0, 20.0, 11.0, 18.0, 20.0, 11.0, 9.0, 6.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8125, -11.4732666015625, -11.134033203125, -10.7947998046875, -10.45556640625, -10.1163330078125, -9.777099609375, -9.4378662109375, -9.0986328125, -8.7593994140625, -8.420166015625, -8.0809326171875, -7.74169921875, -7.4024658203125, -7.063232421875, -6.7239990234375, -6.384765625, -6.0455322265625, -5.706298828125, -5.3670654296875, -5.02783203125, -4.6885986328125, -4.349365234375, -4.0101318359375, -3.6708984375, -3.3316650390625, -2.992431640625, -2.6531982421875, -2.31396484375, -1.9747314453125, -1.635498046875, -1.2962646484375, -0.95703125, -0.6177978515625, -0.278564453125, 0.0606689453125, 0.39990234375, 0.7391357421875, 1.078369140625, 1.4176025390625, 1.7568359375, 2.0960693359375, 2.435302734375, 2.7745361328125, 3.11376953125, 3.4530029296875, 3.792236328125, 4.1314697265625, 4.470703125, 4.8099365234375, 5.149169921875, 5.4884033203125, 5.82763671875, 6.1668701171875, 6.506103515625, 6.8453369140625, 7.1845703125, 7.5238037109375, 7.863037109375, 8.2022705078125, 8.54150390625, 8.8807373046875, 9.219970703125, 9.5592041015625, 9.8984375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 11.0, 15.0, 23.0, 48.0, 68.0, 121.0, 188.0, 282.0, 433.0, 768.0, 1369.0, 2550.0, 4628.0, 8469.0, 16099.0, 31501.0, 66543.0, 155666.0, 365028.0, 220273.0, 88868.0, 41370.0, 20348.0, 10775.0, 5745.0, 3111.0, 1752.0, 1020.0, 572.0, 340.0, 192.0, 117.0, 86.0, 53.0, 38.0, 17.0, 21.0, 10.0, 9.0, 6.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.6746826171875, -6.470458984375, -6.2662353515625, -6.06201171875, -5.8577880859375, -5.653564453125, -5.4493408203125, -5.2451171875, -5.0408935546875, -4.836669921875, -4.6324462890625, -4.42822265625, -4.2239990234375, -4.019775390625, -3.8155517578125, -3.611328125, -3.4071044921875, -3.202880859375, -2.9986572265625, -2.79443359375, -2.5902099609375, -2.385986328125, -2.1817626953125, -1.9775390625, -1.7733154296875, -1.569091796875, -1.3648681640625, -1.16064453125, -0.9564208984375, -0.752197265625, -0.5479736328125, -0.34375, -0.1395263671875, 0.064697265625, 0.2689208984375, 0.47314453125, 0.6773681640625, 0.881591796875, 1.0858154296875, 1.2900390625, 1.4942626953125, 1.698486328125, 1.9027099609375, 2.10693359375, 2.3111572265625, 2.515380859375, 2.7196044921875, 2.923828125, 3.1280517578125, 3.332275390625, 3.5364990234375, 3.74072265625, 3.9449462890625, 4.149169921875, 4.3533935546875, 4.5576171875, 4.7618408203125, 4.966064453125, 5.1702880859375, 5.37451171875, 5.5787353515625, 5.782958984375, 5.9871826171875, 6.19140625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 7.0, 13.0, 9.0, 15.0, 20.0, 16.0, 15.0, 16.0, 22.0, 30.0, 27.0, 28.0, 33.0, 47.0, 49.0, 52.0, 106.0, 259.0, 1578.0, 178.0, 91.0, 69.0, 54.0, 36.0, 42.0, 36.0, 25.0, 27.0, 26.0, 17.0, 19.0, 18.0, 12.0, 17.0, 4.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.34375, -33.3447265625, -32.345703125, -31.3466796875, -30.34765625, -29.3486328125, -28.349609375, -27.3505859375, -26.3515625, -25.3525390625, -24.353515625, -23.3544921875, -22.35546875, -21.3564453125, -20.357421875, -19.3583984375, -18.359375, -17.3603515625, -16.361328125, -15.3623046875, -14.36328125, -13.3642578125, -12.365234375, -11.3662109375, -10.3671875, -9.3681640625, -8.369140625, -7.3701171875, -6.37109375, -5.3720703125, -4.373046875, -3.3740234375, -2.375, -1.3759765625, -0.376953125, 0.6220703125, 1.62109375, 2.6201171875, 3.619140625, 4.6181640625, 5.6171875, 6.6162109375, 7.615234375, 8.6142578125, 9.61328125, 10.6123046875, 11.611328125, 12.6103515625, 13.609375, 14.6083984375, 15.607421875, 16.6064453125, 17.60546875, 18.6044921875, 19.603515625, 20.6025390625, 21.6015625, 22.6005859375, 23.599609375, 24.5986328125, 25.59765625, 26.5966796875, 27.595703125, 28.5947265625, 29.59375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 1.0, 3.0, 3.0, 5.0, 12.0, 11.0, 17.0, 21.0, 37.0, 52.0, 56.0, 92.0, 151.0, 204.0, 273.0, 470.0, 1774.0, 282423.0, 2855166.0, 3445.0, 512.0, 296.0, 197.0, 138.0, 94.0, 52.0, 55.0, 38.0, 30.0, 24.0, 17.0, 15.0, 7.0, 4.0, 1.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.0625, -100.0419921875, -97.021484375, -94.0009765625, -90.98046875, -87.9599609375, -84.939453125, -81.9189453125, -78.8984375, -75.8779296875, -72.857421875, -69.8369140625, -66.81640625, -63.7958984375, -60.775390625, -57.7548828125, -54.734375, -51.7138671875, -48.693359375, -45.6728515625, -42.65234375, -39.6318359375, -36.611328125, -33.5908203125, -30.5703125, -27.5498046875, -24.529296875, -21.5087890625, -18.48828125, -15.4677734375, -12.447265625, -9.4267578125, -6.40625, -3.3857421875, -0.365234375, 2.6552734375, 5.67578125, 8.6962890625, 11.716796875, 14.7373046875, 17.7578125, 20.7783203125, 23.798828125, 26.8193359375, 29.83984375, 32.8603515625, 35.880859375, 38.9013671875, 41.921875, 44.9423828125, 47.962890625, 50.9833984375, 54.00390625, 57.0244140625, 60.044921875, 63.0654296875, 66.0859375, 69.1064453125, 72.126953125, 75.1474609375, 78.16796875, 81.1884765625, 84.208984375, 87.2294921875, 90.25]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 9.0, 206.0, 656.0, 144.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.7839241027832, -28.421607971191406, -22.05929183959961, -15.696977615356445, -9.334661483764648, -2.9723453521728516, 3.3899688720703125, 9.75228500366211, 16.114601135253906, 22.476917266845703, 28.8392333984375, 35.20154571533203, 41.563865661621094, 47.926177978515625, 54.28849411010742, 60.65081024169922, 67.01312255859375, 73.37543487548828, 79.73775482177734, 86.10006713867188, 92.46238708496094, 98.82469940185547, 105.18701171875, 111.54933166503906, 117.91165161132812, 124.27396392822266, 130.6362762451172, 136.99859619140625, 143.3609161376953, 149.72323608398438, 156.08554077148438, 162.44786071777344, 168.81016540527344, 175.1724853515625, 181.5347900390625, 187.89710998535156, 194.25942993164062, 200.6217498779297, 206.9840545654297, 213.34637451171875, 219.7086944580078, 226.07101440429688, 232.43331909179688, 238.79563903808594, 245.157958984375, 251.52027893066406, 257.8825988769531, 264.2449035644531, 270.6072082519531, 276.9695129394531, 283.33184814453125, 289.69415283203125, 296.05645751953125, 302.4187927246094, 308.7810974121094, 315.1434326171875, 321.5057373046875, 327.8680419921875, 334.2303771972656, 340.5926818847656, 346.9549865722656, 353.31732177734375, 359.67962646484375, 366.04193115234375, 372.4042663574219]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 10.0, 7.0, 9.0, 10.0, 12.0, 15.0, 25.0, 19.0, 22.0, 26.0, 30.0, 24.0, 23.0, 35.0, 35.0, 26.0, 40.0, 36.0, 39.0, 36.0, 36.0, 39.0, 46.0, 26.0, 30.0, 36.0, 31.0, 28.0, 24.0, 41.0, 33.0, 16.0, 19.0, 21.0, 14.0, 9.0, 9.0, 9.0, 16.0, 6.0, 2.0, 1.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-72.6746597290039, -70.47612762451172, -68.27760314941406, -66.07907104492188, -63.88053894042969, -61.6820068359375, -59.48347854614258, -57.284950256347656, -55.08641815185547, -52.88788604736328, -50.68935775756836, -48.49082946777344, -46.29229736328125, -44.09376525878906, -41.89523696899414, -39.69670867919922, -37.49817657470703, -35.299644470214844, -33.10111618041992, -30.902585983276367, -28.704055786132812, -26.505525588989258, -24.306995391845703, -22.10846519470215, -19.909934997558594, -17.71140480041504, -15.512874603271484, -13.31434440612793, -11.115814208984375, -8.91728401184082, -6.718753814697266, -4.520223617553711, -2.3217010498046875, -0.12317085266113281, 2.075359344482422, 4.273889541625977, 6.472419738769531, 8.670949935913086, 10.86948013305664, 13.068010330200195, 15.26654052734375, 17.465070724487305, 19.66360092163086, 21.862131118774414, 24.06066131591797, 26.259191513061523, 28.457721710205078, 30.656251907348633, 32.85478210449219, 35.053314208984375, 37.2518424987793, 39.45037078857422, 41.648902893066406, 43.847434997558594, 46.045963287353516, 48.24449157714844, 50.443023681640625, 52.64155578613281, 54.840084075927734, 57.038612365722656, 59.237144470214844, 61.43567657470703, 63.63420486450195, 65.83273315429688, 68.03126525878906]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 8.0, 8.0, 7.0, 14.0, 14.0, 19.0, 29.0, 24.0, 28.0, 25.0, 32.0, 42.0, 37.0, 48.0, 49.0, 50.0, 51.0, 37.0, 41.0, 55.0, 41.0, 38.0, 34.0, 41.0, 31.0, 32.0, 33.0, 24.0, 19.0, 17.0, 13.0, 19.0, 12.0, 8.0, 4.0, 5.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.704345703125, -11.35400390625, -11.003662109375, -10.6533203125, -10.302978515625, -9.95263671875, -9.602294921875, -9.251953125, -8.901611328125, -8.55126953125, -8.200927734375, -7.8505859375, -7.500244140625, -7.14990234375, -6.799560546875, -6.44921875, -6.098876953125, -5.74853515625, -5.398193359375, -5.0478515625, -4.697509765625, -4.34716796875, -3.996826171875, -3.646484375, -3.296142578125, -2.94580078125, -2.595458984375, -2.2451171875, -1.894775390625, -1.54443359375, -1.194091796875, -0.84375, -0.493408203125, -0.14306640625, 0.207275390625, 0.5576171875, 0.907958984375, 1.25830078125, 1.608642578125, 1.958984375, 2.309326171875, 2.65966796875, 3.010009765625, 3.3603515625, 3.710693359375, 4.06103515625, 4.411376953125, 4.76171875, 5.112060546875, 5.46240234375, 5.812744140625, 6.1630859375, 6.513427734375, 6.86376953125, 7.214111328125, 7.564453125, 7.914794921875, 8.26513671875, 8.615478515625, 8.9658203125, 9.316162109375, 9.66650390625, 10.016845703125, 10.3671875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 1.0, 3.0, 7.0, 10.0, 9.0, 11.0, 15.0, 17.0, 18.0, 29.0, 32.0, 42.0, 69.0, 132.0, 303.0, 786.0, 3021.0, 15816.0, 185923.0, 2628808.0, 1281334.0, 66368.0, 8393.0, 1916.0, 638.0, 222.0, 104.0, 62.0, 37.0, 31.0, 28.0, 17.0, 16.0, 15.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.875, -32.92919921875, -31.9833984375, -31.03759765625, -30.091796875, -29.14599609375, -28.2001953125, -27.25439453125, -26.30859375, -25.36279296875, -24.4169921875, -23.47119140625, -22.525390625, -21.57958984375, -20.6337890625, -19.68798828125, -18.7421875, -17.79638671875, -16.8505859375, -15.90478515625, -14.958984375, -14.01318359375, -13.0673828125, -12.12158203125, -11.17578125, -10.22998046875, -9.2841796875, -8.33837890625, -7.392578125, -6.44677734375, -5.5009765625, -4.55517578125, -3.609375, -2.66357421875, -1.7177734375, -0.77197265625, 0.173828125, 1.11962890625, 2.0654296875, 3.01123046875, 3.95703125, 4.90283203125, 5.8486328125, 6.79443359375, 7.740234375, 8.68603515625, 9.6318359375, 10.57763671875, 11.5234375, 12.46923828125, 13.4150390625, 14.36083984375, 15.306640625, 16.25244140625, 17.1982421875, 18.14404296875, 19.08984375, 20.03564453125, 20.9814453125, 21.92724609375, 22.873046875, 23.81884765625, 24.7646484375, 25.71044921875, 26.65625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 11.0, 20.0, 14.0, 37.0, 52.0, 80.0, 109.0, 159.0, 281.0, 491.0, 655.0, 712.0, 516.0, 328.0, 245.0, 126.0, 88.0, 51.0, 40.0, 30.0, 16.0, 10.0, 4.0, 0.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.09375, -36.234375, -35.375, -34.515625, -33.65625, -32.796875, -31.9375, -31.078125, -30.21875, -29.359375, -28.5, -27.640625, -26.78125, -25.921875, -25.0625, -24.203125, -23.34375, -22.484375, -21.625, -20.765625, -19.90625, -19.046875, -18.1875, -17.328125, -16.46875, -15.609375, -14.75, -13.890625, -13.03125, -12.171875, -11.3125, -10.453125, -9.59375, -8.734375, -7.875, -7.015625, -6.15625, -5.296875, -4.4375, -3.578125, -2.71875, -1.859375, -1.0, -0.140625, 0.71875, 1.578125, 2.4375, 3.296875, 4.15625, 5.015625, 5.875, 6.734375, 7.59375, 8.453125, 9.3125, 10.171875, 11.03125, 11.890625, 12.75, 13.609375, 14.46875, 15.328125, 16.1875, 17.046875, 17.90625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 12.0, 18.0, 24.0, 40.0, 53.0, 94.0, 148.0, 225.0, 433.0, 773.0, 3348.0, 973057.0, 3207785.0, 6255.0, 944.0, 417.0, 248.0, 151.0, 105.0, 54.0, 31.0, 32.0, 12.0, 9.0, 13.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.5625, -78.1767578125, -74.791015625, -71.4052734375, -68.01953125, -64.6337890625, -61.248046875, -57.8623046875, -54.4765625, -51.0908203125, -47.705078125, -44.3193359375, -40.93359375, -37.5478515625, -34.162109375, -30.7763671875, -27.390625, -24.0048828125, -20.619140625, -17.2333984375, -13.84765625, -10.4619140625, -7.076171875, -3.6904296875, -0.3046875, 3.0810546875, 6.466796875, 9.8525390625, 13.23828125, 16.6240234375, 20.009765625, 23.3955078125, 26.78125, 30.1669921875, 33.552734375, 36.9384765625, 40.32421875, 43.7099609375, 47.095703125, 50.4814453125, 53.8671875, 57.2529296875, 60.638671875, 64.0244140625, 67.41015625, 70.7958984375, 74.181640625, 77.5673828125, 80.953125, 84.3388671875, 87.724609375, 91.1103515625, 94.49609375, 97.8818359375, 101.267578125, 104.6533203125, 108.0390625, 111.4248046875, 114.810546875, 118.1962890625, 121.58203125, 124.9677734375, 128.353515625, 131.7392578125, 135.125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 17.0, 36.0, 111.0, 193.0, 198.0, 214.0, 130.0, 67.0, 33.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.51513671875, -113.29403686523438, -108.07292938232422, -102.8518295288086, -97.63072967529297, -92.40962219238281, -87.18852233886719, -81.96742248535156, -76.74632263183594, -71.52522277832031, -66.30411529541016, -61.08301544189453, -55.861915588378906, -50.640811920166016, -45.419708251953125, -40.1986083984375, -34.977500915527344, -29.756399154663086, -24.535297393798828, -19.314193725585938, -14.09309196472168, -8.871990203857422, -3.6508865356445312, 1.5702133178710938, 6.791316986083984, 12.012418746948242, 17.2335205078125, 22.45462417602539, 27.67572593688965, 32.896827697753906, 38.1179313659668, 43.33903121948242, 48.56013488769531, 53.7812385559082, 59.00233840942383, 64.22344207763672, 69.44454193115234, 74.6656494140625, 79.88674926757812, 85.10784912109375, 90.32894897460938, 95.550048828125, 100.77115631103516, 105.99225616455078, 111.2133560180664, 116.43446350097656, 121.65556335449219, 126.87666320800781, 132.0977783203125, 137.31887817382812, 142.53997802734375, 147.76107788085938, 152.98219299316406, 158.2032928466797, 163.4243927001953, 168.64549255371094, 173.86659240722656, 179.0876922607422, 184.3087921142578, 189.5299072265625, 194.75100708007812, 199.97210693359375, 205.19320678710938, 210.414306640625, 215.63540649414062]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 1.0, 3.0, 10.0, 10.0, 3.0, 10.0, 18.0, 13.0, 25.0, 13.0, 18.0, 23.0, 36.0, 25.0, 31.0, 27.0, 35.0, 28.0, 28.0, 32.0, 35.0, 43.0, 55.0, 43.0, 39.0, 35.0, 39.0, 25.0, 33.0, 34.0, 21.0, 22.0, 22.0, 19.0, 30.0, 18.0, 18.0, 8.0, 16.0, 8.0, 10.0, 6.0, 9.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-53.985565185546875, -52.30155563354492, -50.61754608154297, -48.933536529541016, -47.24952697753906, -45.56551742553711, -43.881507873535156, -42.1974983215332, -40.51348876953125, -38.8294792175293, -37.145469665527344, -35.46146011352539, -33.77745056152344, -32.093441009521484, -30.40943145751953, -28.725421905517578, -27.041412353515625, -25.357402801513672, -23.67339324951172, -21.989383697509766, -20.305374145507812, -18.62136459350586, -16.937355041503906, -15.253345489501953, -13.5693359375, -11.885326385498047, -10.201316833496094, -8.51730728149414, -6.8332977294921875, -5.149288177490234, -3.4652786254882812, -1.7812690734863281, -0.097259521484375, 1.5867500305175781, 3.2707595825195312, 4.954769134521484, 6.6387786865234375, 8.32278823852539, 10.006797790527344, 11.690807342529297, 13.37481689453125, 15.058826446533203, 16.742835998535156, 18.42684555053711, 20.110855102539062, 21.794864654541016, 23.47887420654297, 25.162883758544922, 26.846893310546875, 28.530902862548828, 30.21491241455078, 31.898921966552734, 33.58293151855469, 35.26694107055664, 36.950950622558594, 38.63496017456055, 40.3189697265625, 42.00297927856445, 43.686988830566406, 45.37099838256836, 47.05500793457031, 48.739017486572266, 50.42302703857422, 52.10703659057617, 53.791046142578125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 5.0, 6.0, 8.0, 11.0, 11.0, 19.0, 28.0, 26.0, 24.0, 22.0, 42.0, 26.0, 40.0, 29.0, 44.0, 44.0, 47.0, 42.0, 39.0, 40.0, 47.0, 51.0, 37.0, 36.0, 32.0, 36.0, 29.0, 31.0, 26.0, 22.0, 14.0, 9.0, 10.0, 16.0, 8.0, 8.0, 7.0, 4.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.0, -10.677490234375, -10.35498046875, -10.032470703125, -9.7099609375, -9.387451171875, -9.06494140625, -8.742431640625, -8.419921875, -8.097412109375, -7.77490234375, -7.452392578125, -7.1298828125, -6.807373046875, -6.48486328125, -6.162353515625, -5.83984375, -5.517333984375, -5.19482421875, -4.872314453125, -4.5498046875, -4.227294921875, -3.90478515625, -3.582275390625, -3.259765625, -2.937255859375, -2.61474609375, -2.292236328125, -1.9697265625, -1.647216796875, -1.32470703125, -1.002197265625, -0.6796875, -0.357177734375, -0.03466796875, 0.287841796875, 0.6103515625, 0.932861328125, 1.25537109375, 1.577880859375, 1.900390625, 2.222900390625, 2.54541015625, 2.867919921875, 3.1904296875, 3.512939453125, 3.83544921875, 4.157958984375, 4.48046875, 4.802978515625, 5.12548828125, 5.447998046875, 5.7705078125, 6.093017578125, 6.41552734375, 6.738037109375, 7.060546875, 7.383056640625, 7.70556640625, 8.028076171875, 8.3505859375, 8.673095703125, 8.99560546875, 9.318115234375, 9.640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 17.0, 28.0, 30.0, 56.0, 72.0, 116.0, 133.0, 240.0, 338.0, 529.0, 766.0, 1158.0, 1741.0, 2598.0, 3990.0, 5978.0, 9254.0, 14528.0, 23062.0, 37106.0, 60453.0, 99179.0, 148648.0, 186396.0, 160286.0, 109902.0, 68306.0, 41502.0, 26092.0, 16144.0, 10308.0, 6617.0, 4384.0, 2821.0, 1930.0, 1261.0, 846.0, 563.0, 386.0, 261.0, 170.0, 112.0, 78.0, 51.0, 35.0, 24.0, 17.0, 13.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.9794921875, -0.949462890625, -0.91943359375, -0.889404296875, -0.859375, -0.829345703125, -0.79931640625, -0.769287109375, -0.7392578125, -0.709228515625, -0.67919921875, -0.649169921875, -0.619140625, -0.589111328125, -0.55908203125, -0.529052734375, -0.4990234375, -0.468994140625, -0.43896484375, -0.408935546875, -0.37890625, -0.348876953125, -0.31884765625, -0.288818359375, -0.2587890625, -0.228759765625, -0.19873046875, -0.168701171875, -0.138671875, -0.108642578125, -0.07861328125, -0.048583984375, -0.0185546875, 0.011474609375, 0.04150390625, 0.071533203125, 0.1015625, 0.131591796875, 0.16162109375, 0.191650390625, 0.2216796875, 0.251708984375, 0.28173828125, 0.311767578125, 0.341796875, 0.371826171875, 0.40185546875, 0.431884765625, 0.4619140625, 0.491943359375, 0.52197265625, 0.552001953125, 0.58203125, 0.612060546875, 0.64208984375, 0.672119140625, 0.7021484375, 0.732177734375, 0.76220703125, 0.792236328125, 0.822265625, 0.852294921875, 0.88232421875, 0.912353515625, 0.9423828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 5.0, 4.0, 6.0, 6.0, 11.0, 9.0, 12.0, 10.0, 21.0, 14.0, 13.0, 29.0, 23.0, 23.0, 23.0, 39.0, 37.0, 43.0, 38.0, 31.0, 45.0, 34.0, 1057.0, 33.0, 46.0, 44.0, 32.0, 31.0, 36.0, 36.0, 24.0, 23.0, 26.0, 19.0, 22.0, 15.0, 13.0, 16.0, 15.0, 9.0, 7.0, 6.0, 8.0, 6.0, 7.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.50390625, -5.32318115234375, -5.1424560546875, -4.96173095703125, -4.781005859375, -4.60028076171875, -4.4195556640625, -4.23883056640625, -4.05810546875, -3.87738037109375, -3.6966552734375, -3.51593017578125, -3.335205078125, -3.15447998046875, -2.9737548828125, -2.79302978515625, -2.6123046875, -2.43157958984375, -2.2508544921875, -2.07012939453125, -1.889404296875, -1.70867919921875, -1.5279541015625, -1.34722900390625, -1.16650390625, -0.98577880859375, -0.8050537109375, -0.62432861328125, -0.443603515625, -0.26287841796875, -0.0821533203125, 0.09857177734375, 0.279296875, 0.46002197265625, 0.6407470703125, 0.82147216796875, 1.002197265625, 1.18292236328125, 1.3636474609375, 1.54437255859375, 1.72509765625, 1.90582275390625, 2.0865478515625, 2.26727294921875, 2.447998046875, 2.62872314453125, 2.8094482421875, 2.99017333984375, 3.1708984375, 3.35162353515625, 3.5323486328125, 3.71307373046875, 3.893798828125, 4.07452392578125, 4.2552490234375, 4.43597412109375, 4.61669921875, 4.79742431640625, 4.9781494140625, 5.15887451171875, 5.339599609375, 5.52032470703125, 5.7010498046875, 5.88177490234375, 6.0625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 13.0, 32.0, 51.0, 68.0, 116.0, 159.0, 267.0, 404.0, 596.0, 923.0, 1538.0, 2295.0, 3609.0, 5710.0, 9290.0, 15256.0, 25606.0, 42217.0, 68724.0, 108306.0, 153383.0, 1223093.0, 152778.0, 107634.0, 68441.0, 41748.0, 25199.0, 15125.0, 9153.0, 5560.0, 3539.0, 2251.0, 1456.0, 900.0, 596.0, 377.0, 248.0, 143.0, 100.0, 70.0, 53.0, 29.0, 20.0, 13.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.74560546875, -0.7233428955078125, -0.701080322265625, -0.6788177490234375, -0.65655517578125, -0.6342926025390625, -0.612030029296875, -0.5897674560546875, -0.5675048828125, -0.5452423095703125, -0.522979736328125, -0.5007171630859375, -0.47845458984375, -0.4561920166015625, -0.433929443359375, -0.4116668701171875, -0.389404296875, -0.3671417236328125, -0.344879150390625, -0.3226165771484375, -0.30035400390625, -0.2780914306640625, -0.255828857421875, -0.2335662841796875, -0.2113037109375, -0.1890411376953125, -0.166778564453125, -0.1445159912109375, -0.12225341796875, -0.0999908447265625, -0.077728271484375, -0.0554656982421875, -0.033203125, -0.0109405517578125, 0.011322021484375, 0.0335845947265625, 0.05584716796875, 0.0781097412109375, 0.100372314453125, 0.1226348876953125, 0.1448974609375, 0.1671600341796875, 0.189422607421875, 0.2116851806640625, 0.23394775390625, 0.2562103271484375, 0.278472900390625, 0.3007354736328125, 0.322998046875, 0.3452606201171875, 0.367523193359375, 0.3897857666015625, 0.41204833984375, 0.4343109130859375, 0.456573486328125, 0.4788360595703125, 0.5010986328125, 0.5233612060546875, 0.545623779296875, 0.5678863525390625, 0.59014892578125, 0.6124114990234375, 0.634674072265625, 0.6569366455078125, 0.67919921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 4.0, 8.0, 8.0, 12.0, 18.0, 18.0, 34.0, 36.0, 42.0, 68.0, 75.0, 102.0, 111.0, 90.0, 74.0, 69.0, 48.0, 40.0, 28.0, 17.0, 16.0, 16.0, 11.0, 9.0, 4.0, 8.0, 4.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0199127197265625, -0.019236087799072266, -0.01855945587158203, -0.017882823944091797, -0.017206192016601562, -0.016529560089111328, -0.015852928161621094, -0.01517629623413086, -0.014499664306640625, -0.01382303237915039, -0.013146400451660156, -0.012469768524169922, -0.011793136596679688, -0.011116504669189453, -0.010439872741699219, -0.009763240814208984, -0.00908660888671875, -0.008409976959228516, -0.007733345031738281, -0.007056713104248047, -0.0063800811767578125, -0.005703449249267578, -0.005026817321777344, -0.004350185394287109, -0.003673553466796875, -0.0029969215393066406, -0.0023202896118164062, -0.0016436576843261719, -0.0009670257568359375, -0.0002903938293457031, 0.00038623809814453125, 0.0010628700256347656, 0.001739501953125, 0.0024161338806152344, 0.0030927658081054688, 0.003769397735595703, 0.0044460296630859375, 0.005122661590576172, 0.005799293518066406, 0.006475925445556641, 0.007152557373046875, 0.00782918930053711, 0.008505821228027344, 0.009182453155517578, 0.009859085083007812, 0.010535717010498047, 0.011212348937988281, 0.011888980865478516, 0.01256561279296875, 0.013242244720458984, 0.013918876647949219, 0.014595508575439453, 0.015272140502929688, 0.015948772430419922, 0.016625404357910156, 0.01730203628540039, 0.017978668212890625, 0.01865530014038086, 0.019331932067871094, 0.020008563995361328, 0.020685195922851562, 0.021361827850341797, 0.02203845977783203, 0.022715091705322266, 0.0233917236328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 7.0, 6.0, 5.0, 9.0, 19.0, 11.0, 20.0, 32.0, 37.0, 53.0, 81.0, 143.0, 268.0, 1033.0, 973216.0, 72478.0, 567.0, 187.0, 115.0, 72.0, 46.0, 35.0, 26.0, 22.0, 14.0, 7.0, 7.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.5615234375, -0.5458641052246094, -0.5302047729492188, -0.5145454406738281, -0.4988861083984375, -0.4832267761230469, -0.46756744384765625, -0.4519081115722656, -0.436248779296875, -0.4205894470214844, -0.40493011474609375, -0.3892707824707031, -0.3736114501953125, -0.3579521179199219, -0.34229278564453125, -0.3266334533691406, -0.31097412109375, -0.2953147888183594, -0.27965545654296875, -0.2639961242675781, -0.2483367919921875, -0.23267745971679688, -0.21701812744140625, -0.20135879516601562, -0.185699462890625, -0.17004013061523438, -0.15438079833984375, -0.13872146606445312, -0.1230621337890625, -0.10740280151367188, -0.09174346923828125, -0.07608413696289062, -0.0604248046875, -0.044765472412109375, -0.02910614013671875, -0.013446807861328125, 0.0022125244140625, 0.017871856689453125, 0.03353118896484375, 0.049190521240234375, 0.064849853515625, 0.08050918579101562, 0.09616851806640625, 0.11182785034179688, 0.1274871826171875, 0.14314651489257812, 0.15880584716796875, 0.17446517944335938, 0.19012451171875, 0.20578384399414062, 0.22144317626953125, 0.23710250854492188, 0.2527618408203125, 0.2684211730957031, 0.28408050537109375, 0.2997398376464844, 0.315399169921875, 0.3310585021972656, 0.34671783447265625, 0.3623771667480469, 0.3780364990234375, 0.3936958312988281, 0.40935516357421875, 0.4250144958496094, 0.440673828125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 11.0, 74.0, 793.0, 131.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036052290350198746, -0.03187992423772812, -0.027707558125257492, -0.023535193875432014, -0.019362827762961388, -0.01519046165049076, -0.011018097400665283, -0.006845731288194656, -0.0026733651757240295, 0.00149900047108531, 0.0056713661178946495, 0.009843731299042702, 0.014016097411513329, 0.018188463523983955, 0.022360827773809433, 0.02653319388628006, 0.030705559998750687, 0.034877926111221313, 0.03905029222369194, 0.04322265833616257, 0.047395020723342896, 0.05156739056110382, 0.05573975294828415, 0.059912119060754776, 0.0640844851732254, 0.06825684756040573, 0.07242921739816666, 0.07660157978534698, 0.08077394962310791, 0.08494631201028824, 0.08911867439746857, 0.09329104423522949, 0.09746341407299042, 0.10163577646017075, 0.10580814629793167, 0.109980508685112, 0.11415287852287292, 0.11832524091005325, 0.12249760329723358, 0.1266699731349945, 0.13084234297275543, 0.13501471281051636, 0.1391870677471161, 0.14335943758487701, 0.14753180742263794, 0.15170417726039886, 0.1558765321969986, 0.16004890203475952, 0.16422125697135925, 0.16839362680912018, 0.1725659817457199, 0.17673835158348083, 0.18091072142124176, 0.18508309125900269, 0.18925544619560242, 0.19342781603336334, 0.19760018587112427, 0.2017725557088852, 0.20594491064548492, 0.21011728048324585, 0.21428965032100677, 0.2184620201587677, 0.22263437509536743, 0.22680674493312836, 0.23097911477088928]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 5.0, 7.0, 9.0, 4.0, 10.0, 11.0, 13.0, 28.0, 30.0, 29.0, 25.0, 40.0, 53.0, 38.0, 58.0, 51.0, 49.0, 61.0, 65.0, 56.0, 50.0, 61.0, 54.0, 40.0, 22.0, 19.0, 25.0, 19.0, 19.0, 13.0, 16.0, 12.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023732244968414307, -0.022998768836259842, -0.022265294566750526, -0.02153182029724121, -0.020798344165086746, -0.02006486803293228, -0.019331393763422966, -0.01859791949391365, -0.017864443361759186, -0.01713096722960472, -0.016397492960095406, -0.01566401869058609, -0.014930542558431625, -0.014197067357599735, -0.013463592156767845, -0.012730116955935955, -0.011996641755104065, -0.011263166554272175, -0.010529691353440285, -0.009796216152608395, -0.009062740951776505, -0.008329265750944614, -0.007595790550112724, -0.006862315349280834, -0.006128840148448944, -0.005395364947617054, -0.004661889746785164, -0.003928414545953274, -0.0031949393451213837, -0.0024614641442894936, -0.0017279889434576035, -0.0009945137426257133, -0.00026103854179382324, 0.00047243665903806686, 0.001205911859869957, 0.001939387060701847, 0.002672862261533737, 0.0034063374623656273, 0.004139812663197517, 0.0048732878640294075, 0.005606763064861298, 0.006340238265693188, 0.007073713466525078, 0.007807188667356968, 0.008540663868188858, 0.009274139069020748, 0.010007614269852638, 0.010741089470684528, 0.011474564671516418, 0.012208039872348309, 0.012941515073180199, 0.013674990274012089, 0.014408465474843979, 0.015141940675675869, 0.01587541587650776, 0.016608890146017075, 0.01734236627817154, 0.018075842410326004, 0.01880931667983532, 0.019542790949344635, 0.0202762670814991, 0.021009743213653564, 0.02174321748316288, 0.022476691752672195, 0.02321016788482666]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 5.0, 6.0, 8.0, 11.0, 11.0, 19.0, 28.0, 26.0, 24.0, 22.0, 42.0, 25.0, 41.0, 29.0, 43.0, 45.0, 47.0, 42.0, 40.0, 39.0, 47.0, 51.0, 36.0, 37.0, 32.0, 36.0, 29.0, 31.0, 26.0, 22.0, 14.0, 9.0, 10.0, 16.0, 8.0, 8.0, 7.0, 4.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.0, -10.677490234375, -10.35498046875, -10.032470703125, -9.7099609375, -9.387451171875, -9.06494140625, -8.742431640625, -8.419921875, -8.097412109375, -7.77490234375, -7.452392578125, -7.1298828125, -6.807373046875, -6.48486328125, -6.162353515625, -5.83984375, -5.517333984375, -5.19482421875, -4.872314453125, -4.5498046875, -4.227294921875, -3.90478515625, -3.582275390625, -3.259765625, -2.937255859375, -2.61474609375, -2.292236328125, -1.9697265625, -1.647216796875, -1.32470703125, -1.002197265625, -0.6796875, -0.357177734375, -0.03466796875, 0.287841796875, 0.6103515625, 0.932861328125, 1.25537109375, 1.577880859375, 1.900390625, 2.222900390625, 2.54541015625, 2.867919921875, 3.1904296875, 3.512939453125, 3.83544921875, 4.157958984375, 4.48046875, 4.802978515625, 5.12548828125, 5.447998046875, 5.7705078125, 6.093017578125, 6.41552734375, 6.738037109375, 7.060546875, 7.383056640625, 7.70556640625, 8.028076171875, 8.3505859375, 8.673095703125, 8.99560546875, 9.318115234375, 9.640625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 5.0, 8.0, 9.0, 7.0, 9.0, 18.0, 26.0, 21.0, 31.0, 47.0, 57.0, 110.0, 142.0, 252.0, 348.0, 657.0, 1166.0, 2141.0, 4437.0, 9354.0, 20039.0, 47544.0, 137759.0, 444491.0, 248858.0, 75249.0, 29403.0, 13369.0, 6190.0, 3105.0, 1477.0, 843.0, 481.0, 282.0, 184.0, 115.0, 91.0, 54.0, 41.0, 36.0, 27.0, 16.0, 10.0, 7.0, 9.0, 7.0, 5.0, 6.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0], "bins": [-9.9609375, -9.6656494140625, -9.370361328125, -9.0750732421875, -8.77978515625, -8.4844970703125, -8.189208984375, -7.8939208984375, -7.5986328125, -7.3033447265625, -7.008056640625, -6.7127685546875, -6.41748046875, -6.1221923828125, -5.826904296875, -5.5316162109375, -5.236328125, -4.9410400390625, -4.645751953125, -4.3504638671875, -4.05517578125, -3.7598876953125, -3.464599609375, -3.1693115234375, -2.8740234375, -2.5787353515625, -2.283447265625, -1.9881591796875, -1.69287109375, -1.3975830078125, -1.102294921875, -0.8070068359375, -0.51171875, -0.2164306640625, 0.078857421875, 0.3741455078125, 0.66943359375, 0.9647216796875, 1.260009765625, 1.5552978515625, 1.8505859375, 2.1458740234375, 2.441162109375, 2.7364501953125, 3.03173828125, 3.3270263671875, 3.622314453125, 3.9176025390625, 4.212890625, 4.5081787109375, 4.803466796875, 5.0987548828125, 5.39404296875, 5.6893310546875, 5.984619140625, 6.2799072265625, 6.5751953125, 6.8704833984375, 7.165771484375, 7.4610595703125, 7.75634765625, 8.0516357421875, 8.346923828125, 8.6422119140625, 8.9375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 13.0, 12.0, 11.0, 7.0, 19.0, 17.0, 21.0, 20.0, 21.0, 27.0, 39.0, 36.0, 47.0, 31.0, 48.0, 82.0, 190.0, 1685.0, 231.0, 91.0, 54.0, 24.0, 41.0, 38.0, 29.0, 31.0, 27.0, 37.0, 20.0, 17.0, 13.0, 14.0, 9.0, 10.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.59375, -33.622314453125, -32.65087890625, -31.679443359375, -30.7080078125, -29.736572265625, -28.76513671875, -27.793701171875, -26.822265625, -25.850830078125, -24.87939453125, -23.907958984375, -22.9365234375, -21.965087890625, -20.99365234375, -20.022216796875, -19.05078125, -18.079345703125, -17.10791015625, -16.136474609375, -15.1650390625, -14.193603515625, -13.22216796875, -12.250732421875, -11.279296875, -10.307861328125, -9.33642578125, -8.364990234375, -7.3935546875, -6.422119140625, -5.45068359375, -4.479248046875, -3.5078125, -2.536376953125, -1.56494140625, -0.593505859375, 0.3779296875, 1.349365234375, 2.32080078125, 3.292236328125, 4.263671875, 5.235107421875, 6.20654296875, 7.177978515625, 8.1494140625, 9.120849609375, 10.09228515625, 11.063720703125, 12.03515625, 13.006591796875, 13.97802734375, 14.949462890625, 15.9208984375, 16.892333984375, 17.86376953125, 18.835205078125, 19.806640625, 20.778076171875, 21.74951171875, 22.720947265625, 23.6923828125, 24.663818359375, 25.63525390625, 26.606689453125, 27.578125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 6.0, 8.0, 5.0, 10.0, 11.0, 21.0, 27.0, 25.0, 49.0, 61.0, 90.0, 93.0, 143.0, 207.0, 271.0, 662.0, 4262.0, 980222.0, 2152601.0, 5046.0, 718.0, 309.0, 222.0, 161.0, 121.0, 76.0, 49.0, 40.0, 52.0, 27.0, 20.0, 27.0, 12.0, 14.0, 4.0, 8.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.375, -68.998046875, -66.62109375, -64.244140625, -61.8671875, -59.490234375, -57.11328125, -54.736328125, -52.359375, -49.982421875, -47.60546875, -45.228515625, -42.8515625, -40.474609375, -38.09765625, -35.720703125, -33.34375, -30.966796875, -28.58984375, -26.212890625, -23.8359375, -21.458984375, -19.08203125, -16.705078125, -14.328125, -11.951171875, -9.57421875, -7.197265625, -4.8203125, -2.443359375, -0.06640625, 2.310546875, 4.6875, 7.064453125, 9.44140625, 11.818359375, 14.1953125, 16.572265625, 18.94921875, 21.326171875, 23.703125, 26.080078125, 28.45703125, 30.833984375, 33.2109375, 35.587890625, 37.96484375, 40.341796875, 42.71875, 45.095703125, 47.47265625, 49.849609375, 52.2265625, 54.603515625, 56.98046875, 59.357421875, 61.734375, 64.111328125, 66.48828125, 68.865234375, 71.2421875, 73.619140625, 75.99609375, 78.373046875, 80.75]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [10.0, 414.0, 580.0, 17.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.1107120513916, -8.980517387390137, -0.8503227233886719, 7.279870986938477, 15.410066604614258, 23.54026222229004, 31.670454025268555, 39.80065155029297, 47.93084716796875, 56.06104278564453, 64.19123840332031, 72.32142639160156, 80.45162963867188, 88.58181762695312, 96.7120132446289, 104.84220886230469, 112.97240447998047, 121.10260009765625, 129.2327880859375, 137.3629913330078, 145.49317932128906, 153.62338256835938, 161.75357055664062, 169.88375854492188, 178.0139617919922, 186.14414978027344, 194.27435302734375, 202.404541015625, 210.5347442626953, 218.66493225097656, 226.79513549804688, 234.92532348632812, 243.05551147460938, 251.18569946289062, 259.3158874511719, 267.44610595703125, 275.5762939453125, 283.70648193359375, 291.836669921875, 299.96685791015625, 308.0970764160156, 316.2272644042969, 324.3574523925781, 332.4876708984375, 340.61785888671875, 348.748046875, 356.87823486328125, 365.0084228515625, 373.13861083984375, 381.268798828125, 389.39898681640625, 397.5292053222656, 405.6593933105469, 413.7895812988281, 421.9197692871094, 430.04998779296875, 438.18017578125, 446.31036376953125, 454.4405517578125, 462.5707702636719, 470.7009582519531, 478.8311462402344, 486.9613342285156, 495.091552734375, 503.22174072265625]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 12.0, 14.0, 20.0, 17.0, 24.0, 25.0, 24.0, 30.0, 46.0, 44.0, 32.0, 48.0, 40.0, 40.0, 58.0, 56.0, 39.0, 42.0, 47.0, 37.0, 39.0, 41.0, 30.0, 26.0, 21.0, 20.0, 22.0, 20.0, 11.0, 8.0, 8.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.7317886352539, -79.25575256347656, -76.77970886230469, -74.30367279052734, -71.82762908935547, -69.35159301757812, -66.87554931640625, -64.3995132446289, -61.92347717285156, -59.44743728637695, -56.971397399902344, -54.495361328125, -52.01932144165039, -49.54328155517578, -47.06724166870117, -44.59120178222656, -42.11516189575195, -39.639122009277344, -37.163082122802734, -34.687042236328125, -32.21100616455078, -29.734966278076172, -27.258926391601562, -24.782888412475586, -22.306848526000977, -19.830808639526367, -17.35477066040039, -14.878730773925781, -12.402691841125488, -9.926652908325195, -7.450613021850586, -4.974575042724609, -2.49853515625, -0.02249598503112793, 2.453543186187744, 4.929582595825195, 7.405621528625488, 9.881660461425781, 12.35770034790039, 14.833738327026367, 17.309778213500977, 19.785818099975586, 22.261856079101562, 24.737895965576172, 27.21393585205078, 29.689973831176758, 32.166015625, 34.642051696777344, 37.11809158325195, 39.59413146972656, 42.07017135620117, 44.54621124267578, 47.022247314453125, 49.498287200927734, 51.974327087402344, 54.45036315917969, 56.92640686035156, 59.40244674682617, 61.87848663330078, 64.35452270507812, 66.83056640625, 69.30660247802734, 71.78263854980469, 74.25868225097656, 76.7347183227539]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 7.0, 6.0, 8.0, 3.0, 5.0, 12.0, 19.0, 15.0, 17.0, 29.0, 19.0, 33.0, 24.0, 32.0, 43.0, 30.0, 40.0, 48.0, 43.0, 52.0, 45.0, 37.0, 45.0, 40.0, 44.0, 38.0, 35.0, 32.0, 28.0, 28.0, 26.0, 15.0, 22.0, 13.0, 16.0, 12.0, 6.0, 8.0, 10.0, 2.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.8984375, -10.560546875, -10.22265625, -9.884765625, -9.546875, -9.208984375, -8.87109375, -8.533203125, -8.1953125, -7.857421875, -7.51953125, -7.181640625, -6.84375, -6.505859375, -6.16796875, -5.830078125, -5.4921875, -5.154296875, -4.81640625, -4.478515625, -4.140625, -3.802734375, -3.46484375, -3.126953125, -2.7890625, -2.451171875, -2.11328125, -1.775390625, -1.4375, -1.099609375, -0.76171875, -0.423828125, -0.0859375, 0.251953125, 0.58984375, 0.927734375, 1.265625, 1.603515625, 1.94140625, 2.279296875, 2.6171875, 2.955078125, 3.29296875, 3.630859375, 3.96875, 4.306640625, 4.64453125, 4.982421875, 5.3203125, 5.658203125, 5.99609375, 6.333984375, 6.671875, 7.009765625, 7.34765625, 7.685546875, 8.0234375, 8.361328125, 8.69921875, 9.037109375, 9.375, 9.712890625, 10.05078125, 10.388671875, 10.7265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 6.0, 6.0, 3.0, 4.0, 11.0, 4.0, 10.0, 13.0, 17.0, 7.0, 22.0, 22.0, 40.0, 43.0, 93.0, 122.0, 201.0, 425.0, 1059.0, 3478.0, 16821.0, 160413.0, 2237981.0, 1649715.0, 106348.0, 12693.0, 2821.0, 932.0, 379.0, 198.0, 118.0, 57.0, 38.0, 39.0, 25.0, 18.0, 22.0, 11.0, 12.0, 16.0, 4.0, 4.0, 9.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.859375, -25.99072265625, -25.1220703125, -24.25341796875, -23.384765625, -22.51611328125, -21.6474609375, -20.77880859375, -19.91015625, -19.04150390625, -18.1728515625, -17.30419921875, -16.435546875, -15.56689453125, -14.6982421875, -13.82958984375, -12.9609375, -12.09228515625, -11.2236328125, -10.35498046875, -9.486328125, -8.61767578125, -7.7490234375, -6.88037109375, -6.01171875, -5.14306640625, -4.2744140625, -3.40576171875, -2.537109375, -1.66845703125, -0.7998046875, 0.06884765625, 0.9375, 1.80615234375, 2.6748046875, 3.54345703125, 4.412109375, 5.28076171875, 6.1494140625, 7.01806640625, 7.88671875, 8.75537109375, 9.6240234375, 10.49267578125, 11.361328125, 12.22998046875, 13.0986328125, 13.96728515625, 14.8359375, 15.70458984375, 16.5732421875, 17.44189453125, 18.310546875, 19.17919921875, 20.0478515625, 20.91650390625, 21.78515625, 22.65380859375, 23.5224609375, 24.39111328125, 25.259765625, 26.12841796875, 26.9970703125, 27.86572265625, 28.734375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 11.0, 14.0, 15.0, 40.0, 35.0, 49.0, 78.0, 118.0, 164.0, 225.0, 321.0, 482.0, 588.0, 530.0, 470.0, 253.0, 205.0, 144.0, 78.0, 81.0, 44.0, 39.0, 23.0, 18.0, 12.0, 9.0, 4.0, 7.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-29.0625, -28.367919921875, -27.67333984375, -26.978759765625, -26.2841796875, -25.589599609375, -24.89501953125, -24.200439453125, -23.505859375, -22.811279296875, -22.11669921875, -21.422119140625, -20.7275390625, -20.032958984375, -19.33837890625, -18.643798828125, -17.94921875, -17.254638671875, -16.56005859375, -15.865478515625, -15.1708984375, -14.476318359375, -13.78173828125, -13.087158203125, -12.392578125, -11.697998046875, -11.00341796875, -10.308837890625, -9.6142578125, -8.919677734375, -8.22509765625, -7.530517578125, -6.8359375, -6.141357421875, -5.44677734375, -4.752197265625, -4.0576171875, -3.363037109375, -2.66845703125, -1.973876953125, -1.279296875, -0.584716796875, 0.10986328125, 0.804443359375, 1.4990234375, 2.193603515625, 2.88818359375, 3.582763671875, 4.27734375, 4.971923828125, 5.66650390625, 6.361083984375, 7.0556640625, 7.750244140625, 8.44482421875, 9.139404296875, 9.833984375, 10.528564453125, 11.22314453125, 11.917724609375, 12.6123046875, 13.306884765625, 14.00146484375, 14.696044921875, 15.390625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 12.0, 10.0, 17.0, 18.0, 44.0, 51.0, 65.0, 100.0, 170.0, 220.0, 378.0, 731.0, 4861.0, 1701261.0, 2478397.0, 6031.0, 790.0, 379.0, 245.0, 161.0, 96.0, 67.0, 52.0, 38.0, 29.0, 13.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.875, -89.4384765625, -86.001953125, -82.5654296875, -79.12890625, -75.6923828125, -72.255859375, -68.8193359375, -65.3828125, -61.9462890625, -58.509765625, -55.0732421875, -51.63671875, -48.2001953125, -44.763671875, -41.3271484375, -37.890625, -34.4541015625, -31.017578125, -27.5810546875, -24.14453125, -20.7080078125, -17.271484375, -13.8349609375, -10.3984375, -6.9619140625, -3.525390625, -0.0888671875, 3.34765625, 6.7841796875, 10.220703125, 13.6572265625, 17.09375, 20.5302734375, 23.966796875, 27.4033203125, 30.83984375, 34.2763671875, 37.712890625, 41.1494140625, 44.5859375, 48.0224609375, 51.458984375, 54.8955078125, 58.33203125, 61.7685546875, 65.205078125, 68.6416015625, 72.078125, 75.5146484375, 78.951171875, 82.3876953125, 85.82421875, 89.2607421875, 92.697265625, 96.1337890625, 99.5703125, 103.0068359375, 106.443359375, 109.8798828125, 113.31640625, 116.7529296875, 120.189453125, 123.6259765625, 127.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 32.0, 257.0, 541.0, 172.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.66856384277344, -98.4273910522461, -85.18621826171875, -71.94503784179688, -58.7038688659668, -45.46269226074219, -32.221519470214844, -18.9803466796875, -5.739173889160156, 7.501999855041504, 20.743173599243164, 33.98434829711914, 47.225521087646484, 60.466697692871094, 73.70787048339844, 86.94904327392578, 100.19021606445312, 113.43138885498047, 126.67256164550781, 139.9137420654297, 153.1549072265625, 166.39608764648438, 179.63726806640625, 192.87843322753906, 206.11959838867188, 219.36077880859375, 232.60194396972656, 245.84312438964844, 259.08428955078125, 272.3254699707031, 285.566650390625, 298.80780029296875, 312.0489807128906, 325.2901611328125, 338.5313415527344, 351.7724914550781, 365.013671875, 378.2548522949219, 391.49603271484375, 404.7371826171875, 417.9783630371094, 431.21954345703125, 444.4607238769531, 457.7018737792969, 470.94305419921875, 484.1842346191406, 497.4254150390625, 510.66656494140625, 523.9077758789062, 537.14892578125, 550.39013671875, 563.6312866210938, 576.8724975585938, 590.1136474609375, 603.3547973632812, 616.5960083007812, 629.837158203125, 643.0783081054688, 656.3195190429688, 669.5606689453125, 682.8018798828125, 696.0430297851562, 709.2841796875, 722.525390625, 735.7665405273438]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 5.0, 4.0, 12.0, 10.0, 16.0, 10.0, 11.0, 12.0, 13.0, 14.0, 14.0, 26.0, 26.0, 18.0, 34.0, 32.0, 23.0, 33.0, 43.0, 35.0, 26.0, 35.0, 42.0, 37.0, 22.0, 43.0, 30.0, 31.0, 16.0, 43.0, 29.0, 33.0, 24.0, 23.0, 27.0, 21.0, 23.0, 16.0, 17.0, 15.0, 16.0, 6.0, 5.0, 6.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.22540283203125, -45.613800048828125, -44.002201080322266, -42.390602111816406, -40.77899932861328, -39.167396545410156, -37.5557975769043, -35.94419860839844, -34.33259582519531, -32.72099304199219, -31.109394073486328, -29.497793197631836, -27.886192321777344, -26.27459144592285, -24.66299057006836, -23.051389694213867, -21.439788818359375, -19.828187942504883, -18.21658706665039, -16.6049861907959, -14.993385314941406, -13.381784439086914, -11.770183563232422, -10.15858268737793, -8.546981811523438, -6.935380935668945, -5.323780059814453, -3.712179183959961, -2.1005783081054688, -0.48897743225097656, 1.1226234436035156, 2.734224319458008, 4.3458251953125, 5.957426071166992, 7.569026947021484, 9.180627822875977, 10.792228698730469, 12.403829574584961, 14.015430450439453, 15.627031326293945, 17.238632202148438, 18.85023307800293, 20.461833953857422, 22.073434829711914, 23.685035705566406, 25.2966365814209, 26.90823745727539, 28.519838333129883, 30.131439208984375, 31.743040084838867, 33.35464096069336, 34.96623992919922, 36.577842712402344, 38.18944549560547, 39.80104446411133, 41.41264343261719, 43.02424621582031, 44.63584899902344, 46.2474479675293, 47.859046936035156, 49.47064971923828, 51.082252502441406, 52.693851470947266, 54.305450439453125, 55.91705322265625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 8.0, 4.0, 6.0, 10.0, 15.0, 23.0, 25.0, 30.0, 29.0, 26.0, 31.0, 34.0, 35.0, 41.0, 42.0, 40.0, 55.0, 41.0, 44.0, 60.0, 50.0, 43.0, 34.0, 39.0, 28.0, 24.0, 28.0, 31.0, 19.0, 15.0, 14.0, 8.0, 7.0, 12.0, 10.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.625, -11.2779541015625, -10.930908203125, -10.5838623046875, -10.23681640625, -9.8897705078125, -9.542724609375, -9.1956787109375, -8.8486328125, -8.5015869140625, -8.154541015625, -7.8074951171875, -7.46044921875, -7.1134033203125, -6.766357421875, -6.4193115234375, -6.072265625, -5.7252197265625, -5.378173828125, -5.0311279296875, -4.68408203125, -4.3370361328125, -3.989990234375, -3.6429443359375, -3.2958984375, -2.9488525390625, -2.601806640625, -2.2547607421875, -1.90771484375, -1.5606689453125, -1.213623046875, -0.8665771484375, -0.51953125, -0.1724853515625, 0.174560546875, 0.5216064453125, 0.86865234375, 1.2156982421875, 1.562744140625, 1.9097900390625, 2.2568359375, 2.6038818359375, 2.950927734375, 3.2979736328125, 3.64501953125, 3.9920654296875, 4.339111328125, 4.6861572265625, 5.033203125, 5.3802490234375, 5.727294921875, 6.0743408203125, 6.42138671875, 6.7684326171875, 7.115478515625, 7.4625244140625, 7.8095703125, 8.1566162109375, 8.503662109375, 8.8507080078125, 9.19775390625, 9.5447998046875, 9.891845703125, 10.2388916015625, 10.5859375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 19.0, 15.0, 22.0, 31.0, 45.0, 69.0, 120.0, 158.0, 233.0, 293.0, 448.0, 713.0, 1020.0, 1451.0, 2077.0, 2982.0, 4456.0, 6535.0, 10007.0, 15467.0, 24486.0, 39156.0, 63588.0, 101101.0, 147932.0, 181054.0, 154147.0, 106892.0, 67526.0, 41904.0, 25810.0, 16396.0, 10752.0, 6912.0, 4638.0, 3142.0, 2116.0, 1484.0, 1027.0, 744.0, 497.0, 325.0, 250.0, 150.0, 112.0, 95.0, 54.0, 33.0, 15.0, 26.0, 11.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.97509765625, -0.9442062377929688, -0.9133148193359375, -0.8824234008789062, -0.851531982421875, -0.8206405639648438, -0.7897491455078125, -0.7588577270507812, -0.72796630859375, -0.6970748901367188, -0.6661834716796875, -0.6352920532226562, -0.604400634765625, -0.5735092163085938, -0.5426177978515625, -0.5117263793945312, -0.4808349609375, -0.44994354248046875, -0.4190521240234375, -0.38816070556640625, -0.357269287109375, -0.32637786865234375, -0.2954864501953125, -0.26459503173828125, -0.23370361328125, -0.20281219482421875, -0.1719207763671875, -0.14102935791015625, -0.110137939453125, -0.07924652099609375, -0.0483551025390625, -0.01746368408203125, 0.013427734375, 0.04431915283203125, 0.0752105712890625, 0.10610198974609375, 0.136993408203125, 0.16788482666015625, 0.1987762451171875, 0.22966766357421875, 0.26055908203125, 0.29145050048828125, 0.3223419189453125, 0.35323333740234375, 0.384124755859375, 0.41501617431640625, 0.4459075927734375, 0.47679901123046875, 0.5076904296875, 0.5385818481445312, 0.5694732666015625, 0.6003646850585938, 0.631256103515625, 0.6621475219726562, 0.6930389404296875, 0.7239303588867188, 0.75482177734375, 0.7857131958007812, 0.8166046142578125, 0.8474960327148438, 0.878387451171875, 0.9092788696289062, 0.9401702880859375, 0.9710617065429688, 1.001953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 15.0, 7.0, 11.0, 16.0, 10.0, 14.0, 15.0, 25.0, 25.0, 35.0, 34.0, 33.0, 30.0, 36.0, 50.0, 39.0, 50.0, 1059.0, 43.0, 37.0, 34.0, 40.0, 33.0, 32.0, 37.0, 30.0, 31.0, 27.0, 24.0, 18.0, 14.0, 20.0, 11.0, 20.0, 7.0, 7.0, 12.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.71484375, -6.502197265625, -6.28955078125, -6.076904296875, -5.8642578125, -5.651611328125, -5.43896484375, -5.226318359375, -5.013671875, -4.801025390625, -4.58837890625, -4.375732421875, -4.1630859375, -3.950439453125, -3.73779296875, -3.525146484375, -3.3125, -3.099853515625, -2.88720703125, -2.674560546875, -2.4619140625, -2.249267578125, -2.03662109375, -1.823974609375, -1.611328125, -1.398681640625, -1.18603515625, -0.973388671875, -0.7607421875, -0.548095703125, -0.33544921875, -0.122802734375, 0.08984375, 0.302490234375, 0.51513671875, 0.727783203125, 0.9404296875, 1.153076171875, 1.36572265625, 1.578369140625, 1.791015625, 2.003662109375, 2.21630859375, 2.428955078125, 2.6416015625, 2.854248046875, 3.06689453125, 3.279541015625, 3.4921875, 3.704833984375, 3.91748046875, 4.130126953125, 4.3427734375, 4.555419921875, 4.76806640625, 4.980712890625, 5.193359375, 5.406005859375, 5.61865234375, 5.831298828125, 6.0439453125, 6.256591796875, 6.46923828125, 6.681884765625, 6.89453125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 7.0, 12.0, 8.0, 22.0, 23.0, 48.0, 49.0, 89.0, 134.0, 187.0, 273.0, 392.0, 674.0, 1039.0, 1610.0, 2605.0, 4082.0, 6810.0, 10732.0, 17573.0, 29051.0, 47566.0, 75171.0, 113852.0, 165074.0, 1201297.0, 144595.0, 102008.0, 65604.0, 41115.0, 25079.0, 15283.0, 9356.0, 5758.0, 3568.0, 2280.0, 1443.0, 910.0, 618.0, 383.0, 250.0, 170.0, 115.0, 83.0, 45.0, 34.0, 15.0, 11.0, 16.0, 10.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.76171875, -0.7381744384765625, -0.714630126953125, -0.6910858154296875, -0.66754150390625, -0.6439971923828125, -0.620452880859375, -0.5969085693359375, -0.5733642578125, -0.5498199462890625, -0.526275634765625, -0.5027313232421875, -0.47918701171875, -0.4556427001953125, -0.432098388671875, -0.4085540771484375, -0.385009765625, -0.3614654541015625, -0.337921142578125, -0.3143768310546875, -0.29083251953125, -0.2672882080078125, -0.243743896484375, -0.2201995849609375, -0.1966552734375, -0.1731109619140625, -0.149566650390625, -0.1260223388671875, -0.10247802734375, -0.0789337158203125, -0.055389404296875, -0.0318450927734375, -0.00830078125, 0.0152435302734375, 0.038787841796875, 0.0623321533203125, 0.08587646484375, 0.1094207763671875, 0.132965087890625, 0.1565093994140625, 0.1800537109375, 0.2035980224609375, 0.227142333984375, 0.2506866455078125, 0.27423095703125, 0.2977752685546875, 0.321319580078125, 0.3448638916015625, 0.368408203125, 0.3919525146484375, 0.415496826171875, 0.4390411376953125, 0.46258544921875, 0.4861297607421875, 0.509674072265625, 0.5332183837890625, 0.5567626953125, 0.5803070068359375, 0.603851318359375, 0.6273956298828125, 0.65093994140625, 0.6744842529296875, 0.698028564453125, 0.7215728759765625, 0.7451171875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 5.0, 8.0, 7.0, 9.0, 10.0, 18.0, 15.0, 28.0, 26.0, 41.0, 46.0, 59.0, 90.0, 97.0, 116.0, 92.0, 66.0, 57.0, 50.0, 31.0, 28.0, 17.0, 22.0, 15.0, 11.0, 7.0, 8.0, 2.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041229248046875, -0.040032386779785156, -0.03883552551269531, -0.03763866424560547, -0.036441802978515625, -0.03524494171142578, -0.03404808044433594, -0.032851219177246094, -0.03165435791015625, -0.030457496643066406, -0.029260635375976562, -0.02806377410888672, -0.026866912841796875, -0.02567005157470703, -0.024473190307617188, -0.023276329040527344, -0.0220794677734375, -0.020882606506347656, -0.019685745239257812, -0.01848888397216797, -0.017292022705078125, -0.01609516143798828, -0.014898300170898438, -0.013701438903808594, -0.01250457763671875, -0.011307716369628906, -0.010110855102539062, -0.008913993835449219, -0.007717132568359375, -0.006520271301269531, -0.0053234100341796875, -0.004126548767089844, -0.0029296875, -0.0017328262329101562, -0.0005359649658203125, 0.0006608963012695312, 0.001857757568359375, 0.0030546188354492188, 0.0042514801025390625, 0.005448341369628906, 0.00664520263671875, 0.007842063903808594, 0.009038925170898438, 0.010235786437988281, 0.011432647705078125, 0.012629508972167969, 0.013826370239257812, 0.015023231506347656, 0.0162200927734375, 0.017416954040527344, 0.018613815307617188, 0.01981067657470703, 0.021007537841796875, 0.02220439910888672, 0.023401260375976562, 0.024598121643066406, 0.02579498291015625, 0.026991844177246094, 0.028188705444335938, 0.02938556671142578, 0.030582427978515625, 0.03177928924560547, 0.03297615051269531, 0.034173011779785156, 0.035369873046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 7.0, 14.0, 14.0, 19.0, 35.0, 28.0, 37.0, 65.0, 105.0, 166.0, 366.0, 3176.0, 1040570.0, 3065.0, 361.0, 166.0, 91.0, 65.0, 49.0, 37.0, 16.0, 23.0, 17.0, 8.0, 9.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80126953125, -0.7741012573242188, -0.7469329833984375, -0.7197647094726562, -0.692596435546875, -0.6654281616210938, -0.6382598876953125, -0.6110916137695312, -0.58392333984375, -0.5567550659179688, -0.5295867919921875, -0.5024185180664062, -0.475250244140625, -0.44808197021484375, -0.4209136962890625, -0.39374542236328125, -0.3665771484375, -0.33940887451171875, -0.3122406005859375, -0.28507232666015625, -0.257904052734375, -0.23073577880859375, -0.2035675048828125, -0.17639923095703125, -0.14923095703125, -0.12206268310546875, -0.0948944091796875, -0.06772613525390625, -0.040557861328125, -0.01338958740234375, 0.0137786865234375, 0.04094696044921875, 0.068115234375, 0.09528350830078125, 0.1224517822265625, 0.14962005615234375, 0.176788330078125, 0.20395660400390625, 0.2311248779296875, 0.25829315185546875, 0.28546142578125, 0.31262969970703125, 0.3397979736328125, 0.36696624755859375, 0.394134521484375, 0.42130279541015625, 0.4484710693359375, 0.47563934326171875, 0.5028076171875, 0.5299758911132812, 0.5571441650390625, 0.5843124389648438, 0.611480712890625, 0.6386489868164062, 0.6658172607421875, 0.6929855346679688, 0.72015380859375, 0.7473220825195312, 0.7744903564453125, 0.8016586303710938, 0.828826904296875, 0.8559951782226562, 0.8831634521484375, 0.9103317260742188, 0.9375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 11.0, 317.0, 678.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39834415912628174, -0.3870043158531189, -0.37566447257995605, -0.3643246293067932, -0.35298478603363037, -0.34164491295814514, -0.3303050696849823, -0.31896522641181946, -0.3076253831386566, -0.2962855398654938, -0.28494569659233093, -0.2736058533191681, -0.26226598024368286, -0.25092613697052, -0.23958629369735718, -0.22824645042419434, -0.2169066071510315, -0.20556676387786865, -0.1942269206047058, -0.18288706243038177, -0.17154721915721893, -0.1602073758840561, -0.14886751770973206, -0.1375276744365692, -0.12618783116340637, -0.11484798789024353, -0.10350813716650009, -0.09216828644275665, -0.08082844316959381, -0.06948859989643097, -0.05814874917268753, -0.04680889844894409, -0.03546902537345886, -0.024129178375005722, -0.012789331376552582, -0.0014494843780994415, 0.009890362620353699, 0.02123020961880684, 0.03257005661725998, 0.04390990734100342, 0.05524975061416626, 0.0665895938873291, 0.07792944461107254, 0.08926929533481598, 0.10060913860797882, 0.11194898188114166, 0.1232888326048851, 0.13462868332862854, 0.14596852660179138, 0.15730836987495422, 0.16864821314811707, 0.1799880713224411, 0.19132791459560394, 0.20266775786876678, 0.21400761604309082, 0.22534745931625366, 0.2366873025894165, 0.24802714586257935, 0.2593669891357422, 0.27070683240890503, 0.28204667568206787, 0.2933865487575531, 0.30472639203071594, 0.3160662353038788, 0.3274060785770416]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 9.0, 12.0, 3.0, 13.0, 12.0, 10.0, 18.0, 10.0, 15.0, 23.0, 31.0, 38.0, 35.0, 42.0, 46.0, 41.0, 41.0, 35.0, 45.0, 35.0, 35.0, 42.0, 31.0, 43.0, 30.0, 43.0, 41.0, 27.0, 25.0, 27.0, 23.0, 26.0, 14.0, 18.0, 11.0, 16.0, 9.0, 4.0, 3.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03758895397186279, -0.036430247128009796, -0.0352715402841568, -0.034112829715013504, -0.03295412287116051, -0.03179541602730751, -0.030636707320809364, -0.029477998614311218, -0.02831929177045822, -0.027160584926605225, -0.02600187622010708, -0.024843167513608932, -0.023684460669755936, -0.02252575382590294, -0.021367045119404793, -0.020208336412906647, -0.01904962956905365, -0.017890922725200653, -0.016732214018702507, -0.015573506243526936, -0.014414798468351364, -0.013256090693175793, -0.012097382918000221, -0.01093867514282465, -0.009779967367649078, -0.008621259592473507, -0.0074625518172979355, -0.006303844042122364, -0.005145136266946793, -0.003986428491771221, -0.0028277207165956497, -0.0016690129414200783, -0.0005103051662445068, 0.0006484026089310646, 0.001807110384106636, 0.0029658181592822075, 0.004124525934457779, 0.00528323370963335, 0.006441941484808922, 0.007600649259984493, 0.008759357035160065, 0.009918064810335636, 0.011076772585511208, 0.012235480360686779, 0.01339418813586235, 0.014552895911037922, 0.015711603686213493, 0.01687031239271164, 0.018029019236564636, 0.019187726080417633, 0.02034643478691578, 0.021505143493413925, 0.022663850337266922, 0.02382255718111992, 0.024981265887618065, 0.02613997459411621, 0.027298681437969208, 0.028457388281822205, 0.02961609698832035, 0.030774805694818497, 0.031933512538671494, 0.03309221938252449, 0.034250929951667786, 0.03540963679552078, 0.03656834363937378]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 8.0, 4.0, 6.0, 10.0, 15.0, 23.0, 25.0, 30.0, 29.0, 26.0, 31.0, 34.0, 35.0, 41.0, 42.0, 40.0, 55.0, 41.0, 44.0, 60.0, 50.0, 43.0, 33.0, 40.0, 28.0, 24.0, 27.0, 32.0, 19.0, 15.0, 14.0, 8.0, 7.0, 12.0, 10.0, 7.0, 6.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.625, -11.2779541015625, -10.930908203125, -10.5838623046875, -10.23681640625, -9.8897705078125, -9.542724609375, -9.1956787109375, -8.8486328125, -8.5015869140625, -8.154541015625, -7.8074951171875, -7.46044921875, -7.1134033203125, -6.766357421875, -6.4193115234375, -6.072265625, -5.7252197265625, -5.378173828125, -5.0311279296875, -4.68408203125, -4.3370361328125, -3.989990234375, -3.6429443359375, -3.2958984375, -2.9488525390625, -2.601806640625, -2.2547607421875, -1.90771484375, -1.5606689453125, -1.213623046875, -0.8665771484375, -0.51953125, -0.1724853515625, 0.174560546875, 0.5216064453125, 0.86865234375, 1.2156982421875, 1.562744140625, 1.9097900390625, 2.2568359375, 2.6038818359375, 2.950927734375, 3.2979736328125, 3.64501953125, 3.9920654296875, 4.339111328125, 4.6861572265625, 5.033203125, 5.3802490234375, 5.727294921875, 6.0743408203125, 6.42138671875, 6.7684326171875, 7.115478515625, 7.4625244140625, 7.8095703125, 8.1566162109375, 8.503662109375, 8.8507080078125, 9.19775390625, 9.5447998046875, 9.891845703125, 10.2388916015625, 10.5859375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 15.0, 7.0, 12.0, 36.0, 41.0, 56.0, 92.0, 131.0, 168.0, 305.0, 479.0, 822.0, 1459.0, 3254.0, 8914.0, 34305.0, 204765.0, 676922.0, 87558.0, 18339.0, 5526.0, 2400.0, 1171.0, 664.0, 368.0, 238.0, 134.0, 101.0, 66.0, 53.0, 30.0, 23.0, 19.0, 20.0, 6.0, 10.0, 6.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.40625, -19.793212890625, -19.18017578125, -18.567138671875, -17.9541015625, -17.341064453125, -16.72802734375, -16.114990234375, -15.501953125, -14.888916015625, -14.27587890625, -13.662841796875, -13.0498046875, -12.436767578125, -11.82373046875, -11.210693359375, -10.59765625, -9.984619140625, -9.37158203125, -8.758544921875, -8.1455078125, -7.532470703125, -6.91943359375, -6.306396484375, -5.693359375, -5.080322265625, -4.46728515625, -3.854248046875, -3.2412109375, -2.628173828125, -2.01513671875, -1.402099609375, -0.7890625, -0.176025390625, 0.43701171875, 1.050048828125, 1.6630859375, 2.276123046875, 2.88916015625, 3.502197265625, 4.115234375, 4.728271484375, 5.34130859375, 5.954345703125, 6.5673828125, 7.180419921875, 7.79345703125, 8.406494140625, 9.01953125, 9.632568359375, 10.24560546875, 10.858642578125, 11.4716796875, 12.084716796875, 12.69775390625, 13.310791015625, 13.923828125, 14.536865234375, 15.14990234375, 15.762939453125, 16.3759765625, 16.989013671875, 17.60205078125, 18.215087890625, 18.828125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 9.0, 13.0, 19.0, 17.0, 24.0, 31.0, 49.0, 40.0, 57.0, 64.0, 94.0, 159.0, 1766.0, 241.0, 99.0, 62.0, 47.0, 63.0, 35.0, 32.0, 38.0, 18.0, 18.0, 9.0, 13.0, 4.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.625, -49.1201171875, -47.615234375, -46.1103515625, -44.60546875, -43.1005859375, -41.595703125, -40.0908203125, -38.5859375, -37.0810546875, -35.576171875, -34.0712890625, -32.56640625, -31.0615234375, -29.556640625, -28.0517578125, -26.546875, -25.0419921875, -23.537109375, -22.0322265625, -20.52734375, -19.0224609375, -17.517578125, -16.0126953125, -14.5078125, -13.0029296875, -11.498046875, -9.9931640625, -8.48828125, -6.9833984375, -5.478515625, -3.9736328125, -2.46875, -0.9638671875, 0.541015625, 2.0458984375, 3.55078125, 5.0556640625, 6.560546875, 8.0654296875, 9.5703125, 11.0751953125, 12.580078125, 14.0849609375, 15.58984375, 17.0947265625, 18.599609375, 20.1044921875, 21.609375, 23.1142578125, 24.619140625, 26.1240234375, 27.62890625, 29.1337890625, 30.638671875, 32.1435546875, 33.6484375, 35.1533203125, 36.658203125, 38.1630859375, 39.66796875, 41.1728515625, 42.677734375, 44.1826171875, 45.6875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 11.0, 15.0, 17.0, 31.0, 29.0, 41.0, 58.0, 96.0, 143.0, 391.0, 1992.0, 38095.0, 3096755.0, 6454.0, 917.0, 233.0, 114.0, 77.0, 54.0, 46.0, 29.0, 18.0, 21.0, 10.0, 14.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.125, -127.76171875, -123.3984375, -119.03515625, -114.671875, -110.30859375, -105.9453125, -101.58203125, -97.21875, -92.85546875, -88.4921875, -84.12890625, -79.765625, -75.40234375, -71.0390625, -66.67578125, -62.3125, -57.94921875, -53.5859375, -49.22265625, -44.859375, -40.49609375, -36.1328125, -31.76953125, -27.40625, -23.04296875, -18.6796875, -14.31640625, -9.953125, -5.58984375, -1.2265625, 3.13671875, 7.5, 11.86328125, 16.2265625, 20.58984375, 24.953125, 29.31640625, 33.6796875, 38.04296875, 42.40625, 46.76953125, 51.1328125, 55.49609375, 59.859375, 64.22265625, 68.5859375, 72.94921875, 77.3125, 81.67578125, 86.0390625, 90.40234375, 94.765625, 99.12890625, 103.4921875, 107.85546875, 112.21875, 116.58203125, 120.9453125, 125.30859375, 129.671875, 134.03515625, 138.3984375, 142.76171875, 147.125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [9.0, 314.0, 672.0, 25.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.24610137939453, -14.97284984588623, -2.6995983123779297, 9.573654174804688, 21.846904754638672, 34.120155334472656, 46.393409729003906, 58.666656494140625, 70.93991088867188, 83.21316528320312, 95.48641204833984, 107.7596664428711, 120.03291320800781, 132.30616760253906, 144.5794219970703, 156.8526611328125, 169.12591552734375, 181.399169921875, 193.67242431640625, 205.9456787109375, 218.2189178466797, 230.49217224121094, 242.7654266357422, 255.03866577148438, 267.31195068359375, 279.585205078125, 291.85845947265625, 304.1317138671875, 316.40496826171875, 328.67822265625, 340.95147705078125, 353.2247009277344, 365.4979553222656, 377.7712097167969, 390.0444641113281, 402.3177185058594, 414.5909729003906, 426.86419677734375, 439.137451171875, 451.41070556640625, 463.6839599609375, 475.95721435546875, 488.23046875, 500.50372314453125, 512.7769775390625, 525.0502319335938, 537.323486328125, 549.5967407226562, 561.8699951171875, 574.1432495117188, 586.41650390625, 598.6897583007812, 610.9630126953125, 623.2362670898438, 635.509521484375, 647.7827758789062, 660.0559692382812, 672.3292236328125, 684.6024780273438, 696.875732421875, 709.1489868164062, 721.4222412109375, 733.6954956054688, 745.96875, 758.2420043945312]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 10.0, 8.0, 6.0, 15.0, 11.0, 18.0, 16.0, 14.0, 21.0, 20.0, 27.0, 26.0, 30.0, 30.0, 31.0, 41.0, 46.0, 46.0, 41.0, 33.0, 34.0, 41.0, 42.0, 41.0, 35.0, 32.0, 40.0, 31.0, 27.0, 23.0, 23.0, 28.0, 22.0, 15.0, 17.0, 8.0, 7.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-115.62972259521484, -112.34939575195312, -109.0690689086914, -105.78874206542969, -102.50841522216797, -99.22808837890625, -95.94776153564453, -92.66743469238281, -89.3871078491211, -86.10678100585938, -82.82645416259766, -79.54612731933594, -76.26580047607422, -72.9854736328125, -69.70514678955078, -66.42481994628906, -63.14449691772461, -59.86417007446289, -56.58384323120117, -53.30351638793945, -50.023189544677734, -46.74286651611328, -43.46253967285156, -40.182212829589844, -36.901885986328125, -33.621559143066406, -30.341232299804688, -27.06090545654297, -23.78057861328125, -20.500253677368164, -17.219926834106445, -13.939599990844727, -10.659271240234375, -7.378944396972656, -4.098618030548096, -0.8182916641235352, 2.4620351791381836, 5.742361068725586, 9.022687911987305, 12.303014755249023, 15.583341598510742, 18.86366844177246, 22.14399528503418, 25.424320220947266, 28.704647064208984, 31.984973907470703, 35.26530075073242, 38.54562759399414, 41.82595443725586, 45.10628128051758, 48.3866081237793, 51.666934967041016, 54.947261810302734, 58.22758483886719, 61.507911682128906, 64.78823852539062, 68.06856536865234, 71.34889221191406, 74.62921905517578, 77.9095458984375, 81.18987274169922, 84.47019958496094, 87.75052642822266, 91.03085327148438, 94.3111801147461]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 10.0, 4.0, 4.0, 8.0, 8.0, 10.0, 6.0, 9.0, 22.0, 27.0, 35.0, 26.0, 26.0, 20.0, 27.0, 35.0, 32.0, 52.0, 53.0, 55.0, 52.0, 52.0, 49.0, 47.0, 43.0, 36.0, 42.0, 33.0, 39.0, 22.0, 22.0, 12.0, 8.0, 16.0, 13.0, 11.0, 11.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.892333984375, -11.50341796875, -11.114501953125, -10.7255859375, -10.336669921875, -9.94775390625, -9.558837890625, -9.169921875, -8.781005859375, -8.39208984375, -8.003173828125, -7.6142578125, -7.225341796875, -6.83642578125, -6.447509765625, -6.05859375, -5.669677734375, -5.28076171875, -4.891845703125, -4.5029296875, -4.114013671875, -3.72509765625, -3.336181640625, -2.947265625, -2.558349609375, -2.16943359375, -1.780517578125, -1.3916015625, -1.002685546875, -0.61376953125, -0.224853515625, 0.1640625, 0.552978515625, 0.94189453125, 1.330810546875, 1.7197265625, 2.108642578125, 2.49755859375, 2.886474609375, 3.275390625, 3.664306640625, 4.05322265625, 4.442138671875, 4.8310546875, 5.219970703125, 5.60888671875, 5.997802734375, 6.38671875, 6.775634765625, 7.16455078125, 7.553466796875, 7.9423828125, 8.331298828125, 8.72021484375, 9.109130859375, 9.498046875, 9.886962890625, 10.27587890625, 10.664794921875, 11.0537109375, 11.442626953125, 11.83154296875, 12.220458984375, 12.609375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 9.0, 11.0, 17.0, 22.0, 35.0, 30.0, 53.0, 82.0, 135.0, 204.0, 352.0, 555.0, 1080.0, 2152.0, 4339.0, 10046.0, 26795.0, 86465.0, 319421.0, 1030901.0, 1597310.0, 789015.0, 226456.0, 62092.0, 20767.0, 8188.0, 3599.0, 1823.0, 904.0, 539.0, 293.0, 187.0, 124.0, 78.0, 50.0, 38.0, 33.0, 17.0, 21.0, 12.0, 10.0, 10.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.5826416015625, -13.149658203125, -12.7166748046875, -12.28369140625, -11.8507080078125, -11.417724609375, -10.9847412109375, -10.5517578125, -10.1187744140625, -9.685791015625, -9.2528076171875, -8.81982421875, -8.3868408203125, -7.953857421875, -7.5208740234375, -7.087890625, -6.6549072265625, -6.221923828125, -5.7889404296875, -5.35595703125, -4.9229736328125, -4.489990234375, -4.0570068359375, -3.6240234375, -3.1910400390625, -2.758056640625, -2.3250732421875, -1.89208984375, -1.4591064453125, -1.026123046875, -0.5931396484375, -0.16015625, 0.2728271484375, 0.705810546875, 1.1387939453125, 1.57177734375, 2.0047607421875, 2.437744140625, 2.8707275390625, 3.3037109375, 3.7366943359375, 4.169677734375, 4.6026611328125, 5.03564453125, 5.4686279296875, 5.901611328125, 6.3345947265625, 6.767578125, 7.2005615234375, 7.633544921875, 8.0665283203125, 8.49951171875, 8.9324951171875, 9.365478515625, 9.7984619140625, 10.2314453125, 10.6644287109375, 11.097412109375, 11.5303955078125, 11.96337890625, 12.3963623046875, 12.829345703125, 13.2623291015625, 13.6953125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 5.0, 6.0, 7.0, 7.0, 10.0, 8.0, 19.0, 24.0, 37.0, 48.0, 56.0, 85.0, 77.0, 129.0, 161.0, 186.0, 254.0, 301.0, 358.0, 372.0, 347.0, 294.0, 244.0, 209.0, 160.0, 130.0, 120.0, 103.0, 67.0, 47.0, 41.0, 26.0, 28.0, 23.0, 23.0, 9.0, 15.0, 8.0, 7.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2109375, -14.6964111328125, -14.181884765625, -13.6673583984375, -13.15283203125, -12.6383056640625, -12.123779296875, -11.6092529296875, -11.0947265625, -10.5802001953125, -10.065673828125, -9.5511474609375, -9.03662109375, -8.5220947265625, -8.007568359375, -7.4930419921875, -6.978515625, -6.4639892578125, -5.949462890625, -5.4349365234375, -4.92041015625, -4.4058837890625, -3.891357421875, -3.3768310546875, -2.8623046875, -2.3477783203125, -1.833251953125, -1.3187255859375, -0.80419921875, -0.2896728515625, 0.224853515625, 0.7393798828125, 1.25390625, 1.7684326171875, 2.282958984375, 2.7974853515625, 3.31201171875, 3.8265380859375, 4.341064453125, 4.8555908203125, 5.3701171875, 5.8846435546875, 6.399169921875, 6.9136962890625, 7.42822265625, 7.9427490234375, 8.457275390625, 8.9718017578125, 9.486328125, 10.0008544921875, 10.515380859375, 11.0299072265625, 11.54443359375, 12.0589599609375, 12.573486328125, 13.0880126953125, 13.6025390625, 14.1170654296875, 14.631591796875, 15.1461181640625, 15.66064453125, 16.1751708984375, 16.689697265625, 17.2042236328125, 17.71875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 7.0, 16.0, 9.0, 19.0, 25.0, 41.0, 37.0, 64.0, 73.0, 103.0, 136.0, 198.0, 253.0, 359.0, 619.0, 1697.0, 9251.0, 180093.0, 3673127.0, 311309.0, 12842.0, 2000.0, 683.0, 400.0, 225.0, 190.0, 115.0, 102.0, 75.0, 46.0, 38.0, 27.0, 25.0, 9.0, 19.0, 6.0, 7.0, 7.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-65.8125, -63.90869140625, -62.0048828125, -60.10107421875, -58.197265625, -56.29345703125, -54.3896484375, -52.48583984375, -50.58203125, -48.67822265625, -46.7744140625, -44.87060546875, -42.966796875, -41.06298828125, -39.1591796875, -37.25537109375, -35.3515625, -33.44775390625, -31.5439453125, -29.64013671875, -27.736328125, -25.83251953125, -23.9287109375, -22.02490234375, -20.12109375, -18.21728515625, -16.3134765625, -14.40966796875, -12.505859375, -10.60205078125, -8.6982421875, -6.79443359375, -4.890625, -2.98681640625, -1.0830078125, 0.82080078125, 2.724609375, 4.62841796875, 6.5322265625, 8.43603515625, 10.33984375, 12.24365234375, 14.1474609375, 16.05126953125, 17.955078125, 19.85888671875, 21.7626953125, 23.66650390625, 25.5703125, 27.47412109375, 29.3779296875, 31.28173828125, 33.185546875, 35.08935546875, 36.9931640625, 38.89697265625, 40.80078125, 42.70458984375, 44.6083984375, 46.51220703125, 48.416015625, 50.31982421875, 52.2236328125, 54.12744140625, 56.03125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 11.0, 30.0, 52.0, 95.0, 133.0, 136.0, 185.0, 118.0, 115.0, 65.0, 22.0, 15.0, 14.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.8058090209961, -112.04943084716797, -108.29306030273438, -104.53668212890625, -100.78030395507812, -97.02393341064453, -93.2675552368164, -89.51118469238281, -85.75480651855469, -81.99842834472656, -78.24205780029297, -74.48567962646484, -70.72930908203125, -66.97293090820312, -63.216552734375, -59.46017837524414, -55.70380401611328, -51.94742965698242, -48.19105529785156, -44.43467712402344, -40.67830276489258, -36.92192840576172, -33.165550231933594, -29.409175872802734, -25.652801513671875, -21.896427154541016, -18.140050888061523, -14.383675575256348, -10.627300262451172, -6.8709259033203125, -3.1145496368408203, 0.6418266296386719, 4.398193359375, 8.154568672180176, 11.910943984985352, 15.667319297790527, 19.423694610595703, 23.180068969726562, 26.936445236206055, 30.692821502685547, 34.449195861816406, 38.205570220947266, 41.961944580078125, 45.71832275390625, 49.47469711303711, 53.23107147216797, 56.987449645996094, 60.74382400512695, 64.50019836425781, 68.25657653808594, 72.01294708251953, 75.76932525634766, 79.52569580078125, 83.28207397460938, 87.0384521484375, 90.79483032226562, 94.55120086669922, 98.30757904052734, 102.06394958496094, 105.82032775878906, 109.57670593261719, 113.33307647705078, 117.0894546508789, 120.8458251953125, 124.60220336914062]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 6.0, 16.0, 12.0, 19.0, 13.0, 29.0, 19.0, 24.0, 38.0, 30.0, 25.0, 31.0, 41.0, 39.0, 39.0, 32.0, 55.0, 55.0, 22.0, 38.0, 41.0, 31.0, 31.0, 28.0, 26.0, 35.0, 28.0, 23.0, 23.0, 20.0, 18.0, 16.0, 15.0, 15.0, 11.0, 10.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.02471923828125, -61.943668365478516, -59.86261749267578, -57.78157043457031, -55.70051956176758, -53.619468688964844, -51.538421630859375, -49.45737075805664, -47.376319885253906, -45.29526901245117, -43.21421813964844, -41.13317108154297, -39.052120208740234, -36.9710693359375, -34.89002227783203, -32.8089714050293, -30.727920532226562, -28.646869659423828, -26.565820693969727, -24.484771728515625, -22.40372085571289, -20.322669982910156, -18.241621017456055, -16.160572052001953, -14.079521179199219, -11.9984712600708, -9.917421340942383, -7.836371421813965, -5.755321502685547, -3.674271583557129, -1.593221664428711, 0.48782825469970703, 2.568878173828125, 4.649928092956543, 6.730978012084961, 8.812027931213379, 10.893077850341797, 12.974127769470215, 15.055177688598633, 17.136226654052734, 19.21727752685547, 21.298328399658203, 23.379377365112305, 25.460426330566406, 27.54147720336914, 29.622528076171875, 31.703577041625977, 33.78462600708008, 35.86567687988281, 37.94672775268555, 40.02777862548828, 42.10882568359375, 44.189876556396484, 46.27092742919922, 48.35197448730469, 50.43302536010742, 52.514076232910156, 54.59512710571289, 56.676177978515625, 58.757225036621094, 60.83827590942383, 62.91932678222656, 65.00037384033203, 67.08142852783203, 69.1624755859375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 11.0, 13.0, 7.0, 15.0, 17.0, 21.0, 17.0, 28.0, 16.0, 24.0, 30.0, 31.0, 49.0, 37.0, 36.0, 46.0, 43.0, 43.0, 55.0, 43.0, 47.0, 59.0, 32.0, 41.0, 29.0, 33.0, 29.0, 31.0, 17.0, 16.0, 17.0, 18.0, 9.0, 8.0, 8.0, 5.0, 9.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.1484375, -11.769775390625, -11.39111328125, -11.012451171875, -10.6337890625, -10.255126953125, -9.87646484375, -9.497802734375, -9.119140625, -8.740478515625, -8.36181640625, -7.983154296875, -7.6044921875, -7.225830078125, -6.84716796875, -6.468505859375, -6.08984375, -5.711181640625, -5.33251953125, -4.953857421875, -4.5751953125, -4.196533203125, -3.81787109375, -3.439208984375, -3.060546875, -2.681884765625, -2.30322265625, -1.924560546875, -1.5458984375, -1.167236328125, -0.78857421875, -0.409912109375, -0.03125, 0.347412109375, 0.72607421875, 1.104736328125, 1.4833984375, 1.862060546875, 2.24072265625, 2.619384765625, 2.998046875, 3.376708984375, 3.75537109375, 4.134033203125, 4.5126953125, 4.891357421875, 5.27001953125, 5.648681640625, 6.02734375, 6.406005859375, 6.78466796875, 7.163330078125, 7.5419921875, 7.920654296875, 8.29931640625, 8.677978515625, 9.056640625, 9.435302734375, 9.81396484375, 10.192626953125, 10.5712890625, 10.949951171875, 11.32861328125, 11.707275390625, 12.0859375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 16.0, 23.0, 25.0, 40.0, 76.0, 111.0, 142.0, 196.0, 327.0, 487.0, 704.0, 1034.0, 1682.0, 2538.0, 3871.0, 6312.0, 9809.0, 15934.0, 26444.0, 45132.0, 79603.0, 135568.0, 201999.0, 198111.0, 130707.0, 76568.0, 43686.0, 25388.0, 15491.0, 9490.0, 6021.0, 3784.0, 2487.0, 1496.0, 1059.0, 751.0, 488.0, 285.0, 221.0, 140.0, 102.0, 55.0, 45.0, 39.0, 17.0, 12.0, 12.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2568359375, -1.21624755859375, -1.1756591796875, -1.13507080078125, -1.094482421875, -1.05389404296875, -1.0133056640625, -0.97271728515625, -0.93212890625, -0.89154052734375, -0.8509521484375, -0.81036376953125, -0.769775390625, -0.72918701171875, -0.6885986328125, -0.64801025390625, -0.607421875, -0.56683349609375, -0.5262451171875, -0.48565673828125, -0.445068359375, -0.40447998046875, -0.3638916015625, -0.32330322265625, -0.28271484375, -0.24212646484375, -0.2015380859375, -0.16094970703125, -0.120361328125, -0.07977294921875, -0.0391845703125, 0.00140380859375, 0.0419921875, 0.08258056640625, 0.1231689453125, 0.16375732421875, 0.204345703125, 0.24493408203125, 0.2855224609375, 0.32611083984375, 0.36669921875, 0.40728759765625, 0.4478759765625, 0.48846435546875, 0.529052734375, 0.56964111328125, 0.6102294921875, 0.65081787109375, 0.69140625, 0.73199462890625, 0.7725830078125, 0.81317138671875, 0.853759765625, 0.89434814453125, 0.9349365234375, 0.97552490234375, 1.01611328125, 1.05670166015625, 1.0972900390625, 1.13787841796875, 1.178466796875, 1.21905517578125, 1.2596435546875, 1.30023193359375, 1.3408203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 11.0, 10.0, 10.0, 11.0, 11.0, 21.0, 13.0, 19.0, 25.0, 26.0, 26.0, 27.0, 18.0, 33.0, 26.0, 39.0, 45.0, 34.0, 37.0, 39.0, 1061.0, 36.0, 32.0, 27.0, 45.0, 37.0, 22.0, 19.0, 41.0, 28.0, 29.0, 24.0, 21.0, 17.0, 17.0, 11.0, 19.0, 15.0, 7.0, 8.0, 2.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.859375, -6.65045166015625, -6.4415283203125, -6.23260498046875, -6.023681640625, -5.81475830078125, -5.6058349609375, -5.39691162109375, -5.18798828125, -4.97906494140625, -4.7701416015625, -4.56121826171875, -4.352294921875, -4.14337158203125, -3.9344482421875, -3.72552490234375, -3.5166015625, -3.30767822265625, -3.0987548828125, -2.88983154296875, -2.680908203125, -2.47198486328125, -2.2630615234375, -2.05413818359375, -1.84521484375, -1.63629150390625, -1.4273681640625, -1.21844482421875, -1.009521484375, -0.80059814453125, -0.5916748046875, -0.38275146484375, -0.173828125, 0.03509521484375, 0.2440185546875, 0.45294189453125, 0.661865234375, 0.87078857421875, 1.0797119140625, 1.28863525390625, 1.49755859375, 1.70648193359375, 1.9154052734375, 2.12432861328125, 2.333251953125, 2.54217529296875, 2.7510986328125, 2.96002197265625, 3.1689453125, 3.37786865234375, 3.5867919921875, 3.79571533203125, 4.004638671875, 4.21356201171875, 4.4224853515625, 4.63140869140625, 4.84033203125, 5.04925537109375, 5.2581787109375, 5.46710205078125, 5.676025390625, 5.88494873046875, 6.0938720703125, 6.30279541015625, 6.51171875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 16.0, 26.0, 31.0, 36.0, 70.0, 108.0, 168.0, 221.0, 342.0, 540.0, 751.0, 1093.0, 1718.0, 2676.0, 3958.0, 6020.0, 9373.0, 14403.0, 22479.0, 34833.0, 53933.0, 81219.0, 117318.0, 254829.0, 1100243.0, 128924.0, 90416.0, 60555.0, 39131.0, 25249.0, 16050.0, 10469.0, 6771.0, 4592.0, 2847.0, 1852.0, 1270.0, 878.0, 592.0, 379.0, 270.0, 160.0, 98.0, 68.0, 41.0, 39.0, 18.0, 16.0, 21.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.7607421875, -0.7377853393554688, -0.7148284912109375, -0.6918716430664062, -0.668914794921875, -0.6459579467773438, -0.6230010986328125, -0.6000442504882812, -0.57708740234375, -0.5541305541992188, -0.5311737060546875, -0.5082168579101562, -0.485260009765625, -0.46230316162109375, -0.4393463134765625, -0.41638946533203125, -0.3934326171875, -0.37047576904296875, -0.3475189208984375, -0.32456207275390625, -0.301605224609375, -0.27864837646484375, -0.2556915283203125, -0.23273468017578125, -0.20977783203125, -0.18682098388671875, -0.1638641357421875, -0.14090728759765625, -0.117950439453125, -0.09499359130859375, -0.0720367431640625, -0.04907989501953125, -0.026123046875, -0.00316619873046875, 0.0197906494140625, 0.04274749755859375, 0.065704345703125, 0.08866119384765625, 0.1116180419921875, 0.13457489013671875, 0.15753173828125, 0.18048858642578125, 0.2034454345703125, 0.22640228271484375, 0.249359130859375, 0.27231597900390625, 0.2952728271484375, 0.31822967529296875, 0.3411865234375, 0.36414337158203125, 0.3871002197265625, 0.41005706787109375, 0.433013916015625, 0.45597076416015625, 0.4789276123046875, 0.5018844604492188, 0.52484130859375, 0.5477981567382812, 0.5707550048828125, 0.5937118530273438, 0.616668701171875, 0.6396255493164062, 0.6625823974609375, 0.6855392456054688, 0.70849609375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 8.0, 3.0, 16.0, 14.0, 15.0, 12.0, 17.0, 18.0, 17.0, 31.0, 26.0, 35.0, 43.0, 46.0, 62.0, 59.0, 75.0, 70.0, 75.0, 39.0, 51.0, 34.0, 34.0, 36.0, 33.0, 18.0, 14.0, 21.0, 9.0, 9.0, 10.0, 4.0, 5.0, 6.0, 5.0, 4.0, 3.0, 9.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0294647216796875, -0.028639554977416992, -0.027814388275146484, -0.026989221572875977, -0.02616405487060547, -0.02533888816833496, -0.024513721466064453, -0.023688554763793945, -0.022863388061523438, -0.02203822135925293, -0.021213054656982422, -0.020387887954711914, -0.019562721252441406, -0.0187375545501709, -0.01791238784790039, -0.017087221145629883, -0.016262054443359375, -0.015436887741088867, -0.01461172103881836, -0.013786554336547852, -0.012961387634277344, -0.012136220932006836, -0.011311054229736328, -0.01048588752746582, -0.009660720825195312, -0.008835554122924805, -0.008010387420654297, -0.007185220718383789, -0.006360054016113281, -0.0055348873138427734, -0.004709720611572266, -0.003884553909301758, -0.00305938720703125, -0.002234220504760742, -0.0014090538024902344, -0.0005838871002197266, 0.00024127960205078125, 0.001066446304321289, 0.0018916130065917969, 0.0027167797088623047, 0.0035419464111328125, 0.00436711311340332, 0.005192279815673828, 0.006017446517944336, 0.006842613220214844, 0.0076677799224853516, 0.00849294662475586, 0.009318113327026367, 0.010143280029296875, 0.010968446731567383, 0.01179361343383789, 0.012618780136108398, 0.013443946838378906, 0.014269113540649414, 0.015094280242919922, 0.01591944694519043, 0.016744613647460938, 0.017569780349731445, 0.018394947052001953, 0.01922011375427246, 0.02004528045654297, 0.020870447158813477, 0.021695613861083984, 0.022520780563354492, 0.023345947265625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 4.0, 3.0, 4.0, 6.0, 6.0, 4.0, 15.0, 7.0, 13.0, 22.0, 25.0, 36.0, 40.0, 51.0, 62.0, 78.0, 118.0, 245.0, 479.0, 7937.0, 1034746.0, 3517.0, 457.0, 194.0, 112.0, 79.0, 50.0, 55.0, 40.0, 18.0, 30.0, 15.0, 11.0, 20.0, 12.0, 8.0, 9.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.556640625, -0.5370635986328125, -0.517486572265625, -0.4979095458984375, -0.47833251953125, -0.4587554931640625, -0.439178466796875, -0.4196014404296875, -0.4000244140625, -0.3804473876953125, -0.360870361328125, -0.3412933349609375, -0.32171630859375, -0.3021392822265625, -0.282562255859375, -0.2629852294921875, -0.243408203125, -0.2238311767578125, -0.204254150390625, -0.1846771240234375, -0.16510009765625, -0.1455230712890625, -0.125946044921875, -0.1063690185546875, -0.0867919921875, -0.0672149658203125, -0.047637939453125, -0.0280609130859375, -0.00848388671875, 0.0110931396484375, 0.030670166015625, 0.0502471923828125, 0.06982421875, 0.0894012451171875, 0.108978271484375, 0.1285552978515625, 0.14813232421875, 0.1677093505859375, 0.187286376953125, 0.2068634033203125, 0.2264404296875, 0.2460174560546875, 0.265594482421875, 0.2851715087890625, 0.30474853515625, 0.3243255615234375, 0.343902587890625, 0.3634796142578125, 0.383056640625, 0.4026336669921875, 0.422210693359375, 0.4417877197265625, 0.46136474609375, 0.4809417724609375, 0.500518798828125, 0.5200958251953125, 0.5396728515625, 0.5592498779296875, 0.578826904296875, 0.5984039306640625, 0.61798095703125, 0.6375579833984375, 0.657135009765625, 0.6767120361328125, 0.6962890625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 118.0, 892.0, 3.0, 0.0, 1.0], "bins": [-0.87105393409729, -0.8566151261329651, -0.8421763181686401, -0.8277375102043152, -0.813298761844635, -0.7988599538803101, -0.7844211459159851, -0.7699823379516602, -0.7555435299873352, -0.7411047220230103, -0.7266659140586853, -0.7122271060943604, -0.6977883577346802, -0.6833495497703552, -0.6689107418060303, -0.6544719338417053, -0.6400331258773804, -0.6255943179130554, -0.6111555099487305, -0.5967167019844055, -0.5822779536247253, -0.5678391456604004, -0.5534003376960754, -0.5389615297317505, -0.5245227217674255, -0.5100839138031006, -0.495645135641098, -0.48120632767677307, -0.4667675197124481, -0.45232874155044556, -0.4378899335861206, -0.42345112562179565, -0.4090123176574707, -0.39457350969314575, -0.3801347315311432, -0.36569592356681824, -0.3512571156024933, -0.3368183374404907, -0.32237952947616577, -0.3079407215118408, -0.29350194334983826, -0.2790631353855133, -0.26462435722351074, -0.2501855492591858, -0.23574674129486084, -0.22130794823169708, -0.20686915516853333, -0.19243034720420837, -0.17799153923988342, -0.16355274617671967, -0.14911393821239471, -0.13467514514923096, -0.120236337184906, -0.10579754412174225, -0.0913587436079979, -0.07691994309425354, -0.062481142580509186, -0.04804234206676483, -0.03360354155302048, -0.01916474476456642, -0.004725944250822067, 0.009712852537631989, 0.024151653051376343, 0.0385904535651207, 0.05302925407886505]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 8.0, 15.0, 15.0, 23.0, 21.0, 28.0, 36.0, 28.0, 35.0, 36.0, 41.0, 28.0, 46.0, 37.0, 57.0, 50.0, 44.0, 52.0, 47.0, 37.0, 40.0, 38.0, 30.0, 36.0, 34.0, 24.0, 22.0, 14.0, 13.0, 10.0, 8.0, 9.0, 5.0, 8.0, 0.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.041173458099365234, -0.03997927904129028, -0.03878509998321533, -0.03759091719985008, -0.03639673814177513, -0.03520255908370018, -0.03400837630033493, -0.03281419724225998, -0.03162001818418503, -0.030425839126110077, -0.029231658205389977, -0.028037477284669876, -0.026843298226594925, -0.025649119168519974, -0.024454938247799873, -0.023260757327079773, -0.022066578269004822, -0.02087239921092987, -0.01967821829020977, -0.01848403736948967, -0.01728985831141472, -0.016095679253339767, -0.014901498332619667, -0.013707318343222141, -0.012513138353824615, -0.01131895836442709, -0.010124778375029564, -0.008930598385632038, -0.007736418396234512, -0.0065422384068369865, -0.005348058417439461, -0.004153878428041935, -0.002959698438644409, -0.0017655184492468834, -0.0005713384598493576, 0.0006228415295481682, 0.001817021518945694, 0.0030112015083432198, 0.0042053814977407455, 0.005399561487138271, 0.006593741476535797, 0.007787921465933323, 0.008982101455330849, 0.010176281444728374, 0.0113704614341259, 0.012564641423523426, 0.013758821412920952, 0.014953001402318478, 0.016147181391716003, 0.017341360449790955, 0.018535541370511055, 0.019729722291231155, 0.020923901349306107, 0.022118080407381058, 0.023312261328101158, 0.02450644224882126, 0.02570062130689621, 0.02689480036497116, 0.02808898128569126, 0.02928316220641136, 0.030477341264486313, 0.031671520322561264, 0.032865703105926514, 0.034059882164001465, 0.035254061222076416]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 11.0, 13.0, 7.0, 15.0, 17.0, 21.0, 17.0, 28.0, 16.0, 24.0, 29.0, 32.0, 50.0, 36.0, 35.0, 47.0, 43.0, 42.0, 55.0, 44.0, 47.0, 59.0, 31.0, 42.0, 29.0, 33.0, 30.0, 30.0, 17.0, 16.0, 17.0, 18.0, 9.0, 8.0, 8.0, 5.0, 9.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.1484375, -11.769775390625, -11.39111328125, -11.012451171875, -10.6337890625, -10.255126953125, -9.87646484375, -9.497802734375, -9.119140625, -8.740478515625, -8.36181640625, -7.983154296875, -7.6044921875, -7.225830078125, -6.84716796875, -6.468505859375, -6.08984375, -5.711181640625, -5.33251953125, -4.953857421875, -4.5751953125, -4.196533203125, -3.81787109375, -3.439208984375, -3.060546875, -2.681884765625, -2.30322265625, -1.924560546875, -1.5458984375, -1.167236328125, -0.78857421875, -0.409912109375, -0.03125, 0.347412109375, 0.72607421875, 1.104736328125, 1.4833984375, 1.862060546875, 2.24072265625, 2.619384765625, 2.998046875, 3.376708984375, 3.75537109375, 4.134033203125, 4.5126953125, 4.891357421875, 5.27001953125, 5.648681640625, 6.02734375, 6.406005859375, 6.78466796875, 7.163330078125, 7.5419921875, 7.920654296875, 8.29931640625, 8.677978515625, 9.056640625, 9.435302734375, 9.81396484375, 10.192626953125, 10.5712890625, 10.949951171875, 11.32861328125, 11.707275390625, 12.0859375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 11.0, 8.0, 14.0, 10.0, 20.0, 48.0, 68.0, 89.0, 171.0, 283.0, 493.0, 981.0, 1822.0, 3735.0, 7717.0, 16869.0, 40856.0, 110091.0, 334879.0, 343105.0, 112782.0, 41460.0, 17236.0, 7957.0, 3712.0, 1911.0, 1020.0, 512.0, 259.0, 161.0, 102.0, 48.0, 41.0, 20.0, 16.0, 11.0, 14.0, 6.0, 10.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.046875, -10.7017822265625, -10.356689453125, -10.0115966796875, -9.66650390625, -9.3214111328125, -8.976318359375, -8.6312255859375, -8.2861328125, -7.9410400390625, -7.595947265625, -7.2508544921875, -6.90576171875, -6.5606689453125, -6.215576171875, -5.8704833984375, -5.525390625, -5.1802978515625, -4.835205078125, -4.4901123046875, -4.14501953125, -3.7999267578125, -3.454833984375, -3.1097412109375, -2.7646484375, -2.4195556640625, -2.074462890625, -1.7293701171875, -1.38427734375, -1.0391845703125, -0.694091796875, -0.3489990234375, -0.00390625, 0.3411865234375, 0.686279296875, 1.0313720703125, 1.37646484375, 1.7215576171875, 2.066650390625, 2.4117431640625, 2.7568359375, 3.1019287109375, 3.447021484375, 3.7921142578125, 4.13720703125, 4.4822998046875, 4.827392578125, 5.1724853515625, 5.517578125, 5.8626708984375, 6.207763671875, 6.5528564453125, 6.89794921875, 7.2430419921875, 7.588134765625, 7.9332275390625, 8.2783203125, 8.6234130859375, 8.968505859375, 9.3135986328125, 9.65869140625, 10.0037841796875, 10.348876953125, 10.6939697265625, 11.0390625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 11.0, 17.0, 7.0, 11.0, 16.0, 20.0, 16.0, 21.0, 21.0, 33.0, 26.0, 38.0, 52.0, 39.0, 64.0, 71.0, 99.0, 234.0, 1466.0, 253.0, 82.0, 62.0, 37.0, 43.0, 36.0, 33.0, 27.0, 32.0, 34.0, 22.0, 27.0, 17.0, 15.0, 13.0, 9.0, 8.0, 5.0, 8.0, 7.0, 3.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.25, -33.1953125, -32.140625, -31.0859375, -30.03125, -28.9765625, -27.921875, -26.8671875, -25.8125, -24.7578125, -23.703125, -22.6484375, -21.59375, -20.5390625, -19.484375, -18.4296875, -17.375, -16.3203125, -15.265625, -14.2109375, -13.15625, -12.1015625, -11.046875, -9.9921875, -8.9375, -7.8828125, -6.828125, -5.7734375, -4.71875, -3.6640625, -2.609375, -1.5546875, -0.5, 0.5546875, 1.609375, 2.6640625, 3.71875, 4.7734375, 5.828125, 6.8828125, 7.9375, 8.9921875, 10.046875, 11.1015625, 12.15625, 13.2109375, 14.265625, 15.3203125, 16.375, 17.4296875, 18.484375, 19.5390625, 20.59375, 21.6484375, 22.703125, 23.7578125, 24.8125, 25.8671875, 26.921875, 27.9765625, 29.03125, 30.0859375, 31.140625, 32.1953125, 33.25]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 11.0, 3.0, 9.0, 9.0, 14.0, 14.0, 15.0, 22.0, 42.0, 54.0, 55.0, 81.0, 82.0, 111.0, 150.0, 202.0, 324.0, 811.0, 4702.0, 129647.0, 2965835.0, 39046.0, 2685.0, 669.0, 313.0, 193.0, 147.0, 100.0, 94.0, 65.0, 46.0, 28.0, 32.0, 19.0, 22.0, 13.0, 13.0, 8.0, 7.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.5625, -59.66015625, -57.7578125, -55.85546875, -53.953125, -52.05078125, -50.1484375, -48.24609375, -46.34375, -44.44140625, -42.5390625, -40.63671875, -38.734375, -36.83203125, -34.9296875, -33.02734375, -31.125, -29.22265625, -27.3203125, -25.41796875, -23.515625, -21.61328125, -19.7109375, -17.80859375, -15.90625, -14.00390625, -12.1015625, -10.19921875, -8.296875, -6.39453125, -4.4921875, -2.58984375, -0.6875, 1.21484375, 3.1171875, 5.01953125, 6.921875, 8.82421875, 10.7265625, 12.62890625, 14.53125, 16.43359375, 18.3359375, 20.23828125, 22.140625, 24.04296875, 25.9453125, 27.84765625, 29.75, 31.65234375, 33.5546875, 35.45703125, 37.359375, 39.26171875, 41.1640625, 43.06640625, 44.96875, 46.87109375, 48.7734375, 50.67578125, 52.578125, 54.48046875, 56.3828125, 58.28515625, 60.1875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 275.0, 713.0, 29.0], "bins": [-778.1177368164062, -765.5999755859375, -753.0822143554688, -740.564453125, -728.0467529296875, -715.5289916992188, -703.01123046875, -690.4934692382812, -677.9757080078125, -665.4579467773438, -652.940185546875, -640.4224243164062, -627.9047241210938, -615.386962890625, -602.8692016601562, -590.3514404296875, -577.8336791992188, -565.31591796875, -552.7981567382812, -540.2803955078125, -527.7626953125, -515.2449340820312, -502.7271728515625, -490.20941162109375, -477.6916809082031, -465.1739196777344, -452.65618896484375, -440.138427734375, -427.62066650390625, -415.1029052734375, -402.5851745605469, -390.0674133300781, -377.5496826171875, -365.03192138671875, -352.5141906738281, -339.9964294433594, -327.4786682128906, -314.9609069824219, -302.44317626953125, -289.9254150390625, -277.40765380859375, -264.889892578125, -252.3721466064453, -239.85440063476562, -227.33663940429688, -214.8188934326172, -202.3011474609375, -189.78338623046875, -177.265625, -164.7478790283203, -152.23011779785156, -139.71237182617188, -127.19461059570312, -114.67686462402344, -102.15911102294922, -89.641357421875, -77.12360382080078, -64.60585021972656, -52.088096618652344, -39.57034683227539, -27.052593231201172, -14.534839630126953, -2.01708984375, 10.500663757324219, 23.018417358398438]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 9.0, 9.0, 21.0, 13.0, 21.0, 21.0, 21.0, 28.0, 22.0, 25.0, 29.0, 38.0, 40.0, 31.0, 38.0, 38.0, 40.0, 48.0, 31.0, 45.0, 43.0, 37.0, 42.0, 26.0, 32.0, 29.0, 25.0, 34.0, 22.0, 27.0, 15.0, 15.0, 12.0, 10.0, 14.0, 4.0, 5.0, 6.0, 3.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.95528411865234, -71.37560272216797, -68.79592895507812, -66.21624755859375, -63.636566162109375, -61.056888580322266, -58.477210998535156, -55.89752960205078, -53.31785202026367, -50.73817443847656, -48.15849304199219, -45.57881546020508, -42.99913787841797, -40.419456481933594, -37.839778900146484, -35.260101318359375, -32.680419921875, -30.100740432739258, -27.521060943603516, -24.941383361816406, -22.361703872680664, -19.782024383544922, -17.202346801757812, -14.62266731262207, -12.042987823486328, -9.463308334350586, -6.88362979888916, -4.303950786590576, -1.7242717742919922, 0.85540771484375, 3.435086250305176, 6.014764785766602, 8.594436645507812, 11.174116134643555, 13.75379467010498, 16.333473205566406, 18.91315269470215, 21.49283218383789, 24.072509765625, 26.652189254760742, 29.231868743896484, 31.811548233032227, 34.39122772216797, 36.97090530395508, 39.55058288574219, 42.13026428222656, 44.70994186401367, 47.28961944580078, 49.869300842285156, 52.448978424072266, 55.02865982055664, 57.60833740234375, 60.188018798828125, 62.767696380615234, 65.34737396240234, 67.92705535888672, 70.50672912597656, 73.08641052246094, 75.66608428955078, 78.24576568603516, 80.82544708251953, 83.40512084960938, 85.98480224609375, 88.56448364257812, 91.1441650390625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 10.0, 8.0, 14.0, 17.0, 14.0, 21.0, 16.0, 25.0, 21.0, 27.0, 27.0, 29.0, 33.0, 44.0, 48.0, 33.0, 49.0, 44.0, 53.0, 47.0, 51.0, 48.0, 42.0, 35.0, 29.0, 40.0, 32.0, 17.0, 19.0, 21.0, 14.0, 15.0, 11.0, 12.0, 6.0, 9.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.6328125, -11.2457275390625, -10.858642578125, -10.4715576171875, -10.08447265625, -9.6973876953125, -9.310302734375, -8.9232177734375, -8.5361328125, -8.1490478515625, -7.761962890625, -7.3748779296875, -6.98779296875, -6.6007080078125, -6.213623046875, -5.8265380859375, -5.439453125, -5.0523681640625, -4.665283203125, -4.2781982421875, -3.89111328125, -3.5040283203125, -3.116943359375, -2.7298583984375, -2.3427734375, -1.9556884765625, -1.568603515625, -1.1815185546875, -0.79443359375, -0.4073486328125, -0.020263671875, 0.3668212890625, 0.75390625, 1.1409912109375, 1.528076171875, 1.9151611328125, 2.30224609375, 2.6893310546875, 3.076416015625, 3.4635009765625, 3.8505859375, 4.2376708984375, 4.624755859375, 5.0118408203125, 5.39892578125, 5.7860107421875, 6.173095703125, 6.5601806640625, 6.947265625, 7.3343505859375, 7.721435546875, 8.1085205078125, 8.49560546875, 8.8826904296875, 9.269775390625, 9.6568603515625, 10.0439453125, 10.4310302734375, 10.818115234375, 11.2052001953125, 11.59228515625, 11.9793701171875, 12.366455078125, 12.7535400390625, 13.140625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 5.0, 6.0, 12.0, 15.0, 15.0, 27.0, 29.0, 33.0, 47.0, 61.0, 95.0, 94.0, 148.0, 274.0, 599.0, 1722.0, 6874.0, 38566.0, 363243.0, 2797112.0, 893892.0, 74747.0, 12105.0, 2686.0, 824.0, 338.0, 167.0, 134.0, 95.0, 75.0, 60.0, 38.0, 34.0, 23.0, 23.0, 16.0, 8.0, 11.0, 10.0, 4.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.65625, -23.76513671875, -22.8740234375, -21.98291015625, -21.091796875, -20.20068359375, -19.3095703125, -18.41845703125, -17.52734375, -16.63623046875, -15.7451171875, -14.85400390625, -13.962890625, -13.07177734375, -12.1806640625, -11.28955078125, -10.3984375, -9.50732421875, -8.6162109375, -7.72509765625, -6.833984375, -5.94287109375, -5.0517578125, -4.16064453125, -3.26953125, -2.37841796875, -1.4873046875, -0.59619140625, 0.294921875, 1.18603515625, 2.0771484375, 2.96826171875, 3.859375, 4.75048828125, 5.6416015625, 6.53271484375, 7.423828125, 8.31494140625, 9.2060546875, 10.09716796875, 10.98828125, 11.87939453125, 12.7705078125, 13.66162109375, 14.552734375, 15.44384765625, 16.3349609375, 17.22607421875, 18.1171875, 19.00830078125, 19.8994140625, 20.79052734375, 21.681640625, 22.57275390625, 23.4638671875, 24.35498046875, 25.24609375, 26.13720703125, 27.0283203125, 27.91943359375, 28.810546875, 29.70166015625, 30.5927734375, 31.48388671875, 32.375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 7.0, 19.0, 31.0, 31.0, 37.0, 66.0, 59.0, 96.0, 122.0, 166.0, 213.0, 278.0, 438.0, 443.0, 478.0, 368.0, 301.0, 230.0, 185.0, 112.0, 106.0, 61.0, 50.0, 40.0, 29.0, 22.0, 9.0, 14.0, 8.0, 5.0, 7.0, 2.0, 3.0, 1.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.516845703125, -18.90869140625, -18.300537109375, -17.6923828125, -17.084228515625, -16.47607421875, -15.867919921875, -15.259765625, -14.651611328125, -14.04345703125, -13.435302734375, -12.8271484375, -12.218994140625, -11.61083984375, -11.002685546875, -10.39453125, -9.786376953125, -9.17822265625, -8.570068359375, -7.9619140625, -7.353759765625, -6.74560546875, -6.137451171875, -5.529296875, -4.921142578125, -4.31298828125, -3.704833984375, -3.0966796875, -2.488525390625, -1.88037109375, -1.272216796875, -0.6640625, -0.055908203125, 0.55224609375, 1.160400390625, 1.7685546875, 2.376708984375, 2.98486328125, 3.593017578125, 4.201171875, 4.809326171875, 5.41748046875, 6.025634765625, 6.6337890625, 7.241943359375, 7.85009765625, 8.458251953125, 9.06640625, 9.674560546875, 10.28271484375, 10.890869140625, 11.4990234375, 12.107177734375, 12.71533203125, 13.323486328125, 13.931640625, 14.539794921875, 15.14794921875, 15.756103515625, 16.3642578125, 16.972412109375, 17.58056640625, 18.188720703125, 18.796875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 5.0, 13.0, 9.0, 11.0, 24.0, 17.0, 33.0, 53.0, 42.0, 72.0, 95.0, 115.0, 159.0, 227.0, 378.0, 816.0, 2395.0, 12569.0, 178782.0, 3562405.0, 409305.0, 20872.0, 3354.0, 1030.0, 455.0, 262.0, 164.0, 157.0, 96.0, 80.0, 78.0, 57.0, 40.0, 20.0, 19.0, 11.0, 9.0, 10.0, 14.0, 4.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.3125, -61.42919921875, -59.5458984375, -57.66259765625, -55.779296875, -53.89599609375, -52.0126953125, -50.12939453125, -48.24609375, -46.36279296875, -44.4794921875, -42.59619140625, -40.712890625, -38.82958984375, -36.9462890625, -35.06298828125, -33.1796875, -31.29638671875, -29.4130859375, -27.52978515625, -25.646484375, -23.76318359375, -21.8798828125, -19.99658203125, -18.11328125, -16.22998046875, -14.3466796875, -12.46337890625, -10.580078125, -8.69677734375, -6.8134765625, -4.93017578125, -3.046875, -1.16357421875, 0.7197265625, 2.60302734375, 4.486328125, 6.36962890625, 8.2529296875, 10.13623046875, 12.01953125, 13.90283203125, 15.7861328125, 17.66943359375, 19.552734375, 21.43603515625, 23.3193359375, 25.20263671875, 27.0859375, 28.96923828125, 30.8525390625, 32.73583984375, 34.619140625, 36.50244140625, 38.3857421875, 40.26904296875, 42.15234375, 44.03564453125, 45.9189453125, 47.80224609375, 49.685546875, 51.56884765625, 53.4521484375, 55.33544921875, 57.21875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 20.0, 196.0, 500.0, 259.0, 33.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.19979858398438, -85.32376098632812, -72.44772338867188, -59.571693420410156, -46.695655822753906, -33.819618225097656, -20.943588256835938, -8.067550659179688, 4.8084869384765625, 17.68452262878418, 30.560558319091797, 43.43659210205078, 56.31262969970703, 69.18866729736328, 82.064697265625, 94.94073486328125, 107.8167724609375, 120.69281005859375, 133.56884765625, 146.44488525390625, 159.3209228515625, 172.19696044921875, 185.07298278808594, 197.9490203857422, 210.82505798339844, 223.7010955810547, 236.57713317871094, 249.45315551757812, 262.3291931152344, 275.2052307128906, 288.0812683105469, 300.9573059082031, 313.8333740234375, 326.70941162109375, 339.58544921875, 352.46148681640625, 365.3375244140625, 378.21356201171875, 391.089599609375, 403.96563720703125, 416.8416748046875, 429.71771240234375, 442.59375, 455.46978759765625, 468.3458251953125, 481.22186279296875, 494.097900390625, 506.97393798828125, 519.8499755859375, 532.7260131835938, 545.60205078125, 558.4780883789062, 571.3541259765625, 584.2301635742188, 597.106201171875, 609.9822387695312, 622.8582153320312, 635.7342529296875, 648.6102905273438, 661.486328125, 674.3623657226562, 687.2384033203125, 700.1144409179688, 712.990478515625, 725.8665161132812]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 6.0, 4.0, 3.0, 6.0, 6.0, 17.0, 14.0, 13.0, 15.0, 15.0, 22.0, 27.0, 22.0, 19.0, 35.0, 24.0, 41.0, 28.0, 39.0, 36.0, 28.0, 45.0, 35.0, 39.0, 41.0, 43.0, 41.0, 36.0, 35.0, 24.0, 27.0, 31.0, 30.0, 26.0, 24.0, 22.0, 13.0, 11.0, 12.0, 8.0, 11.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-66.94454956054688, -64.95384216308594, -62.963134765625, -60.97242736816406, -58.981719970703125, -56.99101257324219, -55.00030517578125, -53.00959777832031, -51.018890380859375, -49.02818298339844, -47.0374755859375, -45.04676818847656, -43.056060791015625, -41.06535339355469, -39.07464599609375, -37.08393859863281, -35.09322738647461, -33.10251998901367, -31.111812591552734, -29.121105194091797, -27.13039779663086, -25.139690399169922, -23.14898109436035, -21.158273696899414, -19.167566299438477, -17.17685890197754, -15.186151504516602, -13.195443153381348, -11.20473575592041, -9.214028358459473, -7.223320007324219, -5.232612609863281, -3.2419052124023438, -1.2511975765228271, 0.7395100593566895, 2.730217933654785, 4.720925331115723, 6.71163272857666, 8.702341079711914, 10.693048477172852, 12.683755874633789, 14.674463272094727, 16.665170669555664, 18.655879974365234, 20.646587371826172, 22.63729476928711, 24.628002166748047, 26.618709564208984, 28.609416961669922, 30.60012435913086, 32.5908317565918, 34.581539154052734, 36.57224655151367, 38.56295394897461, 40.55366516113281, 42.54437255859375, 44.53507995605469, 46.525787353515625, 48.51649475097656, 50.5072021484375, 52.49790954589844, 54.488616943359375, 56.47932434082031, 58.47003173828125, 60.46073913574219]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 6.0, 12.0, 20.0, 17.0, 15.0, 12.0, 21.0, 25.0, 26.0, 34.0, 29.0, 30.0, 39.0, 32.0, 50.0, 47.0, 46.0, 48.0, 43.0, 31.0, 35.0, 49.0, 44.0, 36.0, 40.0, 28.0, 27.0, 30.0, 23.0, 20.0, 17.0, 8.0, 6.0, 10.0, 6.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.921875, -10.5531005859375, -10.184326171875, -9.8155517578125, -9.44677734375, -9.0780029296875, -8.709228515625, -8.3404541015625, -7.9716796875, -7.6029052734375, -7.234130859375, -6.8653564453125, -6.49658203125, -6.1278076171875, -5.759033203125, -5.3902587890625, -5.021484375, -4.6527099609375, -4.283935546875, -3.9151611328125, -3.54638671875, -3.1776123046875, -2.808837890625, -2.4400634765625, -2.0712890625, -1.7025146484375, -1.333740234375, -0.9649658203125, -0.59619140625, -0.2274169921875, 0.141357421875, 0.5101318359375, 0.87890625, 1.2476806640625, 1.616455078125, 1.9852294921875, 2.35400390625, 2.7227783203125, 3.091552734375, 3.4603271484375, 3.8291015625, 4.1978759765625, 4.566650390625, 4.9354248046875, 5.30419921875, 5.6729736328125, 6.041748046875, 6.4105224609375, 6.779296875, 7.1480712890625, 7.516845703125, 7.8856201171875, 8.25439453125, 8.6231689453125, 8.991943359375, 9.3607177734375, 9.7294921875, 10.0982666015625, 10.467041015625, 10.8358154296875, 11.20458984375, 11.5733642578125, 11.942138671875, 12.3109130859375, 12.6796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 10.0, 14.0, 11.0, 26.0, 39.0, 58.0, 73.0, 114.0, 117.0, 175.0, 293.0, 426.0, 638.0, 913.0, 1376.0, 2051.0, 2933.0, 4578.0, 6731.0, 10172.0, 16040.0, 25658.0, 41905.0, 70077.0, 115646.0, 174284.0, 193923.0, 144704.0, 90545.0, 54068.0, 32794.0, 20412.0, 12792.0, 8381.0, 5451.0, 3624.0, 2323.0, 1548.0, 1135.0, 742.0, 534.0, 397.0, 239.0, 175.0, 132.0, 89.0, 57.0, 52.0, 29.0, 27.0, 7.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.017578125, -0.9827880859375, -0.947998046875, -0.9132080078125, -0.87841796875, -0.8436279296875, -0.808837890625, -0.7740478515625, -0.7392578125, -0.7044677734375, -0.669677734375, -0.6348876953125, -0.60009765625, -0.5653076171875, -0.530517578125, -0.4957275390625, -0.4609375, -0.4261474609375, -0.391357421875, -0.3565673828125, -0.32177734375, -0.2869873046875, -0.252197265625, -0.2174072265625, -0.1826171875, -0.1478271484375, -0.113037109375, -0.0782470703125, -0.04345703125, -0.0086669921875, 0.026123046875, 0.0609130859375, 0.095703125, 0.1304931640625, 0.165283203125, 0.2000732421875, 0.23486328125, 0.2696533203125, 0.304443359375, 0.3392333984375, 0.3740234375, 0.4088134765625, 0.443603515625, 0.4783935546875, 0.51318359375, 0.5479736328125, 0.582763671875, 0.6175537109375, 0.65234375, 0.6871337890625, 0.721923828125, 0.7567138671875, 0.79150390625, 0.8262939453125, 0.861083984375, 0.8958740234375, 0.9306640625, 0.9654541015625, 1.000244140625, 1.0350341796875, 1.06982421875, 1.1046142578125, 1.139404296875, 1.1741943359375, 1.208984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 7.0, 4.0, 8.0, 8.0, 11.0, 9.0, 16.0, 15.0, 15.0, 19.0, 28.0, 26.0, 32.0, 27.0, 45.0, 34.0, 34.0, 36.0, 38.0, 27.0, 1064.0, 34.0, 45.0, 43.0, 35.0, 40.0, 38.0, 37.0, 18.0, 25.0, 20.0, 11.0, 27.0, 24.0, 18.0, 17.0, 14.0, 14.0, 16.0, 12.0, 6.0, 4.0, 4.0, 2.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.5234375, -6.318359375, -6.11328125, -5.908203125, -5.703125, -5.498046875, -5.29296875, -5.087890625, -4.8828125, -4.677734375, -4.47265625, -4.267578125, -4.0625, -3.857421875, -3.65234375, -3.447265625, -3.2421875, -3.037109375, -2.83203125, -2.626953125, -2.421875, -2.216796875, -2.01171875, -1.806640625, -1.6015625, -1.396484375, -1.19140625, -0.986328125, -0.78125, -0.576171875, -0.37109375, -0.166015625, 0.0390625, 0.244140625, 0.44921875, 0.654296875, 0.859375, 1.064453125, 1.26953125, 1.474609375, 1.6796875, 1.884765625, 2.08984375, 2.294921875, 2.5, 2.705078125, 2.91015625, 3.115234375, 3.3203125, 3.525390625, 3.73046875, 3.935546875, 4.140625, 4.345703125, 4.55078125, 4.755859375, 4.9609375, 5.166015625, 5.37109375, 5.576171875, 5.78125, 5.986328125, 6.19140625, 6.396484375, 6.6015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 7.0, 6.0, 13.0, 20.0, 41.0, 53.0, 82.0, 132.0, 177.0, 255.0, 395.0, 599.0, 966.0, 1427.0, 2172.0, 3290.0, 5145.0, 7902.0, 12280.0, 19544.0, 30561.0, 47844.0, 74981.0, 111448.0, 156860.0, 1204083.0, 138391.0, 97939.0, 64897.0, 41436.0, 26614.0, 16869.0, 10824.0, 6908.0, 4531.0, 2964.0, 1889.0, 1221.0, 812.0, 485.0, 362.0, 255.0, 158.0, 100.0, 70.0, 56.0, 25.0, 13.0, 15.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.7958984375, -0.7720184326171875, -0.748138427734375, -0.7242584228515625, -0.70037841796875, -0.6764984130859375, -0.652618408203125, -0.6287384033203125, -0.6048583984375, -0.5809783935546875, -0.557098388671875, -0.5332183837890625, -0.50933837890625, -0.4854583740234375, -0.461578369140625, -0.4376983642578125, -0.413818359375, -0.3899383544921875, -0.366058349609375, -0.3421783447265625, -0.31829833984375, -0.2944183349609375, -0.270538330078125, -0.2466583251953125, -0.2227783203125, -0.1988983154296875, -0.175018310546875, -0.1511383056640625, -0.12725830078125, -0.1033782958984375, -0.079498291015625, -0.0556182861328125, -0.03173828125, -0.0078582763671875, 0.016021728515625, 0.0399017333984375, 0.06378173828125, 0.0876617431640625, 0.111541748046875, 0.1354217529296875, 0.1593017578125, 0.1831817626953125, 0.207061767578125, 0.2309417724609375, 0.25482177734375, 0.2787017822265625, 0.302581787109375, 0.3264617919921875, 0.350341796875, 0.3742218017578125, 0.398101806640625, 0.4219818115234375, 0.44586181640625, 0.4697418212890625, 0.493621826171875, 0.5175018310546875, 0.5413818359375, 0.5652618408203125, 0.589141845703125, 0.6130218505859375, 0.63690185546875, 0.6607818603515625, 0.684661865234375, 0.7085418701171875, 0.732421875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 6.0, 14.0, 18.0, 17.0, 32.0, 35.0, 41.0, 63.0, 67.0, 92.0, 104.0, 103.0, 74.0, 71.0, 52.0, 38.0, 22.0, 23.0, 27.0, 20.0, 15.0, 16.0, 12.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022064208984375, -0.021369218826293945, -0.02067422866821289, -0.019979238510131836, -0.01928424835205078, -0.018589258193969727, -0.017894268035888672, -0.017199277877807617, -0.016504287719726562, -0.015809297561645508, -0.015114307403564453, -0.014419317245483398, -0.013724327087402344, -0.013029336929321289, -0.012334346771240234, -0.01163935661315918, -0.010944366455078125, -0.01024937629699707, -0.009554386138916016, -0.008859395980834961, -0.008164405822753906, -0.0074694156646728516, -0.006774425506591797, -0.006079435348510742, -0.0053844451904296875, -0.004689455032348633, -0.003994464874267578, -0.0032994747161865234, -0.0026044845581054688, -0.001909494400024414, -0.0012145042419433594, -0.0005195140838623047, 0.00017547607421875, 0.0008704662322998047, 0.0015654563903808594, 0.002260446548461914, 0.0029554367065429688, 0.0036504268646240234, 0.004345417022705078, 0.005040407180786133, 0.0057353973388671875, 0.006430387496948242, 0.007125377655029297, 0.007820367813110352, 0.008515357971191406, 0.009210348129272461, 0.009905338287353516, 0.01060032844543457, 0.011295318603515625, 0.01199030876159668, 0.012685298919677734, 0.013380289077758789, 0.014075279235839844, 0.014770269393920898, 0.015465259552001953, 0.016160249710083008, 0.016855239868164062, 0.017550230026245117, 0.018245220184326172, 0.018940210342407227, 0.01963520050048828, 0.020330190658569336, 0.02102518081665039, 0.021720170974731445, 0.0224151611328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 2.0, 8.0, 23.0, 15.0, 26.0, 36.0, 33.0, 47.0, 76.0, 100.0, 183.0, 453.0, 5028.0, 1039899.0, 1794.0, 338.0, 173.0, 86.0, 54.0, 45.0, 32.0, 29.0, 18.0, 11.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5105972290039062, -0.4943389892578125, -0.47808074951171875, -0.461822509765625, -0.44556427001953125, -0.4293060302734375, -0.41304779052734375, -0.39678955078125, -0.38053131103515625, -0.3642730712890625, -0.34801483154296875, -0.331756591796875, -0.31549835205078125, -0.2992401123046875, -0.28298187255859375, -0.2667236328125, -0.25046539306640625, -0.2342071533203125, -0.21794891357421875, -0.201690673828125, -0.18543243408203125, -0.1691741943359375, -0.15291595458984375, -0.13665771484375, -0.12039947509765625, -0.1041412353515625, -0.08788299560546875, -0.071624755859375, -0.05536651611328125, -0.0391082763671875, -0.02285003662109375, -0.006591796875, 0.00966644287109375, 0.0259246826171875, 0.04218292236328125, 0.058441162109375, 0.07469940185546875, 0.0909576416015625, 0.10721588134765625, 0.12347412109375, 0.13973236083984375, 0.1559906005859375, 0.17224884033203125, 0.188507080078125, 0.20476531982421875, 0.2210235595703125, 0.23728179931640625, 0.2535400390625, 0.26979827880859375, 0.2860565185546875, 0.30231475830078125, 0.318572998046875, 0.33483123779296875, 0.3510894775390625, 0.36734771728515625, 0.38360595703125, 0.39986419677734375, 0.4161224365234375, 0.43238067626953125, 0.448638916015625, 0.46489715576171875, 0.4811553955078125, 0.49741363525390625, 0.513671875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 248.0, 759.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35202035307884216, -0.3443969190120697, -0.33677345514297485, -0.3291500210762024, -0.32152655720710754, -0.3139031231403351, -0.30627965927124023, -0.2986562252044678, -0.2910327613353729, -0.28340932726860046, -0.2757858633995056, -0.26816242933273315, -0.2605389654636383, -0.25291553139686584, -0.245292067527771, -0.23766863346099854, -0.23004518449306488, -0.22242173552513123, -0.21479828655719757, -0.20717483758926392, -0.19955138862133026, -0.1919279396533966, -0.18430450558662415, -0.1766810417175293, -0.16905760765075684, -0.16143415868282318, -0.15381070971488953, -0.14618726074695587, -0.13856381177902222, -0.13094036281108856, -0.1233169212937355, -0.11569347232580185, -0.1080700010061264, -0.10044655203819275, -0.0928231030702591, -0.08519965410232544, -0.07757620513439178, -0.06995275616645813, -0.06232931464910507, -0.05470586568117142, -0.04708241671323776, -0.03945896774530411, -0.03183551877737045, -0.024212073534727097, -0.016588624566793442, -0.008965175598859787, -0.0013417303562164307, 0.006281718611717224, 0.013905167579650879, 0.021528616547584534, 0.02915206365287304, 0.036775510758161545, 0.0443989597260952, 0.052022408694028854, 0.05964585393667221, 0.06726930290460587, 0.07489275187253952, 0.08251620084047318, 0.09013964980840683, 0.09776309132575989, 0.10538654029369354, 0.1130099892616272, 0.12063343822956085, 0.1282568871974945, 0.13588033616542816]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 7.0, 4.0, 11.0, 8.0, 12.0, 12.0, 13.0, 13.0, 25.0, 24.0, 26.0, 35.0, 28.0, 33.0, 44.0, 52.0, 34.0, 46.0, 46.0, 35.0, 47.0, 43.0, 46.0, 42.0, 41.0, 38.0, 40.0, 38.0, 18.0, 24.0, 18.0, 19.0, 13.0, 21.0, 9.0, 8.0, 7.0, 4.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.021199345588684082, -0.020620128139853477, -0.020040910691022873, -0.01946169324219227, -0.018882475793361664, -0.01830325834453106, -0.017724040895700455, -0.01714482344686985, -0.016565605998039246, -0.01598638854920864, -0.015407171100378036, -0.014827953651547432, -0.014248736202716827, -0.013669518753886223, -0.013090301305055618, -0.012511083856225014, -0.01193186640739441, -0.011352648958563805, -0.0107734315097332, -0.010194214060902596, -0.009614996612071991, -0.009035779163241386, -0.008456561714410782, -0.007877344265580177, -0.007298126816749573, -0.006718909367918968, -0.006139691919088364, -0.005560474470257759, -0.0049812570214271545, -0.00440203957259655, -0.0038228221237659454, -0.003243604674935341, -0.0026643872261047363, -0.0020851697772741318, -0.0015059523284435272, -0.0009267348796129227, -0.0003475174307823181, 0.00023170001804828644, 0.000810917466878891, 0.0013901349157094955, 0.0019693523645401, 0.0025485698133707047, 0.003127787262201309, 0.0037070047110319138, 0.004286222159862518, 0.004865439608693123, 0.005444657057523727, 0.006023874506354332, 0.0066030919551849365, 0.007182309404015541, 0.007761526852846146, 0.00834074430167675, 0.008919961750507355, 0.00949917919933796, 0.010078396648168564, 0.010657614096999168, 0.011236831545829773, 0.011816048994660378, 0.012395266443490982, 0.012974483892321587, 0.013553701341152191, 0.014132918789982796, 0.0147121362388134, 0.015291353687644005, 0.01587057113647461]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 4.0, 7.0, 12.0, 19.0, 18.0, 15.0, 12.0, 21.0, 25.0, 26.0, 34.0, 29.0, 30.0, 39.0, 32.0, 50.0, 47.0, 46.0, 49.0, 42.0, 31.0, 36.0, 48.0, 44.0, 36.0, 40.0, 28.0, 27.0, 30.0, 23.0, 20.0, 17.0, 8.0, 6.0, 10.0, 6.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.921875, -10.5531005859375, -10.184326171875, -9.8155517578125, -9.44677734375, -9.0780029296875, -8.709228515625, -8.3404541015625, -7.9716796875, -7.6029052734375, -7.234130859375, -6.8653564453125, -6.49658203125, -6.1278076171875, -5.759033203125, -5.3902587890625, -5.021484375, -4.6527099609375, -4.283935546875, -3.9151611328125, -3.54638671875, -3.1776123046875, -2.808837890625, -2.4400634765625, -2.0712890625, -1.7025146484375, -1.333740234375, -0.9649658203125, -0.59619140625, -0.2274169921875, 0.141357421875, 0.5101318359375, 0.87890625, 1.2476806640625, 1.616455078125, 1.9852294921875, 2.35400390625, 2.7227783203125, 3.091552734375, 3.4603271484375, 3.8291015625, 4.1978759765625, 4.566650390625, 4.9354248046875, 5.30419921875, 5.6729736328125, 6.041748046875, 6.4105224609375, 6.779296875, 7.1480712890625, 7.516845703125, 7.8856201171875, 8.25439453125, 8.6231689453125, 8.991943359375, 9.3607177734375, 9.7294921875, 10.0982666015625, 10.467041015625, 10.8358154296875, 11.20458984375, 11.5733642578125, 11.942138671875, 12.3109130859375, 12.6796875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 8.0, 16.0, 18.0, 25.0, 30.0, 22.0, 41.0, 63.0, 84.0, 147.0, 224.0, 379.0, 710.0, 1599.0, 4266.0, 14781.0, 77046.0, 713541.0, 197162.0, 26987.0, 6957.0, 2180.0, 922.0, 503.0, 255.0, 165.0, 115.0, 79.0, 57.0, 45.0, 35.0, 13.0, 13.0, 13.0, 7.0, 12.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.71875, -20.987548828125, -20.25634765625, -19.525146484375, -18.7939453125, -18.062744140625, -17.33154296875, -16.600341796875, -15.869140625, -15.137939453125, -14.40673828125, -13.675537109375, -12.9443359375, -12.213134765625, -11.48193359375, -10.750732421875, -10.01953125, -9.288330078125, -8.55712890625, -7.825927734375, -7.0947265625, -6.363525390625, -5.63232421875, -4.901123046875, -4.169921875, -3.438720703125, -2.70751953125, -1.976318359375, -1.2451171875, -0.513916015625, 0.21728515625, 0.948486328125, 1.6796875, 2.410888671875, 3.14208984375, 3.873291015625, 4.6044921875, 5.335693359375, 6.06689453125, 6.798095703125, 7.529296875, 8.260498046875, 8.99169921875, 9.722900390625, 10.4541015625, 11.185302734375, 11.91650390625, 12.647705078125, 13.37890625, 14.110107421875, 14.84130859375, 15.572509765625, 16.3037109375, 17.034912109375, 17.76611328125, 18.497314453125, 19.228515625, 19.959716796875, 20.69091796875, 21.422119140625, 22.1533203125, 22.884521484375, 23.61572265625, 24.346923828125, 25.078125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 3.0, 7.0, 7.0, 10.0, 18.0, 13.0, 27.0, 34.0, 34.0, 27.0, 40.0, 49.0, 42.0, 54.0, 91.0, 172.0, 1692.0, 223.0, 83.0, 50.0, 51.0, 39.0, 30.0, 34.0, 31.0, 29.0, 25.0, 18.0, 28.0, 18.0, 17.0, 5.0, 9.0, 12.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.59375, -42.3681640625, -41.142578125, -39.9169921875, -38.69140625, -37.4658203125, -36.240234375, -35.0146484375, -33.7890625, -32.5634765625, -31.337890625, -30.1123046875, -28.88671875, -27.6611328125, -26.435546875, -25.2099609375, -23.984375, -22.7587890625, -21.533203125, -20.3076171875, -19.08203125, -17.8564453125, -16.630859375, -15.4052734375, -14.1796875, -12.9541015625, -11.728515625, -10.5029296875, -9.27734375, -8.0517578125, -6.826171875, -5.6005859375, -4.375, -3.1494140625, -1.923828125, -0.6982421875, 0.52734375, 1.7529296875, 2.978515625, 4.2041015625, 5.4296875, 6.6552734375, 7.880859375, 9.1064453125, 10.33203125, 11.5576171875, 12.783203125, 14.0087890625, 15.234375, 16.4599609375, 17.685546875, 18.9111328125, 20.13671875, 21.3623046875, 22.587890625, 23.8134765625, 25.0390625, 26.2646484375, 27.490234375, 28.7158203125, 29.94140625, 31.1669921875, 32.392578125, 33.6181640625, 34.84375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 10.0, 9.0, 11.0, 18.0, 17.0, 30.0, 28.0, 37.0, 42.0, 47.0, 70.0, 101.0, 155.0, 264.0, 668.0, 4306.0, 634472.0, 2497987.0, 5732.0, 823.0, 290.0, 161.0, 91.0, 74.0, 47.0, 44.0, 37.0, 31.0, 24.0, 10.0, 11.0, 10.0, 9.0, 5.0, 8.0, 5.0, 1.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.9375, -77.1865234375, -74.435546875, -71.6845703125, -68.93359375, -66.1826171875, -63.431640625, -60.6806640625, -57.9296875, -55.1787109375, -52.427734375, -49.6767578125, -46.92578125, -44.1748046875, -41.423828125, -38.6728515625, -35.921875, -33.1708984375, -30.419921875, -27.6689453125, -24.91796875, -22.1669921875, -19.416015625, -16.6650390625, -13.9140625, -11.1630859375, -8.412109375, -5.6611328125, -2.91015625, -0.1591796875, 2.591796875, 5.3427734375, 8.09375, 10.8447265625, 13.595703125, 16.3466796875, 19.09765625, 21.8486328125, 24.599609375, 27.3505859375, 30.1015625, 32.8525390625, 35.603515625, 38.3544921875, 41.10546875, 43.8564453125, 46.607421875, 49.3583984375, 52.109375, 54.8603515625, 57.611328125, 60.3623046875, 63.11328125, 65.8642578125, 68.615234375, 71.3662109375, 74.1171875, 76.8681640625, 79.619140625, 82.3701171875, 85.12109375, 87.8720703125, 90.623046875, 93.3740234375, 96.125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 17.0, 144.0, 496.0, 312.0, 38.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.6855926513672, -249.45152282714844, -244.21746826171875, -238.9833984375, -233.74932861328125, -228.51527404785156, -223.2812042236328, -218.04714965820312, -212.81307983398438, -207.57901000976562, -202.34495544433594, -197.1108856201172, -191.87681579589844, -186.64276123046875, -181.40869140625, -176.17462158203125, -170.9405517578125, -165.70648193359375, -160.47242736816406, -155.2383575439453, -150.00428771972656, -144.77023315429688, -139.53616333007812, -134.30209350585938, -129.0680389404297, -123.83397674560547, -118.59990692138672, -113.3658447265625, -108.13178253173828, -102.89772033691406, -97.66365051269531, -92.4295883178711, -87.1955337524414, -81.96147155761719, -76.72740173339844, -71.49333953857422, -66.25927734375, -61.025211334228516, -55.79114532470703, -50.55708312988281, -45.32301712036133, -40.088951110839844, -34.854888916015625, -29.62082290649414, -24.38675880432129, -19.152694702148438, -13.918628692626953, -8.684566497802734, -3.45050048828125, 1.7835640907287598, 7.0176286697387695, 12.251693725585938, 17.48575782775879, 22.71982192993164, 27.953887939453125, 33.187950134277344, 38.42201614379883, 43.65608215332031, 48.89014434814453, 54.124210357666016, 59.3582763671875, 64.59233856201172, 69.82640075683594, 75.06047058105469, 80.2945327758789]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 13.0, 1.0, 9.0, 15.0, 10.0, 6.0, 19.0, 16.0, 11.0, 32.0, 19.0, 40.0, 38.0, 28.0, 37.0, 31.0, 49.0, 48.0, 42.0, 37.0, 41.0, 27.0, 33.0, 46.0, 37.0, 39.0, 33.0, 36.0, 35.0, 24.0, 19.0, 23.0, 15.0, 16.0, 11.0, 13.0, 12.0, 10.0, 7.0, 6.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-85.45774841308594, -82.7018814086914, -79.94601440429688, -77.19014739990234, -74.43428039550781, -71.67841339111328, -68.92254638671875, -66.16668701171875, -63.41081619262695, -60.65494918823242, -57.89908218383789, -55.143218994140625, -52.387351989746094, -49.63148498535156, -46.87561798095703, -44.1197509765625, -41.36388397216797, -38.60801696777344, -35.852149963378906, -33.096282958984375, -30.340417861938477, -27.584550857543945, -24.828685760498047, -22.072818756103516, -19.316951751708984, -16.561084747314453, -13.805218696594238, -11.049352645874023, -8.293485641479492, -5.537618637084961, -2.7817535400390625, -0.02588653564453125, 2.72998046875, 5.485846996307373, 8.241713523864746, 10.997579574584961, 13.753446578979492, 16.509313583374023, 19.265178680419922, 22.021045684814453, 24.776912689208984, 27.532779693603516, 30.288646697998047, 33.04450988769531, 35.800376892089844, 38.556243896484375, 41.312110900878906, 44.06797790527344, 46.82384490966797, 49.5797119140625, 52.33557891845703, 55.09144592285156, 57.847312927246094, 60.603179931640625, 63.35904312133789, 66.11491394042969, 68.87077331542969, 71.62664031982422, 74.38250732421875, 77.13837432861328, 79.89424133300781, 82.65010833740234, 85.40597534179688, 88.16183471679688, 90.91770935058594]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 5.0, 7.0, 8.0, 20.0, 12.0, 21.0, 12.0, 23.0, 23.0, 21.0, 37.0, 40.0, 39.0, 35.0, 35.0, 45.0, 37.0, 46.0, 37.0, 49.0, 35.0, 37.0, 43.0, 47.0, 38.0, 41.0, 32.0, 28.0, 26.0, 21.0, 14.0, 14.0, 6.0, 14.0, 11.0, 5.0, 5.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.34375, -10.958251953125, -10.57275390625, -10.187255859375, -9.8017578125, -9.416259765625, -9.03076171875, -8.645263671875, -8.259765625, -7.874267578125, -7.48876953125, -7.103271484375, -6.7177734375, -6.332275390625, -5.94677734375, -5.561279296875, -5.17578125, -4.790283203125, -4.40478515625, -4.019287109375, -3.6337890625, -3.248291015625, -2.86279296875, -2.477294921875, -2.091796875, -1.706298828125, -1.32080078125, -0.935302734375, -0.5498046875, -0.164306640625, 0.22119140625, 0.606689453125, 0.9921875, 1.377685546875, 1.76318359375, 2.148681640625, 2.5341796875, 2.919677734375, 3.30517578125, 3.690673828125, 4.076171875, 4.461669921875, 4.84716796875, 5.232666015625, 5.6181640625, 6.003662109375, 6.38916015625, 6.774658203125, 7.16015625, 7.545654296875, 7.93115234375, 8.316650390625, 8.7021484375, 9.087646484375, 9.47314453125, 9.858642578125, 10.244140625, 10.629638671875, 11.01513671875, 11.400634765625, 11.7861328125, 12.171630859375, 12.55712890625, 12.942626953125, 13.328125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 4.0, 4.0, 14.0, 12.0, 15.0, 23.0, 29.0, 67.0, 61.0, 97.0, 153.0, 247.0, 435.0, 765.0, 1645.0, 3652.0, 10564.0, 36471.0, 190329.0, 1355578.0, 2130563.0, 377847.0, 60855.0, 15289.0, 5124.0, 2108.0, 965.0, 486.0, 293.0, 186.0, 127.0, 79.0, 47.0, 35.0, 33.0, 18.0, 17.0, 8.0, 5.0, 2.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.328125, -18.64208984375, -17.9560546875, -17.27001953125, -16.583984375, -15.89794921875, -15.2119140625, -14.52587890625, -13.83984375, -13.15380859375, -12.4677734375, -11.78173828125, -11.095703125, -10.40966796875, -9.7236328125, -9.03759765625, -8.3515625, -7.66552734375, -6.9794921875, -6.29345703125, -5.607421875, -4.92138671875, -4.2353515625, -3.54931640625, -2.86328125, -2.17724609375, -1.4912109375, -0.80517578125, -0.119140625, 0.56689453125, 1.2529296875, 1.93896484375, 2.625, 3.31103515625, 3.9970703125, 4.68310546875, 5.369140625, 6.05517578125, 6.7412109375, 7.42724609375, 8.11328125, 8.79931640625, 9.4853515625, 10.17138671875, 10.857421875, 11.54345703125, 12.2294921875, 12.91552734375, 13.6015625, 14.28759765625, 14.9736328125, 15.65966796875, 16.345703125, 17.03173828125, 17.7177734375, 18.40380859375, 19.08984375, 19.77587890625, 20.4619140625, 21.14794921875, 21.833984375, 22.52001953125, 23.2060546875, 23.89208984375, 24.578125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 10.0, 7.0, 6.0, 8.0, 15.0, 20.0, 23.0, 35.0, 49.0, 46.0, 92.0, 116.0, 152.0, 206.0, 327.0, 424.0, 502.0, 506.0, 432.0, 338.0, 237.0, 158.0, 106.0, 64.0, 51.0, 39.0, 26.0, 23.0, 10.0, 12.0, 8.0, 10.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.84375, -24.19140625, -23.5390625, -22.88671875, -22.234375, -21.58203125, -20.9296875, -20.27734375, -19.625, -18.97265625, -18.3203125, -17.66796875, -17.015625, -16.36328125, -15.7109375, -15.05859375, -14.40625, -13.75390625, -13.1015625, -12.44921875, -11.796875, -11.14453125, -10.4921875, -9.83984375, -9.1875, -8.53515625, -7.8828125, -7.23046875, -6.578125, -5.92578125, -5.2734375, -4.62109375, -3.96875, -3.31640625, -2.6640625, -2.01171875, -1.359375, -0.70703125, -0.0546875, 0.59765625, 1.25, 1.90234375, 2.5546875, 3.20703125, 3.859375, 4.51171875, 5.1640625, 5.81640625, 6.46875, 7.12109375, 7.7734375, 8.42578125, 9.078125, 9.73046875, 10.3828125, 11.03515625, 11.6875, 12.33984375, 12.9921875, 13.64453125, 14.296875, 14.94921875, 15.6015625, 16.25390625, 16.90625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 18.0, 18.0, 13.0, 36.0, 29.0, 38.0, 55.0, 71.0, 130.0, 134.0, 209.0, 369.0, 602.0, 1343.0, 4351.0, 23321.0, 263167.0, 3370905.0, 484754.0, 35226.0, 5809.0, 1663.0, 743.0, 378.0, 224.0, 167.0, 128.0, 86.0, 56.0, 49.0, 37.0, 29.0, 28.0, 16.0, 15.0, 13.0, 16.0, 1.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.40625, -43.92236328125, -42.4384765625, -40.95458984375, -39.470703125, -37.98681640625, -36.5029296875, -35.01904296875, -33.53515625, -32.05126953125, -30.5673828125, -29.08349609375, -27.599609375, -26.11572265625, -24.6318359375, -23.14794921875, -21.6640625, -20.18017578125, -18.6962890625, -17.21240234375, -15.728515625, -14.24462890625, -12.7607421875, -11.27685546875, -9.79296875, -8.30908203125, -6.8251953125, -5.34130859375, -3.857421875, -2.37353515625, -0.8896484375, 0.59423828125, 2.078125, 3.56201171875, 5.0458984375, 6.52978515625, 8.013671875, 9.49755859375, 10.9814453125, 12.46533203125, 13.94921875, 15.43310546875, 16.9169921875, 18.40087890625, 19.884765625, 21.36865234375, 22.8525390625, 24.33642578125, 25.8203125, 27.30419921875, 28.7880859375, 30.27197265625, 31.755859375, 33.23974609375, 34.7236328125, 36.20751953125, 37.69140625, 39.17529296875, 40.6591796875, 42.14306640625, 43.626953125, 45.11083984375, 46.5947265625, 48.07861328125, 49.5625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 10.0, 60.0, 133.0, 272.0, 280.0, 161.0, 71.0, 21.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-281.91790771484375, -275.09027099609375, -268.26263427734375, -261.43499755859375, -254.6073455810547, -247.77969360351562, -240.95205688476562, -234.12442016601562, -227.29678344726562, -220.46914672851562, -213.64149475097656, -206.81385803222656, -199.98622131347656, -193.1585693359375, -186.3309326171875, -179.5032958984375, -172.67564392089844, -165.84800720214844, -159.02035522460938, -152.19271850585938, -145.36508178710938, -138.53744506835938, -131.7097930908203, -124.88215637207031, -118.05451202392578, -111.22686767578125, -104.39923095703125, -97.57158660888672, -90.74394226074219, -83.91630554199219, -77.08866119384766, -70.26101684570312, -63.433380126953125, -56.60573959350586, -49.778099060058594, -42.95045471191406, -36.1228141784668, -29.29517364501953, -22.467529296875, -15.639888763427734, -8.812248229980469, -1.9846067428588867, 4.843034744262695, 11.670677185058594, 18.49831771850586, 25.325958251953125, 32.153602600097656, 38.98124313354492, 45.80888366699219, 52.63652420043945, 59.46416473388672, 66.29180908203125, 73.11944580078125, 79.94709014892578, 86.77473449707031, 93.60237121582031, 100.43001556396484, 107.25765991210938, 114.08529663085938, 120.9129409790039, 127.74058532714844, 134.56822204589844, 141.3958740234375, 148.2235107421875, 155.0511474609375]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 2.0, 9.0, 5.0, 18.0, 9.0, 20.0, 23.0, 22.0, 18.0, 15.0, 23.0, 36.0, 33.0, 46.0, 28.0, 33.0, 46.0, 33.0, 40.0, 42.0, 35.0, 56.0, 42.0, 36.0, 49.0, 26.0, 33.0, 20.0, 25.0, 24.0, 25.0, 25.0, 15.0, 9.0, 16.0, 15.0, 7.0, 9.0, 2.0, 6.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.15093994140625, -61.1189079284668, -59.086875915527344, -57.05484390258789, -55.02281188964844, -52.990779876708984, -50.95874786376953, -48.926719665527344, -46.894683837890625, -44.86265182495117, -42.83061981201172, -40.798587799072266, -38.76655578613281, -36.73452377319336, -34.702491760253906, -32.67046356201172, -30.638431549072266, -28.606399536132812, -26.57436752319336, -24.542335510253906, -22.510303497314453, -20.478271484375, -18.44624137878418, -16.414209365844727, -14.382177352905273, -12.35014533996582, -10.318113327026367, -8.28608226776123, -6.254050254821777, -4.222018241882324, -2.1899871826171875, -0.15795516967773438, 1.8740768432617188, 3.9061086177825928, 5.938140392303467, 7.970171928405762, 10.002203941345215, 12.034235954284668, 14.066267013549805, 16.098299026489258, 18.13033103942871, 20.162363052368164, 22.194395065307617, 24.226425170898438, 26.25845718383789, 28.290489196777344, 30.322521209716797, 32.35455322265625, 34.3865852355957, 36.418617248535156, 38.45064926147461, 40.48268127441406, 42.514713287353516, 44.54674530029297, 46.578773498535156, 48.610809326171875, 50.64283752441406, 52.674869537353516, 54.70690155029297, 56.73893356323242, 58.770965576171875, 60.80299758911133, 62.83502960205078, 64.86705780029297, 66.89909362792969]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 3.0, 3.0, 8.0, 5.0, 2.0, 11.0, 15.0, 9.0, 20.0, 14.0, 24.0, 27.0, 25.0, 33.0, 30.0, 36.0, 31.0, 45.0, 45.0, 55.0, 40.0, 54.0, 44.0, 55.0, 42.0, 38.0, 28.0, 33.0, 33.0, 29.0, 26.0, 29.0, 18.0, 21.0, 9.0, 12.0, 15.0, 7.0, 8.0, 6.0, 8.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4296875, -12.03466796875, -11.6396484375, -11.24462890625, -10.849609375, -10.45458984375, -10.0595703125, -9.66455078125, -9.26953125, -8.87451171875, -8.4794921875, -8.08447265625, -7.689453125, -7.29443359375, -6.8994140625, -6.50439453125, -6.109375, -5.71435546875, -5.3193359375, -4.92431640625, -4.529296875, -4.13427734375, -3.7392578125, -3.34423828125, -2.94921875, -2.55419921875, -2.1591796875, -1.76416015625, -1.369140625, -0.97412109375, -0.5791015625, -0.18408203125, 0.2109375, 0.60595703125, 1.0009765625, 1.39599609375, 1.791015625, 2.18603515625, 2.5810546875, 2.97607421875, 3.37109375, 3.76611328125, 4.1611328125, 4.55615234375, 4.951171875, 5.34619140625, 5.7412109375, 6.13623046875, 6.53125, 6.92626953125, 7.3212890625, 7.71630859375, 8.111328125, 8.50634765625, 8.9013671875, 9.29638671875, 9.69140625, 10.08642578125, 10.4814453125, 10.87646484375, 11.271484375, 11.66650390625, 12.0615234375, 12.45654296875, 12.8515625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 11.0, 11.0, 14.0, 19.0, 26.0, 32.0, 54.0, 77.0, 93.0, 160.0, 250.0, 399.0, 504.0, 757.0, 1021.0, 1620.0, 2257.0, 3539.0, 5124.0, 7588.0, 11693.0, 18068.0, 27710.0, 43704.0, 67942.0, 103657.0, 146791.0, 173488.0, 143679.0, 100732.0, 66186.0, 42255.0, 27222.0, 17622.0, 11370.0, 7412.0, 4941.0, 3322.0, 2269.0, 1558.0, 1105.0, 726.0, 454.0, 375.0, 237.0, 159.0, 106.0, 67.0, 49.0, 30.0, 26.0, 17.0, 17.0, 6.0, 6.0, 7.0, 1.0, 1.0, 2.0], "bins": [-1.0009765625, -0.9701461791992188, -0.9393157958984375, -0.9084854125976562, -0.877655029296875, -0.8468246459960938, -0.8159942626953125, -0.7851638793945312, -0.75433349609375, -0.7235031127929688, -0.6926727294921875, -0.6618423461914062, -0.631011962890625, -0.6001815795898438, -0.5693511962890625, -0.5385208129882812, -0.5076904296875, -0.47686004638671875, -0.4460296630859375, -0.41519927978515625, -0.384368896484375, -0.35353851318359375, -0.3227081298828125, -0.29187774658203125, -0.26104736328125, -0.23021697998046875, -0.1993865966796875, -0.16855621337890625, -0.137725830078125, -0.10689544677734375, -0.0760650634765625, -0.04523468017578125, -0.014404296875, 0.01642608642578125, 0.0472564697265625, 0.07808685302734375, 0.108917236328125, 0.13974761962890625, 0.1705780029296875, 0.20140838623046875, 0.23223876953125, 0.26306915283203125, 0.2938995361328125, 0.32472991943359375, 0.355560302734375, 0.38639068603515625, 0.4172210693359375, 0.44805145263671875, 0.4788818359375, 0.5097122192382812, 0.5405426025390625, 0.5713729858398438, 0.602203369140625, 0.6330337524414062, 0.6638641357421875, 0.6946945190429688, 0.72552490234375, 0.7563552856445312, 0.7871856689453125, 0.8180160522460938, 0.848846435546875, 0.8796768188476562, 0.9105072021484375, 0.9413375854492188, 0.97216796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 1.0, 7.0, 8.0, 6.0, 11.0, 16.0, 12.0, 11.0, 14.0, 10.0, 19.0, 18.0, 50.0, 24.0, 30.0, 39.0, 50.0, 44.0, 39.0, 40.0, 45.0, 1067.0, 34.0, 35.0, 43.0, 37.0, 31.0, 37.0, 26.0, 32.0, 16.0, 25.0, 26.0, 19.0, 15.0, 16.0, 14.0, 11.0, 13.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.21124267578125, -6.9732666015625, -6.73529052734375, -6.497314453125, -6.25933837890625, -6.0213623046875, -5.78338623046875, -5.54541015625, -5.30743408203125, -5.0694580078125, -4.83148193359375, -4.593505859375, -4.35552978515625, -4.1175537109375, -3.87957763671875, -3.6416015625, -3.40362548828125, -3.1656494140625, -2.92767333984375, -2.689697265625, -2.45172119140625, -2.2137451171875, -1.97576904296875, -1.73779296875, -1.49981689453125, -1.2618408203125, -1.02386474609375, -0.785888671875, -0.54791259765625, -0.3099365234375, -0.07196044921875, 0.166015625, 0.40399169921875, 0.6419677734375, 0.87994384765625, 1.117919921875, 1.35589599609375, 1.5938720703125, 1.83184814453125, 2.06982421875, 2.30780029296875, 2.5457763671875, 2.78375244140625, 3.021728515625, 3.25970458984375, 3.4976806640625, 3.73565673828125, 3.9736328125, 4.21160888671875, 4.4495849609375, 4.68756103515625, 4.925537109375, 5.16351318359375, 5.4014892578125, 5.63946533203125, 5.87744140625, 6.11541748046875, 6.3533935546875, 6.59136962890625, 6.829345703125, 7.06732177734375, 7.3052978515625, 7.54327392578125, 7.78125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 6.0, 20.0, 13.0, 30.0, 42.0, 59.0, 116.0, 217.0, 340.0, 548.0, 926.0, 1641.0, 2645.0, 4479.0, 7934.0, 13675.0, 23683.0, 41961.0, 73222.0, 121183.0, 183636.0, 1233802.0, 153429.0, 98395.0, 57500.0, 33126.0, 18672.0, 10733.0, 6161.0, 3595.0, 2197.0, 1334.0, 690.0, 444.0, 259.0, 159.0, 102.0, 70.0, 28.0, 19.0, 17.0, 11.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8503036499023438, -0.8202362060546875, -0.7901687622070312, -0.760101318359375, -0.7300338745117188, -0.6999664306640625, -0.6698989868164062, -0.63983154296875, -0.6097640991210938, -0.5796966552734375, -0.5496292114257812, -0.519561767578125, -0.48949432373046875, -0.4594268798828125, -0.42935943603515625, -0.3992919921875, -0.36922454833984375, -0.3391571044921875, -0.30908966064453125, -0.279022216796875, -0.24895477294921875, -0.2188873291015625, -0.18881988525390625, -0.15875244140625, -0.12868499755859375, -0.0986175537109375, -0.06855010986328125, -0.038482666015625, -0.00841522216796875, 0.0216522216796875, 0.05171966552734375, 0.081787109375, 0.11185455322265625, 0.1419219970703125, 0.17198944091796875, 0.202056884765625, 0.23212432861328125, 0.2621917724609375, 0.29225921630859375, 0.32232666015625, 0.35239410400390625, 0.3824615478515625, 0.41252899169921875, 0.442596435546875, 0.47266387939453125, 0.5027313232421875, 0.5327987670898438, 0.5628662109375, 0.5929336547851562, 0.6230010986328125, 0.6530685424804688, 0.683135986328125, 0.7132034301757812, 0.7432708740234375, 0.7733383178710938, 0.80340576171875, 0.8334732055664062, 0.8635406494140625, 0.8936080932617188, 0.923675537109375, 0.9537429809570312, 0.9838104248046875, 1.0138778686523438, 1.0439453125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 2.0, 5.0, 4.0, 11.0, 12.0, 17.0, 11.0, 20.0, 27.0, 38.0, 50.0, 54.0, 55.0, 65.0, 81.0, 73.0, 93.0, 71.0, 48.0, 56.0, 35.0, 34.0, 32.0, 27.0, 13.0, 13.0, 10.0, 5.0, 9.0, 3.0, 2.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0301513671875, -0.029270172119140625, -0.02838897705078125, -0.027507781982421875, -0.0266265869140625, -0.025745391845703125, -0.02486419677734375, -0.023983001708984375, -0.023101806640625, -0.022220611572265625, -0.02133941650390625, -0.020458221435546875, -0.0195770263671875, -0.018695831298828125, -0.01781463623046875, -0.016933441162109375, -0.01605224609375, -0.015171051025390625, -0.01428985595703125, -0.013408660888671875, -0.0125274658203125, -0.011646270751953125, -0.01076507568359375, -0.009883880615234375, -0.009002685546875, -0.008121490478515625, -0.00724029541015625, -0.006359100341796875, -0.0054779052734375, -0.004596710205078125, -0.00371551513671875, -0.002834320068359375, -0.001953125, -0.001071929931640625, -0.00019073486328125, 0.000690460205078125, 0.0015716552734375, 0.002452850341796875, 0.00333404541015625, 0.004215240478515625, 0.005096435546875, 0.005977630615234375, 0.00685882568359375, 0.007740020751953125, 0.0086212158203125, 0.009502410888671875, 0.01038360595703125, 0.011264801025390625, 0.01214599609375, 0.013027191162109375, 0.01390838623046875, 0.014789581298828125, 0.0156707763671875, 0.016551971435546875, 0.01743316650390625, 0.018314361572265625, 0.019195556640625, 0.020076751708984375, 0.02095794677734375, 0.021839141845703125, 0.0227203369140625, 0.023601531982421875, 0.02448272705078125, 0.025363922119140625, 0.0262451171875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 14.0, 17.0, 22.0, 20.0, 42.0, 40.0, 54.0, 86.0, 138.0, 205.0, 409.0, 2022.0, 1038912.0, 5325.0, 489.0, 246.0, 135.0, 94.0, 57.0, 46.0, 35.0, 19.0, 27.0, 22.0, 11.0, 6.0, 4.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5849609375, -0.5658493041992188, -0.5467376708984375, -0.5276260375976562, -0.508514404296875, -0.48940277099609375, -0.4702911376953125, -0.45117950439453125, -0.43206787109375, -0.41295623779296875, -0.3938446044921875, -0.37473297119140625, -0.355621337890625, -0.33650970458984375, -0.3173980712890625, -0.29828643798828125, -0.2791748046875, -0.26006317138671875, -0.2409515380859375, -0.22183990478515625, -0.202728271484375, -0.18361663818359375, -0.1645050048828125, -0.14539337158203125, -0.12628173828125, -0.10717010498046875, -0.0880584716796875, -0.06894683837890625, -0.049835205078125, -0.03072357177734375, -0.0116119384765625, 0.00749969482421875, 0.026611328125, 0.04572296142578125, 0.0648345947265625, 0.08394622802734375, 0.103057861328125, 0.12216949462890625, 0.1412811279296875, 0.16039276123046875, 0.17950439453125, 0.19861602783203125, 0.2177276611328125, 0.23683929443359375, 0.255950927734375, 0.27506256103515625, 0.2941741943359375, 0.31328582763671875, 0.3323974609375, 0.35150909423828125, 0.3706207275390625, 0.38973236083984375, 0.408843994140625, 0.42795562744140625, 0.4470672607421875, 0.46617889404296875, 0.48529052734375, 0.5044021606445312, 0.5235137939453125, 0.5426254272460938, 0.561737060546875, 0.5808486938476562, 0.5999603271484375, 0.6190719604492188, 0.63818359375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 44.0, 969.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43143337965011597, -0.4207538962364197, -0.4100744128227234, -0.3993949294090271, -0.3887154459953308, -0.3780359625816345, -0.36735647916793823, -0.35667699575424194, -0.34599751234054565, -0.33531802892684937, -0.3246385455131531, -0.3139590620994568, -0.3032795786857605, -0.2926000952720642, -0.2819206118583679, -0.27124112844467163, -0.26056161522865295, -0.24988213181495667, -0.23920264840126038, -0.2285231649875641, -0.2178436815738678, -0.2071641981601715, -0.19648469984531403, -0.18580521643161774, -0.17512573301792145, -0.16444624960422516, -0.15376676619052887, -0.1430872678756714, -0.1324077844619751, -0.1217283084988594, -0.11104881763458252, -0.10036933422088623, -0.08968988060951233, -0.07901039719581604, -0.06833091378211975, -0.057651422917842865, -0.046971939504146576, -0.03629245609045029, -0.0256129652261734, -0.014933481812477112, -0.004253998398780823, 0.0064254868775606155, 0.017104972153902054, 0.02778445929288864, 0.03846394270658493, 0.04914342612028122, 0.059822916984558105, 0.0705024003982544, 0.08118188381195068, 0.09186136722564697, 0.10254085063934326, 0.11322034150362015, 0.12389982491731644, 0.13457930088043213, 0.1452587991952896, 0.1559382826089859, 0.1666177660226822, 0.17729724943637848, 0.18797673285007477, 0.19865623116493225, 0.20933571457862854, 0.22001519799232483, 0.23069468140602112, 0.2413741648197174, 0.2520536482334137]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 3.0, 5.0, 8.0, 2.0, 7.0, 9.0, 11.0, 11.0, 10.0, 10.0, 14.0, 18.0, 23.0, 25.0, 23.0, 29.0, 34.0, 42.0, 29.0, 42.0, 28.0, 37.0, 34.0, 44.0, 44.0, 36.0, 49.0, 41.0, 45.0, 37.0, 26.0, 28.0, 24.0, 21.0, 21.0, 17.0, 14.0, 17.0, 13.0, 14.0, 12.0, 7.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02262049913406372, -0.021906554698944092, -0.021192610263824463, -0.020478665828704834, -0.019764721393585205, -0.019050776958465576, -0.018336832523345947, -0.01762288808822632, -0.01690894365310669, -0.01619499921798706, -0.015481054782867432, -0.014767110347747803, -0.014053165912628174, -0.013339221477508545, -0.012625277042388916, -0.011911332607269287, -0.011197388172149658, -0.01048344373703003, -0.0097694993019104, -0.009055554866790771, -0.008341610431671143, -0.007627665996551514, -0.006913721561431885, -0.006199777126312256, -0.005485832691192627, -0.004771888256072998, -0.004057943820953369, -0.0033439993858337402, -0.0026300549507141113, -0.0019161105155944824, -0.0012021660804748535, -0.0004882216453552246, 0.0002257227897644043, 0.0009396672248840332, 0.0016536116600036621, 0.002367556095123291, 0.00308150053024292, 0.003795444965362549, 0.004509389400482178, 0.005223333835601807, 0.0059372782707214355, 0.0066512227058410645, 0.007365167140960693, 0.008079111576080322, 0.008793056011199951, 0.00950700044631958, 0.010220944881439209, 0.010934889316558838, 0.011648833751678467, 0.012362778186798096, 0.013076722621917725, 0.013790667057037354, 0.014504611492156982, 0.015218555927276611, 0.01593250036239624, 0.01664644479751587, 0.017360389232635498, 0.018074333667755127, 0.018788278102874756, 0.019502222537994385, 0.020216166973114014, 0.020930111408233643, 0.02164405584335327, 0.0223580002784729, 0.02307194471359253]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 3.0, 3.0, 8.0, 5.0, 2.0, 11.0, 15.0, 9.0, 20.0, 14.0, 22.0, 29.0, 24.0, 32.0, 31.0, 37.0, 31.0, 45.0, 45.0, 53.0, 42.0, 54.0, 44.0, 54.0, 43.0, 38.0, 28.0, 33.0, 33.0, 28.0, 27.0, 28.0, 18.0, 22.0, 9.0, 12.0, 15.0, 7.0, 8.0, 6.0, 8.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4375, -12.0423583984375, -11.647216796875, -11.2520751953125, -10.85693359375, -10.4617919921875, -10.066650390625, -9.6715087890625, -9.2763671875, -8.8812255859375, -8.486083984375, -8.0909423828125, -7.69580078125, -7.3006591796875, -6.905517578125, -6.5103759765625, -6.115234375, -5.7200927734375, -5.324951171875, -4.9298095703125, -4.53466796875, -4.1395263671875, -3.744384765625, -3.3492431640625, -2.9541015625, -2.5589599609375, -2.163818359375, -1.7686767578125, -1.37353515625, -0.9783935546875, -0.583251953125, -0.1881103515625, 0.20703125, 0.6021728515625, 0.997314453125, 1.3924560546875, 1.78759765625, 2.1827392578125, 2.577880859375, 2.9730224609375, 3.3681640625, 3.7633056640625, 4.158447265625, 4.5535888671875, 4.94873046875, 5.3438720703125, 5.739013671875, 6.1341552734375, 6.529296875, 6.9244384765625, 7.319580078125, 7.7147216796875, 8.10986328125, 8.5050048828125, 8.900146484375, 9.2952880859375, 9.6904296875, 10.0855712890625, 10.480712890625, 10.8758544921875, 11.27099609375, 11.6661376953125, 12.061279296875, 12.4564208984375, 12.8515625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 10.0, 4.0, 12.0, 9.0, 16.0, 23.0, 30.0, 30.0, 59.0, 67.0, 75.0, 123.0, 180.0, 228.0, 311.0, 451.0, 805.0, 1627.0, 4174.0, 14821.0, 88300.0, 834084.0, 81137.0, 13952.0, 4026.0, 1558.0, 831.0, 454.0, 320.0, 204.0, 185.0, 107.0, 83.0, 65.0, 36.0, 42.0, 33.0, 17.0, 17.0, 12.0, 14.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.828125, -29.848876953125, -28.86962890625, -27.890380859375, -26.9111328125, -25.931884765625, -24.95263671875, -23.973388671875, -22.994140625, -22.014892578125, -21.03564453125, -20.056396484375, -19.0771484375, -18.097900390625, -17.11865234375, -16.139404296875, -15.16015625, -14.180908203125, -13.20166015625, -12.222412109375, -11.2431640625, -10.263916015625, -9.28466796875, -8.305419921875, -7.326171875, -6.346923828125, -5.36767578125, -4.388427734375, -3.4091796875, -2.429931640625, -1.45068359375, -0.471435546875, 0.5078125, 1.487060546875, 2.46630859375, 3.445556640625, 4.4248046875, 5.404052734375, 6.38330078125, 7.362548828125, 8.341796875, 9.321044921875, 10.30029296875, 11.279541015625, 12.2587890625, 13.238037109375, 14.21728515625, 15.196533203125, 16.17578125, 17.155029296875, 18.13427734375, 19.113525390625, 20.0927734375, 21.072021484375, 22.05126953125, 23.030517578125, 24.009765625, 24.989013671875, 25.96826171875, 26.947509765625, 27.9267578125, 28.906005859375, 29.88525390625, 30.864501953125, 31.84375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 12.0, 5.0, 9.0, 13.0, 8.0, 15.0, 13.0, 10.0, 13.0, 23.0, 27.0, 27.0, 35.0, 39.0, 35.0, 61.0, 58.0, 77.0, 228.0, 1676.0, 139.0, 83.0, 48.0, 44.0, 45.0, 32.0, 41.0, 44.0, 23.0, 26.0, 23.0, 14.0, 15.0, 14.0, 9.0, 9.0, 6.0, 14.0, 6.0, 6.0, 4.0, 3.0, 6.0, 6.0, 3.0, 0.0, 2.0, 1.0], "bins": [-35.34375, -34.344970703125, -33.34619140625, -32.347412109375, -31.3486328125, -30.349853515625, -29.35107421875, -28.352294921875, -27.353515625, -26.354736328125, -25.35595703125, -24.357177734375, -23.3583984375, -22.359619140625, -21.36083984375, -20.362060546875, -19.36328125, -18.364501953125, -17.36572265625, -16.366943359375, -15.3681640625, -14.369384765625, -13.37060546875, -12.371826171875, -11.373046875, -10.374267578125, -9.37548828125, -8.376708984375, -7.3779296875, -6.379150390625, -5.38037109375, -4.381591796875, -3.3828125, -2.384033203125, -1.38525390625, -0.386474609375, 0.6123046875, 1.611083984375, 2.60986328125, 3.608642578125, 4.607421875, 5.606201171875, 6.60498046875, 7.603759765625, 8.6025390625, 9.601318359375, 10.60009765625, 11.598876953125, 12.59765625, 13.596435546875, 14.59521484375, 15.593994140625, 16.5927734375, 17.591552734375, 18.59033203125, 19.589111328125, 20.587890625, 21.586669921875, 22.58544921875, 23.584228515625, 24.5830078125, 25.581787109375, 26.58056640625, 27.579345703125, 28.578125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 7.0, 8.0, 17.0, 10.0, 7.0, 25.0, 19.0, 28.0, 34.0, 47.0, 74.0, 100.0, 124.0, 255.0, 553.0, 5480.0, 3037046.0, 99182.0, 1731.0, 375.0, 169.0, 110.0, 60.0, 52.0, 36.0, 23.0, 24.0, 25.0, 12.0, 17.0, 13.0, 12.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-115.3125, -111.796875, -108.28125, -104.765625, -101.25, -97.734375, -94.21875, -90.703125, -87.1875, -83.671875, -80.15625, -76.640625, -73.125, -69.609375, -66.09375, -62.578125, -59.0625, -55.546875, -52.03125, -48.515625, -45.0, -41.484375, -37.96875, -34.453125, -30.9375, -27.421875, -23.90625, -20.390625, -16.875, -13.359375, -9.84375, -6.328125, -2.8125, 0.703125, 4.21875, 7.734375, 11.25, 14.765625, 18.28125, 21.796875, 25.3125, 28.828125, 32.34375, 35.859375, 39.375, 42.890625, 46.40625, 49.921875, 53.4375, 56.953125, 60.46875, 63.984375, 67.5, 71.015625, 74.53125, 78.046875, 81.5625, 85.078125, 88.59375, 92.109375, 95.625, 99.140625, 102.65625, 106.171875, 109.6875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 53.0, 224.0, 412.0, 253.0, 57.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.99071502685547, -85.3615951538086, -81.73248291015625, -78.10336303710938, -74.4742431640625, -70.84512329101562, -67.21601104736328, -63.586891174316406, -59.9577751159668, -56.32865905761719, -52.69953918457031, -49.0704231262207, -45.441307067871094, -41.81218719482422, -38.18307113647461, -34.553955078125, -30.924835205078125, -27.295717239379883, -23.66659927368164, -20.03748321533203, -16.40836524963379, -12.779247283935547, -9.150131225585938, -5.521013259887695, -1.8918952941894531, 1.7372221946716309, 5.366339683532715, 8.99545669555664, 12.624574661254883, 16.253692626953125, 19.882808685302734, 23.511926651000977, 27.141036987304688, 30.77015495300293, 34.39927291870117, 38.02838897705078, 41.657508850097656, 45.286624908447266, 48.915740966796875, 52.54486083984375, 56.17397689819336, 59.80309295654297, 63.432212829589844, 67.06132507324219, 70.69044494628906, 74.31956481933594, 77.94868469238281, 81.57779693603516, 85.20691680908203, 88.8360366821289, 92.46514892578125, 96.09426879882812, 99.723388671875, 103.35250854492188, 106.98162078857422, 110.6107406616211, 114.23985290527344, 117.86897277832031, 121.49808502197266, 125.12720489501953, 128.75631713867188, 132.38543701171875, 136.01455688476562, 139.6436767578125, 143.27279663085938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 11.0, 5.0, 8.0, 12.0, 19.0, 11.0, 15.0, 11.0, 8.0, 24.0, 24.0, 31.0, 26.0, 21.0, 30.0, 37.0, 38.0, 48.0, 35.0, 56.0, 38.0, 54.0, 43.0, 43.0, 34.0, 38.0, 27.0, 30.0, 25.0, 26.0, 24.0, 31.0, 21.0, 10.0, 13.0, 18.0, 11.0, 10.0, 9.0, 7.0, 6.0, 5.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.14437866210938, -78.42566680908203, -75.70695495605469, -72.98824310302734, -70.26953125, -67.55081176757812, -64.83209991455078, -62.11338806152344, -59.394676208496094, -56.67596435546875, -53.957252502441406, -51.2385368347168, -48.51982498168945, -45.80111312866211, -43.0823974609375, -40.363685607910156, -37.64497375488281, -34.92626190185547, -32.207550048828125, -29.488834381103516, -26.770122528076172, -24.051410675048828, -21.33269691467285, -18.613983154296875, -15.895271301269531, -13.176558494567871, -10.457845687866211, -7.739132881164551, -5.020420074462891, -2.3017072677612305, 0.4170055389404297, 3.1357192993164062, 5.85443115234375, 8.57314395904541, 11.29185676574707, 14.01056957244873, 16.72928237915039, 19.447994232177734, 22.16670799255371, 24.885421752929688, 27.60413360595703, 30.322845458984375, 33.04155731201172, 35.76027297973633, 38.47898483276367, 41.197696685791016, 43.916412353515625, 46.63512420654297, 49.35383605957031, 52.072547912597656, 54.791259765625, 57.50997543334961, 60.22868728637695, 62.9473991394043, 65.6661148071289, 68.38482666015625, 71.1035385131836, 73.82225036621094, 76.54096221923828, 79.25967407226562, 81.9783935546875, 84.69710540771484, 87.41581726074219, 90.13452911376953, 92.85324096679688]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 3.0, 5.0, 9.0, 15.0, 12.0, 18.0, 19.0, 27.0, 27.0, 28.0, 35.0, 30.0, 36.0, 28.0, 39.0, 54.0, 51.0, 49.0, 50.0, 40.0, 51.0, 38.0, 40.0, 38.0, 43.0, 27.0, 33.0, 33.0, 14.0, 16.0, 20.0, 7.0, 15.0, 10.0, 7.0, 3.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7421875, -12.3323974609375, -11.922607421875, -11.5128173828125, -11.10302734375, -10.6932373046875, -10.283447265625, -9.8736572265625, -9.4638671875, -9.0540771484375, -8.644287109375, -8.2344970703125, -7.82470703125, -7.4149169921875, -7.005126953125, -6.5953369140625, -6.185546875, -5.7757568359375, -5.365966796875, -4.9561767578125, -4.54638671875, -4.1365966796875, -3.726806640625, -3.3170166015625, -2.9072265625, -2.4974365234375, -2.087646484375, -1.6778564453125, -1.26806640625, -0.8582763671875, -0.448486328125, -0.0386962890625, 0.37109375, 0.7808837890625, 1.190673828125, 1.6004638671875, 2.01025390625, 2.4200439453125, 2.829833984375, 3.2396240234375, 3.6494140625, 4.0592041015625, 4.468994140625, 4.8787841796875, 5.28857421875, 5.6983642578125, 6.108154296875, 6.5179443359375, 6.927734375, 7.3375244140625, 7.747314453125, 8.1571044921875, 8.56689453125, 8.9766845703125, 9.386474609375, 9.7962646484375, 10.2060546875, 10.6158447265625, 11.025634765625, 11.4354248046875, 11.84521484375, 12.2550048828125, 12.664794921875, 13.0745849609375, 13.484375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 5.0, 0.0, 1.0, 6.0, 3.0, 12.0, 8.0, 26.0, 26.0, 44.0, 52.0, 85.0, 121.0, 195.0, 301.0, 583.0, 970.0, 1751.0, 3688.0, 8068.0, 21470.0, 75812.0, 400023.0, 1928366.0, 1425999.0, 245980.0, 51435.0, 16163.0, 6483.0, 3018.0, 1495.0, 868.0, 458.0, 247.0, 158.0, 121.0, 75.0, 51.0, 36.0, 24.0, 18.0, 11.0, 7.0, 5.0, 10.0, 3.0, 6.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.015625, -16.405029296875, -15.79443359375, -15.183837890625, -14.5732421875, -13.962646484375, -13.35205078125, -12.741455078125, -12.130859375, -11.520263671875, -10.90966796875, -10.299072265625, -9.6884765625, -9.077880859375, -8.46728515625, -7.856689453125, -7.24609375, -6.635498046875, -6.02490234375, -5.414306640625, -4.8037109375, -4.193115234375, -3.58251953125, -2.971923828125, -2.361328125, -1.750732421875, -1.14013671875, -0.529541015625, 0.0810546875, 0.691650390625, 1.30224609375, 1.912841796875, 2.5234375, 3.134033203125, 3.74462890625, 4.355224609375, 4.9658203125, 5.576416015625, 6.18701171875, 6.797607421875, 7.408203125, 8.018798828125, 8.62939453125, 9.239990234375, 9.8505859375, 10.461181640625, 11.07177734375, 11.682373046875, 12.29296875, 12.903564453125, 13.51416015625, 14.124755859375, 14.7353515625, 15.345947265625, 15.95654296875, 16.567138671875, 17.177734375, 17.788330078125, 18.39892578125, 19.009521484375, 19.6201171875, 20.230712890625, 20.84130859375, 21.451904296875, 22.0625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 7.0, 23.0, 28.0, 45.0, 51.0, 65.0, 92.0, 163.0, 228.0, 364.0, 542.0, 607.0, 563.0, 389.0, 265.0, 175.0, 132.0, 93.0, 60.0, 57.0, 30.0, 22.0, 16.0, 9.0, 10.0, 3.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.4951171875, -16.787109375, -16.0791015625, -15.37109375, -14.6630859375, -13.955078125, -13.2470703125, -12.5390625, -11.8310546875, -11.123046875, -10.4150390625, -9.70703125, -8.9990234375, -8.291015625, -7.5830078125, -6.875, -6.1669921875, -5.458984375, -4.7509765625, -4.04296875, -3.3349609375, -2.626953125, -1.9189453125, -1.2109375, -0.5029296875, 0.205078125, 0.9130859375, 1.62109375, 2.3291015625, 3.037109375, 3.7451171875, 4.453125, 5.1611328125, 5.869140625, 6.5771484375, 7.28515625, 7.9931640625, 8.701171875, 9.4091796875, 10.1171875, 10.8251953125, 11.533203125, 12.2412109375, 12.94921875, 13.6572265625, 14.365234375, 15.0732421875, 15.78125, 16.4892578125, 17.197265625, 17.9052734375, 18.61328125, 19.3212890625, 20.029296875, 20.7373046875, 21.4453125, 22.1533203125, 22.861328125, 23.5693359375, 24.27734375, 24.9853515625, 25.693359375, 26.4013671875, 27.109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 11.0, 11.0, 9.0, 10.0, 15.0, 22.0, 44.0, 52.0, 62.0, 119.0, 167.0, 263.0, 479.0, 1055.0, 3996.0, 28543.0, 498976.0, 3479130.0, 163188.0, 13813.0, 2498.0, 788.0, 371.0, 205.0, 127.0, 104.0, 75.0, 39.0, 38.0, 17.0, 15.0, 15.0, 10.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.3125, -59.5771484375, -57.841796875, -56.1064453125, -54.37109375, -52.6357421875, -50.900390625, -49.1650390625, -47.4296875, -45.6943359375, -43.958984375, -42.2236328125, -40.48828125, -38.7529296875, -37.017578125, -35.2822265625, -33.546875, -31.8115234375, -30.076171875, -28.3408203125, -26.60546875, -24.8701171875, -23.134765625, -21.3994140625, -19.6640625, -17.9287109375, -16.193359375, -14.4580078125, -12.72265625, -10.9873046875, -9.251953125, -7.5166015625, -5.78125, -4.0458984375, -2.310546875, -0.5751953125, 1.16015625, 2.8955078125, 4.630859375, 6.3662109375, 8.1015625, 9.8369140625, 11.572265625, 13.3076171875, 15.04296875, 16.7783203125, 18.513671875, 20.2490234375, 21.984375, 23.7197265625, 25.455078125, 27.1904296875, 28.92578125, 30.6611328125, 32.396484375, 34.1318359375, 35.8671875, 37.6025390625, 39.337890625, 41.0732421875, 42.80859375, 44.5439453125, 46.279296875, 48.0146484375, 49.75]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 14.0, 55.0, 114.0, 265.0, 287.0, 171.0, 73.0, 24.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.65559387207031, -97.23971557617188, -90.82383728027344, -84.407958984375, -77.99208068847656, -71.57620239257812, -65.16031646728516, -58.74443817138672, -52.32855987548828, -45.912681579589844, -39.496803283691406, -33.0809211730957, -26.665042877197266, -20.249164581298828, -13.833282470703125, -7.4174041748046875, -1.00152587890625, 5.414353370666504, 11.830232620239258, 18.246112823486328, 24.661991119384766, 31.077869415283203, 37.493751525878906, 43.909629821777344, 50.32550811767578, 56.74138641357422, 63.157264709472656, 69.57315063476562, 75.98902893066406, 82.4049072265625, 88.82078552246094, 95.23666381835938, 101.65255737304688, 108.06843566894531, 114.48431396484375, 120.90019226074219, 127.31607055664062, 133.73194885253906, 140.1478271484375, 146.563720703125, 152.97958374023438, 159.3954620361328, 165.81134033203125, 172.2272186279297, 178.64309692382812, 185.05897521972656, 191.474853515625, 197.8907470703125, 204.30662536621094, 210.72250366210938, 217.1383819580078, 223.55426025390625, 229.9701385498047, 236.38601684570312, 242.80191040039062, 249.2177734375, 255.6336669921875, 262.049560546875, 268.4654235839844, 274.8813171386719, 281.29718017578125, 287.71307373046875, 294.1289367675781, 300.5448303222656, 306.960693359375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 6.0, 5.0, 14.0, 14.0, 11.0, 16.0, 14.0, 19.0, 23.0, 22.0, 24.0, 29.0, 40.0, 32.0, 45.0, 29.0, 41.0, 45.0, 39.0, 56.0, 36.0, 35.0, 53.0, 32.0, 39.0, 35.0, 35.0, 27.0, 30.0, 25.0, 31.0, 22.0, 16.0, 12.0, 16.0, 10.0, 7.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-71.3607177734375, -69.1150894165039, -66.86946105957031, -64.62382507324219, -62.378196716308594, -60.132568359375, -57.88693618774414, -55.64130401611328, -53.39567565917969, -51.150047302246094, -48.904415130615234, -46.658782958984375, -44.41315460205078, -42.16752624511719, -39.92189407348633, -37.67626190185547, -35.430633544921875, -33.18500518798828, -30.939373016357422, -28.693742752075195, -26.44811248779297, -24.202482223510742, -21.956851959228516, -19.71122169494629, -17.465591430664062, -15.219961166381836, -12.97433090209961, -10.728700637817383, -8.483070373535156, -6.23744010925293, -3.991809844970703, -1.7461795806884766, 0.49945068359375, 2.7450809478759766, 4.990711212158203, 7.23634147644043, 9.481971740722656, 11.727602005004883, 13.97323226928711, 16.218862533569336, 18.464492797851562, 20.71012306213379, 22.955753326416016, 25.201383590698242, 27.44701385498047, 29.692644119262695, 31.938274383544922, 34.18390655517578, 36.429534912109375, 38.67516326904297, 40.92079544067383, 43.16642761230469, 45.41205596923828, 47.657684326171875, 49.903316497802734, 52.148948669433594, 54.39457702636719, 56.64020538330078, 58.88583755493164, 61.1314697265625, 63.377098083496094, 65.62272644042969, 67.86836242675781, 70.1139907836914, 72.359619140625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 3.0, 4.0, 8.0, 2.0, 13.0, 8.0, 18.0, 11.0, 17.0, 19.0, 34.0, 28.0, 25.0, 38.0, 33.0, 36.0, 46.0, 44.0, 37.0, 43.0, 41.0, 44.0, 35.0, 52.0, 35.0, 30.0, 36.0, 34.0, 51.0, 22.0, 28.0, 15.0, 18.0, 13.0, 15.0, 6.0, 13.0, 4.0, 6.0, 7.0, 10.0, 2.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.2109375, -11.8359375, -11.4609375, -11.0859375, -10.7109375, -10.3359375, -9.9609375, -9.5859375, -9.2109375, -8.8359375, -8.4609375, -8.0859375, -7.7109375, -7.3359375, -6.9609375, -6.5859375, -6.2109375, -5.8359375, -5.4609375, -5.0859375, -4.7109375, -4.3359375, -3.9609375, -3.5859375, -3.2109375, -2.8359375, -2.4609375, -2.0859375, -1.7109375, -1.3359375, -0.9609375, -0.5859375, -0.2109375, 0.1640625, 0.5390625, 0.9140625, 1.2890625, 1.6640625, 2.0390625, 2.4140625, 2.7890625, 3.1640625, 3.5390625, 3.9140625, 4.2890625, 4.6640625, 5.0390625, 5.4140625, 5.7890625, 6.1640625, 6.5390625, 6.9140625, 7.2890625, 7.6640625, 8.0390625, 8.4140625, 8.7890625, 9.1640625, 9.5390625, 9.9140625, 10.2890625, 10.6640625, 11.0390625, 11.4140625, 11.7890625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 5.0, 10.0, 11.0, 18.0, 44.0, 42.0, 49.0, 81.0, 123.0, 160.0, 232.0, 339.0, 466.0, 644.0, 883.0, 1213.0, 1797.0, 2563.0, 3691.0, 5466.0, 7837.0, 11689.0, 17573.0, 26696.0, 40368.0, 61322.0, 90446.0, 125779.0, 153210.0, 145755.0, 112960.0, 78863.0, 52638.0, 34859.0, 23049.0, 15175.0, 10413.0, 6780.0, 4583.0, 3142.0, 2150.0, 1624.0, 1110.0, 794.0, 540.0, 424.0, 275.0, 184.0, 148.0, 91.0, 77.0, 69.0, 33.0, 18.0, 16.0, 17.0, 8.0, 2.0, 4.0, 3.0, 3.0], "bins": [-0.93701171875, -0.907562255859375, -0.87811279296875, -0.848663330078125, -0.8192138671875, -0.789764404296875, -0.76031494140625, -0.730865478515625, -0.701416015625, -0.671966552734375, -0.64251708984375, -0.613067626953125, -0.5836181640625, -0.554168701171875, -0.52471923828125, -0.495269775390625, -0.4658203125, -0.436370849609375, -0.40692138671875, -0.377471923828125, -0.3480224609375, -0.318572998046875, -0.28912353515625, -0.259674072265625, -0.230224609375, -0.200775146484375, -0.17132568359375, -0.141876220703125, -0.1124267578125, -0.082977294921875, -0.05352783203125, -0.024078369140625, 0.00537109375, 0.034820556640625, 0.06427001953125, 0.093719482421875, 0.1231689453125, 0.152618408203125, 0.18206787109375, 0.211517333984375, 0.240966796875, 0.270416259765625, 0.29986572265625, 0.329315185546875, 0.3587646484375, 0.388214111328125, 0.41766357421875, 0.447113037109375, 0.4765625, 0.506011962890625, 0.53546142578125, 0.564910888671875, 0.5943603515625, 0.623809814453125, 0.65325927734375, 0.682708740234375, 0.712158203125, 0.741607666015625, 0.77105712890625, 0.800506591796875, 0.8299560546875, 0.859405517578125, 0.88885498046875, 0.918304443359375, 0.94775390625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 8.0, 7.0, 13.0, 10.0, 12.0, 13.0, 18.0, 16.0, 28.0, 22.0, 21.0, 33.0, 46.0, 31.0, 51.0, 36.0, 36.0, 35.0, 41.0, 1069.0, 51.0, 34.0, 39.0, 28.0, 43.0, 30.0, 20.0, 34.0, 36.0, 25.0, 30.0, 20.0, 10.0, 14.0, 7.0, 6.0, 13.0, 5.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7109375, -6.4761962890625, -6.241455078125, -6.0067138671875, -5.77197265625, -5.5372314453125, -5.302490234375, -5.0677490234375, -4.8330078125, -4.5982666015625, -4.363525390625, -4.1287841796875, -3.89404296875, -3.6593017578125, -3.424560546875, -3.1898193359375, -2.955078125, -2.7203369140625, -2.485595703125, -2.2508544921875, -2.01611328125, -1.7813720703125, -1.546630859375, -1.3118896484375, -1.0771484375, -0.8424072265625, -0.607666015625, -0.3729248046875, -0.13818359375, 0.0965576171875, 0.331298828125, 0.5660400390625, 0.80078125, 1.0355224609375, 1.270263671875, 1.5050048828125, 1.73974609375, 1.9744873046875, 2.209228515625, 2.4439697265625, 2.6787109375, 2.9134521484375, 3.148193359375, 3.3829345703125, 3.61767578125, 3.8524169921875, 4.087158203125, 4.3218994140625, 4.556640625, 4.7913818359375, 5.026123046875, 5.2608642578125, 5.49560546875, 5.7303466796875, 5.965087890625, 6.1998291015625, 6.4345703125, 6.6693115234375, 6.904052734375, 7.1387939453125, 7.37353515625, 7.6082763671875, 7.843017578125, 8.0777587890625, 8.3125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 13.0, 9.0, 16.0, 14.0, 43.0, 48.0, 83.0, 130.0, 164.0, 320.0, 519.0, 859.0, 1319.0, 2103.0, 3515.0, 5732.0, 9878.0, 16466.0, 28511.0, 48684.0, 80697.0, 126416.0, 216488.0, 1184759.0, 141150.0, 91581.0, 56312.0, 33099.0, 19365.0, 11234.0, 6869.0, 4059.0, 2488.0, 1555.0, 981.0, 596.0, 377.0, 233.0, 156.0, 110.0, 65.0, 44.0, 25.0, 22.0, 7.0, 5.0, 12.0, 4.0, 2.0, 2.0], "bins": [-1.0634765625, -1.0348434448242188, -1.0062103271484375, -0.9775772094726562, -0.948944091796875, -0.9203109741210938, -0.8916778564453125, -0.8630447387695312, -0.83441162109375, -0.8057785034179688, -0.7771453857421875, -0.7485122680664062, -0.719879150390625, -0.6912460327148438, -0.6626129150390625, -0.6339797973632812, -0.6053466796875, -0.5767135620117188, -0.5480804443359375, -0.5194473266601562, -0.490814208984375, -0.46218109130859375, -0.4335479736328125, -0.40491485595703125, -0.37628173828125, -0.34764862060546875, -0.3190155029296875, -0.29038238525390625, -0.261749267578125, -0.23311614990234375, -0.2044830322265625, -0.17584991455078125, -0.147216796875, -0.11858367919921875, -0.0899505615234375, -0.06131744384765625, -0.032684326171875, -0.00405120849609375, 0.0245819091796875, 0.05321502685546875, 0.08184814453125, 0.11048126220703125, 0.1391143798828125, 0.16774749755859375, 0.196380615234375, 0.22501373291015625, 0.2536468505859375, 0.28227996826171875, 0.3109130859375, 0.33954620361328125, 0.3681793212890625, 0.39681243896484375, 0.425445556640625, 0.45407867431640625, 0.4827117919921875, 0.5113449096679688, 0.53997802734375, 0.5686111450195312, 0.5972442626953125, 0.6258773803710938, 0.654510498046875, 0.6831436157226562, 0.7117767333984375, 0.7404098510742188, 0.76904296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 2.0, 6.0, 8.0, 10.0, 10.0, 18.0, 24.0, 19.0, 28.0, 25.0, 44.0, 52.0, 57.0, 62.0, 87.0, 74.0, 79.0, 67.0, 53.0, 55.0, 50.0, 34.0, 26.0, 25.0, 15.0, 16.0, 11.0, 10.0, 12.0, 10.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0214691162109375, -0.020695924758911133, -0.019922733306884766, -0.0191495418548584, -0.01837635040283203, -0.017603158950805664, -0.016829967498779297, -0.01605677604675293, -0.015283584594726562, -0.014510393142700195, -0.013737201690673828, -0.012964010238647461, -0.012190818786621094, -0.011417627334594727, -0.01064443588256836, -0.009871244430541992, -0.009098052978515625, -0.008324861526489258, -0.007551670074462891, -0.0067784786224365234, -0.006005287170410156, -0.005232095718383789, -0.004458904266357422, -0.0036857128143310547, -0.0029125213623046875, -0.0021393299102783203, -0.0013661384582519531, -0.0005929470062255859, 0.00018024444580078125, 0.0009534358978271484, 0.0017266273498535156, 0.002499818801879883, 0.00327301025390625, 0.004046201705932617, 0.004819393157958984, 0.0055925846099853516, 0.006365776062011719, 0.007138967514038086, 0.007912158966064453, 0.00868535041809082, 0.009458541870117188, 0.010231733322143555, 0.011004924774169922, 0.011778116226196289, 0.012551307678222656, 0.013324499130249023, 0.01409769058227539, 0.014870882034301758, 0.015644073486328125, 0.016417264938354492, 0.01719045639038086, 0.017963647842407227, 0.018736839294433594, 0.01951003074645996, 0.020283222198486328, 0.021056413650512695, 0.021829605102539062, 0.02260279655456543, 0.023375988006591797, 0.024149179458618164, 0.02492237091064453, 0.0256955623626709, 0.026468753814697266, 0.027241945266723633, 0.02801513671875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 7.0, 10.0, 19.0, 15.0, 11.0, 22.0, 35.0, 36.0, 51.0, 80.0, 120.0, 158.0, 306.0, 720.0, 249105.0, 796007.0, 890.0, 358.0, 162.0, 125.0, 78.0, 43.0, 52.0, 39.0, 28.0, 13.0, 16.0, 15.0, 6.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.603515625, -0.5867729187011719, -0.5700302124023438, -0.5532875061035156, -0.5365447998046875, -0.5198020935058594, -0.5030593872070312, -0.4863166809082031, -0.469573974609375, -0.4528312683105469, -0.43608856201171875, -0.4193458557128906, -0.4026031494140625, -0.3858604431152344, -0.36911773681640625, -0.3523750305175781, -0.33563232421875, -0.3188896179199219, -0.30214691162109375, -0.2854042053222656, -0.2686614990234375, -0.2519187927246094, -0.23517608642578125, -0.21843338012695312, -0.201690673828125, -0.18494796752929688, -0.16820526123046875, -0.15146255493164062, -0.1347198486328125, -0.11797714233398438, -0.10123443603515625, -0.08449172973632812, -0.0677490234375, -0.051006317138671875, -0.03426361083984375, -0.017520904541015625, -0.0007781982421875, 0.015964508056640625, 0.03270721435546875, 0.049449920654296875, 0.066192626953125, 0.08293533325195312, 0.09967803955078125, 0.11642074584960938, 0.1331634521484375, 0.14990615844726562, 0.16664886474609375, 0.18339157104492188, 0.20013427734375, 0.21687698364257812, 0.23361968994140625, 0.2503623962402344, 0.2671051025390625, 0.2838478088378906, 0.30059051513671875, 0.3173332214355469, 0.334075927734375, 0.3508186340332031, 0.36756134033203125, 0.3843040466308594, 0.4010467529296875, 0.4177894592285156, 0.43453216552734375, 0.4512748718261719, 0.468017578125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 987.0, 21.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5541346669197083, -0.5417428016662598, -0.5293508768081665, -0.516959011554718, -0.5045671463012695, -0.49217525124549866, -0.47978338599205017, -0.4673914909362793, -0.4549996256828308, -0.44260773062705994, -0.43021586537361145, -0.4178239703178406, -0.4054321050643921, -0.3930402100086212, -0.38064834475517273, -0.36825644969940186, -0.35586458444595337, -0.3434726893901825, -0.331080824136734, -0.31868892908096313, -0.30629706382751465, -0.2939051687717438, -0.2815133035182953, -0.2691214084625244, -0.25672951340675354, -0.24433763325214386, -0.23194575309753418, -0.2195538729429245, -0.20716199278831482, -0.19477011263370514, -0.18237823247909546, -0.16998633742332458, -0.1575944721698761, -0.14520259201526642, -0.13281071186065674, -0.12041883170604706, -0.10802695155143738, -0.0956350713968277, -0.08324318379163742, -0.07085130363702774, -0.05845942348241806, -0.04606754332780838, -0.0336756631731987, -0.02128377929329872, -0.008891899138689041, 0.003499981015920639, 0.015891864895820618, 0.028283745050430298, 0.04067562520503998, 0.05306750535964966, 0.06545938551425934, 0.07785126566886902, 0.0902431458234787, 0.10263502597808838, 0.11502691358327866, 0.12741878628730774, 0.1398106813430786, 0.1522025614976883, 0.16459444165229797, 0.17698632180690765, 0.18937820196151733, 0.20177008211612701, 0.2141619622707367, 0.22655385732650757, 0.23894572257995605]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 14.0, 19.0, 17.0, 17.0, 26.0, 38.0, 33.0, 35.0, 43.0, 43.0, 42.0, 62.0, 63.0, 53.0, 48.0, 64.0, 59.0, 36.0, 44.0, 36.0, 35.0, 39.0, 30.0, 21.0, 14.0, 12.0, 17.0, 9.0, 6.0, 8.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029127895832061768, -0.028265831992030144, -0.02740376815199852, -0.026541704311966896, -0.025679640471935272, -0.02481757663190365, -0.023955512791872025, -0.0230934489518404, -0.022231385111808777, -0.021369321271777153, -0.02050725743174553, -0.019645193591713905, -0.01878312975168228, -0.017921065911650658, -0.017059002071619034, -0.01619693823158741, -0.015334874391555786, -0.014472810551524162, -0.013610746711492538, -0.012748682871460915, -0.01188661903142929, -0.011024555191397667, -0.010162491351366043, -0.00930042751133442, -0.008438363671302795, -0.007576299831271172, -0.006714235991239548, -0.005852172151207924, -0.0049901083111763, -0.004128044471144676, -0.0032659806311130524, -0.0024039167910814285, -0.0015418529510498047, -0.0006797891110181808, 0.000182274729013443, 0.0010443385690450668, 0.0019064024090766907, 0.0027684662491083145, 0.0036305300891399384, 0.004492593929171562, 0.005354657769203186, 0.00621672160923481, 0.007078785449266434, 0.007940849289298058, 0.008802913129329681, 0.009664976969361305, 0.010527040809392929, 0.011389104649424553, 0.012251168489456177, 0.0131132323294878, 0.013975296169519424, 0.014837360009551048, 0.015699423849582672, 0.016561487689614296, 0.01742355152964592, 0.018285615369677544, 0.019147679209709167, 0.02000974304974079, 0.020871806889772415, 0.02173387072980404, 0.022595934569835663, 0.023457998409867287, 0.02432006224989891, 0.025182126089930534, 0.026044189929962158]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 3.0, 4.0, 8.0, 2.0, 13.0, 8.0, 18.0, 11.0, 17.0, 18.0, 35.0, 28.0, 25.0, 38.0, 33.0, 36.0, 46.0, 44.0, 37.0, 43.0, 41.0, 44.0, 35.0, 52.0, 35.0, 30.0, 36.0, 35.0, 50.0, 22.0, 28.0, 15.0, 17.0, 14.0, 15.0, 6.0, 13.0, 4.0, 6.0, 7.0, 10.0, 2.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.2109375, -11.8359375, -11.4609375, -11.0859375, -10.7109375, -10.3359375, -9.9609375, -9.5859375, -9.2109375, -8.8359375, -8.4609375, -8.0859375, -7.7109375, -7.3359375, -6.9609375, -6.5859375, -6.2109375, -5.8359375, -5.4609375, -5.0859375, -4.7109375, -4.3359375, -3.9609375, -3.5859375, -3.2109375, -2.8359375, -2.4609375, -2.0859375, -1.7109375, -1.3359375, -0.9609375, -0.5859375, -0.2109375, 0.1640625, 0.5390625, 0.9140625, 1.2890625, 1.6640625, 2.0390625, 2.4140625, 2.7890625, 3.1640625, 3.5390625, 3.9140625, 4.2890625, 4.6640625, 5.0390625, 5.4140625, 5.7890625, 6.1640625, 6.5390625, 6.9140625, 7.2890625, 7.6640625, 8.0390625, 8.4140625, 8.7890625, 9.1640625, 9.5390625, 9.9140625, 10.2890625, 10.6640625, 11.0390625, 11.4140625, 11.7890625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 12.0, 15.0, 10.0, 18.0, 24.0, 23.0, 40.0, 55.0, 81.0, 91.0, 144.0, 159.0, 330.0, 519.0, 775.0, 1430.0, 2384.0, 4594.0, 8957.0, 19249.0, 43576.0, 106950.0, 327732.0, 338203.0, 109120.0, 44315.0, 19498.0, 9373.0, 4688.0, 2482.0, 1405.0, 780.0, 498.0, 303.0, 186.0, 147.0, 96.0, 72.0, 55.0, 39.0, 25.0, 23.0, 20.0, 21.0, 9.0, 8.0, 2.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.671875, -15.1971435546875, -14.722412109375, -14.2476806640625, -13.77294921875, -13.2982177734375, -12.823486328125, -12.3487548828125, -11.8740234375, -11.3992919921875, -10.924560546875, -10.4498291015625, -9.97509765625, -9.5003662109375, -9.025634765625, -8.5509033203125, -8.076171875, -7.6014404296875, -7.126708984375, -6.6519775390625, -6.17724609375, -5.7025146484375, -5.227783203125, -4.7530517578125, -4.2783203125, -3.8035888671875, -3.328857421875, -2.8541259765625, -2.37939453125, -1.9046630859375, -1.429931640625, -0.9552001953125, -0.48046875, -0.0057373046875, 0.468994140625, 0.9437255859375, 1.41845703125, 1.8931884765625, 2.367919921875, 2.8426513671875, 3.3173828125, 3.7921142578125, 4.266845703125, 4.7415771484375, 5.21630859375, 5.6910400390625, 6.165771484375, 6.6405029296875, 7.115234375, 7.5899658203125, 8.064697265625, 8.5394287109375, 9.01416015625, 9.4888916015625, 9.963623046875, 10.4383544921875, 10.9130859375, 11.3878173828125, 11.862548828125, 12.3372802734375, 12.81201171875, 13.2867431640625, 13.761474609375, 14.2362060546875, 14.7109375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 6.0, 6.0, 2.0, 11.0, 10.0, 8.0, 14.0, 12.0, 26.0, 18.0, 21.0, 16.0, 28.0, 33.0, 39.0, 45.0, 31.0, 46.0, 54.0, 93.0, 141.0, 1519.0, 262.0, 111.0, 68.0, 53.0, 41.0, 36.0, 45.0, 25.0, 27.0, 34.0, 21.0, 32.0, 13.0, 12.0, 14.0, 10.0, 10.0, 8.0, 8.0, 5.0, 5.0, 3.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-30.03125, -29.114990234375, -28.19873046875, -27.282470703125, -26.3662109375, -25.449951171875, -24.53369140625, -23.617431640625, -22.701171875, -21.784912109375, -20.86865234375, -19.952392578125, -19.0361328125, -18.119873046875, -17.20361328125, -16.287353515625, -15.37109375, -14.454833984375, -13.53857421875, -12.622314453125, -11.7060546875, -10.789794921875, -9.87353515625, -8.957275390625, -8.041015625, -7.124755859375, -6.20849609375, -5.292236328125, -4.3759765625, -3.459716796875, -2.54345703125, -1.627197265625, -0.7109375, 0.205322265625, 1.12158203125, 2.037841796875, 2.9541015625, 3.870361328125, 4.78662109375, 5.702880859375, 6.619140625, 7.535400390625, 8.45166015625, 9.367919921875, 10.2841796875, 11.200439453125, 12.11669921875, 13.032958984375, 13.94921875, 14.865478515625, 15.78173828125, 16.697998046875, 17.6142578125, 18.530517578125, 19.44677734375, 20.363037109375, 21.279296875, 22.195556640625, 23.11181640625, 24.028076171875, 24.9443359375, 25.860595703125, 26.77685546875, 27.693115234375, 28.609375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 12.0, 5.0, 10.0, 20.0, 23.0, 20.0, 22.0, 33.0, 48.0, 59.0, 63.0, 104.0, 183.0, 224.0, 397.0, 1077.0, 6285.0, 72529.0, 2567761.0, 469223.0, 23277.0, 2638.0, 649.0, 309.0, 177.0, 131.0, 93.0, 75.0, 58.0, 39.0, 32.0, 24.0, 16.0, 13.0, 14.0, 14.0, 13.0, 3.0, 4.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-51.125, -49.6552734375, -48.185546875, -46.7158203125, -45.24609375, -43.7763671875, -42.306640625, -40.8369140625, -39.3671875, -37.8974609375, -36.427734375, -34.9580078125, -33.48828125, -32.0185546875, -30.548828125, -29.0791015625, -27.609375, -26.1396484375, -24.669921875, -23.2001953125, -21.73046875, -20.2607421875, -18.791015625, -17.3212890625, -15.8515625, -14.3818359375, -12.912109375, -11.4423828125, -9.97265625, -8.5029296875, -7.033203125, -5.5634765625, -4.09375, -2.6240234375, -1.154296875, 0.3154296875, 1.78515625, 3.2548828125, 4.724609375, 6.1943359375, 7.6640625, 9.1337890625, 10.603515625, 12.0732421875, 13.54296875, 15.0126953125, 16.482421875, 17.9521484375, 19.421875, 20.8916015625, 22.361328125, 23.8310546875, 25.30078125, 26.7705078125, 28.240234375, 29.7099609375, 31.1796875, 32.6494140625, 34.119140625, 35.5888671875, 37.05859375, 38.5283203125, 39.998046875, 41.4677734375, 42.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 21.0, 58.0, 118.0, 187.0, 207.0, 168.0, 143.0, 62.0, 25.0, 13.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78714370727539, -24.27083396911621, -21.75452423095703, -19.238216400146484, -16.721906661987305, -14.205596923828125, -11.689288139343262, -9.172979354858398, -6.656669616699219, -4.140360355377197, -1.6240510940551758, 0.8922581672668457, 3.408567428588867, 5.924877166748047, 8.44118595123291, 10.957494735717773, 13.473804473876953, 15.990114212036133, 18.506423950195312, 21.02273178100586, 23.53904151916504, 26.05535125732422, 28.571659088134766, 31.087968826293945, 33.604278564453125, 36.12058639526367, 38.636898040771484, 41.15320587158203, 43.669517517089844, 46.18582534790039, 48.70213317871094, 51.21844482421875, 53.73475646972656, 56.25106430053711, 58.76737594604492, 61.28368377685547, 63.79999542236328, 66.31629943847656, 68.83261108398438, 71.34892272949219, 73.865234375, 76.38154602050781, 78.8978500366211, 81.4141616821289, 83.93047332763672, 86.44677734375, 88.96308898925781, 91.47940063476562, 93.9957046508789, 96.51201629638672, 99.0283203125, 101.54463195800781, 104.06094360351562, 106.57725524902344, 109.09355926513672, 111.60987091064453, 114.12617492675781, 116.64248657226562, 119.1587905883789, 121.67510223388672, 124.19141387939453, 126.70771789550781, 129.22402954101562, 131.74034118652344, 134.25665283203125]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 8.0, 12.0, 11.0, 8.0, 15.0, 13.0, 14.0, 23.0, 20.0, 26.0, 28.0, 21.0, 23.0, 35.0, 37.0, 41.0, 39.0, 36.0, 38.0, 42.0, 41.0, 55.0, 41.0, 42.0, 38.0, 36.0, 25.0, 23.0, 30.0, 36.0, 35.0, 18.0, 15.0, 10.0, 11.0, 8.0, 13.0, 8.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.00802612304688, -77.6344985961914, -75.26097869873047, -72.887451171875, -70.51393127441406, -68.1404037475586, -65.76688385009766, -63.39335632324219, -61.01983642578125, -58.64631271362305, -56.272789001464844, -53.89926528930664, -51.52574157714844, -49.152217864990234, -46.77869415283203, -44.40516662597656, -42.03164291381836, -39.658119201660156, -37.28459548950195, -34.91107177734375, -32.53754806518555, -30.164024353027344, -27.790498733520508, -25.416975021362305, -23.0434513092041, -20.6699275970459, -18.296403884887695, -15.922879219055176, -13.549355506896973, -11.17583179473877, -8.80230712890625, -6.428783416748047, -4.055259704589844, -1.6817357540130615, 0.6917881965637207, 3.065312385559082, 5.438836097717285, 7.812359809875488, 10.185884475708008, 12.559408187866211, 14.932931900024414, 17.306455612182617, 19.67997932434082, 22.053504943847656, 24.42702865600586, 26.800552368164062, 29.174076080322266, 31.54759979248047, 33.92112350463867, 36.294647216796875, 38.66817092895508, 41.04169464111328, 43.415218353271484, 45.78874206542969, 48.162269592285156, 50.535789489746094, 52.90931701660156, 55.282840728759766, 57.65636444091797, 60.02988815307617, 62.403411865234375, 64.77693939208984, 67.15045928955078, 69.52398681640625, 71.89750671386719]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 8.0, 12.0, 17.0, 19.0, 17.0, 28.0, 25.0, 28.0, 35.0, 44.0, 26.0, 46.0, 31.0, 41.0, 57.0, 52.0, 49.0, 42.0, 37.0, 39.0, 42.0, 32.0, 40.0, 30.0, 26.0, 20.0, 27.0, 16.0, 11.0, 8.0, 9.0, 14.0, 11.0, 12.0, 4.0, 2.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8515625, -12.4581298828125, -12.064697265625, -11.6712646484375, -11.27783203125, -10.8843994140625, -10.490966796875, -10.0975341796875, -9.7041015625, -9.3106689453125, -8.917236328125, -8.5238037109375, -8.13037109375, -7.7369384765625, -7.343505859375, -6.9500732421875, -6.556640625, -6.1632080078125, -5.769775390625, -5.3763427734375, -4.98291015625, -4.5894775390625, -4.196044921875, -3.8026123046875, -3.4091796875, -3.0157470703125, -2.622314453125, -2.2288818359375, -1.83544921875, -1.4420166015625, -1.048583984375, -0.6551513671875, -0.26171875, 0.1317138671875, 0.525146484375, 0.9185791015625, 1.31201171875, 1.7054443359375, 2.098876953125, 2.4923095703125, 2.8857421875, 3.2791748046875, 3.672607421875, 4.0660400390625, 4.45947265625, 4.8529052734375, 5.246337890625, 5.6397705078125, 6.033203125, 6.4266357421875, 6.820068359375, 7.2135009765625, 7.60693359375, 8.0003662109375, 8.393798828125, 8.7872314453125, 9.1806640625, 9.5740966796875, 9.967529296875, 10.3609619140625, 10.75439453125, 11.1478271484375, 11.541259765625, 11.9346923828125, 12.328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 7.0, 10.0, 18.0, 22.0, 32.0, 32.0, 58.0, 114.0, 181.0, 363.0, 742.0, 1746.0, 4786.0, 14407.0, 54218.0, 313773.0, 2055047.0, 1492977.0, 198511.0, 39183.0, 11313.0, 3810.0, 1487.0, 662.0, 311.0, 175.0, 80.0, 57.0, 35.0, 24.0, 25.0, 7.0, 9.0, 17.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.140625, -18.4287109375, -17.716796875, -17.0048828125, -16.29296875, -15.5810546875, -14.869140625, -14.1572265625, -13.4453125, -12.7333984375, -12.021484375, -11.3095703125, -10.59765625, -9.8857421875, -9.173828125, -8.4619140625, -7.75, -7.0380859375, -6.326171875, -5.6142578125, -4.90234375, -4.1904296875, -3.478515625, -2.7666015625, -2.0546875, -1.3427734375, -0.630859375, 0.0810546875, 0.79296875, 1.5048828125, 2.216796875, 2.9287109375, 3.640625, 4.3525390625, 5.064453125, 5.7763671875, 6.48828125, 7.2001953125, 7.912109375, 8.6240234375, 9.3359375, 10.0478515625, 10.759765625, 11.4716796875, 12.18359375, 12.8955078125, 13.607421875, 14.3193359375, 15.03125, 15.7431640625, 16.455078125, 17.1669921875, 17.87890625, 18.5908203125, 19.302734375, 20.0146484375, 20.7265625, 21.4384765625, 22.150390625, 22.8623046875, 23.57421875, 24.2861328125, 24.998046875, 25.7099609375, 26.421875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 10.0, 5.0, 12.0, 18.0, 16.0, 39.0, 40.0, 54.0, 111.0, 155.0, 213.0, 351.0, 531.0, 664.0, 598.0, 421.0, 269.0, 175.0, 134.0, 80.0, 52.0, 49.0, 31.0, 18.0, 14.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.605224609375, -22.88232421875, -22.159423828125, -21.4365234375, -20.713623046875, -19.99072265625, -19.267822265625, -18.544921875, -17.822021484375, -17.09912109375, -16.376220703125, -15.6533203125, -14.930419921875, -14.20751953125, -13.484619140625, -12.76171875, -12.038818359375, -11.31591796875, -10.593017578125, -9.8701171875, -9.147216796875, -8.42431640625, -7.701416015625, -6.978515625, -6.255615234375, -5.53271484375, -4.809814453125, -4.0869140625, -3.364013671875, -2.64111328125, -1.918212890625, -1.1953125, -0.472412109375, 0.25048828125, 0.973388671875, 1.6962890625, 2.419189453125, 3.14208984375, 3.864990234375, 4.587890625, 5.310791015625, 6.03369140625, 6.756591796875, 7.4794921875, 8.202392578125, 8.92529296875, 9.648193359375, 10.37109375, 11.093994140625, 11.81689453125, 12.539794921875, 13.2626953125, 13.985595703125, 14.70849609375, 15.431396484375, 16.154296875, 16.877197265625, 17.60009765625, 18.322998046875, 19.0458984375, 19.768798828125, 20.49169921875, 21.214599609375, 21.9375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 8.0, 11.0, 11.0, 22.0, 20.0, 36.0, 45.0, 79.0, 131.0, 208.0, 361.0, 671.0, 1406.0, 3462.0, 10162.0, 34847.0, 143690.0, 963806.0, 2569555.0, 362307.0, 73181.0, 19685.0, 6190.0, 2310.0, 950.0, 452.0, 232.0, 149.0, 89.0, 60.0, 35.0, 34.0, 23.0, 15.0, 9.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-29.921875, -29.073486328125, -28.22509765625, -27.376708984375, -26.5283203125, -25.679931640625, -24.83154296875, -23.983154296875, -23.134765625, -22.286376953125, -21.43798828125, -20.589599609375, -19.7412109375, -18.892822265625, -18.04443359375, -17.196044921875, -16.34765625, -15.499267578125, -14.65087890625, -13.802490234375, -12.9541015625, -12.105712890625, -11.25732421875, -10.408935546875, -9.560546875, -8.712158203125, -7.86376953125, -7.015380859375, -6.1669921875, -5.318603515625, -4.47021484375, -3.621826171875, -2.7734375, -1.925048828125, -1.07666015625, -0.228271484375, 0.6201171875, 1.468505859375, 2.31689453125, 3.165283203125, 4.013671875, 4.862060546875, 5.71044921875, 6.558837890625, 7.4072265625, 8.255615234375, 9.10400390625, 9.952392578125, 10.80078125, 11.649169921875, 12.49755859375, 13.345947265625, 14.1943359375, 15.042724609375, 15.89111328125, 16.739501953125, 17.587890625, 18.436279296875, 19.28466796875, 20.133056640625, 20.9814453125, 21.829833984375, 22.67822265625, 23.526611328125, 24.375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 25.0, 87.0, 160.0, 248.0, 240.0, 154.0, 66.0, 22.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.9603385925293, -31.562278747558594, -26.16421890258789, -20.766159057617188, -15.368099212646484, -9.970039367675781, -4.571979522705078, 0.826080322265625, 6.224140167236328, 11.622200012207031, 17.020259857177734, 22.418319702148438, 27.81637954711914, 33.214439392089844, 38.61249923706055, 44.01055908203125, 49.40861892700195, 54.806678771972656, 60.20473861694336, 65.60279846191406, 71.0008544921875, 76.39891815185547, 81.79698181152344, 87.19503784179688, 92.59309387207031, 97.99114990234375, 103.38921356201172, 108.78727722167969, 114.18533325195312, 119.58338928222656, 124.98145294189453, 130.3795166015625, 135.777587890625, 141.17564392089844, 146.57369995117188, 151.97177124023438, 157.3698272705078, 162.76788330078125, 168.16595458984375, 173.5640106201172, 178.96206665039062, 184.36012268066406, 189.7581787109375, 195.15625, 200.55430603027344, 205.95236206054688, 211.35043334960938, 216.7484893798828, 222.14654541015625, 227.5446014404297, 232.94265747070312, 238.34072875976562, 243.73878479003906, 249.1368408203125, 254.534912109375, 259.9329528808594, 265.3310241699219, 270.7290954589844, 276.12713623046875, 281.52520751953125, 286.92327880859375, 292.3213195800781, 297.7193908691406, 303.117431640625, 308.5155029296875]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 4.0, 7.0, 9.0, 6.0, 16.0, 22.0, 21.0, 20.0, 19.0, 33.0, 24.0, 32.0, 25.0, 34.0, 47.0, 43.0, 50.0, 60.0, 46.0, 41.0, 59.0, 40.0, 37.0, 33.0, 41.0, 36.0, 20.0, 26.0, 26.0, 29.0, 16.0, 14.0, 20.0, 12.0, 14.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.92107391357422, -66.84284210205078, -64.76461029052734, -62.686378479003906, -60.60814666748047, -58.52991485595703, -56.451683044433594, -54.373451232910156, -52.29521942138672, -50.21698760986328, -48.138755798339844, -46.060523986816406, -43.98229217529297, -41.90406036376953, -39.825828552246094, -37.747596740722656, -35.66936111450195, -33.591129302978516, -31.512897491455078, -29.43466567993164, -27.356433868408203, -25.278202056884766, -23.199968338012695, -21.121736526489258, -19.04350471496582, -16.965272903442383, -14.887041091918945, -12.808808326721191, -10.730576515197754, -8.652344703674316, -6.5741119384765625, -4.495880126953125, -2.4176483154296875, -0.3394162654876709, 1.7388157844543457, 3.8170480728149414, 5.895279884338379, 7.973511695861816, 10.05174446105957, 12.129976272583008, 14.208208084106445, 16.286439895629883, 18.36467170715332, 20.44290542602539, 22.521137237548828, 24.599369049072266, 26.677600860595703, 28.75583267211914, 30.834064483642578, 32.912296295166016, 34.99052810668945, 37.06875991821289, 39.14699172973633, 41.225223541259766, 43.30345916748047, 45.381690979003906, 47.459922790527344, 49.53815460205078, 51.61638641357422, 53.694618225097656, 55.772850036621094, 57.85108184814453, 59.92931365966797, 62.007545471191406, 64.08577728271484]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 8.0, 3.0, 4.0, 12.0, 7.0, 12.0, 14.0, 26.0, 21.0, 20.0, 21.0, 31.0, 23.0, 26.0, 38.0, 35.0, 43.0, 32.0, 45.0, 51.0, 44.0, 52.0, 40.0, 42.0, 44.0, 36.0, 37.0, 30.0, 33.0, 24.0, 19.0, 25.0, 19.0, 13.0, 16.0, 12.0, 11.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.0625, -12.6593017578125, -12.256103515625, -11.8529052734375, -11.44970703125, -11.0465087890625, -10.643310546875, -10.2401123046875, -9.8369140625, -9.4337158203125, -9.030517578125, -8.6273193359375, -8.22412109375, -7.8209228515625, -7.417724609375, -7.0145263671875, -6.611328125, -6.2081298828125, -5.804931640625, -5.4017333984375, -4.99853515625, -4.5953369140625, -4.192138671875, -3.7889404296875, -3.3857421875, -2.9825439453125, -2.579345703125, -2.1761474609375, -1.77294921875, -1.3697509765625, -0.966552734375, -0.5633544921875, -0.16015625, 0.2430419921875, 0.646240234375, 1.0494384765625, 1.45263671875, 1.8558349609375, 2.259033203125, 2.6622314453125, 3.0654296875, 3.4686279296875, 3.871826171875, 4.2750244140625, 4.67822265625, 5.0814208984375, 5.484619140625, 5.8878173828125, 6.291015625, 6.6942138671875, 7.097412109375, 7.5006103515625, 7.90380859375, 8.3070068359375, 8.710205078125, 9.1134033203125, 9.5166015625, 9.9197998046875, 10.322998046875, 10.7261962890625, 11.12939453125, 11.5325927734375, 11.935791015625, 12.3389892578125, 12.7421875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 12.0, 15.0, 24.0, 32.0, 42.0, 74.0, 95.0, 146.0, 222.0, 330.0, 485.0, 732.0, 1050.0, 1613.0, 2452.0, 3793.0, 5913.0, 9338.0, 14861.0, 24767.0, 42024.0, 73265.0, 126643.0, 200097.0, 208807.0, 136517.0, 79458.0, 44938.0, 26498.0, 16121.0, 10016.0, 6298.0, 4018.0, 2655.0, 1750.0, 1136.0, 714.0, 529.0, 358.0, 231.0, 153.0, 119.0, 63.0, 44.0, 37.0, 21.0, 21.0, 11.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.546875, -1.4986419677734375, -1.450408935546875, -1.4021759033203125, -1.35394287109375, -1.3057098388671875, -1.257476806640625, -1.2092437744140625, -1.1610107421875, -1.1127777099609375, -1.064544677734375, -1.0163116455078125, -0.96807861328125, -0.9198455810546875, -0.871612548828125, -0.8233795166015625, -0.775146484375, -0.7269134521484375, -0.678680419921875, -0.6304473876953125, -0.58221435546875, -0.5339813232421875, -0.485748291015625, -0.4375152587890625, -0.3892822265625, -0.3410491943359375, -0.292816162109375, -0.2445831298828125, -0.19635009765625, -0.1481170654296875, -0.099884033203125, -0.0516510009765625, -0.00341796875, 0.0448150634765625, 0.093048095703125, 0.1412811279296875, 0.18951416015625, 0.2377471923828125, 0.285980224609375, 0.3342132568359375, 0.3824462890625, 0.4306793212890625, 0.478912353515625, 0.5271453857421875, 0.57537841796875, 0.6236114501953125, 0.671844482421875, 0.7200775146484375, 0.768310546875, 0.8165435791015625, 0.864776611328125, 0.9130096435546875, 0.96124267578125, 1.0094757080078125, 1.057708740234375, 1.1059417724609375, 1.1541748046875, 1.2024078369140625, 1.250640869140625, 1.2988739013671875, 1.34710693359375, 1.3953399658203125, 1.443572998046875, 1.4918060302734375, 1.5400390625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 12.0, 11.0, 16.0, 20.0, 20.0, 26.0, 14.0, 21.0, 31.0, 36.0, 22.0, 49.0, 34.0, 40.0, 45.0, 48.0, 1060.0, 51.0, 51.0, 43.0, 42.0, 37.0, 27.0, 28.0, 28.0, 30.0, 20.0, 14.0, 19.0, 19.0, 15.0, 12.0, 12.0, 11.0, 11.0, 4.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41796875, -7.14093017578125, -6.8638916015625, -6.58685302734375, -6.309814453125, -6.03277587890625, -5.7557373046875, -5.47869873046875, -5.20166015625, -4.92462158203125, -4.6475830078125, -4.37054443359375, -4.093505859375, -3.81646728515625, -3.5394287109375, -3.26239013671875, -2.9853515625, -2.70831298828125, -2.4312744140625, -2.15423583984375, -1.877197265625, -1.60015869140625, -1.3231201171875, -1.04608154296875, -0.76904296875, -0.49200439453125, -0.2149658203125, 0.06207275390625, 0.339111328125, 0.61614990234375, 0.8931884765625, 1.17022705078125, 1.447265625, 1.72430419921875, 2.0013427734375, 2.27838134765625, 2.555419921875, 2.83245849609375, 3.1094970703125, 3.38653564453125, 3.66357421875, 3.94061279296875, 4.2176513671875, 4.49468994140625, 4.771728515625, 5.04876708984375, 5.3258056640625, 5.60284423828125, 5.8798828125, 6.15692138671875, 6.4339599609375, 6.71099853515625, 6.988037109375, 7.26507568359375, 7.5421142578125, 7.81915283203125, 8.09619140625, 8.37322998046875, 8.6502685546875, 8.92730712890625, 9.204345703125, 9.48138427734375, 9.7584228515625, 10.03546142578125, 10.3125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 18.0, 23.0, 37.0, 44.0, 75.0, 94.0, 147.0, 216.0, 363.0, 569.0, 906.0, 1425.0, 2331.0, 3758.0, 6307.0, 10818.0, 18348.0, 31447.0, 54269.0, 93172.0, 152533.0, 1221684.0, 208673.0, 120079.0, 70986.0, 40636.0, 23656.0, 13850.0, 7967.0, 4870.0, 2986.0, 1790.0, 1074.0, 729.0, 408.0, 291.0, 182.0, 123.0, 74.0, 56.0, 33.0, 21.0, 19.0, 17.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.14453125, -1.1084747314453125, -1.072418212890625, -1.0363616943359375, -1.00030517578125, -0.9642486572265625, -0.928192138671875, -0.8921356201171875, -0.8560791015625, -0.8200225830078125, -0.783966064453125, -0.7479095458984375, -0.71185302734375, -0.6757965087890625, -0.639739990234375, -0.6036834716796875, -0.567626953125, -0.5315704345703125, -0.495513916015625, -0.4594573974609375, -0.42340087890625, -0.3873443603515625, -0.351287841796875, -0.3152313232421875, -0.2791748046875, -0.2431182861328125, -0.207061767578125, -0.1710052490234375, -0.13494873046875, -0.0988922119140625, -0.062835693359375, -0.0267791748046875, 0.00927734375, 0.0453338623046875, 0.081390380859375, 0.1174468994140625, 0.15350341796875, 0.1895599365234375, 0.225616455078125, 0.2616729736328125, 0.2977294921875, 0.3337860107421875, 0.369842529296875, 0.4058990478515625, 0.44195556640625, 0.4780120849609375, 0.514068603515625, 0.5501251220703125, 0.586181640625, 0.6222381591796875, 0.658294677734375, 0.6943511962890625, 0.73040771484375, 0.7664642333984375, 0.802520751953125, 0.8385772705078125, 0.8746337890625, 0.9106903076171875, 0.946746826171875, 0.9828033447265625, 1.01885986328125, 1.0549163818359375, 1.090972900390625, 1.1270294189453125, 1.1630859375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 8.0, 3.0, 11.0, 9.0, 14.0, 12.0, 11.0, 11.0, 27.0, 26.0, 33.0, 34.0, 35.0, 34.0, 40.0, 59.0, 60.0, 54.0, 63.0, 57.0, 43.0, 42.0, 39.0, 32.0, 46.0, 34.0, 20.0, 20.0, 20.0, 17.0, 10.0, 16.0, 13.0, 4.0, 8.0, 7.0, 5.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0318603515625, -0.030825138092041016, -0.02978992462158203, -0.028754711151123047, -0.027719497680664062, -0.026684284210205078, -0.025649070739746094, -0.02461385726928711, -0.023578643798828125, -0.02254343032836914, -0.021508216857910156, -0.020473003387451172, -0.019437789916992188, -0.018402576446533203, -0.01736736297607422, -0.016332149505615234, -0.01529693603515625, -0.014261722564697266, -0.013226509094238281, -0.012191295623779297, -0.011156082153320312, -0.010120868682861328, -0.009085655212402344, -0.00805044174194336, -0.007015228271484375, -0.005980014801025391, -0.004944801330566406, -0.003909587860107422, -0.0028743743896484375, -0.0018391609191894531, -0.0008039474487304688, 0.00023126602172851562, 0.0012664794921875, 0.0023016929626464844, 0.0033369064331054688, 0.004372119903564453, 0.0054073333740234375, 0.006442546844482422, 0.007477760314941406, 0.00851297378540039, 0.009548187255859375, 0.01058340072631836, 0.011618614196777344, 0.012653827667236328, 0.013689041137695312, 0.014724254608154297, 0.01575946807861328, 0.016794681549072266, 0.01782989501953125, 0.018865108489990234, 0.01990032196044922, 0.020935535430908203, 0.021970748901367188, 0.023005962371826172, 0.024041175842285156, 0.02507638931274414, 0.026111602783203125, 0.02714681625366211, 0.028182029724121094, 0.029217243194580078, 0.030252456665039062, 0.03128767013549805, 0.03232288360595703, 0.033358097076416016, 0.034393310546875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 7.0, 6.0, 12.0, 5.0, 13.0, 18.0, 24.0, 24.0, 32.0, 27.0, 53.0, 50.0, 64.0, 91.0, 109.0, 170.0, 275.0, 471.0, 1941.0, 969628.0, 73482.0, 868.0, 363.0, 212.0, 129.0, 88.0, 79.0, 63.0, 39.0, 44.0, 25.0, 21.0, 16.0, 22.0, 10.0, 15.0, 13.0, 11.0, 6.0, 1.0, 7.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.69189453125, -0.670806884765625, -0.64971923828125, -0.628631591796875, -0.6075439453125, -0.586456298828125, -0.56536865234375, -0.544281005859375, -0.523193359375, -0.502105712890625, -0.48101806640625, -0.459930419921875, -0.4388427734375, -0.417755126953125, -0.39666748046875, -0.375579833984375, -0.3544921875, -0.333404541015625, -0.31231689453125, -0.291229248046875, -0.2701416015625, -0.249053955078125, -0.22796630859375, -0.206878662109375, -0.185791015625, -0.164703369140625, -0.14361572265625, -0.122528076171875, -0.1014404296875, -0.080352783203125, -0.05926513671875, -0.038177490234375, -0.01708984375, 0.003997802734375, 0.02508544921875, 0.046173095703125, 0.0672607421875, 0.088348388671875, 0.10943603515625, 0.130523681640625, 0.151611328125, 0.172698974609375, 0.19378662109375, 0.214874267578125, 0.2359619140625, 0.257049560546875, 0.27813720703125, 0.299224853515625, 0.3203125, 0.341400146484375, 0.36248779296875, 0.383575439453125, 0.4046630859375, 0.425750732421875, 0.44683837890625, 0.467926025390625, 0.489013671875, 0.510101318359375, 0.53118896484375, 0.552276611328125, 0.5733642578125, 0.594451904296875, 0.61553955078125, 0.636627197265625, 0.65771484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 921.0, 93.0], "bins": [-1.8843187093734741, -1.8543654680252075, -1.824412226676941, -1.7944589853286743, -1.7645058631896973, -1.7345526218414307, -1.704599380493164, -1.6746461391448975, -1.6446928977966309, -1.6147396564483643, -1.5847864151000977, -1.554833173751831, -1.524880051612854, -1.4949268102645874, -1.4649735689163208, -1.4350203275680542, -1.4050670862197876, -1.375113844871521, -1.3451606035232544, -1.3152073621749878, -1.2852542400360107, -1.2553009986877441, -1.2253477573394775, -1.195394515991211, -1.1654412746429443, -1.1354880332946777, -1.1055347919464111, -1.0755815505981445, -1.0456284284591675, -1.0156751871109009, -0.9857219457626343, -0.9557687044143677, -0.9258155226707458, -0.8958622813224792, -0.8659090995788574, -0.8359558582305908, -0.8060026168823242, -0.7760493755340576, -0.7460961937904358, -0.7161429524421692, -0.6861897110939026, -0.656236469745636, -0.6262832880020142, -0.5963300466537476, -0.566376805305481, -0.5364235639572144, -0.5064703822135925, -0.4765171408653259, -0.4465639293193817, -0.4166107177734375, -0.3866574764251709, -0.3567042648792267, -0.3267510235309601, -0.29679781198501587, -0.26684457063674927, -0.23689135909080505, -0.20693811774253845, -0.17698489129543304, -0.14703166484832764, -0.11707844585180283, -0.08712521940469742, -0.05717200040817261, -0.0272187739610672, 0.002734452486038208, 0.03268767520785332]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 16.0, 12.0, 17.0, 35.0, 32.0, 46.0, 43.0, 68.0, 56.0, 60.0, 80.0, 75.0, 64.0, 65.0, 61.0, 62.0, 35.0, 50.0, 34.0, 31.0, 23.0, 14.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051915884017944336, -0.049700986593961716, -0.047486089169979095, -0.04527118802070618, -0.043056290596723557, -0.040841393172740936, -0.03862649202346802, -0.0364115945994854, -0.03419669717550278, -0.03198179975152016, -0.029766900464892387, -0.027552001178264618, -0.025337103754281998, -0.023122206330299377, -0.020907307043671608, -0.01869240775704384, -0.016477510333061218, -0.014262611977756023, -0.012047713622450829, -0.009832815267145634, -0.007617916911840439, -0.005403018556535244, -0.003188120201230049, -0.0009732218459248543, 0.0012416765093803406, 0.0034565748646855354, 0.00567147321999073, 0.007886371575295925, 0.01010126993060112, 0.012316168285906315, 0.01453106664121151, 0.01674596592783928, 0.0189608633518219, 0.02117576077580452, 0.02339066006243229, 0.02560555934906006, 0.02782045677304268, 0.0300353541970253, 0.03225025534629822, 0.03446515277028084, 0.03668005019426346, 0.03889494761824608, 0.0411098450422287, 0.04332474619150162, 0.04553964361548424, 0.04775454103946686, 0.04996944218873978, 0.0521843396127224, 0.05439923703670502, 0.05661413446068764, 0.05882903188467026, 0.061043933033943176, 0.0632588267326355, 0.06547372788190842, 0.06768862903118134, 0.06990352272987366, 0.07211842387914658, 0.0743333250284195, 0.07654821872711182, 0.07876311987638474, 0.08097802102565765, 0.08319291472434998, 0.0854078158736229, 0.08762270957231522, 0.08983761072158813]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 8.0, 3.0, 4.0, 12.0, 7.0, 12.0, 14.0, 25.0, 22.0, 20.0, 21.0, 31.0, 23.0, 26.0, 38.0, 35.0, 42.0, 33.0, 45.0, 51.0, 44.0, 51.0, 42.0, 41.0, 44.0, 36.0, 37.0, 30.0, 33.0, 24.0, 19.0, 25.0, 19.0, 13.0, 16.0, 12.0, 11.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.0625, -12.6593017578125, -12.256103515625, -11.8529052734375, -11.44970703125, -11.0465087890625, -10.643310546875, -10.2401123046875, -9.8369140625, -9.4337158203125, -9.030517578125, -8.6273193359375, -8.22412109375, -7.8209228515625, -7.417724609375, -7.0145263671875, -6.611328125, -6.2081298828125, -5.804931640625, -5.4017333984375, -4.99853515625, -4.5953369140625, -4.192138671875, -3.7889404296875, -3.3857421875, -2.9825439453125, -2.579345703125, -2.1761474609375, -1.77294921875, -1.3697509765625, -0.966552734375, -0.5633544921875, -0.16015625, 0.2430419921875, 0.646240234375, 1.0494384765625, 1.45263671875, 1.8558349609375, 2.259033203125, 2.6622314453125, 3.0654296875, 3.4686279296875, 3.871826171875, 4.2750244140625, 4.67822265625, 5.0814208984375, 5.484619140625, 5.8878173828125, 6.291015625, 6.6942138671875, 7.097412109375, 7.5006103515625, 7.90380859375, 8.3070068359375, 8.710205078125, 9.1134033203125, 9.5166015625, 9.9197998046875, 10.322998046875, 10.7261962890625, 11.12939453125, 11.5325927734375, 11.935791015625, 12.3389892578125, 12.7421875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 6.0, 8.0, 2.0, 11.0, 12.0, 13.0, 28.0, 20.0, 42.0, 41.0, 91.0, 99.0, 163.0, 224.0, 367.0, 690.0, 1149.0, 2211.0, 4494.0, 9850.0, 24400.0, 64558.0, 195992.0, 453585.0, 186121.0, 61711.0, 23462.0, 9598.0, 4439.0, 2204.0, 1172.0, 622.0, 378.0, 237.0, 170.0, 120.0, 67.0, 60.0, 39.0, 26.0, 20.0, 9.0, 13.0, 11.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 4.0, 2.0], "bins": [-20.3125, -19.739990234375, -19.16748046875, -18.594970703125, -18.0224609375, -17.449951171875, -16.87744140625, -16.304931640625, -15.732421875, -15.159912109375, -14.58740234375, -14.014892578125, -13.4423828125, -12.869873046875, -12.29736328125, -11.724853515625, -11.15234375, -10.579833984375, -10.00732421875, -9.434814453125, -8.8623046875, -8.289794921875, -7.71728515625, -7.144775390625, -6.572265625, -5.999755859375, -5.42724609375, -4.854736328125, -4.2822265625, -3.709716796875, -3.13720703125, -2.564697265625, -1.9921875, -1.419677734375, -0.84716796875, -0.274658203125, 0.2978515625, 0.870361328125, 1.44287109375, 2.015380859375, 2.587890625, 3.160400390625, 3.73291015625, 4.305419921875, 4.8779296875, 5.450439453125, 6.02294921875, 6.595458984375, 7.16796875, 7.740478515625, 8.31298828125, 8.885498046875, 9.4580078125, 10.030517578125, 10.60302734375, 11.175537109375, 11.748046875, 12.320556640625, 12.89306640625, 13.465576171875, 14.0380859375, 14.610595703125, 15.18310546875, 15.755615234375, 16.328125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 5.0, 6.0, 9.0, 4.0, 6.0, 13.0, 6.0, 19.0, 25.0, 28.0, 32.0, 31.0, 42.0, 58.0, 49.0, 43.0, 70.0, 110.0, 184.0, 1405.0, 311.0, 141.0, 93.0, 61.0, 44.0, 52.0, 34.0, 24.0, 25.0, 25.0, 19.0, 23.0, 12.0, 9.0, 6.0, 11.0, 6.0, 5.0, 1.0, 5.0, 0.0, 5.0, 0.0, 2.0, 2.0, 1.0], "bins": [-44.25, -43.0791015625, -41.908203125, -40.7373046875, -39.56640625, -38.3955078125, -37.224609375, -36.0537109375, -34.8828125, -33.7119140625, -32.541015625, -31.3701171875, -30.19921875, -29.0283203125, -27.857421875, -26.6865234375, -25.515625, -24.3447265625, -23.173828125, -22.0029296875, -20.83203125, -19.6611328125, -18.490234375, -17.3193359375, -16.1484375, -14.9775390625, -13.806640625, -12.6357421875, -11.46484375, -10.2939453125, -9.123046875, -7.9521484375, -6.78125, -5.6103515625, -4.439453125, -3.2685546875, -2.09765625, -0.9267578125, 0.244140625, 1.4150390625, 2.5859375, 3.7568359375, 4.927734375, 6.0986328125, 7.26953125, 8.4404296875, 9.611328125, 10.7822265625, 11.953125, 13.1240234375, 14.294921875, 15.4658203125, 16.63671875, 17.8076171875, 18.978515625, 20.1494140625, 21.3203125, 22.4912109375, 23.662109375, 24.8330078125, 26.00390625, 27.1748046875, 28.345703125, 29.5166015625, 30.6875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 7.0, 14.0, 23.0, 17.0, 35.0, 58.0, 75.0, 114.0, 155.0, 322.0, 787.0, 5254.0, 390926.0, 2730443.0, 15193.0, 1129.0, 442.0, 220.0, 152.0, 95.0, 73.0, 42.0, 35.0, 26.0, 16.0, 10.0, 7.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-99.5, -96.958984375, -94.41796875, -91.876953125, -89.3359375, -86.794921875, -84.25390625, -81.712890625, -79.171875, -76.630859375, -74.08984375, -71.548828125, -69.0078125, -66.466796875, -63.92578125, -61.384765625, -58.84375, -56.302734375, -53.76171875, -51.220703125, -48.6796875, -46.138671875, -43.59765625, -41.056640625, -38.515625, -35.974609375, -33.43359375, -30.892578125, -28.3515625, -25.810546875, -23.26953125, -20.728515625, -18.1875, -15.646484375, -13.10546875, -10.564453125, -8.0234375, -5.482421875, -2.94140625, -0.400390625, 2.140625, 4.681640625, 7.22265625, 9.763671875, 12.3046875, 14.845703125, 17.38671875, 19.927734375, 22.46875, 25.009765625, 27.55078125, 30.091796875, 32.6328125, 35.173828125, 37.71484375, 40.255859375, 42.796875, 45.337890625, 47.87890625, 50.419921875, 52.9609375, 55.501953125, 58.04296875, 60.583984375, 63.125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 788.0, 219.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-682.9923706054688, -662.800048828125, -642.6077880859375, -622.41552734375, -602.2232055664062, -582.0308837890625, -561.838623046875, -541.6463623046875, -521.4540405273438, -501.2617492675781, -481.0694580078125, -460.8771667480469, -440.68487548828125, -420.4925842285156, -400.30029296875, -380.1080017089844, -359.91571044921875, -339.7234191894531, -319.5311279296875, -299.3388366699219, -279.14654541015625, -258.9542541503906, -238.761962890625, -218.56967163085938, -198.37738037109375, -178.18508911132812, -157.9927978515625, -137.80050659179688, -117.60821533203125, -97.41592407226562, -77.2236328125, -57.031341552734375, -36.839111328125, -16.646820068359375, 3.54547119140625, 23.737762451171875, 43.9300537109375, 64.12234497070312, 84.31463623046875, 104.50692749023438, 124.69921875, 144.89151000976562, 165.08380126953125, 185.27609252929688, 205.4683837890625, 225.66067504882812, 245.85296630859375, 266.0452575683594, 286.237548828125, 306.4298400878906, 326.62213134765625, 346.8144226074219, 367.0067138671875, 387.1990051269531, 407.39129638671875, 427.5835876464844, 447.77587890625, 467.9681701660156, 488.16046142578125, 508.3527526855469, 528.5450439453125, 548.7373046875, 568.9296264648438, 589.1219482421875, 609.314208984375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 7.0, 10.0, 8.0, 15.0, 10.0, 11.0, 18.0, 19.0, 17.0, 15.0, 24.0, 25.0, 31.0, 30.0, 35.0, 60.0, 44.0, 41.0, 41.0, 31.0, 44.0, 33.0, 49.0, 35.0, 21.0, 31.0, 32.0, 29.0, 30.0, 23.0, 30.0, 25.0, 18.0, 19.0, 14.0, 16.0, 9.0, 9.0, 6.0, 12.0, 2.0, 6.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0], "bins": [-88.81170654296875, -86.51644134521484, -84.2211685180664, -81.9259033203125, -79.63063049316406, -77.33536529541016, -75.04009246826172, -72.74482727050781, -70.44955444335938, -68.15428924560547, -65.85901641845703, -63.56374740600586, -61.26847839355469, -58.973209381103516, -56.677940368652344, -54.38267517089844, -52.087406158447266, -49.792137145996094, -47.49686813354492, -45.20159912109375, -42.90633010864258, -40.611061096191406, -38.3157958984375, -36.02052307128906, -33.725257873535156, -31.429988861083984, -29.134719848632812, -26.83945083618164, -24.54418182373047, -22.248912811279297, -19.953645706176758, -17.658376693725586, -15.363101959228516, -13.067832946777344, -10.772563934326172, -8.477295875549316, -6.1820268630981445, -3.8867578506469727, -1.5914897918701172, 0.7037792205810547, 2.9990482330322266, 5.294317245483398, 7.589585781097412, 9.884854316711426, 12.180123329162598, 14.47539234161377, 16.770660400390625, 19.065929412841797, 21.36119842529297, 23.65646743774414, 25.951736450195312, 28.247005462646484, 30.542274475097656, 32.83754348754883, 35.1328125, 37.428077697753906, 39.723350524902344, 42.018619537353516, 44.31388854980469, 46.60915756225586, 48.90442657470703, 51.1996955871582, 53.494964599609375, 55.79022979736328, 58.08549880981445]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 5.0, 4.0, 8.0, 9.0, 9.0, 15.0, 23.0, 20.0, 24.0, 20.0, 23.0, 29.0, 41.0, 30.0, 31.0, 39.0, 39.0, 43.0, 66.0, 46.0, 45.0, 50.0, 46.0, 42.0, 36.0, 34.0, 28.0, 27.0, 24.0, 31.0, 24.0, 15.0, 16.0, 12.0, 8.0, 8.0, 9.0, 8.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.53125, -14.107666015625, -13.68408203125, -13.260498046875, -12.8369140625, -12.413330078125, -11.98974609375, -11.566162109375, -11.142578125, -10.718994140625, -10.29541015625, -9.871826171875, -9.4482421875, -9.024658203125, -8.60107421875, -8.177490234375, -7.75390625, -7.330322265625, -6.90673828125, -6.483154296875, -6.0595703125, -5.635986328125, -5.21240234375, -4.788818359375, -4.365234375, -3.941650390625, -3.51806640625, -3.094482421875, -2.6708984375, -2.247314453125, -1.82373046875, -1.400146484375, -0.9765625, -0.552978515625, -0.12939453125, 0.294189453125, 0.7177734375, 1.141357421875, 1.56494140625, 1.988525390625, 2.412109375, 2.835693359375, 3.25927734375, 3.682861328125, 4.1064453125, 4.530029296875, 4.95361328125, 5.377197265625, 5.80078125, 6.224365234375, 6.64794921875, 7.071533203125, 7.4951171875, 7.918701171875, 8.34228515625, 8.765869140625, 9.189453125, 9.613037109375, 10.03662109375, 10.460205078125, 10.8837890625, 11.307373046875, 11.73095703125, 12.154541015625, 12.578125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 10.0, 8.0, 8.0, 12.0, 19.0, 18.0, 15.0, 33.0, 31.0, 46.0, 59.0, 69.0, 102.0, 158.0, 200.0, 251.0, 330.0, 520.0, 17823.0, 4169433.0, 3330.0, 495.0, 354.0, 238.0, 184.0, 139.0, 89.0, 61.0, 49.0, 45.0, 34.0, 26.0, 18.0, 12.0, 10.0, 14.0, 9.0, 8.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.0, -154.15625, -148.3125, -142.46875, -136.625, -130.78125, -124.9375, -119.09375, -113.25, -107.40625, -101.5625, -95.71875, -89.875, -84.03125, -78.1875, -72.34375, -66.5, -60.65625, -54.8125, -48.96875, -43.125, -37.28125, -31.4375, -25.59375, -19.75, -13.90625, -8.0625, -2.21875, 3.625, 9.46875, 15.3125, 21.15625, 27.0, 32.84375, 38.6875, 44.53125, 50.375, 56.21875, 62.0625, 67.90625, 73.75, 79.59375, 85.4375, 91.28125, 97.125, 102.96875, 108.8125, 114.65625, 120.5, 126.34375, 132.1875, 138.03125, 143.875, 149.71875, 155.5625, 161.40625, 167.25, 173.09375, 178.9375, 184.78125, 190.625, 196.46875, 202.3125, 208.15625, 214.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 14.0, 6.0, 10.0, 15.0, 15.0, 29.0, 28.0, 46.0, 59.0, 77.0, 91.0, 159.0, 241.0, 326.0, 508.0, 583.0, 548.0, 371.0, 290.0, 179.0, 132.0, 94.0, 67.0, 39.0, 38.0, 22.0, 25.0, 5.0, 11.0, 11.0, 8.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.318115234375, -16.71435546875, -16.110595703125, -15.5068359375, -14.903076171875, -14.29931640625, -13.695556640625, -13.091796875, -12.488037109375, -11.88427734375, -11.280517578125, -10.6767578125, -10.072998046875, -9.46923828125, -8.865478515625, -8.26171875, -7.657958984375, -7.05419921875, -6.450439453125, -5.8466796875, -5.242919921875, -4.63916015625, -4.035400390625, -3.431640625, -2.827880859375, -2.22412109375, -1.620361328125, -1.0166015625, -0.412841796875, 0.19091796875, 0.794677734375, 1.3984375, 2.002197265625, 2.60595703125, 3.209716796875, 3.8134765625, 4.417236328125, 5.02099609375, 5.624755859375, 6.228515625, 6.832275390625, 7.43603515625, 8.039794921875, 8.6435546875, 9.247314453125, 9.85107421875, 10.454833984375, 11.05859375, 11.662353515625, 12.26611328125, 12.869873046875, 13.4736328125, 14.077392578125, 14.68115234375, 15.284912109375, 15.888671875, 16.492431640625, 17.09619140625, 17.699951171875, 18.3037109375, 18.907470703125, 19.51123046875, 20.114990234375, 20.71875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 10.0, 10.0, 20.0, 34.0, 34.0, 51.0, 70.0, 103.0, 278.0, 3327.0, 2093911.0, 2092449.0, 3322.0, 287.0, 114.0, 62.0, 37.0, 32.0, 33.0, 27.0, 10.0, 11.0, 13.0, 7.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.375, -92.359375, -88.34375, -84.328125, -80.3125, -76.296875, -72.28125, -68.265625, -64.25, -60.234375, -56.21875, -52.203125, -48.1875, -44.171875, -40.15625, -36.140625, -32.125, -28.109375, -24.09375, -20.078125, -16.0625, -12.046875, -8.03125, -4.015625, 0.0, 4.015625, 8.03125, 12.046875, 16.0625, 20.078125, 24.09375, 28.109375, 32.125, 36.140625, 40.15625, 44.171875, 48.1875, 52.203125, 56.21875, 60.234375, 64.25, 68.265625, 72.28125, 76.296875, 80.3125, 84.328125, 88.34375, 92.359375, 96.375, 100.390625, 104.40625, 108.421875, 112.4375, 116.453125, 120.46875, 124.484375, 128.5, 132.515625, 136.53125, 140.546875, 144.5625, 148.578125, 152.59375, 156.609375, 160.625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 36.0, 134.0, 329.0, 323.0, 138.0, 41.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-390.4690856933594, -383.1014099121094, -375.7337646484375, -368.3660888671875, -360.9984436035156, -353.6307678222656, -346.26312255859375, -338.89544677734375, -331.52777099609375, -324.16009521484375, -316.7924499511719, -309.4247741699219, -302.05712890625, -294.689453125, -287.32177734375, -279.9541320800781, -272.58648681640625, -265.21881103515625, -257.8511657714844, -250.48348999023438, -243.11582946777344, -235.7481689453125, -228.38050842285156, -221.01284790039062, -213.64517211914062, -206.2775115966797, -198.90985107421875, -191.54217529296875, -184.1745147705078, -176.80685424804688, -169.43919372558594, -162.071533203125, -154.703857421875, -147.33619689941406, -139.96853637695312, -132.60086059570312, -125.23320770263672, -117.86553955078125, -110.49787902832031, -103.13021850585938, -95.76255798339844, -88.3948974609375, -81.02722930908203, -73.6595687866211, -66.29190826416016, -58.92424392700195, -51.55657958984375, -44.18891906738281, -36.821258544921875, -29.453596115112305, -22.085933685302734, -14.718269348144531, -7.350606918334961, 0.017055511474609375, 7.3847198486328125, 14.75238037109375, 22.120044708251953, 29.487707138061523, 36.855369567871094, 44.2230339050293, 51.5906982421875, 58.95835876464844, 66.32601928710938, 73.69367980957031, 81.06134796142578]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 6.0, 11.0, 16.0, 22.0, 14.0, 26.0, 21.0, 28.0, 26.0, 31.0, 46.0, 32.0, 41.0, 45.0, 39.0, 56.0, 52.0, 38.0, 38.0, 32.0, 54.0, 35.0, 41.0, 28.0, 24.0, 22.0, 26.0, 28.0, 23.0, 14.0, 16.0, 11.0, 13.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-75.15878295898438, -73.06165313720703, -70.96452331542969, -68.86738586425781, -66.77025604248047, -64.67312622070312, -62.57599639892578, -60.47886657714844, -58.38173294067383, -56.284603118896484, -54.187469482421875, -52.09033966064453, -49.99320983886719, -47.89607620239258, -45.798946380615234, -43.701812744140625, -41.60468292236328, -39.50755310058594, -37.41041946411133, -35.313289642333984, -33.216156005859375, -31.11902618408203, -29.021896362304688, -26.92476463317871, -24.827632904052734, -22.730501174926758, -20.63336944580078, -18.536239624023438, -16.43910789489746, -14.341976165771484, -12.244845390319824, -10.147714614868164, -8.050582885742188, -5.953451633453369, -3.856320381164551, -1.7591891288757324, 0.33794212341308594, 2.4350738525390625, 4.532204627990723, 6.629335403442383, 8.72646713256836, 10.823598861694336, 12.920729637145996, 15.017860412597656, 17.114992141723633, 19.21212387084961, 21.309253692626953, 23.40638542175293, 25.503517150878906, 27.600648880004883, 29.69778060913086, 31.794910430908203, 33.89204406738281, 35.989173889160156, 38.0863037109375, 40.183433532714844, 42.28056716918945, 44.3776969909668, 46.474830627441406, 48.57196044921875, 50.669090270996094, 52.7662239074707, 54.86335372924805, 56.960487365722656, 59.0576171875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 4.0, 7.0, 6.0, 11.0, 10.0, 9.0, 10.0, 18.0, 19.0, 17.0, 20.0, 28.0, 24.0, 33.0, 37.0, 35.0, 30.0, 44.0, 39.0, 46.0, 47.0, 42.0, 45.0, 41.0, 36.0, 38.0, 33.0, 32.0, 29.0, 32.0, 31.0, 14.0, 25.0, 11.0, 21.0, 12.0, 7.0, 7.0, 7.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-12.5390625, -12.166015625, -11.79296875, -11.419921875, -11.046875, -10.673828125, -10.30078125, -9.927734375, -9.5546875, -9.181640625, -8.80859375, -8.435546875, -8.0625, -7.689453125, -7.31640625, -6.943359375, -6.5703125, -6.197265625, -5.82421875, -5.451171875, -5.078125, -4.705078125, -4.33203125, -3.958984375, -3.5859375, -3.212890625, -2.83984375, -2.466796875, -2.09375, -1.720703125, -1.34765625, -0.974609375, -0.6015625, -0.228515625, 0.14453125, 0.517578125, 0.890625, 1.263671875, 1.63671875, 2.009765625, 2.3828125, 2.755859375, 3.12890625, 3.501953125, 3.875, 4.248046875, 4.62109375, 4.994140625, 5.3671875, 5.740234375, 6.11328125, 6.486328125, 6.859375, 7.232421875, 7.60546875, 7.978515625, 8.3515625, 8.724609375, 9.09765625, 9.470703125, 9.84375, 10.216796875, 10.58984375, 10.962890625, 11.3359375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 16.0, 16.0, 30.0, 40.0, 64.0, 74.0, 103.0, 155.0, 226.0, 358.0, 524.0, 741.0, 1187.0, 1732.0, 2643.0, 4049.0, 6402.0, 10384.0, 16434.0, 26841.0, 44863.0, 78548.0, 139020.0, 214096.0, 201427.0, 123661.0, 69472.0, 40248.0, 24131.0, 14750.0, 9462.0, 5846.0, 3759.0, 2402.0, 1648.0, 1034.0, 700.0, 479.0, 313.0, 212.0, 147.0, 99.0, 70.0, 44.0, 30.0, 24.0, 17.0, 12.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.63671875, -1.583740234375, -1.53076171875, -1.477783203125, -1.4248046875, -1.371826171875, -1.31884765625, -1.265869140625, -1.212890625, -1.159912109375, -1.10693359375, -1.053955078125, -1.0009765625, -0.947998046875, -0.89501953125, -0.842041015625, -0.7890625, -0.736083984375, -0.68310546875, -0.630126953125, -0.5771484375, -0.524169921875, -0.47119140625, -0.418212890625, -0.365234375, -0.312255859375, -0.25927734375, -0.206298828125, -0.1533203125, -0.100341796875, -0.04736328125, 0.005615234375, 0.05859375, 0.111572265625, 0.16455078125, 0.217529296875, 0.2705078125, 0.323486328125, 0.37646484375, 0.429443359375, 0.482421875, 0.535400390625, 0.58837890625, 0.641357421875, 0.6943359375, 0.747314453125, 0.80029296875, 0.853271484375, 0.90625, 0.959228515625, 1.01220703125, 1.065185546875, 1.1181640625, 1.171142578125, 1.22412109375, 1.277099609375, 1.330078125, 1.383056640625, 1.43603515625, 1.489013671875, 1.5419921875, 1.594970703125, 1.64794921875, 1.700927734375, 1.75390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 7.0, 12.0, 13.0, 15.0, 11.0, 21.0, 16.0, 16.0, 15.0, 22.0, 28.0, 27.0, 35.0, 46.0, 24.0, 37.0, 51.0, 29.0, 41.0, 1063.0, 26.0, 33.0, 31.0, 46.0, 33.0, 28.0, 41.0, 37.0, 27.0, 23.0, 26.0, 23.0, 26.0, 19.0, 17.0, 10.0, 12.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.0390625, -7.79412841796875, -7.5491943359375, -7.30426025390625, -7.059326171875, -6.81439208984375, -6.5694580078125, -6.32452392578125, -6.07958984375, -5.83465576171875, -5.5897216796875, -5.34478759765625, -5.099853515625, -4.85491943359375, -4.6099853515625, -4.36505126953125, -4.1201171875, -3.87518310546875, -3.6302490234375, -3.38531494140625, -3.140380859375, -2.89544677734375, -2.6505126953125, -2.40557861328125, -2.16064453125, -1.91571044921875, -1.6707763671875, -1.42584228515625, -1.180908203125, -0.93597412109375, -0.6910400390625, -0.44610595703125, -0.201171875, 0.04376220703125, 0.2886962890625, 0.53363037109375, 0.778564453125, 1.02349853515625, 1.2684326171875, 1.51336669921875, 1.75830078125, 2.00323486328125, 2.2481689453125, 2.49310302734375, 2.738037109375, 2.98297119140625, 3.2279052734375, 3.47283935546875, 3.7177734375, 3.96270751953125, 4.2076416015625, 4.45257568359375, 4.697509765625, 4.94244384765625, 5.1873779296875, 5.43231201171875, 5.67724609375, 5.92218017578125, 6.1671142578125, 6.41204833984375, 6.656982421875, 6.90191650390625, 7.1468505859375, 7.39178466796875, 7.63671875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 7.0, 9.0, 11.0, 15.0, 18.0, 23.0, 40.0, 58.0, 116.0, 139.0, 211.0, 289.0, 438.0, 665.0, 905.0, 1306.0, 2038.0, 3170.0, 4637.0, 7496.0, 11607.0, 18455.0, 30725.0, 50388.0, 84186.0, 134284.0, 919129.0, 490721.0, 129433.0, 79959.0, 48182.0, 29090.0, 17884.0, 10953.0, 7072.0, 4459.0, 2990.0, 1931.0, 1318.0, 894.0, 565.0, 394.0, 303.0, 194.0, 129.0, 84.0, 64.0, 45.0, 30.0, 26.0, 16.0, 13.0, 10.0, 5.0, 5.0, 2.0, 0.0, 3.0], "bins": [-1.1171875, -1.083282470703125, -1.04937744140625, -1.015472412109375, -0.9815673828125, -0.947662353515625, -0.91375732421875, -0.879852294921875, -0.845947265625, -0.812042236328125, -0.77813720703125, -0.744232177734375, -0.7103271484375, -0.676422119140625, -0.64251708984375, -0.608612060546875, -0.57470703125, -0.540802001953125, -0.50689697265625, -0.472991943359375, -0.4390869140625, -0.405181884765625, -0.37127685546875, -0.337371826171875, -0.303466796875, -0.269561767578125, -0.23565673828125, -0.201751708984375, -0.1678466796875, -0.133941650390625, -0.10003662109375, -0.066131591796875, -0.0322265625, 0.001678466796875, 0.03558349609375, 0.069488525390625, 0.1033935546875, 0.137298583984375, 0.17120361328125, 0.205108642578125, 0.239013671875, 0.272918701171875, 0.30682373046875, 0.340728759765625, 0.3746337890625, 0.408538818359375, 0.44244384765625, 0.476348876953125, 0.51025390625, 0.544158935546875, 0.57806396484375, 0.611968994140625, 0.6458740234375, 0.679779052734375, 0.71368408203125, 0.747589111328125, 0.781494140625, 0.815399169921875, 0.84930419921875, 0.883209228515625, 0.9171142578125, 0.951019287109375, 0.98492431640625, 1.018829345703125, 1.052734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 11.0, 8.0, 15.0, 15.0, 21.0, 14.0, 19.0, 24.0, 24.0, 14.0, 28.0, 31.0, 33.0, 34.0, 42.0, 39.0, 36.0, 41.0, 45.0, 55.0, 44.0, 39.0, 33.0, 40.0, 38.0, 42.0, 33.0, 25.0, 19.0, 21.0, 13.0, 12.0, 24.0, 13.0, 17.0, 8.0, 6.0, 5.0, 6.0, 0.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.041290283203125, -0.039877891540527344, -0.03846549987792969, -0.03705310821533203, -0.035640716552734375, -0.03422832489013672, -0.03281593322753906, -0.031403541564941406, -0.02999114990234375, -0.028578758239746094, -0.027166366577148438, -0.02575397491455078, -0.024341583251953125, -0.02292919158935547, -0.021516799926757812, -0.020104408264160156, -0.0186920166015625, -0.017279624938964844, -0.015867233276367188, -0.014454841613769531, -0.013042449951171875, -0.011630058288574219, -0.010217666625976562, -0.008805274963378906, -0.00739288330078125, -0.005980491638183594, -0.0045680999755859375, -0.0031557083129882812, -0.001743316650390625, -0.00033092498779296875, 0.0010814666748046875, 0.0024938583374023438, 0.00390625, 0.005318641662597656, 0.0067310333251953125, 0.008143424987792969, 0.009555816650390625, 0.010968208312988281, 0.012380599975585938, 0.013792991638183594, 0.01520538330078125, 0.016617774963378906, 0.018030166625976562, 0.01944255828857422, 0.020854949951171875, 0.02226734161376953, 0.023679733276367188, 0.025092124938964844, 0.0265045166015625, 0.027916908264160156, 0.029329299926757812, 0.03074169158935547, 0.032154083251953125, 0.03356647491455078, 0.03497886657714844, 0.036391258239746094, 0.03780364990234375, 0.039216041564941406, 0.04062843322753906, 0.04204082489013672, 0.043453216552734375, 0.04486560821533203, 0.04627799987792969, 0.047690391540527344, 0.049102783203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 7.0, 16.0, 9.0, 24.0, 21.0, 27.0, 37.0, 24.0, 40.0, 41.0, 50.0, 63.0, 84.0, 100.0, 156.0, 231.0, 335.0, 559.0, 1464.0, 304845.0, 736791.0, 1817.0, 557.0, 357.0, 237.0, 140.0, 86.0, 73.0, 47.0, 42.0, 49.0, 34.0, 35.0, 28.0, 32.0, 27.0, 16.0, 16.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.974609375, -0.94757080078125, -0.9205322265625, -0.89349365234375, -0.866455078125, -0.83941650390625, -0.8123779296875, -0.78533935546875, -0.75830078125, -0.73126220703125, -0.7042236328125, -0.67718505859375, -0.650146484375, -0.62310791015625, -0.5960693359375, -0.56903076171875, -0.5419921875, -0.51495361328125, -0.4879150390625, -0.46087646484375, -0.433837890625, -0.40679931640625, -0.3797607421875, -0.35272216796875, -0.32568359375, -0.29864501953125, -0.2716064453125, -0.24456787109375, -0.217529296875, -0.19049072265625, -0.1634521484375, -0.13641357421875, -0.109375, -0.08233642578125, -0.0552978515625, -0.02825927734375, -0.001220703125, 0.02581787109375, 0.0528564453125, 0.07989501953125, 0.10693359375, 0.13397216796875, 0.1610107421875, 0.18804931640625, 0.215087890625, 0.24212646484375, 0.2691650390625, 0.29620361328125, 0.3232421875, 0.35028076171875, 0.3773193359375, 0.40435791015625, 0.431396484375, 0.45843505859375, 0.4854736328125, 0.51251220703125, 0.53955078125, 0.56658935546875, 0.5936279296875, 0.62066650390625, 0.647705078125, 0.67474365234375, 0.7017822265625, 0.72882080078125, 0.755859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 309.0, 700.0, 1.0, 1.0], "bins": [-2.3738183975219727, -2.334967851638794, -2.296117067337036, -2.2572665214538574, -2.2184157371520996, -2.179565191268921, -2.140714406967163, -2.1018638610839844, -2.0630130767822266, -2.024162530899048, -1.98531174659729, -1.9464610815048218, -1.9076104164123535, -1.8687598705291748, -1.829909086227417, -1.7910585403442383, -1.7522079944610596, -1.7133573293685913, -1.674506664276123, -1.6356559991836548, -1.5968053340911865, -1.5579547882080078, -1.51910400390625, -1.4802534580230713, -1.4414026737213135, -1.4025520086288452, -1.363701343536377, -1.3248506784439087, -1.2860000133514404, -1.2471494674682617, -1.208298683166504, -1.1694481372833252, -1.1305975914001465, -1.0917469263076782, -1.05289626121521, -1.0140455961227417, -0.9751949906349182, -0.93634432554245, -0.8974936604499817, -0.8586430549621582, -0.8197923302650452, -0.7809416651725769, -0.7420910000801086, -0.7032403945922852, -0.6643897294998169, -0.6255390644073486, -0.5866883993148804, -0.5478377342224121, -0.5089870691299438, -0.4701364040374756, -0.4312857687473297, -0.39243510365486145, -0.3535844683647156, -0.3147338032722473, -0.27588313817977905, -0.23703250288963318, -0.1981818526983261, -0.15933120250701904, -0.12048054486513138, -0.08162988722324371, -0.042779237031936646, -0.003928586840629578, 0.034922078251838684, 0.07377271354198456, 0.11262337863445282]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 12.0, 10.0, 13.0, 19.0, 20.0, 22.0, 33.0, 39.0, 42.0, 48.0, 41.0, 67.0, 54.0, 55.0, 52.0, 52.0, 64.0, 59.0, 28.0, 48.0, 44.0, 32.0, 28.0, 27.0, 16.0, 15.0, 13.0, 16.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08121919631958008, -0.07804180681705475, -0.07486440986394882, -0.0716870129108429, -0.06850962340831757, -0.06533223390579224, -0.06215483695268631, -0.05897744372487068, -0.055800050497055054, -0.052622657269239426, -0.0494452640414238, -0.04626787081360817, -0.04309047758579254, -0.03991308435797691, -0.036735691130161285, -0.03355829790234566, -0.03038090467453003, -0.0272035114467144, -0.024026118218898773, -0.020848724991083145, -0.017671331763267517, -0.014493938535451889, -0.011316545307636261, -0.008139152079820633, -0.004961758852005005, -0.0017843656241893768, 0.0013930276036262512, 0.004570420831441879, 0.007747814059257507, 0.010925207287073135, 0.014102600514888763, 0.01727999374270439, 0.02045738697052002, 0.023634780198335648, 0.026812173426151276, 0.029989566653966904, 0.03316695988178253, 0.03634435310959816, 0.03952174633741379, 0.042699139565229416, 0.045876532793045044, 0.04905392602086067, 0.0522313192486763, 0.05540871247649193, 0.058586105704307556, 0.061763498932123184, 0.06494089215993881, 0.06811828911304474, 0.07129567861557007, 0.0744730681180954, 0.07765046507120132, 0.08082786202430725, 0.08400525152683258, 0.08718264102935791, 0.09036003798246384, 0.09353743493556976, 0.09671482443809509, 0.09989221394062042, 0.10306961089372635, 0.10624700784683228, 0.1094243973493576, 0.11260178685188293, 0.11577918380498886, 0.11895658075809479, 0.12213397026062012]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 4.0, 7.0, 6.0, 11.0, 10.0, 9.0, 10.0, 19.0, 18.0, 17.0, 20.0, 28.0, 23.0, 34.0, 38.0, 34.0, 30.0, 44.0, 38.0, 47.0, 47.0, 42.0, 45.0, 41.0, 36.0, 39.0, 32.0, 32.0, 29.0, 32.0, 31.0, 14.0, 25.0, 10.0, 22.0, 12.0, 7.0, 8.0, 6.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-12.5390625, -12.166015625, -11.79296875, -11.419921875, -11.046875, -10.673828125, -10.30078125, -9.927734375, -9.5546875, -9.181640625, -8.80859375, -8.435546875, -8.0625, -7.689453125, -7.31640625, -6.943359375, -6.5703125, -6.197265625, -5.82421875, -5.451171875, -5.078125, -4.705078125, -4.33203125, -3.958984375, -3.5859375, -3.212890625, -2.83984375, -2.466796875, -2.09375, -1.720703125, -1.34765625, -0.974609375, -0.6015625, -0.228515625, 0.14453125, 0.517578125, 0.890625, 1.263671875, 1.63671875, 2.009765625, 2.3828125, 2.755859375, 3.12890625, 3.501953125, 3.875, 4.248046875, 4.62109375, 4.994140625, 5.3671875, 5.740234375, 6.11328125, 6.486328125, 6.859375, 7.232421875, 7.60546875, 7.978515625, 8.3515625, 8.724609375, 9.09765625, 9.470703125, 9.84375, 10.216796875, 10.58984375, 10.962890625, 11.3359375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 5.0, 13.0, 17.0, 22.0, 39.0, 44.0, 43.0, 73.0, 83.0, 116.0, 126.0, 186.0, 246.0, 323.0, 403.0, 610.0, 773.0, 1188.0, 2061.0, 4185.0, 10760.0, 35421.0, 129804.0, 418385.0, 314228.0, 88014.0, 24365.0, 7992.0, 3351.0, 1740.0, 1084.0, 712.0, 489.0, 391.0, 316.0, 207.0, 176.0, 141.0, 117.0, 77.0, 66.0, 40.0, 27.0, 41.0, 17.0, 15.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-21.421875, -20.7890625, -20.15625, -19.5234375, -18.890625, -18.2578125, -17.625, -16.9921875, -16.359375, -15.7265625, -15.09375, -14.4609375, -13.828125, -13.1953125, -12.5625, -11.9296875, -11.296875, -10.6640625, -10.03125, -9.3984375, -8.765625, -8.1328125, -7.5, -6.8671875, -6.234375, -5.6015625, -4.96875, -4.3359375, -3.703125, -3.0703125, -2.4375, -1.8046875, -1.171875, -0.5390625, 0.09375, 0.7265625, 1.359375, 1.9921875, 2.625, 3.2578125, 3.890625, 4.5234375, 5.15625, 5.7890625, 6.421875, 7.0546875, 7.6875, 8.3203125, 8.953125, 9.5859375, 10.21875, 10.8515625, 11.484375, 12.1171875, 12.75, 13.3828125, 14.015625, 14.6484375, 15.28125, 15.9140625, 16.546875, 17.1796875, 17.8125, 18.4453125, 19.078125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 2.0, 8.0, 3.0, 10.0, 9.0, 7.0, 16.0, 19.0, 20.0, 39.0, 18.0, 24.0, 35.0, 51.0, 49.0, 71.0, 96.0, 194.0, 1501.0, 288.0, 134.0, 83.0, 54.0, 54.0, 43.0, 28.0, 23.0, 28.0, 33.0, 23.0, 16.0, 17.0, 7.0, 6.0, 6.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.125, -31.044921875, -29.96484375, -28.884765625, -27.8046875, -26.724609375, -25.64453125, -24.564453125, -23.484375, -22.404296875, -21.32421875, -20.244140625, -19.1640625, -18.083984375, -17.00390625, -15.923828125, -14.84375, -13.763671875, -12.68359375, -11.603515625, -10.5234375, -9.443359375, -8.36328125, -7.283203125, -6.203125, -5.123046875, -4.04296875, -2.962890625, -1.8828125, -0.802734375, 0.27734375, 1.357421875, 2.4375, 3.517578125, 4.59765625, 5.677734375, 6.7578125, 7.837890625, 8.91796875, 9.998046875, 11.078125, 12.158203125, 13.23828125, 14.318359375, 15.3984375, 16.478515625, 17.55859375, 18.638671875, 19.71875, 20.798828125, 21.87890625, 22.958984375, 24.0390625, 25.119140625, 26.19921875, 27.279296875, 28.359375, 29.439453125, 30.51953125, 31.599609375, 32.6796875, 33.759765625, 34.83984375, 35.919921875, 37.0]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 2.0, 8.0, 11.0, 14.0, 12.0, 14.0, 26.0, 38.0, 33.0, 59.0, 80.0, 143.0, 189.0, 410.0, 983.0, 6701.0, 3117331.0, 17357.0, 1132.0, 465.0, 233.0, 152.0, 82.0, 56.0, 31.0, 25.0, 23.0, 17.0, 17.0, 9.0, 10.0, 8.0, 4.0, 8.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.9375, -111.1787109375, -107.419921875, -103.6611328125, -99.90234375, -96.1435546875, -92.384765625, -88.6259765625, -84.8671875, -81.1083984375, -77.349609375, -73.5908203125, -69.83203125, -66.0732421875, -62.314453125, -58.5556640625, -54.796875, -51.0380859375, -47.279296875, -43.5205078125, -39.76171875, -36.0029296875, -32.244140625, -28.4853515625, -24.7265625, -20.9677734375, -17.208984375, -13.4501953125, -9.69140625, -5.9326171875, -2.173828125, 1.5849609375, 5.34375, 9.1025390625, 12.861328125, 16.6201171875, 20.37890625, 24.1376953125, 27.896484375, 31.6552734375, 35.4140625, 39.1728515625, 42.931640625, 46.6904296875, 50.44921875, 54.2080078125, 57.966796875, 61.7255859375, 65.484375, 69.2431640625, 73.001953125, 76.7607421875, 80.51953125, 84.2783203125, 88.037109375, 91.7958984375, 95.5546875, 99.3134765625, 103.072265625, 106.8310546875, 110.58984375, 114.3486328125, 118.107421875, 121.8662109375, 125.625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 16.0, 493.0, 494.0, 14.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-389.60302734375, -375.68768310546875, -361.7723388671875, -347.85699462890625, -333.941650390625, -320.02630615234375, -306.1109313964844, -292.1955871582031, -278.2802429199219, -264.3648986816406, -250.44955444335938, -236.53419494628906, -222.6188507080078, -208.70350646972656, -194.78814697265625, -180.872802734375, -166.95745849609375, -153.0421142578125, -139.12677001953125, -125.21141052246094, -111.29606628417969, -97.38072204589844, -83.46537017822266, -69.55001831054688, -55.634674072265625, -41.71932601928711, -27.803977966308594, -13.888629913330078, 0.0267181396484375, 13.942062377929688, 27.85741424560547, 41.77276611328125, 55.6881103515625, 69.60345458984375, 83.51880645751953, 97.43415832519531, 111.34950256347656, 125.26484680175781, 139.18020629882812, 153.09555053710938, 167.01089477539062, 180.92623901367188, 194.84158325195312, 208.75694274902344, 222.6722869873047, 236.58763122558594, 250.50299072265625, 264.4183349609375, 278.33367919921875, 292.2490234375, 306.16436767578125, 320.0797119140625, 333.99505615234375, 347.910400390625, 361.8257751464844, 375.7411193847656, 389.6564636230469, 403.5718078613281, 417.4871520996094, 431.4024963378906, 445.31787109375, 459.23321533203125, 473.1485595703125, 487.06390380859375, 500.979248046875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 7.0, 4.0, 7.0, 2.0, 7.0, 11.0, 10.0, 15.0, 18.0, 12.0, 18.0, 18.0, 19.0, 33.0, 28.0, 34.0, 33.0, 41.0, 33.0, 30.0, 38.0, 40.0, 51.0, 42.0, 36.0, 45.0, 39.0, 41.0, 33.0, 22.0, 26.0, 22.0, 21.0, 24.0, 24.0, 25.0, 18.0, 14.0, 16.0, 4.0, 9.0, 6.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0], "bins": [-94.98654174804688, -92.24393463134766, -89.50132751464844, -86.75872039794922, -84.01611328125, -81.27350616455078, -78.53089904785156, -75.78829193115234, -73.04568481445312, -70.3030776977539, -67.56047058105469, -64.81786346435547, -62.07525634765625, -59.33264923095703, -56.59004211425781, -53.847434997558594, -51.104827880859375, -48.362220764160156, -45.61961364746094, -42.87700653076172, -40.1343994140625, -37.39179229736328, -34.64918518066406, -31.906578063964844, -29.163970947265625, -26.421363830566406, -23.678756713867188, -20.93614959716797, -18.19354248046875, -15.450935363769531, -12.708328247070312, -9.965721130371094, -7.223114013671875, -4.480506896972656, -1.7378997802734375, 1.0047073364257812, 3.747314453125, 6.489921569824219, 9.232528686523438, 11.975135803222656, 14.717742919921875, 17.460350036621094, 20.202957153320312, 22.94556427001953, 25.68817138671875, 28.43077850341797, 31.173385620117188, 33.915992736816406, 36.658599853515625, 39.401206970214844, 42.14381408691406, 44.88642120361328, 47.6290283203125, 50.37163543701172, 53.11424255371094, 55.856849670410156, 58.599456787109375, 61.342063903808594, 64.08467102050781, 66.82727813720703, 69.56988525390625, 72.31249237060547, 75.05509948730469, 77.7977066040039, 80.54031372070312]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 7.0, 7.0, 5.0, 7.0, 10.0, 10.0, 8.0, 11.0, 14.0, 11.0, 21.0, 22.0, 16.0, 23.0, 30.0, 32.0, 24.0, 48.0, 38.0, 50.0, 42.0, 49.0, 42.0, 39.0, 53.0, 46.0, 33.0, 42.0, 30.0, 24.0, 34.0, 31.0, 27.0, 10.0, 20.0, 5.0, 14.0, 18.0, 6.0, 7.0, 5.0, 6.0, 9.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.796875, -12.411376953125, -12.02587890625, -11.640380859375, -11.2548828125, -10.869384765625, -10.48388671875, -10.098388671875, -9.712890625, -9.327392578125, -8.94189453125, -8.556396484375, -8.1708984375, -7.785400390625, -7.39990234375, -7.014404296875, -6.62890625, -6.243408203125, -5.85791015625, -5.472412109375, -5.0869140625, -4.701416015625, -4.31591796875, -3.930419921875, -3.544921875, -3.159423828125, -2.77392578125, -2.388427734375, -2.0029296875, -1.617431640625, -1.23193359375, -0.846435546875, -0.4609375, -0.075439453125, 0.31005859375, 0.695556640625, 1.0810546875, 1.466552734375, 1.85205078125, 2.237548828125, 2.623046875, 3.008544921875, 3.39404296875, 3.779541015625, 4.1650390625, 4.550537109375, 4.93603515625, 5.321533203125, 5.70703125, 6.092529296875, 6.47802734375, 6.863525390625, 7.2490234375, 7.634521484375, 8.02001953125, 8.405517578125, 8.791015625, 9.176513671875, 9.56201171875, 9.947509765625, 10.3330078125, 10.718505859375, 11.10400390625, 11.489501953125, 11.875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 7.0, 6.0, 10.0, 11.0, 20.0, 23.0, 34.0, 36.0, 56.0, 72.0, 99.0, 166.0, 256.0, 470.0, 769.0, 1454.0, 3135.0, 7359.0, 22024.0, 104742.0, 740144.0, 2358868.0, 800911.0, 115766.0, 23454.0, 7541.0, 3194.0, 1544.0, 820.0, 474.0, 271.0, 157.0, 115.0, 85.0, 48.0, 36.0, 31.0, 21.0, 20.0, 8.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.875, -21.134033203125, -20.39306640625, -19.652099609375, -18.9111328125, -18.170166015625, -17.42919921875, -16.688232421875, -15.947265625, -15.206298828125, -14.46533203125, -13.724365234375, -12.9833984375, -12.242431640625, -11.50146484375, -10.760498046875, -10.01953125, -9.278564453125, -8.53759765625, -7.796630859375, -7.0556640625, -6.314697265625, -5.57373046875, -4.832763671875, -4.091796875, -3.350830078125, -2.60986328125, -1.868896484375, -1.1279296875, -0.386962890625, 0.35400390625, 1.094970703125, 1.8359375, 2.576904296875, 3.31787109375, 4.058837890625, 4.7998046875, 5.540771484375, 6.28173828125, 7.022705078125, 7.763671875, 8.504638671875, 9.24560546875, 9.986572265625, 10.7275390625, 11.468505859375, 12.20947265625, 12.950439453125, 13.69140625, 14.432373046875, 15.17333984375, 15.914306640625, 16.6552734375, 17.396240234375, 18.13720703125, 18.878173828125, 19.619140625, 20.360107421875, 21.10107421875, 21.842041015625, 22.5830078125, 23.323974609375, 24.06494140625, 24.805908203125, 25.546875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 10.0, 17.0, 25.0, 27.0, 48.0, 53.0, 89.0, 112.0, 146.0, 215.0, 289.0, 391.0, 551.0, 598.0, 456.0, 272.0, 200.0, 150.0, 119.0, 78.0, 72.0, 55.0, 32.0, 14.0, 16.0, 12.0, 13.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-33.09375, -32.3428955078125, -31.592041015625, -30.8411865234375, -30.09033203125, -29.3394775390625, -28.588623046875, -27.8377685546875, -27.0869140625, -26.3360595703125, -25.585205078125, -24.8343505859375, -24.08349609375, -23.3326416015625, -22.581787109375, -21.8309326171875, -21.080078125, -20.3292236328125, -19.578369140625, -18.8275146484375, -18.07666015625, -17.3258056640625, -16.574951171875, -15.8240966796875, -15.0732421875, -14.3223876953125, -13.571533203125, -12.8206787109375, -12.06982421875, -11.3189697265625, -10.568115234375, -9.8172607421875, -9.06640625, -8.3155517578125, -7.564697265625, -6.8138427734375, -6.06298828125, -5.3121337890625, -4.561279296875, -3.8104248046875, -3.0595703125, -2.3087158203125, -1.557861328125, -0.8070068359375, -0.05615234375, 0.6947021484375, 1.445556640625, 2.1964111328125, 2.947265625, 3.6981201171875, 4.448974609375, 5.1998291015625, 5.95068359375, 6.7015380859375, 7.452392578125, 8.2032470703125, 8.9541015625, 9.7049560546875, 10.455810546875, 11.2066650390625, 11.95751953125, 12.7083740234375, 13.459228515625, 14.2100830078125, 14.9609375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 15.0, 8.0, 20.0, 30.0, 51.0, 94.0, 145.0, 248.0, 440.0, 862.0, 2072.0, 7045.0, 60598.0, 1173247.0, 2798904.0, 133736.0, 11752.0, 2676.0, 1078.0, 546.0, 264.0, 176.0, 94.0, 62.0, 40.0, 28.0, 16.0, 9.0, 6.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.08203125, -32.7265625, -31.37109375, -30.015625, -28.66015625, -27.3046875, -25.94921875, -24.59375, -23.23828125, -21.8828125, -20.52734375, -19.171875, -17.81640625, -16.4609375, -15.10546875, -13.75, -12.39453125, -11.0390625, -9.68359375, -8.328125, -6.97265625, -5.6171875, -4.26171875, -2.90625, -1.55078125, -0.1953125, 1.16015625, 2.515625, 3.87109375, 5.2265625, 6.58203125, 7.9375, 9.29296875, 10.6484375, 12.00390625, 13.359375, 14.71484375, 16.0703125, 17.42578125, 18.78125, 20.13671875, 21.4921875, 22.84765625, 24.203125, 25.55859375, 26.9140625, 28.26953125, 29.625, 30.98046875, 32.3359375, 33.69140625, 35.046875, 36.40234375, 37.7578125, 39.11328125, 40.46875, 41.82421875, 43.1796875, 44.53515625, 45.890625, 47.24609375, 48.6015625, 49.95703125, 51.3125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 131.0, 754.0, 127.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-316.965576171875, -295.1055603027344, -273.2455749511719, -251.38555908203125, -229.5255584716797, -207.66555786132812, -185.8055419921875, -163.94554138183594, -142.08554077148438, -120.22554016113281, -98.36553192138672, -76.50552368164062, -54.64552307128906, -32.7855224609375, -10.925506591796875, 10.934494018554688, 32.79449462890625, 54.65449905395508, 76.5145034790039, 98.37451171875, 120.23451232910156, 142.09451293945312, 163.95452880859375, 185.8145294189453, 207.67453002929688, 229.53453063964844, 251.39453125, 273.2545471191406, 295.11456298828125, 316.97454833984375, 338.8345642089844, 360.694580078125, 382.5545654296875, 404.4145812988281, 426.2745666503906, 448.13458251953125, 469.99456787109375, 491.8545837402344, 513.714599609375, 535.5745849609375, 557.4345703125, 579.2945556640625, 601.1546020507812, 623.0145874023438, 644.8745727539062, 666.734619140625, 688.5946044921875, 710.45458984375, 732.3146362304688, 754.1746215820312, 776.03466796875, 797.8946533203125, 819.754638671875, 841.6146240234375, 863.4746704101562, 885.3346557617188, 907.1947021484375, 929.0546875, 950.9147338867188, 972.7747192382812, 994.6347045898438, 1016.4947509765625, 1038.354736328125, 1060.2147216796875, 1082.07470703125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 7.0, 7.0, 11.0, 8.0, 25.0, 13.0, 26.0, 31.0, 25.0, 43.0, 29.0, 35.0, 41.0, 59.0, 48.0, 48.0, 61.0, 36.0, 37.0, 63.0, 50.0, 41.0, 29.0, 26.0, 37.0, 26.0, 32.0, 20.0, 15.0, 15.0, 15.0, 10.0, 5.0, 7.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.3106689453125, -88.50206756591797, -85.69346618652344, -82.8848648071289, -80.07626342773438, -77.26765441894531, -74.45905303955078, -71.65045166015625, -68.84185028076172, -66.03324890136719, -63.224647521972656, -60.41604232788086, -57.60744094848633, -54.7988395690918, -51.990234375, -49.18163299560547, -46.37303161621094, -43.564430236816406, -40.755828857421875, -37.94722366333008, -35.13862228393555, -32.330020904541016, -29.52141761779785, -26.712814331054688, -23.904212951660156, -21.095611572265625, -18.28700828552246, -15.478405952453613, -12.669803619384766, -9.861201286315918, -7.05259895324707, -4.243995666503906, -1.435394287109375, 1.3732080459594727, 4.18181037902832, 6.990412712097168, 9.799015045166016, 12.607617378234863, 15.416219711303711, 18.224822998046875, 21.033424377441406, 23.842025756835938, 26.6506290435791, 29.459232330322266, 32.2678337097168, 35.07643508911133, 37.885040283203125, 40.693641662597656, 43.50224304199219, 46.31084442138672, 49.11944580078125, 51.92805099487305, 54.73665237426758, 57.54525375366211, 60.353858947753906, 63.16246032714844, 65.97106170654297, 68.7796630859375, 71.58826446533203, 74.39686584472656, 77.20547485351562, 80.01407623291016, 82.82267761230469, 85.63127899169922, 88.43988037109375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 3.0, 8.0, 10.0, 9.0, 7.0, 11.0, 8.0, 17.0, 17.0, 26.0, 21.0, 36.0, 36.0, 33.0, 39.0, 41.0, 44.0, 50.0, 42.0, 53.0, 45.0, 46.0, 47.0, 39.0, 34.0, 41.0, 28.0, 34.0, 36.0, 24.0, 19.0, 15.0, 11.0, 15.0, 14.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.4765625, -11.1339111328125, -10.791259765625, -10.4486083984375, -10.10595703125, -9.7633056640625, -9.420654296875, -9.0780029296875, -8.7353515625, -8.3927001953125, -8.050048828125, -7.7073974609375, -7.36474609375, -7.0220947265625, -6.679443359375, -6.3367919921875, -5.994140625, -5.6514892578125, -5.308837890625, -4.9661865234375, -4.62353515625, -4.2808837890625, -3.938232421875, -3.5955810546875, -3.2529296875, -2.9102783203125, -2.567626953125, -2.2249755859375, -1.88232421875, -1.5396728515625, -1.197021484375, -0.8543701171875, -0.51171875, -0.1690673828125, 0.173583984375, 0.5162353515625, 0.85888671875, 1.2015380859375, 1.544189453125, 1.8868408203125, 2.2294921875, 2.5721435546875, 2.914794921875, 3.2574462890625, 3.60009765625, 3.9427490234375, 4.285400390625, 4.6280517578125, 4.970703125, 5.3133544921875, 5.656005859375, 5.9986572265625, 6.34130859375, 6.6839599609375, 7.026611328125, 7.3692626953125, 7.7119140625, 8.0545654296875, 8.397216796875, 8.7398681640625, 9.08251953125, 9.4251708984375, 9.767822265625, 10.1104736328125, 10.453125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 9.0, 15.0, 23.0, 47.0, 93.0, 108.0, 172.0, 312.0, 454.0, 664.0, 979.0, 1412.0, 2187.0, 3594.0, 5736.0, 9146.0, 15256.0, 24900.0, 43345.0, 76398.0, 139391.0, 225236.0, 209721.0, 123573.0, 68133.0, 38552.0, 22744.0, 13558.0, 8365.0, 5180.0, 3167.0, 2182.0, 1325.0, 875.0, 597.0, 393.0, 233.0, 164.0, 95.0, 70.0, 48.0, 37.0, 21.0, 15.0, 12.0, 5.0, 6.0, 1.0, 2.0, 1.0], "bins": [-1.591796875, -1.547454833984375, -1.50311279296875, -1.458770751953125, -1.4144287109375, -1.370086669921875, -1.32574462890625, -1.281402587890625, -1.237060546875, -1.192718505859375, -1.14837646484375, -1.104034423828125, -1.0596923828125, -1.015350341796875, -0.97100830078125, -0.926666259765625, -0.88232421875, -0.837982177734375, -0.79364013671875, -0.749298095703125, -0.7049560546875, -0.660614013671875, -0.61627197265625, -0.571929931640625, -0.527587890625, -0.483245849609375, -0.43890380859375, -0.394561767578125, -0.3502197265625, -0.305877685546875, -0.26153564453125, -0.217193603515625, -0.1728515625, -0.128509521484375, -0.08416748046875, -0.039825439453125, 0.0045166015625, 0.048858642578125, 0.09320068359375, 0.137542724609375, 0.181884765625, 0.226226806640625, 0.27056884765625, 0.314910888671875, 0.3592529296875, 0.403594970703125, 0.44793701171875, 0.492279052734375, 0.53662109375, 0.580963134765625, 0.62530517578125, 0.669647216796875, 0.7139892578125, 0.758331298828125, 0.80267333984375, 0.847015380859375, 0.891357421875, 0.935699462890625, 0.98004150390625, 1.024383544921875, 1.0687255859375, 1.113067626953125, 1.15740966796875, 1.201751708984375, 1.24609375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 5.0, 8.0, 10.0, 10.0, 15.0, 12.0, 11.0, 23.0, 23.0, 19.0, 17.0, 26.0, 29.0, 41.0, 27.0, 38.0, 30.0, 32.0, 29.0, 38.0, 1072.0, 48.0, 26.0, 42.0, 35.0, 34.0, 30.0, 27.0, 32.0, 27.0, 20.0, 19.0, 19.0, 19.0, 24.0, 14.0, 18.0, 11.0, 10.0, 4.0, 7.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.98828125, -5.79254150390625, -5.5968017578125, -5.40106201171875, -5.205322265625, -5.00958251953125, -4.8138427734375, -4.61810302734375, -4.42236328125, -4.22662353515625, -4.0308837890625, -3.83514404296875, -3.639404296875, -3.44366455078125, -3.2479248046875, -3.05218505859375, -2.8564453125, -2.66070556640625, -2.4649658203125, -2.26922607421875, -2.073486328125, -1.87774658203125, -1.6820068359375, -1.48626708984375, -1.29052734375, -1.09478759765625, -0.8990478515625, -0.70330810546875, -0.507568359375, -0.31182861328125, -0.1160888671875, 0.07965087890625, 0.275390625, 0.47113037109375, 0.6668701171875, 0.86260986328125, 1.058349609375, 1.25408935546875, 1.4498291015625, 1.64556884765625, 1.84130859375, 2.03704833984375, 2.2327880859375, 2.42852783203125, 2.624267578125, 2.82000732421875, 3.0157470703125, 3.21148681640625, 3.4072265625, 3.60296630859375, 3.7987060546875, 3.99444580078125, 4.190185546875, 4.38592529296875, 4.5816650390625, 4.77740478515625, 4.97314453125, 5.16888427734375, 5.3646240234375, 5.56036376953125, 5.756103515625, 5.95184326171875, 6.1475830078125, 6.34332275390625, 6.5390625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 17.0, 7.0, 24.0, 26.0, 52.0, 72.0, 127.0, 158.0, 243.0, 383.0, 627.0, 950.0, 1470.0, 2361.0, 3761.0, 6181.0, 10399.0, 17419.0, 30442.0, 52899.0, 92898.0, 156581.0, 1217106.0, 221517.0, 118136.0, 68098.0, 39137.0, 22078.0, 13092.0, 7839.0, 4779.0, 2970.0, 1855.0, 1191.0, 750.0, 500.0, 335.0, 216.0, 137.0, 108.0, 59.0, 41.0, 30.0, 22.0, 14.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.095703125, -1.06414794921875, -1.0325927734375, -1.00103759765625, -0.969482421875, -0.93792724609375, -0.9063720703125, -0.87481689453125, -0.84326171875, -0.81170654296875, -0.7801513671875, -0.74859619140625, -0.717041015625, -0.68548583984375, -0.6539306640625, -0.62237548828125, -0.5908203125, -0.55926513671875, -0.5277099609375, -0.49615478515625, -0.464599609375, -0.43304443359375, -0.4014892578125, -0.36993408203125, -0.33837890625, -0.30682373046875, -0.2752685546875, -0.24371337890625, -0.212158203125, -0.18060302734375, -0.1490478515625, -0.11749267578125, -0.0859375, -0.05438232421875, -0.0228271484375, 0.00872802734375, 0.040283203125, 0.07183837890625, 0.1033935546875, 0.13494873046875, 0.16650390625, 0.19805908203125, 0.2296142578125, 0.26116943359375, 0.292724609375, 0.32427978515625, 0.3558349609375, 0.38739013671875, 0.4189453125, 0.45050048828125, 0.4820556640625, 0.51361083984375, 0.545166015625, 0.57672119140625, 0.6082763671875, 0.63983154296875, 0.67138671875, 0.70294189453125, 0.7344970703125, 0.76605224609375, 0.797607421875, 0.82916259765625, 0.8607177734375, 0.89227294921875, 0.923828125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 2.0, 4.0, 5.0, 10.0, 10.0, 4.0, 11.0, 8.0, 16.0, 10.0, 19.0, 17.0, 25.0, 33.0, 36.0, 39.0, 34.0, 57.0, 55.0, 62.0, 53.0, 54.0, 52.0, 47.0, 45.0, 45.0, 27.0, 37.0, 33.0, 26.0, 16.0, 22.0, 20.0, 10.0, 9.0, 8.0, 7.0, 10.0, 2.0, 7.0, 3.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.03162574768066406, -0.030567169189453125, -0.029508590698242188, -0.02845001220703125, -0.027391433715820312, -0.026332855224609375, -0.025274276733398438, -0.0242156982421875, -0.023157119750976562, -0.022098541259765625, -0.021039962768554688, -0.01998138427734375, -0.018922805786132812, -0.017864227294921875, -0.016805648803710938, -0.0157470703125, -0.014688491821289062, -0.013629913330078125, -0.012571334838867188, -0.01151275634765625, -0.010454177856445312, -0.009395599365234375, -0.008337020874023438, -0.0072784423828125, -0.0062198638916015625, -0.005161285400390625, -0.0041027069091796875, -0.00304412841796875, -0.0019855499267578125, -0.000926971435546875, 0.0001316070556640625, 0.001190185546875, 0.0022487640380859375, 0.003307342529296875, 0.0043659210205078125, 0.00542449951171875, 0.0064830780029296875, 0.007541656494140625, 0.008600234985351562, 0.0096588134765625, 0.010717391967773438, 0.011775970458984375, 0.012834548950195312, 0.01389312744140625, 0.014951705932617188, 0.016010284423828125, 0.017068862915039062, 0.01812744140625, 0.019186019897460938, 0.020244598388671875, 0.021303176879882812, 0.02236175537109375, 0.023420333862304688, 0.024478912353515625, 0.025537490844726562, 0.0265960693359375, 0.027654647827148438, 0.028713226318359375, 0.029771804809570312, 0.03083038330078125, 0.03188896179199219, 0.032947540283203125, 0.03400611877441406, 0.035064697265625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 9.0, 2.0, 4.0, 13.0, 10.0, 17.0, 15.0, 15.0, 9.0, 24.0, 32.0, 42.0, 45.0, 64.0, 72.0, 105.0, 135.0, 182.0, 276.0, 488.0, 1098.0, 196101.0, 846736.0, 1378.0, 509.0, 324.0, 183.0, 147.0, 118.0, 82.0, 59.0, 44.0, 34.0, 31.0, 21.0, 15.0, 20.0, 18.0, 16.0, 16.0, 10.0, 8.0, 4.0, 12.0, 4.0, 1.0, 4.0, 4.0, 3.0, 5.0, 0.0, 0.0, 3.0], "bins": [-0.64990234375, -0.6302490234375, -0.610595703125, -0.5909423828125, -0.5712890625, -0.5516357421875, -0.531982421875, -0.5123291015625, -0.49267578125, -0.4730224609375, -0.453369140625, -0.4337158203125, -0.4140625, -0.3944091796875, -0.374755859375, -0.3551025390625, -0.33544921875, -0.3157958984375, -0.296142578125, -0.2764892578125, -0.2568359375, -0.2371826171875, -0.217529296875, -0.1978759765625, -0.17822265625, -0.1585693359375, -0.138916015625, -0.1192626953125, -0.099609375, -0.0799560546875, -0.060302734375, -0.0406494140625, -0.02099609375, -0.0013427734375, 0.018310546875, 0.0379638671875, 0.0576171875, 0.0772705078125, 0.096923828125, 0.1165771484375, 0.13623046875, 0.1558837890625, 0.175537109375, 0.1951904296875, 0.21484375, 0.2344970703125, 0.254150390625, 0.2738037109375, 0.29345703125, 0.3131103515625, 0.332763671875, 0.3524169921875, 0.3720703125, 0.3917236328125, 0.411376953125, 0.4310302734375, 0.45068359375, 0.4703369140625, 0.489990234375, 0.5096435546875, 0.529296875, 0.5489501953125, 0.568603515625, 0.5882568359375, 0.60791015625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 10.0, 1001.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4527397155761719, -1.4279417991638184, -1.4031437635421753, -1.3783458471298218, -1.3535479307174683, -1.3287500143051147, -1.3039519786834717, -1.2791540622711182, -1.2543561458587646, -1.2295582294464111, -1.204760193824768, -1.1799622774124146, -1.155164361000061, -1.1303664445877075, -1.1055684089660645, -1.080770492553711, -1.0559725761413574, -1.031174659729004, -1.0063766241073608, -0.9815787076950073, -0.9567807912826538, -0.9319828152656555, -0.907184898853302, -0.8823869228363037, -0.8575889468193054, -0.8327909708023071, -0.8079930543899536, -0.7831950783729553, -0.7583971619606018, -0.7335991859436035, -0.70880126953125, -0.6840032935142517, -0.6592053771018982, -0.6344074010848999, -0.6096094846725464, -0.5848115086555481, -0.5600135922431946, -0.5352156162261963, -0.5104176998138428, -0.4856197237968445, -0.46082180738449097, -0.43602386116981506, -0.41122591495513916, -0.38642796874046326, -0.36163002252578735, -0.33683207631111145, -0.31203413009643555, -0.28723615407943726, -0.26243820786476135, -0.23764026165008545, -0.21284231543540955, -0.18804436922073364, -0.16324642300605774, -0.13844847679138184, -0.11365051567554474, -0.08885256946086884, -0.06405462324619293, -0.03925667703151703, -0.014458727091550827, 0.010339222848415375, 0.03513716906309128, 0.05993511527776718, 0.08473306894302368, 0.10953101515769958, 0.1343289613723755]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 17.0, 25.0, 19.0, 27.0, 44.0, 62.0, 60.0, 65.0, 67.0, 66.0, 80.0, 74.0, 60.0, 63.0, 49.0, 47.0, 47.0, 30.0, 29.0, 29.0, 13.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058796226978302, -0.056676194071769714, -0.05455616116523743, -0.05243612825870514, -0.05031609535217285, -0.048196062445640564, -0.046076029539108276, -0.04395599663257599, -0.0418359637260437, -0.039715930819511414, -0.037595897912979126, -0.03547586500644684, -0.03335583209991455, -0.031235799193382263, -0.029115766286849976, -0.026995733380317688, -0.0248757004737854, -0.022755667567253113, -0.020635634660720825, -0.018515601754188538, -0.01639556884765625, -0.014275535941123962, -0.012155503034591675, -0.010035470128059387, -0.0079154372215271, -0.005795404314994812, -0.0036753714084625244, -0.0015553385019302368, 0.0005646944046020508, 0.0026847273111343384, 0.004804760217666626, 0.006924793124198914, 0.009044826030731201, 0.011164858937263489, 0.013284891843795776, 0.015404924750328064, 0.01752495765686035, 0.01964499056339264, 0.021765023469924927, 0.023885056376457214, 0.026005089282989502, 0.02812512218952179, 0.030245155096054077, 0.032365188002586365, 0.03448522090911865, 0.03660525381565094, 0.03872528672218323, 0.040845319628715515, 0.0429653525352478, 0.04508538544178009, 0.04720541834831238, 0.049325451254844666, 0.05144548416137695, 0.05356551706790924, 0.05568554997444153, 0.057805582880973816, 0.059925615787506104, 0.06204564869403839, 0.06416568160057068, 0.06628571450710297, 0.06840574741363525, 0.07052578032016754, 0.07264581322669983, 0.07476584613323212, 0.0768858790397644]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 3.0, 8.0, 10.0, 9.0, 7.0, 11.0, 8.0, 17.0, 17.0, 27.0, 20.0, 36.0, 36.0, 33.0, 39.0, 42.0, 42.0, 51.0, 42.0, 52.0, 46.0, 46.0, 48.0, 38.0, 34.0, 41.0, 27.0, 35.0, 36.0, 24.0, 19.0, 15.0, 11.0, 15.0, 14.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.4765625, -11.1339111328125, -10.791259765625, -10.4486083984375, -10.10595703125, -9.7633056640625, -9.420654296875, -9.0780029296875, -8.7353515625, -8.3927001953125, -8.050048828125, -7.7073974609375, -7.36474609375, -7.0220947265625, -6.679443359375, -6.3367919921875, -5.994140625, -5.6514892578125, -5.308837890625, -4.9661865234375, -4.62353515625, -4.2808837890625, -3.938232421875, -3.5955810546875, -3.2529296875, -2.9102783203125, -2.567626953125, -2.2249755859375, -1.88232421875, -1.5396728515625, -1.197021484375, -0.8543701171875, -0.51171875, -0.1690673828125, 0.173583984375, 0.5162353515625, 0.85888671875, 1.2015380859375, 1.544189453125, 1.8868408203125, 2.2294921875, 2.5721435546875, 2.914794921875, 3.2574462890625, 3.60009765625, 3.9427490234375, 4.285400390625, 4.6280517578125, 4.970703125, 5.3133544921875, 5.656005859375, 5.9986572265625, 6.34130859375, 6.6839599609375, 7.026611328125, 7.3692626953125, 7.7119140625, 8.0545654296875, 8.397216796875, 8.7398681640625, 9.08251953125, 9.4251708984375, 9.767822265625, 10.1104736328125, 10.453125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 7.0, 7.0, 6.0, 11.0, 20.0, 19.0, 27.0, 46.0, 60.0, 69.0, 109.0, 121.0, 175.0, 294.0, 362.0, 607.0, 796.0, 1294.0, 2109.0, 4257.0, 10836.0, 48457.0, 407584.0, 490111.0, 57998.0, 12111.0, 4582.0, 2344.0, 1349.0, 826.0, 528.0, 396.0, 291.0, 196.0, 162.0, 101.0, 80.0, 58.0, 35.0, 21.0, 22.0, 20.0, 14.0, 12.0, 9.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.703125, -23.907470703125, -23.11181640625, -22.316162109375, -21.5205078125, -20.724853515625, -19.92919921875, -19.133544921875, -18.337890625, -17.542236328125, -16.74658203125, -15.950927734375, -15.1552734375, -14.359619140625, -13.56396484375, -12.768310546875, -11.97265625, -11.177001953125, -10.38134765625, -9.585693359375, -8.7900390625, -7.994384765625, -7.19873046875, -6.403076171875, -5.607421875, -4.811767578125, -4.01611328125, -3.220458984375, -2.4248046875, -1.629150390625, -0.83349609375, -0.037841796875, 0.7578125, 1.553466796875, 2.34912109375, 3.144775390625, 3.9404296875, 4.736083984375, 5.53173828125, 6.327392578125, 7.123046875, 7.918701171875, 8.71435546875, 9.510009765625, 10.3056640625, 11.101318359375, 11.89697265625, 12.692626953125, 13.48828125, 14.283935546875, 15.07958984375, 15.875244140625, 16.6708984375, 17.466552734375, 18.26220703125, 19.057861328125, 19.853515625, 20.649169921875, 21.44482421875, 22.240478515625, 23.0361328125, 23.831787109375, 24.62744140625, 25.423095703125, 26.21875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 7.0, 6.0, 10.0, 13.0, 12.0, 12.0, 23.0, 20.0, 16.0, 26.0, 31.0, 36.0, 46.0, 40.0, 62.0, 78.0, 145.0, 1467.0, 452.0, 123.0, 51.0, 63.0, 40.0, 35.0, 30.0, 24.0, 33.0, 22.0, 15.0, 15.0, 13.0, 20.0, 6.0, 6.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.8125, -26.968994140625, -26.12548828125, -25.281982421875, -24.4384765625, -23.594970703125, -22.75146484375, -21.907958984375, -21.064453125, -20.220947265625, -19.37744140625, -18.533935546875, -17.6904296875, -16.846923828125, -16.00341796875, -15.159912109375, -14.31640625, -13.472900390625, -12.62939453125, -11.785888671875, -10.9423828125, -10.098876953125, -9.25537109375, -8.411865234375, -7.568359375, -6.724853515625, -5.88134765625, -5.037841796875, -4.1943359375, -3.350830078125, -2.50732421875, -1.663818359375, -0.8203125, 0.023193359375, 0.86669921875, 1.710205078125, 2.5537109375, 3.397216796875, 4.24072265625, 5.084228515625, 5.927734375, 6.771240234375, 7.61474609375, 8.458251953125, 9.3017578125, 10.145263671875, 10.98876953125, 11.832275390625, 12.67578125, 13.519287109375, 14.36279296875, 15.206298828125, 16.0498046875, 16.893310546875, 17.73681640625, 18.580322265625, 19.423828125, 20.267333984375, 21.11083984375, 21.954345703125, 22.7978515625, 23.641357421875, 24.48486328125, 25.328369140625, 26.171875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 10.0, 6.0, 10.0, 18.0, 26.0, 42.0, 47.0, 58.0, 92.0, 127.0, 210.0, 414.0, 1191.0, 49420.0, 3090035.0, 2486.0, 637.0, 299.0, 161.0, 118.0, 88.0, 55.0, 39.0, 38.0, 23.0, 23.0, 11.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.625, -91.38671875, -88.1484375, -84.91015625, -81.671875, -78.43359375, -75.1953125, -71.95703125, -68.71875, -65.48046875, -62.2421875, -59.00390625, -55.765625, -52.52734375, -49.2890625, -46.05078125, -42.8125, -39.57421875, -36.3359375, -33.09765625, -29.859375, -26.62109375, -23.3828125, -20.14453125, -16.90625, -13.66796875, -10.4296875, -7.19140625, -3.953125, -0.71484375, 2.5234375, 5.76171875, 9.0, 12.23828125, 15.4765625, 18.71484375, 21.953125, 25.19140625, 28.4296875, 31.66796875, 34.90625, 38.14453125, 41.3828125, 44.62109375, 47.859375, 51.09765625, 54.3359375, 57.57421875, 60.8125, 64.05078125, 67.2890625, 70.52734375, 73.765625, 77.00390625, 80.2421875, 83.48046875, 86.71875, 89.95703125, 93.1953125, 96.43359375, 99.671875, 102.91015625, 106.1484375, 109.38671875, 112.625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 9.0, 6.0, 12.0, 28.0, 31.0, 52.0, 61.0, 76.0, 94.0, 90.0, 111.0, 92.0, 91.0, 60.0, 58.0, 46.0, 24.0, 24.0, 11.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.12629318237305, -38.76962661743164, -37.412960052490234, -36.056297302246094, -34.69963073730469, -33.34296417236328, -31.986297607421875, -30.6296329498291, -29.272968292236328, -27.916301727294922, -26.55963706970215, -25.202970504760742, -23.84630584716797, -22.489639282226562, -21.132972717285156, -19.776308059692383, -18.419641494750977, -17.06297492980957, -15.706310272216797, -14.34964370727539, -12.992979049682617, -11.636312484741211, -10.279646873474121, -8.922981262207031, -7.566315650939941, -6.209650039672852, -4.852984428405762, -3.4963183403015137, -2.139652729034424, -0.782987117767334, 0.5736789703369141, 1.930344581604004, 3.2870101928710938, 4.643675804138184, 6.000341415405273, 7.3570075035095215, 8.713672637939453, 10.07033920288086, 11.42700481414795, 12.783670425415039, 14.140336036682129, 15.497001647949219, 16.853668212890625, 18.2103328704834, 19.566999435424805, 20.923664093017578, 22.280330657958984, 23.63699722290039, 24.993661880493164, 26.35032844543457, 27.706993103027344, 29.06365966796875, 30.420324325561523, 31.77699089050293, 33.1336555480957, 34.49032211303711, 35.846988677978516, 37.20365524291992, 38.56032180786133, 39.91698455810547, 41.273651123046875, 42.63031768798828, 43.98698425292969, 45.343650817871094, 46.700313568115234]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 14.0, 4.0, 10.0, 13.0, 13.0, 10.0, 23.0, 18.0, 19.0, 24.0, 27.0, 27.0, 36.0, 46.0, 37.0, 33.0, 47.0, 45.0, 35.0, 36.0, 45.0, 38.0, 46.0, 40.0, 45.0, 30.0, 36.0, 28.0, 36.0, 18.0, 21.0, 15.0, 12.0, 13.0, 10.0, 4.0, 7.0, 5.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-76.89368438720703, -74.5935287475586, -72.29337310791016, -69.99322509765625, -67.69306945800781, -65.39291381835938, -63.09275817871094, -60.7926025390625, -58.49245071411133, -56.19229507446289, -53.89214324951172, -51.59198760986328, -49.291831970214844, -46.99168014526367, -44.691524505615234, -42.39137268066406, -40.091217041015625, -37.79106140136719, -35.490909576416016, -33.19075393676758, -30.890600204467773, -28.59044647216797, -26.29029083251953, -23.990137100219727, -21.689983367919922, -19.389829635620117, -17.089675903320312, -14.789520263671875, -12.48936653137207, -10.189212799072266, -7.8890581130981445, -5.588903427124023, -3.28875732421875, -0.9886031150817871, 1.3115510940551758, 3.6117053031921387, 5.911859512329102, 8.212013244628906, 10.512167930603027, 12.812322616577148, 15.112476348876953, 17.412630081176758, 19.712783813476562, 22.012939453125, 24.313093185424805, 26.61324691772461, 28.913402557373047, 31.21355628967285, 33.513710021972656, 35.813865661621094, 38.114017486572266, 40.4141731262207, 42.714324951171875, 45.01448059082031, 47.31463623046875, 49.61479187011719, 51.91494369506836, 54.2150993347168, 56.51525115966797, 58.815406799316406, 61.115562438964844, 63.415714263916016, 65.71586608886719, 68.01602172851562, 70.31617736816406]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 7.0, 9.0, 7.0, 6.0, 13.0, 17.0, 16.0, 18.0, 29.0, 17.0, 35.0, 30.0, 32.0, 34.0, 34.0, 54.0, 42.0, 48.0, 47.0, 42.0, 53.0, 50.0, 42.0, 55.0, 36.0, 30.0, 24.0, 23.0, 24.0, 18.0, 24.0, 20.0, 11.0, 11.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.2764892578125, -9.904541015625, -9.5325927734375, -9.16064453125, -8.7886962890625, -8.416748046875, -8.0447998046875, -7.6728515625, -7.3009033203125, -6.928955078125, -6.5570068359375, -6.18505859375, -5.8131103515625, -5.441162109375, -5.0692138671875, -4.697265625, -4.3253173828125, -3.953369140625, -3.5814208984375, -3.20947265625, -2.8375244140625, -2.465576171875, -2.0936279296875, -1.7216796875, -1.3497314453125, -0.977783203125, -0.6058349609375, -0.23388671875, 0.1380615234375, 0.510009765625, 0.8819580078125, 1.25390625, 1.6258544921875, 1.997802734375, 2.3697509765625, 2.74169921875, 3.1136474609375, 3.485595703125, 3.8575439453125, 4.2294921875, 4.6014404296875, 4.973388671875, 5.3453369140625, 5.71728515625, 6.0892333984375, 6.461181640625, 6.8331298828125, 7.205078125, 7.5770263671875, 7.948974609375, 8.3209228515625, 8.69287109375, 9.0648193359375, 9.436767578125, 9.8087158203125, 10.1806640625, 10.5526123046875, 10.924560546875, 11.2965087890625, 11.66845703125, 12.0404052734375, 12.412353515625, 12.7843017578125, 13.15625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 10.0, 14.0, 16.0, 28.0, 46.0, 50.0, 89.0, 98.0, 158.0, 235.0, 327.0, 480.0, 686.0, 1040.0, 1668.0, 2588.0, 4198.0, 7286.0, 14295.0, 40383.0, 195528.0, 974152.0, 1997983.0, 745013.0, 145333.0, 32408.0, 12694.0, 6645.0, 3810.0, 2326.0, 1506.0, 1051.0, 674.0, 447.0, 307.0, 223.0, 133.0, 99.0, 67.0, 61.0, 34.0, 23.0, 18.0, 17.0, 13.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.359375, -13.87109375, -13.3828125, -12.89453125, -12.40625, -11.91796875, -11.4296875, -10.94140625, -10.453125, -9.96484375, -9.4765625, -8.98828125, -8.5, -8.01171875, -7.5234375, -7.03515625, -6.546875, -6.05859375, -5.5703125, -5.08203125, -4.59375, -4.10546875, -3.6171875, -3.12890625, -2.640625, -2.15234375, -1.6640625, -1.17578125, -0.6875, -0.19921875, 0.2890625, 0.77734375, 1.265625, 1.75390625, 2.2421875, 2.73046875, 3.21875, 3.70703125, 4.1953125, 4.68359375, 5.171875, 5.66015625, 6.1484375, 6.63671875, 7.125, 7.61328125, 8.1015625, 8.58984375, 9.078125, 9.56640625, 10.0546875, 10.54296875, 11.03125, 11.51953125, 12.0078125, 12.49609375, 12.984375, 13.47265625, 13.9609375, 14.44921875, 14.9375, 15.42578125, 15.9140625, 16.40234375, 16.890625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 12.0, 21.0, 27.0, 58.0, 93.0, 165.0, 246.0, 458.0, 641.0, 844.0, 590.0, 373.0, 237.0, 121.0, 77.0, 52.0, 19.0, 13.0, 10.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0625, -31.181396484375, -30.30029296875, -29.419189453125, -28.5380859375, -27.656982421875, -26.77587890625, -25.894775390625, -25.013671875, -24.132568359375, -23.25146484375, -22.370361328125, -21.4892578125, -20.608154296875, -19.72705078125, -18.845947265625, -17.96484375, -17.083740234375, -16.20263671875, -15.321533203125, -14.4404296875, -13.559326171875, -12.67822265625, -11.797119140625, -10.916015625, -10.034912109375, -9.15380859375, -8.272705078125, -7.3916015625, -6.510498046875, -5.62939453125, -4.748291015625, -3.8671875, -2.986083984375, -2.10498046875, -1.223876953125, -0.3427734375, 0.538330078125, 1.41943359375, 2.300537109375, 3.181640625, 4.062744140625, 4.94384765625, 5.824951171875, 6.7060546875, 7.587158203125, 8.46826171875, 9.349365234375, 10.23046875, 11.111572265625, 11.99267578125, 12.873779296875, 13.7548828125, 14.635986328125, 15.51708984375, 16.398193359375, 17.279296875, 18.160400390625, 19.04150390625, 19.922607421875, 20.8037109375, 21.684814453125, 22.56591796875, 23.447021484375, 24.328125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 16.0, 27.0, 48.0, 81.0, 184.0, 364.0, 856.0, 2837.0, 40858.0, 3978651.0, 164048.0, 4120.0, 1219.0, 478.0, 207.0, 117.0, 67.0, 34.0, 14.0, 15.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.125, -54.23046875, -52.3359375, -50.44140625, -48.546875, -46.65234375, -44.7578125, -42.86328125, -40.96875, -39.07421875, -37.1796875, -35.28515625, -33.390625, -31.49609375, -29.6015625, -27.70703125, -25.8125, -23.91796875, -22.0234375, -20.12890625, -18.234375, -16.33984375, -14.4453125, -12.55078125, -10.65625, -8.76171875, -6.8671875, -4.97265625, -3.078125, -1.18359375, 0.7109375, 2.60546875, 4.5, 6.39453125, 8.2890625, 10.18359375, 12.078125, 13.97265625, 15.8671875, 17.76171875, 19.65625, 21.55078125, 23.4453125, 25.33984375, 27.234375, 29.12890625, 31.0234375, 32.91796875, 34.8125, 36.70703125, 38.6015625, 40.49609375, 42.390625, 44.28515625, 46.1796875, 48.07421875, 49.96875, 51.86328125, 53.7578125, 55.65234375, 57.546875, 59.44140625, 61.3359375, 63.23046875, 65.125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 248.0, 647.0, 112.0, 2.0], "bins": [-872.9672241210938, -858.7333374023438, -844.4994506835938, -830.2655639648438, -816.0316162109375, -801.7977294921875, -787.5638427734375, -773.3299560546875, -759.0960693359375, -744.8621826171875, -730.6282958984375, -716.3944091796875, -702.1604614257812, -687.9265747070312, -673.6926879882812, -659.4588012695312, -645.2249145507812, -630.9910278320312, -616.7571411132812, -602.5232543945312, -588.289306640625, -574.055419921875, -559.821533203125, -545.587646484375, -531.353759765625, -517.119873046875, -502.8859558105469, -488.6520690917969, -474.4181823730469, -460.18426513671875, -445.95037841796875, -431.71649169921875, -417.48260498046875, -403.24871826171875, -389.0148010253906, -374.7809143066406, -360.5470275878906, -346.3131103515625, -332.0792236328125, -317.8453369140625, -303.6114196777344, -289.3775329589844, -275.14361572265625, -260.90972900390625, -246.67584228515625, -232.4419403076172, -218.20803833007812, -203.97415161132812, -189.74026489257812, -175.50636291503906, -161.27247619628906, -147.03857421875, -132.8046875, -118.57078552246094, -104.3368911743164, -90.10299682617188, -75.86911010742188, -61.635215759277344, -47.40132141113281, -33.167423248291016, -18.933528900146484, -4.6996307373046875, 9.534263610839844, 23.768157958984375, 38.00205612182617]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 10.0, 6.0, 6.0, 12.0, 10.0, 13.0, 22.0, 26.0, 35.0, 24.0, 30.0, 31.0, 34.0, 30.0, 37.0, 53.0, 41.0, 39.0, 37.0, 46.0, 39.0, 30.0, 31.0, 37.0, 29.0, 38.0, 27.0, 29.0, 26.0, 32.0, 21.0, 23.0, 23.0, 12.0, 8.0, 5.0, 7.0, 10.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.54561614990234, -66.46924591064453, -64.39287567138672, -62.316505432128906, -60.240135192871094, -58.16376495361328, -56.08739471435547, -54.011024475097656, -51.934654235839844, -49.85828399658203, -47.78191375732422, -45.705543518066406, -43.629173278808594, -41.55280303955078, -39.47643280029297, -37.400062561035156, -35.323692321777344, -33.24732208251953, -31.17095184326172, -29.094581604003906, -27.018211364746094, -24.94184112548828, -22.86547088623047, -20.789100646972656, -18.712730407714844, -16.63636016845703, -14.559989929199219, -12.483619689941406, -10.407249450683594, -8.330879211425781, -6.254508972167969, -4.178138732910156, -2.1017608642578125, -0.025390625, 2.0509796142578125, 4.127349853515625, 6.2037200927734375, 8.28009033203125, 10.356460571289062, 12.432830810546875, 14.509201049804688, 16.5855712890625, 18.661941528320312, 20.738311767578125, 22.814682006835938, 24.89105224609375, 26.967422485351562, 29.043792724609375, 31.120162963867188, 33.196533203125, 35.27290344238281, 37.349273681640625, 39.42564392089844, 41.50201416015625, 43.57838439941406, 45.654754638671875, 47.73112487792969, 49.8074951171875, 51.88386535644531, 53.960235595703125, 56.03660583496094, 58.11297607421875, 60.18934631347656, 62.265716552734375, 64.34208679199219]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 6.0, 12.0, 2.0, 11.0, 11.0, 11.0, 15.0, 18.0, 17.0, 13.0, 15.0, 16.0, 23.0, 21.0, 28.0, 29.0, 48.0, 30.0, 35.0, 33.0, 43.0, 41.0, 38.0, 37.0, 47.0, 29.0, 31.0, 38.0, 26.0, 31.0, 35.0, 32.0, 21.0, 22.0, 18.0, 14.0, 19.0, 13.0, 12.0, 6.0, 11.0, 6.0, 6.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5703125, -7.3199462890625, -7.069580078125, -6.8192138671875, -6.56884765625, -6.3184814453125, -6.068115234375, -5.8177490234375, -5.5673828125, -5.3170166015625, -5.066650390625, -4.8162841796875, -4.56591796875, -4.3155517578125, -4.065185546875, -3.8148193359375, -3.564453125, -3.3140869140625, -3.063720703125, -2.8133544921875, -2.56298828125, -2.3126220703125, -2.062255859375, -1.8118896484375, -1.5615234375, -1.3111572265625, -1.060791015625, -0.8104248046875, -0.56005859375, -0.3096923828125, -0.059326171875, 0.1910400390625, 0.44140625, 0.6917724609375, 0.942138671875, 1.1925048828125, 1.44287109375, 1.6932373046875, 1.943603515625, 2.1939697265625, 2.4443359375, 2.6947021484375, 2.945068359375, 3.1954345703125, 3.44580078125, 3.6961669921875, 3.946533203125, 4.1968994140625, 4.447265625, 4.6976318359375, 4.947998046875, 5.1983642578125, 5.44873046875, 5.6990966796875, 5.949462890625, 6.1998291015625, 6.4501953125, 6.7005615234375, 6.950927734375, 7.2012939453125, 7.45166015625, 7.7020263671875, 7.952392578125, 8.2027587890625, 8.453125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 9.0, 4.0, 13.0, 16.0, 19.0, 38.0, 49.0, 67.0, 118.0, 112.0, 165.0, 232.0, 374.0, 532.0, 659.0, 1004.0, 1435.0, 2063.0, 3048.0, 4336.0, 6195.0, 9433.0, 13859.0, 21097.0, 32688.0, 51184.0, 80563.0, 127101.0, 176865.0, 172889.0, 121821.0, 77682.0, 48941.0, 31281.0, 20732.0, 13272.0, 8867.0, 6101.0, 4107.0, 2881.0, 1952.0, 1365.0, 1021.0, 669.0, 560.0, 326.0, 242.0, 184.0, 115.0, 79.0, 56.0, 51.0, 33.0, 21.0, 12.0, 14.0, 4.0, 7.0, 3.0, 2.0, 2.0], "bins": [-0.84326171875, -0.8168716430664062, -0.7904815673828125, -0.7640914916992188, -0.737701416015625, -0.7113113403320312, -0.6849212646484375, -0.6585311889648438, -0.63214111328125, -0.6057510375976562, -0.5793609619140625, -0.5529708862304688, -0.526580810546875, -0.5001907348632812, -0.4738006591796875, -0.44741058349609375, -0.4210205078125, -0.39463043212890625, -0.3682403564453125, -0.34185028076171875, -0.315460205078125, -0.28907012939453125, -0.2626800537109375, -0.23628997802734375, -0.20989990234375, -0.18350982666015625, -0.1571197509765625, -0.13072967529296875, -0.104339599609375, -0.07794952392578125, -0.0515594482421875, -0.02516937255859375, 0.001220703125, 0.02761077880859375, 0.0540008544921875, 0.08039093017578125, 0.106781005859375, 0.13317108154296875, 0.1595611572265625, 0.18595123291015625, 0.21234130859375, 0.23873138427734375, 0.2651214599609375, 0.29151153564453125, 0.317901611328125, 0.34429168701171875, 0.3706817626953125, 0.39707183837890625, 0.4234619140625, 0.44985198974609375, 0.4762420654296875, 0.5026321411132812, 0.529022216796875, 0.5554122924804688, 0.5818023681640625, 0.6081924438476562, 0.63458251953125, 0.6609725952148438, 0.6873626708984375, 0.7137527465820312, 0.740142822265625, 0.7665328979492188, 0.7929229736328125, 0.8193130493164062, 0.845703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 4.0, 8.0, 7.0, 11.0, 16.0, 19.0, 21.0, 20.0, 17.0, 15.0, 25.0, 21.0, 32.0, 40.0, 34.0, 35.0, 27.0, 29.0, 33.0, 42.0, 1070.0, 53.0, 42.0, 43.0, 39.0, 40.0, 34.0, 35.0, 24.0, 23.0, 18.0, 25.0, 22.0, 18.0, 11.0, 17.0, 7.0, 12.0, 4.0, 4.0, 3.0, 5.0, 4.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.875, -5.7003173828125, -5.525634765625, -5.3509521484375, -5.17626953125, -5.0015869140625, -4.826904296875, -4.6522216796875, -4.4775390625, -4.3028564453125, -4.128173828125, -3.9534912109375, -3.77880859375, -3.6041259765625, -3.429443359375, -3.2547607421875, -3.080078125, -2.9053955078125, -2.730712890625, -2.5560302734375, -2.38134765625, -2.2066650390625, -2.031982421875, -1.8572998046875, -1.6826171875, -1.5079345703125, -1.333251953125, -1.1585693359375, -0.98388671875, -0.8092041015625, -0.634521484375, -0.4598388671875, -0.28515625, -0.1104736328125, 0.064208984375, 0.2388916015625, 0.41357421875, 0.5882568359375, 0.762939453125, 0.9376220703125, 1.1123046875, 1.2869873046875, 1.461669921875, 1.6363525390625, 1.81103515625, 1.9857177734375, 2.160400390625, 2.3350830078125, 2.509765625, 2.6844482421875, 2.859130859375, 3.0338134765625, 3.20849609375, 3.3831787109375, 3.557861328125, 3.7325439453125, 3.9072265625, 4.0819091796875, 4.256591796875, 4.4312744140625, 4.60595703125, 4.7806396484375, 4.955322265625, 5.1300048828125, 5.3046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 10.0, 19.0, 29.0, 44.0, 59.0, 94.0, 155.0, 188.0, 324.0, 518.0, 765.0, 1154.0, 1682.0, 2670.0, 4089.0, 6372.0, 9994.0, 15297.0, 24230.0, 38253.0, 60666.0, 93549.0, 137248.0, 1192782.0, 182162.0, 115584.0, 76021.0, 48156.0, 30438.0, 19257.0, 12300.0, 7959.0, 5172.0, 3398.0, 2123.0, 1484.0, 949.0, 634.0, 421.0, 285.0, 188.0, 125.0, 87.0, 73.0, 29.0, 27.0, 19.0, 14.0, 12.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.658203125, -0.6381072998046875, -0.618011474609375, -0.5979156494140625, -0.57781982421875, -0.5577239990234375, -0.537628173828125, -0.5175323486328125, -0.4974365234375, -0.4773406982421875, -0.457244873046875, -0.4371490478515625, -0.41705322265625, -0.3969573974609375, -0.376861572265625, -0.3567657470703125, -0.336669921875, -0.3165740966796875, -0.296478271484375, -0.2763824462890625, -0.25628662109375, -0.2361907958984375, -0.216094970703125, -0.1959991455078125, -0.1759033203125, -0.1558074951171875, -0.135711669921875, -0.1156158447265625, -0.09552001953125, -0.0754241943359375, -0.055328369140625, -0.0352325439453125, -0.01513671875, 0.0049591064453125, 0.025054931640625, 0.0451507568359375, 0.06524658203125, 0.0853424072265625, 0.105438232421875, 0.1255340576171875, 0.1456298828125, 0.1657257080078125, 0.185821533203125, 0.2059173583984375, 0.22601318359375, 0.2461090087890625, 0.266204833984375, 0.2863006591796875, 0.306396484375, 0.3264923095703125, 0.346588134765625, 0.3666839599609375, 0.38677978515625, 0.4068756103515625, 0.426971435546875, 0.4470672607421875, 0.4671630859375, 0.4872589111328125, 0.507354736328125, 0.5274505615234375, 0.54754638671875, 0.5676422119140625, 0.587738037109375, 0.6078338623046875, 0.6279296875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 9.0, 15.0, 11.0, 12.0, 9.0, 17.0, 21.0, 30.0, 33.0, 31.0, 33.0, 50.0, 44.0, 55.0, 56.0, 71.0, 58.0, 51.0, 50.0, 55.0, 42.0, 35.0, 38.0, 14.0, 20.0, 21.0, 17.0, 20.0, 17.0, 11.0, 5.0, 5.0, 7.0, 10.0, 5.0, 3.0, 0.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01739501953125, -0.016748428344726562, -0.016101837158203125, -0.015455245971679688, -0.01480865478515625, -0.014162063598632812, -0.013515472412109375, -0.012868881225585938, -0.0122222900390625, -0.011575698852539062, -0.010929107666015625, -0.010282516479492188, -0.00963592529296875, -0.008989334106445312, -0.008342742919921875, -0.0076961517333984375, -0.007049560546875, -0.0064029693603515625, -0.005756378173828125, -0.0051097869873046875, -0.00446319580078125, -0.0038166046142578125, -0.003170013427734375, -0.0025234222412109375, -0.0018768310546875, -0.0012302398681640625, -0.000583648681640625, 6.29425048828125e-05, 0.00070953369140625, 0.0013561248779296875, 0.002002716064453125, 0.0026493072509765625, 0.0032958984375, 0.0039424896240234375, 0.004589080810546875, 0.0052356719970703125, 0.00588226318359375, 0.0065288543701171875, 0.007175445556640625, 0.007822036743164062, 0.0084686279296875, 0.009115219116210938, 0.009761810302734375, 0.010408401489257812, 0.01105499267578125, 0.011701583862304688, 0.012348175048828125, 0.012994766235351562, 0.013641357421875, 0.014287948608398438, 0.014934539794921875, 0.015581130981445312, 0.01622772216796875, 0.016874313354492188, 0.017520904541015625, 0.018167495727539062, 0.0188140869140625, 0.019460678100585938, 0.020107269287109375, 0.020753860473632812, 0.02140045166015625, 0.022047042846679688, 0.022693634033203125, 0.023340225219726562, 0.02398681640625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 10.0, 5.0, 1.0, 5.0, 11.0, 13.0, 12.0, 15.0, 13.0, 18.0, 33.0, 45.0, 43.0, 67.0, 60.0, 85.0, 145.0, 204.0, 223.0, 400.0, 618.0, 1616.0, 955279.0, 86654.0, 1140.0, 583.0, 333.0, 230.0, 156.0, 129.0, 107.0, 59.0, 51.0, 43.0, 31.0, 29.0, 20.0, 21.0, 11.0, 11.0, 8.0, 7.0, 4.0, 6.0, 5.0, 1.0, 0.0, 5.0, 1.0, 3.0], "bins": [-0.387939453125, -0.3774147033691406, -0.36688995361328125, -0.3563652038574219, -0.3458404541015625, -0.3353157043457031, -0.32479095458984375, -0.3142662048339844, -0.303741455078125, -0.2932167053222656, -0.28269195556640625, -0.2721672058105469, -0.2616424560546875, -0.2511177062988281, -0.24059295654296875, -0.23006820678710938, -0.21954345703125, -0.20901870727539062, -0.19849395751953125, -0.18796920776367188, -0.1774444580078125, -0.16691970825195312, -0.15639495849609375, -0.14587020874023438, -0.135345458984375, -0.12482070922851562, -0.11429595947265625, -0.10377120971679688, -0.0932464599609375, -0.08272171020507812, -0.07219696044921875, -0.061672210693359375, -0.0511474609375, -0.040622711181640625, -0.03009796142578125, -0.019573211669921875, -0.0090484619140625, 0.001476287841796875, 0.01200103759765625, 0.022525787353515625, 0.033050537109375, 0.043575286865234375, 0.05410003662109375, 0.06462478637695312, 0.0751495361328125, 0.08567428588867188, 0.09619903564453125, 0.10672378540039062, 0.11724853515625, 0.12777328491210938, 0.13829803466796875, 0.14882278442382812, 0.1593475341796875, 0.16987228393554688, 0.18039703369140625, 0.19092178344726562, 0.201446533203125, 0.21197128295898438, 0.22249603271484375, 0.23302078247070312, 0.2435455322265625, 0.2540702819824219, 0.26459503173828125, 0.2751197814941406, 0.28564453125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1009.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5187245011329651, -0.5080504417419434, -0.49737638235092163, -0.4867023229598999, -0.4760282635688782, -0.46535417437553406, -0.45468011498451233, -0.4440060555934906, -0.43333199620246887, -0.42265793681144714, -0.4119838774204254, -0.4013098180294037, -0.39063572883605957, -0.37996166944503784, -0.3692876100540161, -0.3586135506629944, -0.34793949127197266, -0.3372654318809509, -0.3265913724899292, -0.31591731309890747, -0.30524325370788574, -0.2945691645145416, -0.2838951051235199, -0.27322104573249817, -0.26254698634147644, -0.2518729269504547, -0.24119886755943298, -0.23052479326725006, -0.21985073387622833, -0.2091766744852066, -0.19850260019302368, -0.18782854080200195, -0.17715445160865784, -0.1664803922176361, -0.15580633282661438, -0.14513225853443146, -0.13445819914340973, -0.123784139752388, -0.11311007291078568, -0.10243600606918335, -0.09176194667816162, -0.08108788728713989, -0.07041382044553757, -0.05973975732922554, -0.04906569421291351, -0.038391631096601486, -0.02771756798028946, -0.017043501138687134, -0.006369441747665405, 0.004304621368646622, 0.014978684484958649, 0.025652747601270676, 0.0363268107175827, 0.04700087383389473, 0.05767493695020676, 0.06834900379180908, 0.07902306318283081, 0.08969712257385254, 0.10037118941545486, 0.11104525625705719, 0.12171931564807892, 0.13239337503910065, 0.14306744933128357, 0.1537415087223053, 0.16441556811332703]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 16.0, 9.0, 25.0, 38.0, 45.0, 51.0, 62.0, 87.0, 98.0, 100.0, 99.0, 90.0, 72.0, 72.0, 46.0, 35.0, 25.0, 20.0, 13.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024046778678894043, -0.022699836641550064, -0.021352892741560936, -0.020005948841571808, -0.01865900680422783, -0.01731206476688385, -0.015965120866894722, -0.014618177898228168, -0.013271234929561615, -0.011924291960895061, -0.010577348992228508, -0.009230406023561954, -0.007883463054895401, -0.0065365200862288475, -0.005189577117562294, -0.0038426341488957405, -0.002495691180229187, -0.0011487482115626335, 0.00019819475710391998, 0.0015451377257704735, 0.002892080694437027, 0.0042390236631035805, 0.005585966631770134, 0.0069329096004366875, 0.008279852569103241, 0.009626795537769794, 0.010973738506436348, 0.012320681475102901, 0.013667624443769455, 0.015014567412436008, 0.016361510381102562, 0.01770845428109169, 0.01905539631843567, 0.020402338355779648, 0.021749282255768776, 0.023096226155757904, 0.024443168193101883, 0.025790110230445862, 0.02713705413043499, 0.028483998030424118, 0.029830940067768097, 0.031177882105112076, 0.032524824142456055, 0.03387176990509033, 0.03521871194243431, 0.03656565397977829, 0.03791259974241257, 0.039259541779756546, 0.040606483817100525, 0.041953425854444504, 0.04330036789178848, 0.04464731365442276, 0.04599425569176674, 0.04734119772911072, 0.048688143491744995, 0.050035085529088974, 0.05138202756643295, 0.05272896960377693, 0.05407591164112091, 0.05542285740375519, 0.05676979944109917, 0.058116741478443146, 0.05946368724107742, 0.0608106292784214, 0.06215757131576538]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 6.0, 12.0, 2.0, 11.0, 11.0, 11.0, 15.0, 18.0, 17.0, 13.0, 16.0, 15.0, 24.0, 20.0, 28.0, 30.0, 48.0, 29.0, 35.0, 34.0, 42.0, 42.0, 38.0, 36.0, 47.0, 29.0, 32.0, 38.0, 25.0, 31.0, 35.0, 32.0, 21.0, 22.0, 18.0, 14.0, 19.0, 13.0, 12.0, 6.0, 11.0, 6.0, 6.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.31610107421875, -7.0657958984375, -6.81549072265625, -6.565185546875, -6.31488037109375, -6.0645751953125, -5.81427001953125, -5.56396484375, -5.31365966796875, -5.0633544921875, -4.81304931640625, -4.562744140625, -4.31243896484375, -4.0621337890625, -3.81182861328125, -3.5615234375, -3.31121826171875, -3.0609130859375, -2.81060791015625, -2.560302734375, -2.30999755859375, -2.0596923828125, -1.80938720703125, -1.55908203125, -1.30877685546875, -1.0584716796875, -0.80816650390625, -0.557861328125, -0.30755615234375, -0.0572509765625, 0.19305419921875, 0.443359375, 0.69366455078125, 0.9439697265625, 1.19427490234375, 1.444580078125, 1.69488525390625, 1.9451904296875, 2.19549560546875, 2.44580078125, 2.69610595703125, 2.9464111328125, 3.19671630859375, 3.447021484375, 3.69732666015625, 3.9476318359375, 4.19793701171875, 4.4482421875, 4.69854736328125, 4.9488525390625, 5.19915771484375, 5.449462890625, 5.69976806640625, 5.9500732421875, 6.20037841796875, 6.45068359375, 6.70098876953125, 6.9512939453125, 7.20159912109375, 7.451904296875, 7.70220947265625, 7.9525146484375, 8.20281982421875, 8.453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 9.0, 2.0, 3.0, 5.0, 14.0, 12.0, 17.0, 11.0, 23.0, 28.0, 44.0, 33.0, 73.0, 79.0, 123.0, 231.0, 283.0, 378.0, 594.0, 913.0, 1643.0, 3493.0, 9493.0, 35684.0, 207740.0, 620349.0, 127983.0, 25219.0, 7289.0, 2755.0, 1403.0, 891.0, 496.0, 382.0, 222.0, 181.0, 120.0, 88.0, 54.0, 48.0, 39.0, 24.0, 21.0, 22.0, 16.0, 10.0, 11.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.09375, -13.614013671875, -13.13427734375, -12.654541015625, -12.1748046875, -11.695068359375, -11.21533203125, -10.735595703125, -10.255859375, -9.776123046875, -9.29638671875, -8.816650390625, -8.3369140625, -7.857177734375, -7.37744140625, -6.897705078125, -6.41796875, -5.938232421875, -5.45849609375, -4.978759765625, -4.4990234375, -4.019287109375, -3.53955078125, -3.059814453125, -2.580078125, -2.100341796875, -1.62060546875, -1.140869140625, -0.6611328125, -0.181396484375, 0.29833984375, 0.778076171875, 1.2578125, 1.737548828125, 2.21728515625, 2.697021484375, 3.1767578125, 3.656494140625, 4.13623046875, 4.615966796875, 5.095703125, 5.575439453125, 6.05517578125, 6.534912109375, 7.0146484375, 7.494384765625, 7.97412109375, 8.453857421875, 8.93359375, 9.413330078125, 9.89306640625, 10.372802734375, 10.8525390625, 11.332275390625, 11.81201171875, 12.291748046875, 12.771484375, 13.251220703125, 13.73095703125, 14.210693359375, 14.6904296875, 15.170166015625, 15.64990234375, 16.129638671875, 16.609375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 11.0, 12.0, 17.0, 9.0, 21.0, 22.0, 26.0, 41.0, 54.0, 60.0, 61.0, 128.0, 343.0, 1625.0, 168.0, 98.0, 67.0, 67.0, 54.0, 38.0, 26.0, 18.0, 25.0, 9.0, 9.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.921875, -30.898193359375, -29.87451171875, -28.850830078125, -27.8271484375, -26.803466796875, -25.77978515625, -24.756103515625, -23.732421875, -22.708740234375, -21.68505859375, -20.661376953125, -19.6376953125, -18.614013671875, -17.59033203125, -16.566650390625, -15.54296875, -14.519287109375, -13.49560546875, -12.471923828125, -11.4482421875, -10.424560546875, -9.40087890625, -8.377197265625, -7.353515625, -6.329833984375, -5.30615234375, -4.282470703125, -3.2587890625, -2.235107421875, -1.21142578125, -0.187744140625, 0.8359375, 1.859619140625, 2.88330078125, 3.906982421875, 4.9306640625, 5.954345703125, 6.97802734375, 8.001708984375, 9.025390625, 10.049072265625, 11.07275390625, 12.096435546875, 13.1201171875, 14.143798828125, 15.16748046875, 16.191162109375, 17.21484375, 18.238525390625, 19.26220703125, 20.285888671875, 21.3095703125, 22.333251953125, 23.35693359375, 24.380615234375, 25.404296875, 26.427978515625, 27.45166015625, 28.475341796875, 29.4990234375, 30.522705078125, 31.54638671875, 32.570068359375, 33.59375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 8.0, 6.0, 12.0, 13.0, 29.0, 39.0, 55.0, 70.0, 135.0, 312.0, 701.0, 3361.0, 3134301.0, 5243.0, 721.0, 304.0, 131.0, 92.0, 38.0, 38.0, 24.0, 16.0, 16.0, 12.0, 9.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.6875, -93.623046875, -90.55859375, -87.494140625, -84.4296875, -81.365234375, -78.30078125, -75.236328125, -72.171875, -69.107421875, -66.04296875, -62.978515625, -59.9140625, -56.849609375, -53.78515625, -50.720703125, -47.65625, -44.591796875, -41.52734375, -38.462890625, -35.3984375, -32.333984375, -29.26953125, -26.205078125, -23.140625, -20.076171875, -17.01171875, -13.947265625, -10.8828125, -7.818359375, -4.75390625, -1.689453125, 1.375, 4.439453125, 7.50390625, 10.568359375, 13.6328125, 16.697265625, 19.76171875, 22.826171875, 25.890625, 28.955078125, 32.01953125, 35.083984375, 38.1484375, 41.212890625, 44.27734375, 47.341796875, 50.40625, 53.470703125, 56.53515625, 59.599609375, 62.6640625, 65.728515625, 68.79296875, 71.857421875, 74.921875, 77.986328125, 81.05078125, 84.115234375, 87.1796875, 90.244140625, 93.30859375, 96.373046875, 99.4375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 16.0, 258.0, 633.0, 101.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.83428955078125, -280.3750305175781, -274.9158020019531, -269.45654296875, -263.9972839355469, -258.53802490234375, -253.07879638671875, -247.61953735351562, -242.1602783203125, -236.70103454589844, -231.2417755126953, -225.78253173828125, -220.32327270507812, -214.86402893066406, -209.40478515625, -203.94552612304688, -198.4862823486328, -193.02703857421875, -187.56777954101562, -182.10853576660156, -176.64927673339844, -171.19003295898438, -165.73077392578125, -160.2715301513672, -154.81228637695312, -149.35304260253906, -143.89378356933594, -138.43453979492188, -132.97528076171875, -127.51603698730469, -122.0567855834961, -116.5975341796875, -111.13826751708984, -105.67901611328125, -100.21976470947266, -94.76051330566406, -89.30126953125, -83.84201049804688, -78.38276672363281, -72.92351531982422, -67.46426391601562, -62.00501251220703, -56.54576110839844, -51.08651351928711, -45.627262115478516, -40.16801071166992, -34.708763122558594, -29.24951171875, -23.790260314941406, -18.331008911132812, -12.871759414672852, -7.412509918212891, -1.9532585144042969, 3.505992889404297, 8.965240478515625, 14.424491882324219, 19.883743286132812, 25.342994689941406, 30.802244186401367, 36.26149368286133, 41.72074508666992, 47.179996490478516, 52.639244079589844, 58.09849548339844, 63.55774688720703]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 3.0, 12.0, 7.0, 12.0, 11.0, 11.0, 15.0, 18.0, 26.0, 28.0, 27.0, 33.0, 41.0, 58.0, 41.0, 50.0, 49.0, 35.0, 52.0, 45.0, 39.0, 49.0, 56.0, 46.0, 28.0, 25.0, 29.0, 27.0, 23.0, 18.0, 21.0, 12.0, 13.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.18035125732422, -55.20181655883789, -53.22328186035156, -51.24474334716797, -49.26620864868164, -47.28767395019531, -45.309139251708984, -43.330604553222656, -41.35206604003906, -39.373531341552734, -37.394996643066406, -35.41645812988281, -33.437923431396484, -31.459388732910156, -29.480854034423828, -27.502317428588867, -25.52378273010254, -23.54524803161621, -21.56671142578125, -19.588176727294922, -17.60964012145996, -15.631105422973633, -13.652569770812988, -11.674034118652344, -9.6954984664917, -7.716962814331055, -5.73842716217041, -3.759891986846924, -1.7813563346862793, 0.19717884063720703, 2.1757144927978516, 4.154250144958496, 6.132785797119141, 8.111321449279785, 10.08985710144043, 12.068391799926758, 14.046928405761719, 16.025463104248047, 18.003997802734375, 19.982534408569336, 21.961071014404297, 23.939605712890625, 25.918142318725586, 27.896677017211914, 29.875213623046875, 31.853748321533203, 33.83228302001953, 35.810821533203125, 37.78935241699219, 39.767887115478516, 41.746421813964844, 43.72496032714844, 45.703495025634766, 47.682029724121094, 49.66056442260742, 51.63909912109375, 53.617637634277344, 55.59617233276367, 57.57470703125, 59.553245544433594, 61.53178024291992, 63.51031494140625, 65.48885345458984, 67.4673843383789, 69.4459228515625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 10.0, 5.0, 14.0, 12.0, 15.0, 17.0, 24.0, 20.0, 26.0, 31.0, 24.0, 39.0, 30.0, 37.0, 38.0, 48.0, 47.0, 38.0, 45.0, 47.0, 34.0, 52.0, 47.0, 38.0, 43.0, 29.0, 24.0, 24.0, 16.0, 28.0, 16.0, 10.0, 14.0, 11.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2359619140625, -8.901611328125, -8.5672607421875, -8.23291015625, -7.8985595703125, -7.564208984375, -7.2298583984375, -6.8955078125, -6.5611572265625, -6.226806640625, -5.8924560546875, -5.55810546875, -5.2237548828125, -4.889404296875, -4.5550537109375, -4.220703125, -3.8863525390625, -3.552001953125, -3.2176513671875, -2.88330078125, -2.5489501953125, -2.214599609375, -1.8802490234375, -1.5458984375, -1.2115478515625, -0.877197265625, -0.5428466796875, -0.20849609375, 0.1258544921875, 0.460205078125, 0.7945556640625, 1.12890625, 1.4632568359375, 1.797607421875, 2.1319580078125, 2.46630859375, 2.8006591796875, 3.135009765625, 3.4693603515625, 3.8037109375, 4.1380615234375, 4.472412109375, 4.8067626953125, 5.14111328125, 5.4754638671875, 5.809814453125, 6.1441650390625, 6.478515625, 6.8128662109375, 7.147216796875, 7.4815673828125, 7.81591796875, 8.1502685546875, 8.484619140625, 8.8189697265625, 9.1533203125, 9.4876708984375, 9.822021484375, 10.1563720703125, 10.49072265625, 10.8250732421875, 11.159423828125, 11.4937744140625, 11.828125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 5.0, 9.0, 14.0, 12.0, 12.0, 17.0, 27.0, 16.0, 29.0, 35.0, 54.0, 55.0, 90.0, 102.0, 145.0, 166.0, 265.0, 319.0, 519.0, 758.0, 1525.0, 5533.0, 95100.0, 3599675.0, 473184.0, 11430.0, 2122.0, 1032.0, 585.0, 363.0, 277.0, 199.0, 137.0, 107.0, 91.0, 66.0, 39.0, 38.0, 27.0, 22.0, 17.0, 14.0, 15.0, 9.0, 11.0, 11.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.71875, -45.02978515625, -43.3408203125, -41.65185546875, -39.962890625, -38.27392578125, -36.5849609375, -34.89599609375, -33.20703125, -31.51806640625, -29.8291015625, -28.14013671875, -26.451171875, -24.76220703125, -23.0732421875, -21.38427734375, -19.6953125, -18.00634765625, -16.3173828125, -14.62841796875, -12.939453125, -11.25048828125, -9.5615234375, -7.87255859375, -6.18359375, -4.49462890625, -2.8056640625, -1.11669921875, 0.572265625, 2.26123046875, 3.9501953125, 5.63916015625, 7.328125, 9.01708984375, 10.7060546875, 12.39501953125, 14.083984375, 15.77294921875, 17.4619140625, 19.15087890625, 20.83984375, 22.52880859375, 24.2177734375, 25.90673828125, 27.595703125, 29.28466796875, 30.9736328125, 32.66259765625, 34.3515625, 36.04052734375, 37.7294921875, 39.41845703125, 41.107421875, 42.79638671875, 44.4853515625, 46.17431640625, 47.86328125, 49.55224609375, 51.2412109375, 52.93017578125, 54.619140625, 56.30810546875, 57.9970703125, 59.68603515625, 61.375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 10.0, 2.0, 11.0, 5.0, 13.0, 12.0, 28.0, 44.0, 58.0, 72.0, 107.0, 151.0, 219.0, 304.0, 432.0, 540.0, 494.0, 420.0, 314.0, 209.0, 167.0, 120.0, 78.0, 64.0, 47.0, 34.0, 24.0, 17.0, 13.0, 11.0, 7.0, 12.0, 10.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.573974609375, -13.06982421875, -12.565673828125, -12.0615234375, -11.557373046875, -11.05322265625, -10.549072265625, -10.044921875, -9.540771484375, -9.03662109375, -8.532470703125, -8.0283203125, -7.524169921875, -7.02001953125, -6.515869140625, -6.01171875, -5.507568359375, -5.00341796875, -4.499267578125, -3.9951171875, -3.490966796875, -2.98681640625, -2.482666015625, -1.978515625, -1.474365234375, -0.97021484375, -0.466064453125, 0.0380859375, 0.542236328125, 1.04638671875, 1.550537109375, 2.0546875, 2.558837890625, 3.06298828125, 3.567138671875, 4.0712890625, 4.575439453125, 5.07958984375, 5.583740234375, 6.087890625, 6.592041015625, 7.09619140625, 7.600341796875, 8.1044921875, 8.608642578125, 9.11279296875, 9.616943359375, 10.12109375, 10.625244140625, 11.12939453125, 11.633544921875, 12.1376953125, 12.641845703125, 13.14599609375, 13.650146484375, 14.154296875, 14.658447265625, 15.16259765625, 15.666748046875, 16.1708984375, 16.675048828125, 17.17919921875, 17.683349609375, 18.1875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 19.0, 16.0, 26.0, 43.0, 48.0, 89.0, 115.0, 227.0, 426.0, 819.0, 1692.0, 3974.0, 11146.0, 41013.0, 207800.0, 1617570.0, 1980800.0, 258461.0, 48738.0, 12986.0, 4486.0, 1792.0, 876.0, 425.0, 277.0, 144.0, 73.0, 65.0, 47.0, 25.0, 9.0, 12.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.21875, -15.696533203125, -15.17431640625, -14.652099609375, -14.1298828125, -13.607666015625, -13.08544921875, -12.563232421875, -12.041015625, -11.518798828125, -10.99658203125, -10.474365234375, -9.9521484375, -9.429931640625, -8.90771484375, -8.385498046875, -7.86328125, -7.341064453125, -6.81884765625, -6.296630859375, -5.7744140625, -5.252197265625, -4.72998046875, -4.207763671875, -3.685546875, -3.163330078125, -2.64111328125, -2.118896484375, -1.5966796875, -1.074462890625, -0.55224609375, -0.030029296875, 0.4921875, 1.014404296875, 1.53662109375, 2.058837890625, 2.5810546875, 3.103271484375, 3.62548828125, 4.147705078125, 4.669921875, 5.192138671875, 5.71435546875, 6.236572265625, 6.7587890625, 7.281005859375, 7.80322265625, 8.325439453125, 8.84765625, 9.369873046875, 9.89208984375, 10.414306640625, 10.9365234375, 11.458740234375, 11.98095703125, 12.503173828125, 13.025390625, 13.547607421875, 14.06982421875, 14.592041015625, 15.1142578125, 15.636474609375, 16.15869140625, 16.680908203125, 17.203125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 12.0, 27.0, 37.0, 55.0, 65.0, 85.0, 98.0, 127.0, 109.0, 88.0, 63.0, 57.0, 48.0, 27.0, 27.0, 18.0, 13.0, 9.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.4036865234375, -79.60592651367188, -75.80817413330078, -72.01041412353516, -68.21266174316406, -64.41490173339844, -60.61714553833008, -56.81938934326172, -53.021629333496094, -49.223873138427734, -45.426116943359375, -41.62835693359375, -37.83060073852539, -34.03284454345703, -30.235088348388672, -26.43733024597168, -22.639575958251953, -18.841819763183594, -15.044061660766602, -11.246305465698242, -7.448548316955566, -3.6507911682128906, 0.14696502685546875, 3.944723129272461, 7.74247932434082, 11.540236473083496, 15.337993621826172, 19.13574981689453, 22.93350601196289, 26.731264114379883, 30.529020309448242, 34.326778411865234, 38.124534606933594, 41.92229080200195, 45.72004699707031, 49.51780700683594, 53.3155632019043, 57.113319396972656, 60.911075592041016, 64.70883178710938, 68.506591796875, 72.30435180664062, 76.10210418701172, 79.89986419677734, 83.69761657714844, 87.49537658691406, 91.29313659667969, 95.09088897705078, 98.88864135742188, 102.6864013671875, 106.4841537475586, 110.28191375732422, 114.07966613769531, 117.87742614746094, 121.67518615722656, 125.47293853759766, 129.2707061767578, 133.06846618652344, 136.86622619628906, 140.66397094726562, 144.46173095703125, 148.25949096679688, 152.0572509765625, 155.85501098632812, 159.6527557373047]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 7.0, 7.0, 5.0, 10.0, 13.0, 13.0, 20.0, 14.0, 20.0, 18.0, 15.0, 26.0, 29.0, 30.0, 32.0, 19.0, 32.0, 35.0, 41.0, 43.0, 37.0, 23.0, 37.0, 44.0, 36.0, 47.0, 34.0, 33.0, 37.0, 32.0, 23.0, 19.0, 23.0, 32.0, 15.0, 17.0, 16.0, 10.0, 12.0, 5.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-58.68937301635742, -56.8261604309082, -54.96294403076172, -53.0997314453125, -51.23651885986328, -49.37330627441406, -47.51008987426758, -45.64687728881836, -43.783660888671875, -41.920448303222656, -40.05723190307617, -38.19401931762695, -36.330806732177734, -34.46759033203125, -32.60437774658203, -30.741165161132812, -28.877952575683594, -27.014738082885742, -25.151525497436523, -23.288311004638672, -21.425098419189453, -19.5618839263916, -17.69866943359375, -15.835455894470215, -13.97224235534668, -12.109028816223145, -10.24581527709961, -8.382600784301758, -6.519387245178223, -4.6561737060546875, -2.792959213256836, -0.9297456741333008, 0.9334640502929688, 2.796677827835083, 4.659891605377197, 6.523105621337891, 8.386319160461426, 10.249532699584961, 12.112747192382812, 13.975960731506348, 15.839174270629883, 17.702388763427734, 19.565601348876953, 21.428815841674805, 23.292030334472656, 25.155242919921875, 27.018457412719727, 28.881671905517578, 30.744884490966797, 32.608097076416016, 34.4713134765625, 36.33452606201172, 38.19773864746094, 40.060951232910156, 41.92416763305664, 43.78738021850586, 45.650596618652344, 47.51380920410156, 49.37702560424805, 51.240238189697266, 53.103450775146484, 54.96666717529297, 56.82987976074219, 58.693092346191406, 60.556304931640625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 5.0, 4.0, 4.0, 3.0, 15.0, 12.0, 8.0, 17.0, 29.0, 19.0, 27.0, 34.0, 38.0, 28.0, 47.0, 50.0, 66.0, 49.0, 44.0, 52.0, 44.0, 68.0, 39.0, 58.0, 42.0, 27.0, 37.0, 29.0, 22.0, 24.0, 17.0, 17.0, 9.0, 4.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-171.0, -166.6064453125, -162.212890625, -157.8193359375, -153.42578125, -149.0322265625, -144.638671875, -140.2451171875, -135.8515625, -131.4580078125, -127.064453125, -122.6708984375, -118.27734375, -113.8837890625, -109.490234375, -105.0966796875, -100.703125, -96.3095703125, -91.916015625, -87.5224609375, -83.12890625, -78.7353515625, -74.341796875, -69.9482421875, -65.5546875, -61.1611328125, -56.767578125, -52.3740234375, -47.98046875, -43.5869140625, -39.193359375, -34.7998046875, -30.40625, -26.0126953125, -21.619140625, -17.2255859375, -12.83203125, -8.4384765625, -4.044921875, 0.3486328125, 4.7421875, 9.1357421875, 13.529296875, 17.9228515625, 22.31640625, 26.7099609375, 31.103515625, 35.4970703125, 39.890625, 44.2841796875, 48.677734375, 53.0712890625, 57.46484375, 61.8583984375, 66.251953125, 70.6455078125, 75.0390625, 79.4326171875, 83.826171875, 88.2197265625, 92.61328125, 97.0068359375, 101.400390625, 105.7939453125, 110.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 7.0, 10.0, 25.0, 26.0, 54.0, 51.0, 113.0, 148.0, 245.0, 405.0, 639.0, 958.0, 1653.0, 2450.0, 4136.0, 6422.0, 10541.0, 16673.0, 27076.0, 43852.0, 69619.0, 104012.0, 142788.0, 162185.0, 146493.0, 110477.0, 73877.0, 46944.0, 29143.0, 17865.0, 11241.0, 6807.0, 4269.0, 2774.0, 1717.0, 1046.0, 660.0, 433.0, 275.0, 167.0, 113.0, 57.0, 32.0, 26.0, 15.0, 16.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0], "bins": [-7.95703125, -7.73333740234375, -7.5096435546875, -7.28594970703125, -7.062255859375, -6.83856201171875, -6.6148681640625, -6.39117431640625, -6.16748046875, -5.94378662109375, -5.7200927734375, -5.49639892578125, -5.272705078125, -5.04901123046875, -4.8253173828125, -4.60162353515625, -4.3779296875, -4.15423583984375, -3.9305419921875, -3.70684814453125, -3.483154296875, -3.25946044921875, -3.0357666015625, -2.81207275390625, -2.58837890625, -2.36468505859375, -2.1409912109375, -1.91729736328125, -1.693603515625, -1.46990966796875, -1.2462158203125, -1.02252197265625, -0.798828125, -0.57513427734375, -0.3514404296875, -0.12774658203125, 0.095947265625, 0.31964111328125, 0.5433349609375, 0.76702880859375, 0.99072265625, 1.21441650390625, 1.4381103515625, 1.66180419921875, 1.885498046875, 2.10919189453125, 2.3328857421875, 2.55657958984375, 2.7802734375, 3.00396728515625, 3.2276611328125, 3.45135498046875, 3.675048828125, 3.89874267578125, 4.1224365234375, 4.34613037109375, 4.56982421875, 4.79351806640625, 5.0172119140625, 5.24090576171875, 5.464599609375, 5.68829345703125, 5.9119873046875, 6.13568115234375, 6.359375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 9.0, 9.0, 11.0, 18.0, 9.0, 20.0, 26.0, 24.0, 29.0, 31.0, 32.0, 41.0, 35.0, 48.0, 47.0, 42.0, 42.0, 1075.0, 50.0, 33.0, 42.0, 33.0, 41.0, 38.0, 39.0, 32.0, 23.0, 20.0, 15.0, 26.0, 17.0, 13.0, 12.0, 7.0, 11.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.1875, -79.7236328125, -77.259765625, -74.7958984375, -72.33203125, -69.8681640625, -67.404296875, -64.9404296875, -62.4765625, -60.0126953125, -57.548828125, -55.0849609375, -52.62109375, -50.1572265625, -47.693359375, -45.2294921875, -42.765625, -40.3017578125, -37.837890625, -35.3740234375, -32.91015625, -30.4462890625, -27.982421875, -25.5185546875, -23.0546875, -20.5908203125, -18.126953125, -15.6630859375, -13.19921875, -10.7353515625, -8.271484375, -5.8076171875, -3.34375, -0.8798828125, 1.583984375, 4.0478515625, 6.51171875, 8.9755859375, 11.439453125, 13.9033203125, 16.3671875, 18.8310546875, 21.294921875, 23.7587890625, 26.22265625, 28.6865234375, 31.150390625, 33.6142578125, 36.078125, 38.5419921875, 41.005859375, 43.4697265625, 45.93359375, 48.3974609375, 50.861328125, 53.3251953125, 55.7890625, 58.2529296875, 60.716796875, 63.1806640625, 65.64453125, 68.1083984375, 70.572265625, 73.0361328125, 75.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 7.0, 17.0, 27.0, 49.0, 80.0, 118.0, 192.0, 279.0, 495.0, 714.0, 1242.0, 1983.0, 3301.0, 5319.0, 8643.0, 14286.0, 22892.0, 36891.0, 57656.0, 86224.0, 119432.0, 219612.0, 1128267.0, 126755.0, 93361.0, 62517.0, 40782.0, 25630.0, 15620.0, 9562.0, 5901.0, 3632.0, 2134.0, 1363.0, 793.0, 514.0, 316.0, 183.0, 126.0, 75.0, 42.0, 30.0, 29.0, 8.0, 13.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0234375, -5.8358154296875, -5.648193359375, -5.4605712890625, -5.27294921875, -5.0853271484375, -4.897705078125, -4.7100830078125, -4.5224609375, -4.3348388671875, -4.147216796875, -3.9595947265625, -3.77197265625, -3.5843505859375, -3.396728515625, -3.2091064453125, -3.021484375, -2.8338623046875, -2.646240234375, -2.4586181640625, -2.27099609375, -2.0833740234375, -1.895751953125, -1.7081298828125, -1.5205078125, -1.3328857421875, -1.145263671875, -0.9576416015625, -0.77001953125, -0.5823974609375, -0.394775390625, -0.2071533203125, -0.01953125, 0.1680908203125, 0.355712890625, 0.5433349609375, 0.73095703125, 0.9185791015625, 1.106201171875, 1.2938232421875, 1.4814453125, 1.6690673828125, 1.856689453125, 2.0443115234375, 2.23193359375, 2.4195556640625, 2.607177734375, 2.7947998046875, 2.982421875, 3.1700439453125, 3.357666015625, 3.5452880859375, 3.73291015625, 3.9205322265625, 4.108154296875, 4.2957763671875, 4.4833984375, 4.6710205078125, 4.858642578125, 5.0462646484375, 5.23388671875, 5.4215087890625, 5.609130859375, 5.7967529296875, 5.984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 6.0, 6.0, 8.0, 6.0, 12.0, 12.0, 12.0, 16.0, 20.0, 10.0, 25.0, 23.0, 17.0, 19.0, 23.0, 38.0, 53.0, 55.0, 79.0, 84.0, 86.0, 69.0, 53.0, 36.0, 26.0, 21.0, 19.0, 11.0, 23.0, 27.0, 11.0, 14.0, 13.0, 8.0, 8.0, 15.0, 10.0, 6.0, 5.0, 3.0, 6.0, 5.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10577392578125, -0.10219478607177734, -0.09861564636230469, -0.09503650665283203, -0.09145736694335938, -0.08787822723388672, -0.08429908752441406, -0.0807199478149414, -0.07714080810546875, -0.0735616683959961, -0.06998252868652344, -0.06640338897705078, -0.06282424926757812, -0.05924510955810547, -0.05566596984863281, -0.052086830139160156, -0.0485076904296875, -0.044928550720214844, -0.04134941101074219, -0.03777027130126953, -0.034191131591796875, -0.03061199188232422, -0.027032852172851562, -0.023453712463378906, -0.01987457275390625, -0.016295433044433594, -0.012716293334960938, -0.009137153625488281, -0.005558013916015625, -0.0019788742065429688, 0.0016002655029296875, 0.005179405212402344, 0.008758544921875, 0.012337684631347656, 0.015916824340820312, 0.01949596405029297, 0.023075103759765625, 0.02665424346923828, 0.030233383178710938, 0.033812522888183594, 0.03739166259765625, 0.040970802307128906, 0.04454994201660156, 0.04812908172607422, 0.051708221435546875, 0.05528736114501953, 0.05886650085449219, 0.062445640563964844, 0.0660247802734375, 0.06960391998291016, 0.07318305969238281, 0.07676219940185547, 0.08034133911132812, 0.08392047882080078, 0.08749961853027344, 0.0910787582397461, 0.09465789794921875, 0.0982370376586914, 0.10181617736816406, 0.10539531707763672, 0.10897445678710938, 0.11255359649658203, 0.11613273620605469, 0.11971187591552734, 0.123291015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 5.0, 6.0, 14.0, 6.0, 21.0, 22.0, 31.0, 30.0, 48.0, 49.0, 65.0, 87.0, 128.0, 130.0, 225.0, 310.0, 527.0, 1154.0, 2600.0, 7148.0, 23433.0, 102715.0, 544910.0, 290304.0, 52270.0, 13791.0, 4489.0, 1730.0, 821.0, 440.0, 247.0, 223.0, 155.0, 96.0, 84.0, 52.0, 34.0, 34.0, 38.0, 19.0, 22.0, 5.0, 13.0, 10.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8046875, -0.7801437377929688, -0.7555999755859375, -0.7310562133789062, -0.706512451171875, -0.6819686889648438, -0.6574249267578125, -0.6328811645507812, -0.60833740234375, -0.5837936401367188, -0.5592498779296875, -0.5347061157226562, -0.510162353515625, -0.48561859130859375, -0.4610748291015625, -0.43653106689453125, -0.4119873046875, -0.38744354248046875, -0.3628997802734375, -0.33835601806640625, -0.313812255859375, -0.28926849365234375, -0.2647247314453125, -0.24018096923828125, -0.21563720703125, -0.19109344482421875, -0.1665496826171875, -0.14200592041015625, -0.117462158203125, -0.09291839599609375, -0.0683746337890625, -0.04383087158203125, -0.019287109375, 0.00525665283203125, 0.0298004150390625, 0.05434417724609375, 0.078887939453125, 0.10343170166015625, 0.1279754638671875, 0.15251922607421875, 0.17706298828125, 0.20160675048828125, 0.2261505126953125, 0.25069427490234375, 0.275238037109375, 0.29978179931640625, 0.3243255615234375, 0.34886932373046875, 0.3734130859375, 0.39795684814453125, 0.4225006103515625, 0.44704437255859375, 0.471588134765625, 0.49613189697265625, 0.5206756591796875, 0.5452194213867188, 0.56976318359375, 0.5943069458007812, 0.6188507080078125, 0.6433944702148438, 0.667938232421875, 0.6924819946289062, 0.7170257568359375, 0.7415695190429688, 0.76611328125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 22.0, 115.0, 417.0, 270.0, 92.0, 39.0, 20.0, 14.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6714964509010315, -0.6480262875556946, -0.6245560646057129, -0.601085901260376, -0.5776157379150391, -0.5541455745697021, -0.5306753516197205, -0.5072051882743835, -0.48373499512672424, -0.46026480197906494, -0.436794638633728, -0.4133244454860687, -0.3898542523384094, -0.3663840889930725, -0.3429138958454132, -0.3194437026977539, -0.295973539352417, -0.2725033462047577, -0.24903318285942078, -0.22556298971176147, -0.20209281146526337, -0.17862263321876526, -0.15515244007110596, -0.13168226182460785, -0.10821208357810974, -0.08474190533161163, -0.06127171963453293, -0.037801533937454224, -0.014331355690956116, 0.009138822555541992, 0.032609015703201294, 0.0560791939496994, 0.07954937219619751, 0.10301955044269562, 0.12648972868919373, 0.14995992183685303, 0.17343010008335114, 0.19690027832984924, 0.22037047147750854, 0.24384064972400665, 0.26731082797050476, 0.29078102111816406, 0.314251184463501, 0.3377213776111603, 0.3611915707588196, 0.3846617341041565, 0.4081319272518158, 0.4316021203994751, 0.455072283744812, 0.4785424768924713, 0.5020126700401306, 0.5254828333854675, 0.5489529967308044, 0.5724232196807861, 0.595893383026123, 0.61936354637146, 0.6428337097167969, 0.6663038730621338, 0.6897740960121155, 0.7132442593574524, 0.7367144227027893, 0.760184645652771, 0.7836548089981079, 0.8071249723434448, 0.8305951952934265]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 6.0, 7.0, 11.0, 12.0, 14.0, 18.0, 27.0, 20.0, 22.0, 25.0, 23.0, 35.0, 27.0, 27.0, 31.0, 28.0, 34.0, 36.0, 37.0, 41.0, 40.0, 27.0, 34.0, 43.0, 35.0, 25.0, 26.0, 34.0, 27.0, 32.0, 24.0, 18.0, 21.0, 19.0, 18.0, 16.0, 15.0, 6.0, 9.0, 13.0, 6.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.17102372646331787, -0.16614510118961334, -0.1612664759159088, -0.1563878357410431, -0.15150921046733856, -0.14663058519363403, -0.1417519599199295, -0.13687333464622498, -0.13199469447135925, -0.12711606919765472, -0.1222374364733696, -0.11735881119966507, -0.11248017847537994, -0.10760155320167542, -0.10272292792797089, -0.09784430265426636, -0.09296567738056183, -0.0880870521068573, -0.08320841938257217, -0.07832979410886765, -0.07345116138458252, -0.06857253611087799, -0.06369391083717346, -0.058815281838178635, -0.05393665283918381, -0.04905802384018898, -0.04417939484119415, -0.039300769567489624, -0.0344221405684948, -0.02954351156949997, -0.02466488443315029, -0.019786257296800613, -0.014907628297805786, -0.010029000230133533, -0.005150372162461281, -0.00027174409478902817, 0.0046068839728832245, 0.009485512971878052, 0.01436414010822773, 0.019242767244577408, 0.024121396243572235, 0.029000025242567062, 0.03387865424156189, 0.03875727951526642, 0.043635908514261246, 0.04851453751325607, 0.0533931627869606, 0.05827179178595543, 0.06315042078495026, 0.06802904605865479, 0.07290767878293991, 0.07778630405664444, 0.08266493678092957, 0.0875435620546341, 0.09242218732833862, 0.09730081260204315, 0.10217944532632828, 0.1070580706000328, 0.11193670332431793, 0.11681532859802246, 0.12169395387172699, 0.12657257914543152, 0.13145121932029724, 0.13632984459400177, 0.1412084698677063]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 13.0, 12.0, 8.0, 19.0, 25.0, 19.0, 28.0, 35.0, 34.0, 28.0, 46.0, 50.0, 67.0, 52.0, 41.0, 54.0, 43.0, 69.0, 40.0, 57.0, 41.0, 27.0, 36.0, 32.0, 22.0, 24.0, 20.0, 14.0, 12.0, 3.0, 4.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0], "bins": [-172.0, -167.5927734375, -163.185546875, -158.7783203125, -154.37109375, -149.9638671875, -145.556640625, -141.1494140625, -136.7421875, -132.3349609375, -127.927734375, -123.5205078125, -119.11328125, -114.7060546875, -110.298828125, -105.8916015625, -101.484375, -97.0771484375, -92.669921875, -88.2626953125, -83.85546875, -79.4482421875, -75.041015625, -70.6337890625, -66.2265625, -61.8193359375, -57.412109375, -53.0048828125, -48.59765625, -44.1904296875, -39.783203125, -35.3759765625, -30.96875, -26.5615234375, -22.154296875, -17.7470703125, -13.33984375, -8.9326171875, -4.525390625, -0.1181640625, 4.2890625, 8.6962890625, 13.103515625, 17.5107421875, 21.91796875, 26.3251953125, 30.732421875, 35.1396484375, 39.546875, 43.9541015625, 48.361328125, 52.7685546875, 57.17578125, 61.5830078125, 65.990234375, 70.3974609375, 74.8046875, 79.2119140625, 83.619140625, 88.0263671875, 92.43359375, 96.8408203125, 101.248046875, 105.6552734375, 110.0625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 9.0, 14.0, 19.0, 31.0, 27.0, 46.0, 69.0, 94.0, 141.0, 208.0, 291.0, 482.0, 772.0, 1270.0, 2412.0, 5163.0, 13355.0, 45107.0, 195776.0, 523203.0, 191688.0, 43843.0, 13354.0, 5151.0, 2462.0, 1374.0, 757.0, 483.0, 290.0, 192.0, 135.0, 94.0, 62.0, 50.0, 31.0, 21.0, 14.0, 20.0, 11.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-23.5625, -22.87939453125, -22.1962890625, -21.51318359375, -20.830078125, -20.14697265625, -19.4638671875, -18.78076171875, -18.09765625, -17.41455078125, -16.7314453125, -16.04833984375, -15.365234375, -14.68212890625, -13.9990234375, -13.31591796875, -12.6328125, -11.94970703125, -11.2666015625, -10.58349609375, -9.900390625, -9.21728515625, -8.5341796875, -7.85107421875, -7.16796875, -6.48486328125, -5.8017578125, -5.11865234375, -4.435546875, -3.75244140625, -3.0693359375, -2.38623046875, -1.703125, -1.02001953125, -0.3369140625, 0.34619140625, 1.029296875, 1.71240234375, 2.3955078125, 3.07861328125, 3.76171875, 4.44482421875, 5.1279296875, 5.81103515625, 6.494140625, 7.17724609375, 7.8603515625, 8.54345703125, 9.2265625, 9.90966796875, 10.5927734375, 11.27587890625, 11.958984375, 12.64208984375, 13.3251953125, 14.00830078125, 14.69140625, 15.37451171875, 16.0576171875, 16.74072265625, 17.423828125, 18.10693359375, 18.7900390625, 19.47314453125, 20.15625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 6.0, 14.0, 23.0, 52.0, 60.0, 102.0, 152.0, 2208.0, 140.0, 108.0, 72.0, 52.0, 36.0, 19.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-526.0, -510.828125, -495.65625, -480.484375, -465.3125, -450.140625, -434.96875, -419.796875, -404.625, -389.453125, -374.28125, -359.109375, -343.9375, -328.765625, -313.59375, -298.421875, -283.25, -268.078125, -252.90625, -237.734375, -222.5625, -207.390625, -192.21875, -177.046875, -161.875, -146.703125, -131.53125, -116.359375, -101.1875, -86.015625, -70.84375, -55.671875, -40.5, -25.328125, -10.15625, 5.015625, 20.1875, 35.359375, 50.53125, 65.703125, 80.875, 96.046875, 111.21875, 126.390625, 141.5625, 156.734375, 171.90625, 187.078125, 202.25, 217.421875, 232.59375, 247.765625, 262.9375, 278.109375, 293.28125, 308.453125, 323.625, 338.796875, 353.96875, 369.140625, 384.3125, 399.484375, 414.65625, 429.828125, 445.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 6.0, 8.0, 5.0, 15.0, 33.0, 52.0, 135.0, 261.0, 625.0, 2041.0, 19162.0, 3078045.0, 41481.0, 2509.0, 736.0, 304.0, 132.0, 58.0, 32.0, 17.0, 19.0, 9.0, 4.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.5625, -77.8388671875, -75.115234375, -72.3916015625, -69.66796875, -66.9443359375, -64.220703125, -61.4970703125, -58.7734375, -56.0498046875, -53.326171875, -50.6025390625, -47.87890625, -45.1552734375, -42.431640625, -39.7080078125, -36.984375, -34.2607421875, -31.537109375, -28.8134765625, -26.08984375, -23.3662109375, -20.642578125, -17.9189453125, -15.1953125, -12.4716796875, -9.748046875, -7.0244140625, -4.30078125, -1.5771484375, 1.146484375, 3.8701171875, 6.59375, 9.3173828125, 12.041015625, 14.7646484375, 17.48828125, 20.2119140625, 22.935546875, 25.6591796875, 28.3828125, 31.1064453125, 33.830078125, 36.5537109375, 39.27734375, 42.0009765625, 44.724609375, 47.4482421875, 50.171875, 52.8955078125, 55.619140625, 58.3427734375, 61.06640625, 63.7900390625, 66.513671875, 69.2373046875, 71.9609375, 74.6845703125, 77.408203125, 80.1318359375, 82.85546875, 85.5791015625, 88.302734375, 91.0263671875, 93.75]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 11.0, 8.0, 18.0, 17.0, 21.0, 34.0, 53.0, 96.0, 125.0, 142.0, 131.0, 133.0, 75.0, 62.0, 17.0, 18.0, 9.0, 7.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-174.1661834716797, -166.9312744140625, -159.69638061523438, -152.4614715576172, -145.2265625, -137.99166870117188, -130.7567596435547, -123.52185821533203, -116.28695678710938, -109.05205535888672, -101.81715393066406, -94.58224487304688, -87.34734344482422, -80.11244201660156, -72.87753295898438, -65.64263153076172, -58.40773010253906, -51.172828674316406, -43.937923431396484, -36.70301818847656, -29.468116760253906, -22.23321533203125, -14.998310089111328, -7.763404846191406, -0.52850341796875, 6.706399917602539, 13.941303253173828, 21.176206588745117, 28.411109924316406, 35.64601135253906, 42.880916595458984, 50.115821838378906, 57.3507080078125, 64.58560943603516, 71.82051086425781, 79.055419921875, 86.29032135009766, 93.52522277832031, 100.7601318359375, 107.99503326416016, 115.22993469238281, 122.46483612060547, 129.69973754882812, 136.9346466064453, 144.1695556640625, 151.40444946289062, 158.6393585205078, 165.874267578125, 173.10916137695312, 180.3440704345703, 187.57896423339844, 194.81387329101562, 202.04876708984375, 209.28367614746094, 216.51858520507812, 223.75347900390625, 230.98838806152344, 238.22329711914062, 245.45819091796875, 252.69309997558594, 259.9280090332031, 267.16290283203125, 274.3977966308594, 281.6327209472656, 288.86761474609375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 5.0, 15.0, 10.0, 11.0, 13.0, 18.0, 20.0, 25.0, 27.0, 26.0, 29.0, 37.0, 33.0, 30.0, 35.0, 40.0, 31.0, 47.0, 43.0, 44.0, 45.0, 40.0, 54.0, 40.0, 39.0, 37.0, 23.0, 28.0, 18.0, 22.0, 22.0, 14.0, 8.0, 15.0, 8.0, 10.0, 9.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-207.69728088378906, -201.50135803222656, -195.30543518066406, -189.10951232910156, -182.91358947753906, -176.71766662597656, -170.52174377441406, -164.32582092285156, -158.12989807128906, -151.93397521972656, -145.73805236816406, -139.54212951660156, -133.34620666503906, -127.15028381347656, -120.95436096191406, -114.75843811035156, -108.5625228881836, -102.3666000366211, -96.1706771850586, -89.9747543334961, -83.7788314819336, -77.5829086303711, -71.38699340820312, -65.19107055664062, -58.99514389038086, -52.79922103881836, -46.60329818725586, -40.407379150390625, -34.211456298828125, -28.015531539916992, -21.819610595703125, -15.623687744140625, -9.427764892578125, -3.231842517852783, 2.9640798568725586, 9.160001754760742, 15.355924606323242, 21.551847457885742, 27.74776840209961, 33.94369125366211, 40.13961410522461, 46.33553695678711, 52.53145980834961, 58.727378845214844, 64.92330169677734, 71.11922454833984, 77.31514739990234, 83.51107025146484, 89.70699310302734, 95.90291595458984, 102.09883880615234, 108.29476165771484, 114.49068450927734, 120.68660736083984, 126.88252258300781, 133.0784454345703, 139.2743682861328, 145.4702911376953, 151.6662139892578, 157.8621368408203, 164.0580596923828, 170.2539825439453, 176.4499053955078, 182.6458282470703, 188.8417510986328]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 11.0, 11.0, 25.0, 33.0, 58.0, 87.0, 150.0, 217.0, 308.0, 401.0, 653.0, 990.0, 1702.0, 1040396.0, 1163.0, 776.0, 486.0, 358.0, 261.0, 177.0, 127.0, 77.0, 40.0, 25.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.51348876953125, -129.29742431640625, -126.08135986328125, -122.86529541015625, -119.64923095703125, -116.43316650390625, -113.21710968017578, -110.00104522705078, -106.78498077392578, -103.56891632080078, -100.35285186767578, -97.13678741455078, -93.92073059082031, -90.70466613769531, -87.48860168457031, -84.27253723144531, -81.05647277832031, -77.84040832519531, -74.62434387207031, -71.40827941894531, -68.19221496582031, -64.97615051269531, -61.760093688964844, -58.544029235839844, -55.327964782714844, -52.111900329589844, -48.895835876464844, -45.67977523803711, -42.46371078491211, -39.24764633178711, -36.031585693359375, -32.815521240234375, -29.599464416503906, -26.383399963378906, -23.16733741760254, -19.951274871826172, -16.735210418701172, -13.519145965576172, -10.303083419799805, -7.0870208740234375, -3.8709564208984375, -0.6548929214477539, 2.5611705780029297, 5.777234077453613, 8.993297576904297, 12.209362030029297, 15.425424575805664, 18.64148712158203, 21.85755157470703, 25.07361602783203, 28.2896785736084, 31.505741119384766, 34.721805572509766, 37.937870025634766, 41.1539306640625, 44.3699951171875, 47.5860595703125, 50.8021240234375, 54.0181884765625, 57.234249114990234, 60.450313568115234, 63.666378021240234, 66.88243865966797, 70.09850311279297, 73.31456756591797]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 9.0, 8.0, 4.0, 11.0, 18.0, 19.0, 63.0, 163.0, 51462052.0, 643.0, 65.0, 36.0, 14.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 4.0, 2.0, 8.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6248.0, -5946.72509765625, -5645.45068359375, -5344.17578125, -5042.9013671875, -4741.62646484375, -4440.3515625, -4139.0771484375, -3837.802490234375, -3536.52783203125, -3235.253173828125, -2933.978515625, -2632.70361328125, -2331.42919921875, -2030.154296875, -1728.879638671875, -1427.60498046875, -1126.330322265625, -825.0556030273438, -523.7808837890625, -222.5062255859375, 78.7684326171875, 380.043212890625, 681.31787109375, 982.592529296875, 1283.8671875, 1585.141845703125, 1886.4166259765625, 2187.69140625, 2488.9658203125, 2790.24072265625, 3091.515380859375, 3392.7900390625, 3694.064697265625, 3995.33935546875, 4296.6142578125, 4597.888671875, 4899.16357421875, 5200.4384765625, 5501.712890625, 5802.9873046875, 6104.26220703125, 6405.53662109375, 6706.8115234375, 7008.0859375, 7309.36083984375, 7610.6357421875, 7911.91015625, 8213.185546875, 8514.4599609375, 8815.7353515625, 9117.009765625, 9418.2841796875, 9719.55859375, 10020.833984375, 10322.1083984375, 10623.3828125, 10924.6572265625, 11225.9326171875, 11527.20703125, 11828.4814453125, 12129.755859375, 12431.03125, 12732.3056640625, 13033.580078125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 10.0, 12.0, 26.0, 34.0, 51.0, 88.0, 110.0, 177.0, 277.0, 464.0, 706.0, 1089.0, 1560.0, 2528.0, 4045.0, 6350.0, 10070.0, 15898.0, 25562.0, 41257.0, 65795.0, 103567.0, 157792.0, 231004.0, 318029.0, 459832.0, 3435481.0, 441627.0, 313602.0, 227143.0, 153853.0, 101184.0, 63968.0, 40379.0, 25252.0, 15840.0, 9929.0, 6193.0, 3903.0, 2408.0, 1540.0, 987.0, 651.0, 410.0, 265.0, 178.0, 113.0, 66.0, 43.0, 40.0, 20.0, 11.0, 5.0, 3.0, 7.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0], "bins": [-2.146484375, -2.07366943359375, -2.0008544921875, -1.92803955078125, -1.855224609375, -1.78240966796875, -1.7095947265625, -1.63677978515625, -1.56396484375, -1.49114990234375, -1.4183349609375, -1.34552001953125, -1.272705078125, -1.19989013671875, -1.1270751953125, -1.05426025390625, -0.9814453125, -0.90863037109375, -0.8358154296875, -0.76300048828125, -0.690185546875, -0.61737060546875, -0.5445556640625, -0.47174072265625, -0.39892578125, -0.32611083984375, -0.2532958984375, -0.18048095703125, -0.107666015625, -0.03485107421875, 0.0379638671875, 0.11077880859375, 0.18359375, 0.25640869140625, 0.3292236328125, 0.40203857421875, 0.474853515625, 0.54766845703125, 0.6204833984375, 0.69329833984375, 0.76611328125, 0.83892822265625, 0.9117431640625, 0.98455810546875, 1.057373046875, 1.13018798828125, 1.2030029296875, 1.27581787109375, 1.3486328125, 1.42144775390625, 1.4942626953125, 1.56707763671875, 1.639892578125, 1.71270751953125, 1.7855224609375, 1.85833740234375, 1.93115234375, 2.00396728515625, 2.0767822265625, 2.14959716796875, 2.222412109375, 2.29522705078125, 2.3680419921875, 2.44085693359375, 2.513671875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 2.0, 5.0, 6.0, 3.0, 4.0, 13.0, 7.0, 17.0, 20.0, 14.0, 20.0, 29.0, 28.0, 26.0, 41.0, 33.0, 47.0, 32.0, 32.0, 42.0, 59.0, 558.0, 531.0, 28.0, 46.0, 50.0, 36.0, 45.0, 34.0, 28.0, 29.0, 22.0, 26.0, 18.0, 15.0, 15.0, 10.0, 15.0, 9.0, 5.0, 5.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.859375, -25.993896484375, -25.12841796875, -24.262939453125, -23.3974609375, -22.531982421875, -21.66650390625, -20.801025390625, -19.935546875, -19.070068359375, -18.20458984375, -17.339111328125, -16.4736328125, -15.608154296875, -14.74267578125, -13.877197265625, -13.01171875, -12.146240234375, -11.28076171875, -10.415283203125, -9.5498046875, -8.684326171875, -7.81884765625, -6.953369140625, -6.087890625, -5.222412109375, -4.35693359375, -3.491455078125, -2.6259765625, -1.760498046875, -0.89501953125, -0.029541015625, 0.8359375, 1.701416015625, 2.56689453125, 3.432373046875, 4.2978515625, 5.163330078125, 6.02880859375, 6.894287109375, 7.759765625, 8.625244140625, 9.49072265625, 10.356201171875, 11.2216796875, 12.087158203125, 12.95263671875, 13.818115234375, 14.68359375, 15.549072265625, 16.41455078125, 17.280029296875, 18.1455078125, 19.010986328125, 19.87646484375, 20.741943359375, 21.607421875, 22.472900390625, 23.33837890625, 24.203857421875, 25.0693359375, 25.934814453125, 26.80029296875, 27.665771484375, 28.53125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 14.0, 14.0, 33.0, 36.0, 57.0, 76.0, 105.0, 149.0, 229.0, 334.0, 548.0, 768.0, 1180.0, 1856.0, 2923.0, 4560.0, 7147.0, 11552.0, 18610.0, 30353.0, 47955.0, 76524.0, 118872.0, 180937.0, 259634.0, 353130.0, 1009593.0, 2899082.0, 395954.0, 289040.0, 204256.0, 137012.0, 88227.0, 55688.0, 35267.0, 21977.0, 13580.0, 8904.0, 5510.0, 3503.0, 2185.0, 1418.0, 957.0, 616.0, 394.0, 245.0, 171.0, 102.0, 66.0, 48.0, 23.0, 14.0, 6.0, 1.0, 3.0, 4.0, 1.0], "bins": [-2.498046875, -2.4249267578125, -2.351806640625, -2.2786865234375, -2.20556640625, -2.1324462890625, -2.059326171875, -1.9862060546875, -1.9130859375, -1.8399658203125, -1.766845703125, -1.6937255859375, -1.62060546875, -1.5474853515625, -1.474365234375, -1.4012451171875, -1.328125, -1.2550048828125, -1.181884765625, -1.1087646484375, -1.03564453125, -0.9625244140625, -0.889404296875, -0.8162841796875, -0.7431640625, -0.6700439453125, -0.596923828125, -0.5238037109375, -0.45068359375, -0.3775634765625, -0.304443359375, -0.2313232421875, -0.158203125, -0.0850830078125, -0.011962890625, 0.0611572265625, 0.13427734375, 0.2073974609375, 0.280517578125, 0.3536376953125, 0.4267578125, 0.4998779296875, 0.572998046875, 0.6461181640625, 0.71923828125, 0.7923583984375, 0.865478515625, 0.9385986328125, 1.01171875, 1.0848388671875, 1.157958984375, 1.2310791015625, 1.30419921875, 1.3773193359375, 1.450439453125, 1.5235595703125, 1.5966796875, 1.6697998046875, 1.742919921875, 1.8160400390625, 1.88916015625, 1.9622802734375, 2.035400390625, 2.1085205078125, 2.181640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 16.0, 5.0, 14.0, 23.0, 24.0, 24.0, 26.0, 33.0, 27.0, 31.0, 36.0, 48.0, 48.0, 44.0, 40.0, 183.0, 922.0, 50.0, 58.0, 43.0, 39.0, 45.0, 28.0, 29.0, 31.0, 28.0, 23.0, 19.0, 19.0, 16.0, 7.0, 9.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-29.1875, -28.361572265625, -27.53564453125, -26.709716796875, -25.8837890625, -25.057861328125, -24.23193359375, -23.406005859375, -22.580078125, -21.754150390625, -20.92822265625, -20.102294921875, -19.2763671875, -18.450439453125, -17.62451171875, -16.798583984375, -15.97265625, -15.146728515625, -14.32080078125, -13.494873046875, -12.6689453125, -11.843017578125, -11.01708984375, -10.191162109375, -9.365234375, -8.539306640625, -7.71337890625, -6.887451171875, -6.0615234375, -5.235595703125, -4.40966796875, -3.583740234375, -2.7578125, -1.931884765625, -1.10595703125, -0.280029296875, 0.5458984375, 1.371826171875, 2.19775390625, 3.023681640625, 3.849609375, 4.675537109375, 5.50146484375, 6.327392578125, 7.1533203125, 7.979248046875, 8.80517578125, 9.631103515625, 10.45703125, 11.282958984375, 12.10888671875, 12.934814453125, 13.7607421875, 14.586669921875, 15.41259765625, 16.238525390625, 17.064453125, 17.890380859375, 18.71630859375, 19.542236328125, 20.3681640625, 21.194091796875, 22.02001953125, 22.845947265625, 23.671875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 5.0, 6.0, 8.0, 8.0, 16.0, 25.0, 34.0, 36.0, 54.0, 72.0, 118.0, 142.0, 181.0, 231.0, 299.0, 446.0, 600.0, 986.0, 1613.0, 2867.0, 5218.0, 10681.0, 23351.0, 54454.0, 132570.0, 5705561.0, 211435.0, 76886.0, 32775.0, 14282.0, 6767.0, 3562.0, 2028.0, 1274.0, 827.0, 572.0, 376.0, 260.0, 186.0, 154.0, 119.0, 84.0, 69.0, 42.0, 33.0, 30.0, 22.0, 23.0, 9.0, 9.0, 5.0, 5.0, 3.0, 5.0, 4.0, 6.0, 2.0], "bins": [-11.109375, -10.7696533203125, -10.429931640625, -10.0902099609375, -9.75048828125, -9.4107666015625, -9.071044921875, -8.7313232421875, -8.3916015625, -8.0518798828125, -7.712158203125, -7.3724365234375, -7.03271484375, -6.6929931640625, -6.353271484375, -6.0135498046875, -5.673828125, -5.3341064453125, -4.994384765625, -4.6546630859375, -4.31494140625, -3.9752197265625, -3.635498046875, -3.2957763671875, -2.9560546875, -2.6163330078125, -2.276611328125, -1.9368896484375, -1.59716796875, -1.2574462890625, -0.917724609375, -0.5780029296875, -0.23828125, 0.1014404296875, 0.441162109375, 0.7808837890625, 1.12060546875, 1.4603271484375, 1.800048828125, 2.1397705078125, 2.4794921875, 2.8192138671875, 3.158935546875, 3.4986572265625, 3.83837890625, 4.1781005859375, 4.517822265625, 4.8575439453125, 5.197265625, 5.5369873046875, 5.876708984375, 6.2164306640625, 6.55615234375, 6.8958740234375, 7.235595703125, 7.5753173828125, 7.9150390625, 8.2547607421875, 8.594482421875, 8.9342041015625, 9.27392578125, 9.6136474609375, 9.953369140625, 10.2930908203125, 10.6328125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 11.0, 17.0, 15.0, 22.0, 19.0, 27.0, 17.0, 31.0, 33.0, 49.0, 34.0, 42.0, 44.0, 43.0, 86.0, 894.0, 182.0, 46.0, 54.0, 46.0, 34.0, 33.0, 33.0, 21.0, 27.0, 21.0, 26.0, 13.0, 11.0, 15.0, 18.0, 12.0, 6.0, 11.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.453125, -21.768310546875, -21.08349609375, -20.398681640625, -19.7138671875, -19.029052734375, -18.34423828125, -17.659423828125, -16.974609375, -16.289794921875, -15.60498046875, -14.920166015625, -14.2353515625, -13.550537109375, -12.86572265625, -12.180908203125, -11.49609375, -10.811279296875, -10.12646484375, -9.441650390625, -8.7568359375, -8.072021484375, -7.38720703125, -6.702392578125, -6.017578125, -5.332763671875, -4.64794921875, -3.963134765625, -3.2783203125, -2.593505859375, -1.90869140625, -1.223876953125, -0.5390625, 0.145751953125, 0.83056640625, 1.515380859375, 2.2001953125, 2.885009765625, 3.56982421875, 4.254638671875, 4.939453125, 5.624267578125, 6.30908203125, 6.993896484375, 7.6787109375, 8.363525390625, 9.04833984375, 9.733154296875, 10.41796875, 11.102783203125, 11.78759765625, 12.472412109375, 13.1572265625, 13.842041015625, 14.52685546875, 15.211669921875, 15.896484375, 16.581298828125, 17.26611328125, 17.950927734375, 18.6357421875, 19.320556640625, 20.00537109375, 20.690185546875, 21.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 10.0, 22.0, 30.0, 59.0, 83.0, 144.0, 230.0, 176.0, 93.0, 63.0, 37.0, 18.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.35433959960938, -111.6714859008789, -108.98863983154297, -106.3057861328125, -103.62294006347656, -100.9400863647461, -98.25723266601562, -95.57438659667969, -92.89154052734375, -90.20868682861328, -87.52584075927734, -84.84298706054688, -82.16014099121094, -79.47728729248047, -76.79443359375, -74.11158752441406, -71.4287338256836, -68.74588012695312, -66.06303405761719, -63.38018035888672, -60.69733428955078, -58.01448059082031, -55.33163070678711, -52.648780822753906, -49.9659309387207, -47.2830810546875, -44.6002311706543, -41.917381286621094, -39.234527587890625, -36.55168151855469, -33.86882781982422, -31.185977935791016, -28.503131866455078, -25.820281982421875, -23.137432098388672, -20.454580307006836, -17.771730422973633, -15.08888053894043, -12.406028747558594, -9.72317886352539, -7.0403289794921875, -4.357478618621826, -1.6746282577514648, 1.0082225799560547, 3.691072463989258, 6.373922348022461, 9.056774139404297, 11.7396240234375, 14.422473907470703, 17.105323791503906, 19.78817367553711, 22.471025466918945, 25.15387535095215, 27.83672523498535, 30.519577026367188, 33.20242691040039, 35.885276794433594, 38.5681266784668, 41.2509765625, 43.93383026123047, 46.616676330566406, 49.299530029296875, 51.98237991333008, 54.66522979736328, 57.348079681396484]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 4.0, 2.0, 13.0, 19.0, 20.0, 28.0, 33.0, 15.0, 22.0, 28.0, 32.0, 25.0, 30.0, 35.0, 32.0, 30.0, 29.0, 32.0, 22.0, 40.0, 26.0, 38.0, 30.0, 42.0, 34.0, 36.0, 45.0, 27.0, 26.0, 24.0, 24.0, 30.0, 28.0, 16.0, 15.0, 22.0, 15.0, 9.0, 8.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.06080627441406, -52.17949295043945, -50.298179626464844, -48.416866302490234, -46.535552978515625, -44.65424346923828, -42.77293014526367, -40.89161682128906, -39.01030349731445, -37.128990173339844, -35.247676849365234, -33.366363525390625, -31.48505210876465, -29.60373878479004, -27.722427368164062, -25.841114044189453, -23.959800720214844, -22.078487396240234, -20.197174072265625, -18.31586265563965, -16.43454933166504, -14.55323600769043, -12.671923637390137, -10.790611267089844, -8.909297943115234, -7.027985095977783, -5.146672248840332, -3.265359401702881, -1.3840465545654297, 0.4972667694091797, 2.3785791397094727, 4.259891510009766, 6.141204833984375, 8.022518157958984, 9.903830528259277, 11.78514289855957, 13.66645622253418, 15.547769546508789, 17.429080963134766, 19.310394287109375, 21.191707611083984, 23.073020935058594, 24.954334259033203, 26.83564567565918, 28.71695899963379, 30.5982723236084, 32.479583740234375, 34.360897064208984, 36.242210388183594, 38.1235237121582, 40.00483703613281, 41.88615036010742, 43.76746368408203, 45.648773193359375, 47.530086517333984, 49.411399841308594, 51.2927131652832, 53.17402648925781, 55.05533981323242, 56.93665313720703, 58.817962646484375, 60.69927978515625, 62.580589294433594, 64.46189880371094, 66.34321594238281]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 6.0, 7.0, 7.0, 8.0, 10.0, 21.0, 20.0, 34.0, 45.0, 53.0, 77.0, 109.0, 184.0, 301.0, 481.0, 878.0, 1743.0, 4077.0, 11796.0, 61220.0, 4008749.0, 83493.0, 13324.0, 4141.0, 1671.0, 807.0, 417.0, 225.0, 130.0, 85.0, 66.0, 39.0, 11.0, 15.0, 7.0, 6.0, 7.0, 9.0, 4.0], "bins": [-1.3603515625, -1.3304901123046875, -1.300628662109375, -1.2707672119140625, -1.24090576171875, -1.2110443115234375, -1.181182861328125, -1.1513214111328125, -1.1214599609375, -1.0915985107421875, -1.061737060546875, -1.0318756103515625, -1.00201416015625, -0.9721527099609375, -0.942291259765625, -0.9124298095703125, -0.882568359375, -0.8527069091796875, -0.822845458984375, -0.7929840087890625, -0.76312255859375, -0.7332611083984375, -0.703399658203125, -0.6735382080078125, -0.6436767578125, -0.6138153076171875, -0.583953857421875, -0.5540924072265625, -0.52423095703125, -0.4943695068359375, -0.464508056640625, -0.4346466064453125, -0.40478515625, -0.3749237060546875, -0.345062255859375, -0.3152008056640625, -0.28533935546875, -0.2554779052734375, -0.225616455078125, -0.1957550048828125, -0.1658935546875, -0.1360321044921875, -0.106170654296875, -0.0763092041015625, -0.04644775390625, -0.0165863037109375, 0.013275146484375, 0.0431365966796875, 0.072998046875, 0.1028594970703125, 0.132720947265625, 0.1625823974609375, 0.19244384765625, 0.2223052978515625, 0.252166748046875, 0.2820281982421875, 0.3118896484375, 0.3417510986328125, 0.371612548828125, 0.4014739990234375, 0.43133544921875, 0.4611968994140625, 0.491058349609375, 0.5209197998046875, 0.55078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 9.0, 12.0, 18.0, 754.0, 38.0, 16.0, 16.0, 14.0, 11.0, 11.0, 4.0, 6.0, 5.0, 6.0, 3.0, 7.0, 0.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2568359375, -0.25002098083496094, -0.24320602416992188, -0.2363910675048828, -0.22957611083984375, -0.2227611541748047, -0.21594619750976562, -0.20913124084472656, -0.2023162841796875, -0.19550132751464844, -0.18868637084960938, -0.1818714141845703, -0.17505645751953125, -0.1682415008544922, -0.16142654418945312, -0.15461158752441406, -0.147796630859375, -0.14098167419433594, -0.13416671752929688, -0.1273517608642578, -0.12053680419921875, -0.11372184753417969, -0.10690689086914062, -0.10009193420410156, -0.0932769775390625, -0.08646202087402344, -0.07964706420898438, -0.07283210754394531, -0.06601715087890625, -0.05920219421386719, -0.052387237548828125, -0.04557228088378906, -0.03875732421875, -0.03194236755371094, -0.025127410888671875, -0.018312454223632812, -0.01149749755859375, -0.0046825408935546875, 0.002132415771484375, 0.008947372436523438, 0.0157623291015625, 0.022577285766601562, 0.029392242431640625, 0.03620719909667969, 0.04302215576171875, 0.04983711242675781, 0.056652069091796875, 0.06346702575683594, 0.070281982421875, 0.07709693908691406, 0.08391189575195312, 0.09072685241699219, 0.09754180908203125, 0.10435676574707031, 0.11117172241210938, 0.11798667907714844, 0.1248016357421875, 0.13161659240722656, 0.13843154907226562, 0.1452465057373047, 0.15206146240234375, 0.1588764190673828, 0.16569137573242188, 0.17250633239746094, 0.1793212890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 9.0, 18.0, 19.0, 31.0, 58.0, 82.0, 141.0, 239.0, 470.0, 1052.0, 2316.0, 5757.0, 17675.0, 76978.0, 1333256.0, 2613934.0, 105670.0, 22775.0, 7660.0, 3152.0, 1377.0, 698.0, 364.0, 207.0, 134.0, 72.0, 42.0, 25.0, 25.0, 14.0, 8.0, 7.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6532974243164062, -0.6322784423828125, -0.6112594604492188, -0.590240478515625, -0.5692214965820312, -0.5482025146484375, -0.5271835327148438, -0.50616455078125, -0.48514556884765625, -0.4641265869140625, -0.44310760498046875, -0.422088623046875, -0.40106964111328125, -0.3800506591796875, -0.35903167724609375, -0.3380126953125, -0.31699371337890625, -0.2959747314453125, -0.27495574951171875, -0.253936767578125, -0.23291778564453125, -0.2118988037109375, -0.19087982177734375, -0.16986083984375, -0.14884185791015625, -0.1278228759765625, -0.10680389404296875, -0.085784912109375, -0.06476593017578125, -0.0437469482421875, -0.02272796630859375, -0.001708984375, 0.01930999755859375, 0.0403289794921875, 0.06134796142578125, 0.082366943359375, 0.10338592529296875, 0.1244049072265625, 0.14542388916015625, 0.16644287109375, 0.18746185302734375, 0.2084808349609375, 0.22949981689453125, 0.250518798828125, 0.27153778076171875, 0.2925567626953125, 0.31357574462890625, 0.3345947265625, 0.35561370849609375, 0.3766326904296875, 0.39765167236328125, 0.418670654296875, 0.43968963623046875, 0.4607086181640625, 0.48172760009765625, 0.50274658203125, 0.5237655639648438, 0.5447845458984375, 0.5658035278320312, 0.586822509765625, 0.6078414916992188, 0.6288604736328125, 0.6498794555664062, 0.6708984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 9.0, 6.0, 7.0, 10.0, 9.0, 16.0, 18.0, 25.0, 39.0, 59.0, 80.0, 170.0, 250.0, 492.0, 1090.0, 824.0, 366.0, 206.0, 97.0, 66.0, 55.0, 35.0, 29.0, 25.0, 14.0, 19.0, 8.0, 6.0, 7.0, 2.0, 4.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2064208984375, -0.19949913024902344, -0.19257736206054688, -0.1856555938720703, -0.17873382568359375, -0.1718120574951172, -0.16489028930664062, -0.15796852111816406, -0.1510467529296875, -0.14412498474121094, -0.13720321655273438, -0.1302814483642578, -0.12335968017578125, -0.11643791198730469, -0.10951614379882812, -0.10259437561035156, -0.095672607421875, -0.08875083923339844, -0.08182907104492188, -0.07490730285644531, -0.06798553466796875, -0.06106376647949219, -0.054141998291015625, -0.04722023010253906, -0.0402984619140625, -0.03337669372558594, -0.026454925537109375, -0.019533157348632812, -0.01261138916015625, -0.0056896209716796875, 0.001232147216796875, 0.008153915405273438, 0.01507568359375, 0.021997451782226562, 0.028919219970703125, 0.03584098815917969, 0.04276275634765625, 0.04968452453613281, 0.056606292724609375, 0.06352806091308594, 0.0704498291015625, 0.07737159729003906, 0.08429336547851562, 0.09121513366699219, 0.09813690185546875, 0.10505867004394531, 0.11198043823242188, 0.11890220642089844, 0.125823974609375, 0.13274574279785156, 0.13966751098632812, 0.1465892791748047, 0.15351104736328125, 0.1604328155517578, 0.16735458374023438, 0.17427635192871094, 0.1811981201171875, 0.18811988830566406, 0.19504165649414062, 0.2019634246826172, 0.20888519287109375, 0.2158069610595703, 0.22272872924804688, 0.22965049743652344, 0.236572265625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 11.0, 124.0, 694.0, 159.0, 12.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.195158004760742, -10.98995590209961, -10.78475284576416, -10.579550743103027, -10.374348640441895, -10.169146537780762, -9.963943481445312, -9.75874137878418, -9.553539276123047, -9.348337173461914, -9.143134117126465, -8.937932014465332, -8.7327299118042, -8.527527809143066, -8.322324752807617, -8.117122650146484, -7.911920070648193, -7.706717491149902, -7.5015153884887695, -7.2963128089904785, -7.091110706329346, -6.885908126831055, -6.680706024169922, -6.475503444671631, -6.27030086517334, -6.065098285675049, -5.859896183013916, -5.654693603515625, -5.449491500854492, -5.244288921356201, -5.03908634185791, -4.833884239196777, -4.628681659698486, -4.423479080200195, -4.2182769775390625, -4.0130743980407715, -3.8078722953796387, -3.6026697158813477, -3.3974673748016357, -3.192265033721924, -2.987062931060791, -2.781860589981079, -2.576658248901367, -2.371455669403076, -2.1662535667419434, -1.961051106452942, -1.7558486461639404, -1.5506463050842285, -1.345443844795227, -1.1402415037155151, -0.9350391030311584, -0.7298367023468018, -0.5246343612670898, -0.31943202018737793, -0.11422955989837646, 0.09097278118133545, 0.29617512226104736, 0.5013774633407593, 0.706579864025116, 0.9117822647094727, 1.1169846057891846, 1.3221869468688965, 1.527389407157898, 1.7325917482376099, 1.9377940893173218]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 9.0, 23.0, 43.0, 61.0, 61.0, 71.0, 104.0, 105.0, 112.0, 88.0, 93.0, 62.0, 56.0, 34.0, 22.0, 17.0, 8.0, 7.0, 3.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951798439025879, -1.8999910354614258, -1.848183512687683, -1.79637610912323, -1.7445687055587769, -1.6927611827850342, -1.640953779220581, -1.589146375656128, -1.5373389720916748, -1.4855315685272217, -1.433724045753479, -1.3819166421890259, -1.3301092386245728, -1.27830171585083, -1.226494312286377, -1.1746869087219238, -1.1228795051574707, -1.0710721015930176, -1.019264578819275, -0.9674571752548218, -0.9156497716903687, -0.8638423085212708, -0.8120348453521729, -0.7602274417877197, -0.708419919013977, -0.6566124558448792, -0.604805052280426, -0.5529975891113281, -0.501190185546875, -0.4493827223777771, -0.3975752890110016, -0.3457678556442261, -0.29396045207977295, -0.24215301871299744, -0.19034558534622192, -0.13853813707828522, -0.0867307037115097, -0.034923255443573, 0.016884177923202515, 0.06869161128997803, 0.12049904465675354, 0.17230647802352905, 0.22411391139030457, 0.2759213447570801, 0.327728807926178, 0.3795362412929535, 0.431343674659729, 0.4831511080265045, 0.53495854139328, 0.5867660045623779, 0.638573408126831, 0.690380871295929, 0.7421882748603821, 0.79399573802948, 0.8458031415939331, 0.897610604763031, 0.9494180679321289, 1.001225471496582, 1.0530329942703247, 1.1048403978347778, 1.156647801399231, 1.2084553241729736, 1.2602627277374268, 1.3120701313018799, 1.363877534866333]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 16.0, 9.0, 14.0, 14.0, 27.0, 53.0, 71.0, 91.0, 143.0, 205.0, 342.0, 532.0, 876.0, 1457.0, 2511.0, 4652.0, 9472.0, 21747.0, 69200.0, 870653.0, 36973.0, 14448.0, 6617.0, 3424.0, 1929.0, 1124.0, 675.0, 409.0, 287.0, 179.0, 121.0, 84.0, 61.0, 45.0, 25.0, 15.0, 15.0, 11.0, 4.0, 4.0, 3.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.423828125, -1.3767852783203125, -1.329742431640625, -1.2826995849609375, -1.23565673828125, -1.1886138916015625, -1.141571044921875, -1.0945281982421875, -1.0474853515625, -1.0004425048828125, -0.953399658203125, -0.9063568115234375, -0.85931396484375, -0.8122711181640625, -0.765228271484375, -0.7181854248046875, -0.671142578125, -0.6240997314453125, -0.577056884765625, -0.5300140380859375, -0.48297119140625, -0.4359283447265625, -0.388885498046875, -0.3418426513671875, -0.2947998046875, -0.2477569580078125, -0.200714111328125, -0.1536712646484375, -0.10662841796875, -0.0595855712890625, -0.012542724609375, 0.0345001220703125, 0.08154296875, 0.1285858154296875, 0.175628662109375, 0.2226715087890625, 0.26971435546875, 0.3167572021484375, 0.363800048828125, 0.4108428955078125, 0.4578857421875, 0.5049285888671875, 0.551971435546875, 0.5990142822265625, 0.64605712890625, 0.6930999755859375, 0.740142822265625, 0.7871856689453125, 0.834228515625, 0.8812713623046875, 0.928314208984375, 0.9753570556640625, 1.02239990234375, 1.0694427490234375, 1.116485595703125, 1.1635284423828125, 1.2105712890625, 1.2576141357421875, 1.304656982421875, 1.3516998291015625, 1.39874267578125, 1.4457855224609375, 1.492828369140625, 1.5398712158203125, 1.5869140625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 6.0, 4.0, 4.0, 19.0, 7.0, 14.0, 31.0, 467.0, 297.0, 21.0, 17.0, 11.0, 10.0, 10.0, 5.0, 10.0, 8.0, 2.0, 5.0, 5.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.242919921875, -0.23650169372558594, -0.23008346557617188, -0.2236652374267578, -0.21724700927734375, -0.2108287811279297, -0.20441055297851562, -0.19799232482910156, -0.1915740966796875, -0.18515586853027344, -0.17873764038085938, -0.1723194122314453, -0.16590118408203125, -0.1594829559326172, -0.15306472778320312, -0.14664649963378906, -0.140228271484375, -0.13381004333496094, -0.12739181518554688, -0.12097358703613281, -0.11455535888671875, -0.10813713073730469, -0.10171890258789062, -0.09530067443847656, -0.0888824462890625, -0.08246421813964844, -0.07604598999023438, -0.06962776184082031, -0.06320953369140625, -0.05679130554199219, -0.050373077392578125, -0.04395484924316406, -0.03753662109375, -0.031118392944335938, -0.024700164794921875, -0.018281936645507812, -0.01186370849609375, -0.0054454803466796875, 0.000972747802734375, 0.0073909759521484375, 0.0138092041015625, 0.020227432250976562, 0.026645660400390625, 0.03306388854980469, 0.03948211669921875, 0.04590034484863281, 0.052318572998046875, 0.05873680114746094, 0.065155029296875, 0.07157325744628906, 0.07799148559570312, 0.08440971374511719, 0.09082794189453125, 0.09724617004394531, 0.10366439819335938, 0.11008262634277344, 0.1165008544921875, 0.12291908264160156, 0.12933731079101562, 0.1357555389404297, 0.14217376708984375, 0.1485919952392578, 0.15501022338867188, 0.16142845153808594, 0.1678466796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 12.0, 26.0, 35.0, 37.0, 59.0, 81.0, 89.0, 148.0, 229.0, 360.0, 698.0, 1329.0, 2803.0, 6458.0, 17067.0, 55166.0, 205311.0, 476260.0, 199666.0, 53670.0, 16877.0, 6437.0, 2713.0, 1234.0, 639.0, 396.0, 233.0, 161.0, 90.0, 62.0, 41.0, 35.0, 37.0, 16.0, 10.0, 9.0, 7.0, 7.0, 11.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7568359375, -0.731170654296875, -0.70550537109375, -0.679840087890625, -0.6541748046875, -0.628509521484375, -0.60284423828125, -0.577178955078125, -0.551513671875, -0.525848388671875, -0.50018310546875, -0.474517822265625, -0.4488525390625, -0.423187255859375, -0.39752197265625, -0.371856689453125, -0.34619140625, -0.320526123046875, -0.29486083984375, -0.269195556640625, -0.2435302734375, -0.217864990234375, -0.19219970703125, -0.166534423828125, -0.140869140625, -0.115203857421875, -0.08953857421875, -0.063873291015625, -0.0382080078125, -0.012542724609375, 0.01312255859375, 0.038787841796875, 0.064453125, 0.090118408203125, 0.11578369140625, 0.141448974609375, 0.1671142578125, 0.192779541015625, 0.21844482421875, 0.244110107421875, 0.269775390625, 0.295440673828125, 0.32110595703125, 0.346771240234375, 0.3724365234375, 0.398101806640625, 0.42376708984375, 0.449432373046875, 0.47509765625, 0.500762939453125, 0.52642822265625, 0.552093505859375, 0.5777587890625, 0.603424072265625, 0.62908935546875, 0.654754638671875, 0.680419921875, 0.706085205078125, 0.73175048828125, 0.757415771484375, 0.7830810546875, 0.808746337890625, 0.83441162109375, 0.860076904296875, 0.8857421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 7.0, 9.0, 6.0, 15.0, 16.0, 18.0, 19.0, 26.0, 30.0, 25.0, 33.0, 30.0, 30.0, 30.0, 44.0, 42.0, 31.0, 45.0, 44.0, 39.0, 48.0, 37.0, 36.0, 35.0, 29.0, 27.0, 33.0, 29.0, 21.0, 19.0, 23.0, 20.0, 12.0, 15.0, 16.0, 9.0, 10.0, 11.0, 8.0, 9.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7451171875, -0.72015380859375, -0.6951904296875, -0.67022705078125, -0.645263671875, -0.62030029296875, -0.5953369140625, -0.57037353515625, -0.54541015625, -0.52044677734375, -0.4954833984375, -0.47052001953125, -0.445556640625, -0.42059326171875, -0.3956298828125, -0.37066650390625, -0.345703125, -0.32073974609375, -0.2957763671875, -0.27081298828125, -0.245849609375, -0.22088623046875, -0.1959228515625, -0.17095947265625, -0.14599609375, -0.12103271484375, -0.0960693359375, -0.07110595703125, -0.046142578125, -0.02117919921875, 0.0037841796875, 0.02874755859375, 0.0537109375, 0.07867431640625, 0.1036376953125, 0.12860107421875, 0.153564453125, 0.17852783203125, 0.2034912109375, 0.22845458984375, 0.25341796875, 0.27838134765625, 0.3033447265625, 0.32830810546875, 0.353271484375, 0.37823486328125, 0.4031982421875, 0.42816162109375, 0.453125, 0.47808837890625, 0.5030517578125, 0.52801513671875, 0.552978515625, 0.57794189453125, 0.6029052734375, 0.62786865234375, 0.65283203125, 0.67779541015625, 0.7027587890625, 0.72772216796875, 0.752685546875, 0.77764892578125, 0.8026123046875, 0.82757568359375, 0.8525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 9.0, 12.0, 26.0, 38.0, 51.0, 83.0, 147.0, 303.0, 751.0, 2570.0, 14229.0, 614599.0, 399898.0, 12184.0, 2278.0, 723.0, 280.0, 170.0, 69.0, 45.0, 30.0, 19.0, 10.0, 11.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.46875, -2.408477783203125, -2.34820556640625, -2.287933349609375, -2.2276611328125, -2.167388916015625, -2.10711669921875, -2.046844482421875, -1.986572265625, -1.926300048828125, -1.86602783203125, -1.805755615234375, -1.7454833984375, -1.685211181640625, -1.62493896484375, -1.564666748046875, -1.50439453125, -1.444122314453125, -1.38385009765625, -1.323577880859375, -1.2633056640625, -1.203033447265625, -1.14276123046875, -1.082489013671875, -1.022216796875, -0.961944580078125, -0.90167236328125, -0.841400146484375, -0.7811279296875, -0.720855712890625, -0.66058349609375, -0.600311279296875, -0.5400390625, -0.479766845703125, -0.41949462890625, -0.359222412109375, -0.2989501953125, -0.238677978515625, -0.17840576171875, -0.118133544921875, -0.057861328125, 0.002410888671875, 0.06268310546875, 0.122955322265625, 0.1832275390625, 0.243499755859375, 0.30377197265625, 0.364044189453125, 0.42431640625, 0.484588623046875, 0.54486083984375, 0.605133056640625, 0.6654052734375, 0.725677490234375, 0.78594970703125, 0.846221923828125, 0.906494140625, 0.966766357421875, 1.02703857421875, 1.087310791015625, 1.1475830078125, 1.207855224609375, 1.26812744140625, 1.328399658203125, 1.388671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 13.0, 15.0, 32.0, 49.0, 84.0, 106.0, 142.0, 161.0, 143.0, 93.0, 46.0, 41.0, 21.0, 12.0, 11.0, 6.0, 5.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012493133544921875, -0.00012107193470001221, -0.00011721253395080566, -0.00011335313320159912, -0.00010949373245239258, -0.00010563433170318604, -0.00010177493095397949, -9.791553020477295e-05, -9.40561294555664e-05, -9.019672870635986e-05, -8.633732795715332e-05, -8.247792720794678e-05, -7.861852645874023e-05, -7.475912570953369e-05, -7.089972496032715e-05, -6.70403242111206e-05, -6.318092346191406e-05, -5.932152271270752e-05, -5.5462121963500977e-05, -5.1602721214294434e-05, -4.774332046508789e-05, -4.388391971588135e-05, -4.0024518966674805e-05, -3.616511821746826e-05, -3.230571746826172e-05, -2.8446316719055176e-05, -2.4586915969848633e-05, -2.072751522064209e-05, -1.6868114471435547e-05, -1.3008713722229004e-05, -9.149312973022461e-06, -5.289912223815918e-06, -1.430511474609375e-06, 2.428889274597168e-06, 6.288290023803711e-06, 1.0147690773010254e-05, 1.4007091522216797e-05, 1.786649227142334e-05, 2.1725893020629883e-05, 2.5585293769836426e-05, 2.944469451904297e-05, 3.330409526824951e-05, 3.7163496017456055e-05, 4.10228967666626e-05, 4.488229751586914e-05, 4.8741698265075684e-05, 5.2601099014282227e-05, 5.646049976348877e-05, 6.031990051269531e-05, 6.417930126190186e-05, 6.80387020111084e-05, 7.189810276031494e-05, 7.575750350952148e-05, 7.961690425872803e-05, 8.347630500793457e-05, 8.733570575714111e-05, 9.119510650634766e-05, 9.50545072555542e-05, 9.891390800476074e-05, 0.00010277330875396729, 0.00010663270950317383, 0.00011049211025238037, 0.00011435151100158691, 0.00011821091175079346, 0.0001220703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 10.0, 13.0, 28.0, 39.0, 43.0, 96.0, 157.0, 271.0, 623.0, 1312.0, 3412.0, 12133.0, 67224.0, 596485.0, 318231.0, 36371.0, 7610.0, 2484.0, 958.0, 429.0, 265.0, 133.0, 89.0, 47.0, 18.0, 17.0, 13.0, 5.0, 5.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88720703125, -0.8541488647460938, -0.8210906982421875, -0.7880325317382812, -0.754974365234375, -0.7219161987304688, -0.6888580322265625, -0.6557998657226562, -0.62274169921875, -0.5896835327148438, -0.5566253662109375, -0.5235671997070312, -0.490509033203125, -0.45745086669921875, -0.4243927001953125, -0.39133453369140625, -0.3582763671875, -0.32521820068359375, -0.2921600341796875, -0.25910186767578125, -0.226043701171875, -0.19298553466796875, -0.1599273681640625, -0.12686920166015625, -0.09381103515625, -0.06075286865234375, -0.0276947021484375, 0.00536346435546875, 0.038421630859375, 0.07147979736328125, 0.1045379638671875, 0.13759613037109375, 0.170654296875, 0.20371246337890625, 0.2367706298828125, 0.26982879638671875, 0.302886962890625, 0.33594512939453125, 0.3690032958984375, 0.40206146240234375, 0.43511962890625, 0.46817779541015625, 0.5012359619140625, 0.5342941284179688, 0.567352294921875, 0.6004104614257812, 0.6334686279296875, 0.6665267944335938, 0.6995849609375, 0.7326431274414062, 0.7657012939453125, 0.7987594604492188, 0.831817626953125, 0.8648757934570312, 0.8979339599609375, 0.9309921264648438, 0.96405029296875, 0.9971084594726562, 1.0301666259765625, 1.0632247924804688, 1.096282958984375, 1.1293411254882812, 1.1623992919921875, 1.1954574584960938, 1.228515625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 15.0, 11.0, 16.0, 16.0, 22.0, 20.0, 30.0, 37.0, 41.0, 78.0, 72.0, 70.0, 88.0, 72.0, 63.0, 47.0, 57.0, 55.0, 44.0, 28.0, 19.0, 28.0, 16.0, 10.0, 12.0, 10.0, 7.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8359375, -0.8077926635742188, -0.7796478271484375, -0.7515029907226562, -0.723358154296875, -0.6952133178710938, -0.6670684814453125, -0.6389236450195312, -0.61077880859375, -0.5826339721679688, -0.5544891357421875, -0.5263442993164062, -0.498199462890625, -0.47005462646484375, -0.4419097900390625, -0.41376495361328125, -0.3856201171875, -0.35747528076171875, -0.3293304443359375, -0.30118560791015625, -0.273040771484375, -0.24489593505859375, -0.2167510986328125, -0.18860626220703125, -0.16046142578125, -0.13231658935546875, -0.1041717529296875, -0.07602691650390625, -0.047882080078125, -0.01973724365234375, 0.0084075927734375, 0.03655242919921875, 0.064697265625, 0.09284210205078125, 0.1209869384765625, 0.14913177490234375, 0.177276611328125, 0.20542144775390625, 0.2335662841796875, 0.26171112060546875, 0.28985595703125, 0.31800079345703125, 0.3461456298828125, 0.37429046630859375, 0.402435302734375, 0.43058013916015625, 0.4587249755859375, 0.48686981201171875, 0.5150146484375, 0.5431594848632812, 0.5713043212890625, 0.5994491577148438, 0.627593994140625, 0.6557388305664062, 0.6838836669921875, 0.7120285034179688, 0.74017333984375, 0.7683181762695312, 0.7964630126953125, 0.8246078491210938, 0.852752685546875, 0.8808975219726562, 0.9090423583984375, 0.9371871948242188, 0.96533203125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 10.0, 13.0, 32.0, 117.0, 414.0, 283.0, 83.0, 25.0, 12.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.543588638305664, -20.887941360473633, -20.23229217529297, -19.576644897460938, -18.920997619628906, -18.265350341796875, -17.60970115661621, -16.95405387878418, -16.29840660095215, -15.6427583694458, -14.98711109161377, -14.331462860107422, -13.67581558227539, -13.020167350769043, -12.364519119262695, -11.708871841430664, -11.053223609924316, -10.397575378417969, -9.741928100585938, -9.08627986907959, -8.430632591247559, -7.774984359741211, -7.1193366050720215, -6.463688850402832, -5.808041095733643, -5.152393341064453, -4.496745586395264, -3.841097593307495, -3.1854498386383057, -2.529802083969116, -1.8741540908813477, -1.2185063362121582, -0.5628585815429688, 0.09278923273086548, 0.7484370470046997, 1.4040849208831787, 2.059732675552368, 2.7153804302215576, 3.371028423309326, 4.026676177978516, 4.682323932647705, 5.3379716873168945, 5.993619441986084, 6.649267196655273, 7.304915428161621, 7.960562705993652, 8.6162109375, 9.271858215332031, 9.927506446838379, 10.583154678344727, 11.238801956176758, 11.894450187683105, 12.550097465515137, 13.205745697021484, 13.861392974853516, 14.517041206359863, 15.172689437866211, 15.828337669372559, 16.483985900878906, 17.139633178710938, 17.79528045654297, 18.450927734375, 19.106576919555664, 19.762224197387695, 20.417871475219727]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 2.0, 8.0, 12.0, 12.0, 17.0, 23.0, 33.0, 55.0, 76.0, 100.0, 128.0, 113.0, 98.0, 78.0, 72.0, 43.0, 23.0, 21.0, 13.0, 10.0, 6.0, 4.0, 4.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.069162368774414, -14.628057479858398, -14.186952590942383, -13.745847702026367, -13.304742813110352, -12.863637924194336, -12.42253303527832, -11.981428146362305, -11.540323257446289, -11.099218368530273, -10.658113479614258, -10.217008590698242, -9.775903701782227, -9.334798812866211, -8.893693923950195, -8.45258903503418, -8.011484146118164, -7.570379257202148, -7.129274368286133, -6.688169479370117, -6.247064590454102, -5.805959701538086, -5.36485481262207, -4.923749923706055, -4.482645034790039, -4.041540145874023, -3.600435256958008, -3.159330368041992, -2.7182254791259766, -2.277120590209961, -1.8360157012939453, -1.3949108123779297, -0.9538059234619141, -0.5127010345458984, -0.07159614562988281, 0.3695087432861328, 0.8106136322021484, 1.251718521118164, 1.6928234100341797, 2.1339282989501953, 2.575033187866211, 3.0161380767822266, 3.457242965698242, 3.898347854614258, 4.339452743530273, 4.780557632446289, 5.221662521362305, 5.66276741027832, 6.103872299194336, 6.544977188110352, 6.986082077026367, 7.427186965942383, 7.868291854858398, 8.309396743774414, 8.75050163269043, 9.191606521606445, 9.632711410522461, 10.073816299438477, 10.514921188354492, 10.956026077270508, 11.397130966186523, 11.838235855102539, 12.279340744018555, 12.72044563293457, 13.161550521850586]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 11.0, 14.0, 22.0, 55.0, 92.0, 206.0, 451.0, 1067.0, 3075.0, 12026.0, 185888.0, 3961732.0, 23954.0, 3960.0, 1072.0, 373.0, 137.0, 56.0, 37.0, 16.0, 14.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-6.71875, -6.576385498046875, -6.43402099609375, -6.291656494140625, -6.1492919921875, -6.006927490234375, -5.86456298828125, -5.722198486328125, -5.579833984375, -5.437469482421875, -5.29510498046875, -5.152740478515625, -5.0103759765625, -4.868011474609375, -4.72564697265625, -4.583282470703125, -4.44091796875, -4.298553466796875, -4.15618896484375, -4.013824462890625, -3.8714599609375, -3.729095458984375, -3.58673095703125, -3.444366455078125, -3.302001953125, -3.159637451171875, -3.01727294921875, -2.874908447265625, -2.7325439453125, -2.590179443359375, -2.44781494140625, -2.305450439453125, -2.1630859375, -2.020721435546875, -1.87835693359375, -1.735992431640625, -1.5936279296875, -1.451263427734375, -1.30889892578125, -1.166534423828125, -1.024169921875, -0.881805419921875, -0.73944091796875, -0.597076416015625, -0.4547119140625, -0.312347412109375, -0.16998291015625, -0.027618408203125, 0.11474609375, 0.257110595703125, 0.39947509765625, 0.541839599609375, 0.6842041015625, 0.826568603515625, 0.96893310546875, 1.111297607421875, 1.253662109375, 1.396026611328125, 1.53839111328125, 1.680755615234375, 1.8231201171875, 1.965484619140625, 2.10784912109375, 2.250213623046875, 2.392578125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 6.0, 5.0, 5.0, 3.0, 10.0, 8.0, 10.0, 9.0, 14.0, 39.0, 102.0, 273.0, 266.0, 106.0, 39.0, 22.0, 10.0, 12.0, 6.0, 9.0, 4.0, 9.0, 6.0, 4.0, 3.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.22167015075683594, -0.21567916870117188, -0.2096881866455078, -0.20369720458984375, -0.1977062225341797, -0.19171524047851562, -0.18572425842285156, -0.1797332763671875, -0.17374229431152344, -0.16775131225585938, -0.1617603302001953, -0.15576934814453125, -0.1497783660888672, -0.14378738403320312, -0.13779640197753906, -0.131805419921875, -0.12581443786621094, -0.11982345581054688, -0.11383247375488281, -0.10784149169921875, -0.10185050964355469, -0.09585952758789062, -0.08986854553222656, -0.0838775634765625, -0.07788658142089844, -0.07189559936523438, -0.06590461730957031, -0.05991363525390625, -0.05392265319824219, -0.047931671142578125, -0.04194068908691406, -0.03594970703125, -0.029958724975585938, -0.023967742919921875, -0.017976760864257812, -0.01198577880859375, -0.0059947967529296875, -3.814697265625e-06, 0.0059871673583984375, 0.0119781494140625, 0.017969131469726562, 0.023960113525390625, 0.029951095581054688, 0.03594207763671875, 0.04193305969238281, 0.047924041748046875, 0.05391502380371094, 0.059906005859375, 0.06589698791503906, 0.07188796997070312, 0.07787895202636719, 0.08386993408203125, 0.08986091613769531, 0.09585189819335938, 0.10184288024902344, 0.1078338623046875, 0.11382484436035156, 0.11981582641601562, 0.1258068084716797, 0.13179779052734375, 0.1377887725830078, 0.14377975463867188, 0.14977073669433594, 0.15576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 12.0, 11.0, 28.0, 34.0, 70.0, 106.0, 196.0, 405.0, 790.0, 1982.0, 5703.0, 23009.0, 192266.0, 3721349.0, 213370.0, 24645.0, 6101.0, 2148.0, 1006.0, 467.0, 196.0, 121.0, 75.0, 59.0, 40.0, 26.0, 20.0, 11.0, 7.0, 7.0, 7.0, 1.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.3436279296875, -1.288818359375, -1.2340087890625, -1.17919921875, -1.1243896484375, -1.069580078125, -1.0147705078125, -0.9599609375, -0.9051513671875, -0.850341796875, -0.7955322265625, -0.74072265625, -0.6859130859375, -0.631103515625, -0.5762939453125, -0.521484375, -0.4666748046875, -0.411865234375, -0.3570556640625, -0.30224609375, -0.2474365234375, -0.192626953125, -0.1378173828125, -0.0830078125, -0.0281982421875, 0.026611328125, 0.0814208984375, 0.13623046875, 0.1910400390625, 0.245849609375, 0.3006591796875, 0.35546875, 0.4102783203125, 0.465087890625, 0.5198974609375, 0.57470703125, 0.6295166015625, 0.684326171875, 0.7391357421875, 0.7939453125, 0.8487548828125, 0.903564453125, 0.9583740234375, 1.01318359375, 1.0679931640625, 1.122802734375, 1.1776123046875, 1.232421875, 1.2872314453125, 1.342041015625, 1.3968505859375, 1.45166015625, 1.5064697265625, 1.561279296875, 1.6160888671875, 1.6708984375, 1.7257080078125, 1.780517578125, 1.8353271484375, 1.89013671875, 1.9449462890625, 1.999755859375, 2.0545654296875, 2.109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 7.0, 5.0, 5.0, 12.0, 16.0, 20.0, 32.0, 48.0, 75.0, 108.0, 256.0, 706.0, 1556.0, 598.0, 245.0, 132.0, 73.0, 54.0, 35.0, 23.0, 14.0, 13.0, 10.0, 4.0, 10.0, 3.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.19326210021972656, -0.18498611450195312, -0.1767101287841797, -0.16843414306640625, -0.1601581573486328, -0.15188217163085938, -0.14360618591308594, -0.1353302001953125, -0.12705421447753906, -0.11877822875976562, -0.11050224304199219, -0.10222625732421875, -0.09395027160644531, -0.08567428588867188, -0.07739830017089844, -0.069122314453125, -0.06084632873535156, -0.052570343017578125, -0.04429435729980469, -0.03601837158203125, -0.027742385864257812, -0.019466400146484375, -0.011190414428710938, -0.0029144287109375, 0.0053615570068359375, 0.013637542724609375, 0.021913528442382812, 0.03018951416015625, 0.03846549987792969, 0.046741485595703125, 0.05501747131347656, 0.06329345703125, 0.07156944274902344, 0.07984542846679688, 0.08812141418457031, 0.09639739990234375, 0.10467338562011719, 0.11294937133789062, 0.12122535705566406, 0.1295013427734375, 0.13777732849121094, 0.14605331420898438, 0.1543292999267578, 0.16260528564453125, 0.1708812713623047, 0.17915725708007812, 0.18743324279785156, 0.195709228515625, 0.20398521423339844, 0.21226119995117188, 0.2205371856689453, 0.22881317138671875, 0.2370891571044922, 0.24536514282226562, 0.25364112854003906, 0.2619171142578125, 0.27019309997558594, 0.2784690856933594, 0.2867450714111328, 0.29502105712890625, 0.3032970428466797, 0.3115730285644531, 0.31984901428222656, 0.328125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 19.0, 325.0, 517.0, 95.0, 21.0, 6.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6770597696304321, -1.5095062255859375, -1.3419526815414429, -1.1743991374969482, -1.0068457126617432, -0.8392921090126038, -0.6717386245727539, -0.5041850805282593, -0.33663153648376465, -0.1690780073404312, -0.0015244781970977783, 0.16602903604507446, 0.3335825800895691, 0.5011361241340637, 0.6686896085739136, 0.8362431526184082, 1.0037966966629028, 1.1713502407073975, 1.338903784751892, 1.5064573287963867, 1.6740107536315918, 1.841564416885376, 2.009117841720581, 2.1766715049743652, 2.3442249298095703, 2.5117783546447754, 2.6793320178985596, 2.8468854427337646, 3.014439105987549, 3.181992530822754, 3.349545955657959, 3.517099618911743, 3.684652805328369, 3.852206230163574, 4.019759654998779, 4.187313556671143, 4.354866981506348, 4.522420406341553, 4.689973831176758, 4.857527732849121, 5.025081157684326, 5.192634582519531, 5.360188007354736, 5.5277419090271, 5.695295333862305, 5.86284875869751, 6.030402183532715, 6.197956085205078, 6.365509033203125, 6.53306245803833, 6.700615882873535, 6.868169784545898, 7.0357232093811035, 7.203276634216309, 7.370830059051514, 7.538383483886719, 7.705937385559082, 7.873490810394287, 8.041044235229492, 8.208598136901855, 8.376151084899902, 8.543704986572266, 8.711258888244629, 8.878811836242676, 9.046365737915039]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 8.0, 14.0, 12.0, 20.0, 22.0, 29.0, 35.0, 57.0, 57.0, 78.0, 81.0, 75.0, 87.0, 94.0, 68.0, 63.0, 53.0, 25.0, 23.0, 21.0, 13.0, 14.0, 4.0, 8.0, 8.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3642146587371826, -1.3161721229553223, -1.2681297063827515, -1.2200871706008911, -1.1720446348190308, -1.12400221824646, -1.0759596824645996, -1.0279171466827393, -0.9798746705055237, -0.9318321943283081, -0.8837896585464478, -0.8357471823692322, -0.7877047061920166, -0.7396621704101562, -0.6916196942329407, -0.6435772180557251, -0.5955346822738647, -0.5474922060966492, -0.4994496703147888, -0.45140719413757324, -0.4033646881580353, -0.3553221821784973, -0.30727970600128174, -0.2592372000217438, -0.2111946940422058, -0.16315218806266785, -0.11510969698429108, -0.0670672059059143, -0.019024699926376343, 0.02901780605316162, 0.0770602822303772, 0.12510278820991516, 0.17314529418945312, 0.2211878001689911, 0.26923030614852905, 0.31727278232574463, 0.3653152883052826, 0.41335779428482056, 0.46140027046203613, 0.5094428062438965, 0.5574852824211121, 0.6055277585983276, 0.653570294380188, 0.7016127705574036, 0.7496552467346191, 0.7976977825164795, 0.8457402586936951, 0.8937827348709106, 0.941825270652771, 0.9898677468299866, 1.0379102230072021, 1.0859527587890625, 1.1339952945709229, 1.1820378303527832, 1.230080246925354, 1.2781227827072144, 1.3261651992797852, 1.3742077350616455, 1.4222501516342163, 1.4702926874160767, 1.518335223197937, 1.5663776397705078, 1.6144201755523682, 1.6624627113342285, 1.7105052471160889]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 9.0, 20.0, 30.0, 31.0, 72.0, 89.0, 174.0, 365.0, 750.0, 1850.0, 5340.0, 19031.0, 165687.0, 800792.0, 39708.0, 9321.0, 3033.0, 1137.0, 505.0, 227.0, 147.0, 79.0, 55.0, 36.0, 21.0, 8.0, 10.0, 5.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.223724365234375, -2.15252685546875, -2.081329345703125, -2.0101318359375, -1.938934326171875, -1.86773681640625, -1.796539306640625, -1.725341796875, -1.654144287109375, -1.58294677734375, -1.511749267578125, -1.4405517578125, -1.369354248046875, -1.29815673828125, -1.226959228515625, -1.15576171875, -1.084564208984375, -1.01336669921875, -0.942169189453125, -0.8709716796875, -0.799774169921875, -0.72857666015625, -0.657379150390625, -0.586181640625, -0.514984130859375, -0.44378662109375, -0.372589111328125, -0.3013916015625, -0.230194091796875, -0.15899658203125, -0.087799072265625, -0.0166015625, 0.054595947265625, 0.12579345703125, 0.196990966796875, 0.2681884765625, 0.339385986328125, 0.41058349609375, 0.481781005859375, 0.552978515625, 0.624176025390625, 0.69537353515625, 0.766571044921875, 0.8377685546875, 0.908966064453125, 0.98016357421875, 1.051361083984375, 1.12255859375, 1.193756103515625, 1.26495361328125, 1.336151123046875, 1.4073486328125, 1.478546142578125, 1.54974365234375, 1.620941162109375, 1.692138671875, 1.763336181640625, 1.83453369140625, 1.905731201171875, 1.9769287109375, 2.048126220703125, 2.11932373046875, 2.190521240234375, 2.26171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 8.0, 5.0, 5.0, 15.0, 14.0, 8.0, 28.0, 61.0, 165.0, 222.0, 193.0, 125.0, 49.0, 27.0, 22.0, 7.0, 10.0, 6.0, 6.0, 8.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24395179748535156, -0.23765945434570312, -0.2313671112060547, -0.22507476806640625, -0.2187824249267578, -0.21249008178710938, -0.20619773864746094, -0.1999053955078125, -0.19361305236816406, -0.18732070922851562, -0.1810283660888672, -0.17473602294921875, -0.1684436798095703, -0.16215133666992188, -0.15585899353027344, -0.149566650390625, -0.14327430725097656, -0.13698196411132812, -0.1306896209716797, -0.12439727783203125, -0.11810493469238281, -0.11181259155273438, -0.10552024841308594, -0.0992279052734375, -0.09293556213378906, -0.08664321899414062, -0.08035087585449219, -0.07405853271484375, -0.06776618957519531, -0.061473846435546875, -0.05518150329589844, -0.04888916015625, -0.04259681701660156, -0.036304473876953125, -0.030012130737304688, -0.02371978759765625, -0.017427444458007812, -0.011135101318359375, -0.0048427581787109375, 0.0014495849609375, 0.0077419281005859375, 0.014034271240234375, 0.020326614379882812, 0.02661895751953125, 0.03291130065917969, 0.039203643798828125, 0.04549598693847656, 0.051788330078125, 0.05808067321777344, 0.06437301635742188, 0.07066535949707031, 0.07695770263671875, 0.08325004577636719, 0.08954238891601562, 0.09583473205566406, 0.1021270751953125, 0.10841941833496094, 0.11471176147460938, 0.12100410461425781, 0.12729644775390625, 0.1335887908935547, 0.13988113403320312, 0.14617347717285156, 0.1524658203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 3.0, 7.0, 16.0, 63.0, 283.0, 2607.0, 850678.0, 193376.0, 1247.0, 176.0, 32.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.3046875, -6.12896728515625, -5.9532470703125, -5.77752685546875, -5.601806640625, -5.42608642578125, -5.2503662109375, -5.07464599609375, -4.89892578125, -4.72320556640625, -4.5474853515625, -4.37176513671875, -4.196044921875, -4.02032470703125, -3.8446044921875, -3.66888427734375, -3.4931640625, -3.31744384765625, -3.1417236328125, -2.96600341796875, -2.790283203125, -2.61456298828125, -2.4388427734375, -2.26312255859375, -2.08740234375, -1.91168212890625, -1.7359619140625, -1.56024169921875, -1.384521484375, -1.20880126953125, -1.0330810546875, -0.85736083984375, -0.681640625, -0.50592041015625, -0.3302001953125, -0.15447998046875, 0.021240234375, 0.19696044921875, 0.3726806640625, 0.54840087890625, 0.72412109375, 0.89984130859375, 1.0755615234375, 1.25128173828125, 1.427001953125, 1.60272216796875, 1.7784423828125, 1.95416259765625, 2.1298828125, 2.30560302734375, 2.4813232421875, 2.65704345703125, 2.832763671875, 3.00848388671875, 3.1842041015625, 3.35992431640625, 3.53564453125, 3.71136474609375, 3.8870849609375, 4.06280517578125, 4.238525390625, 4.41424560546875, 4.5899658203125, 4.76568603515625, 4.94140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 14.0, 17.0, 9.0, 14.0, 11.0, 17.0, 13.0, 16.0, 16.0, 28.0, 18.0, 30.0, 28.0, 26.0, 30.0, 40.0, 34.0, 36.0, 45.0, 38.0, 46.0, 41.0, 38.0, 34.0, 26.0, 29.0, 26.0, 31.0, 24.0, 28.0, 23.0, 24.0, 16.0, 18.0, 20.0, 18.0, 9.0, 7.0, 11.0, 8.0, 11.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.470458984375, -0.4557342529296875, -0.441009521484375, -0.4262847900390625, -0.41156005859375, -0.3968353271484375, -0.382110595703125, -0.3673858642578125, -0.3526611328125, -0.3379364013671875, -0.323211669921875, -0.3084869384765625, -0.29376220703125, -0.2790374755859375, -0.264312744140625, -0.2495880126953125, -0.23486328125, -0.2201385498046875, -0.205413818359375, -0.1906890869140625, -0.17596435546875, -0.1612396240234375, -0.146514892578125, -0.1317901611328125, -0.1170654296875, -0.1023406982421875, -0.087615966796875, -0.0728912353515625, -0.05816650390625, -0.0434417724609375, -0.028717041015625, -0.0139923095703125, 0.000732421875, 0.0154571533203125, 0.030181884765625, 0.0449066162109375, 0.05963134765625, 0.0743560791015625, 0.089080810546875, 0.1038055419921875, 0.1185302734375, 0.1332550048828125, 0.147979736328125, 0.1627044677734375, 0.17742919921875, 0.1921539306640625, 0.206878662109375, 0.2216033935546875, 0.236328125, 0.2510528564453125, 0.265777587890625, 0.2805023193359375, 0.29522705078125, 0.3099517822265625, 0.324676513671875, 0.3394012451171875, 0.3541259765625, 0.3688507080078125, 0.383575439453125, 0.3983001708984375, 0.41302490234375, 0.4277496337890625, 0.442474365234375, 0.4571990966796875, 0.471923828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 11.0, 19.0, 31.0, 100.0, 590.0, 119161.0, 927540.0, 921.0, 105.0, 33.0, 16.0, 10.0, 4.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.50244140625, -10.1533203125, -9.80419921875, -9.455078125, -9.10595703125, -8.7568359375, -8.40771484375, -8.05859375, -7.70947265625, -7.3603515625, -7.01123046875, -6.662109375, -6.31298828125, -5.9638671875, -5.61474609375, -5.265625, -4.91650390625, -4.5673828125, -4.21826171875, -3.869140625, -3.52001953125, -3.1708984375, -2.82177734375, -2.47265625, -2.12353515625, -1.7744140625, -1.42529296875, -1.076171875, -0.72705078125, -0.3779296875, -0.02880859375, 0.3203125, 0.66943359375, 1.0185546875, 1.36767578125, 1.716796875, 2.06591796875, 2.4150390625, 2.76416015625, 3.11328125, 3.46240234375, 3.8115234375, 4.16064453125, 4.509765625, 4.85888671875, 5.2080078125, 5.55712890625, 5.90625, 6.25537109375, 6.6044921875, 6.95361328125, 7.302734375, 7.65185546875, 8.0009765625, 8.35009765625, 8.69921875, 9.04833984375, 9.3974609375, 9.74658203125, 10.095703125, 10.44482421875, 10.7939453125, 11.14306640625, 11.4921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 3.0, 15.0, 14.0, 28.0, 46.0, 47.0, 87.0, 102.0, 133.0, 102.0, 126.0, 78.0, 64.0, 42.0, 37.0, 16.0, 10.0, 13.0, 11.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010979175567626953, -0.00010615028440952301, -0.00010250881314277649, -9.886734187602997e-05, -9.522587060928345e-05, -9.158439934253693e-05, -8.79429280757904e-05, -8.430145680904388e-05, -8.065998554229736e-05, -7.701851427555084e-05, -7.337704300880432e-05, -6.97355717420578e-05, -6.609410047531128e-05, -6.245262920856476e-05, -5.881115794181824e-05, -5.5169686675071716e-05, -5.1528215408325195e-05, -4.7886744141578674e-05, -4.424527287483215e-05, -4.060380160808563e-05, -3.696233034133911e-05, -3.332085907459259e-05, -2.967938780784607e-05, -2.603791654109955e-05, -2.2396445274353027e-05, -1.8754974007606506e-05, -1.5113502740859985e-05, -1.1472031474113464e-05, -7.830560207366943e-06, -4.189088940620422e-06, -5.476176738739014e-07, 3.0938535928726196e-06, 6.735324859619141e-06, 1.0376796126365662e-05, 1.4018267393112183e-05, 1.7659738659858704e-05, 2.1301209926605225e-05, 2.4942681193351746e-05, 2.8584152460098267e-05, 3.222562372684479e-05, 3.586709499359131e-05, 3.950856626033783e-05, 4.315003752708435e-05, 4.679150879383087e-05, 5.043298006057739e-05, 5.4074451327323914e-05, 5.7715922594070435e-05, 6.135739386081696e-05, 6.499886512756348e-05, 6.864033639431e-05, 7.228180766105652e-05, 7.592327892780304e-05, 7.956475019454956e-05, 8.320622146129608e-05, 8.68476927280426e-05, 9.048916399478912e-05, 9.413063526153564e-05, 9.777210652828217e-05, 0.00010141357779502869, 0.00010505504906177521, 0.00010869652032852173, 0.00011233799159526825, 0.00011597946286201477, 0.00011962093412876129, 0.0001232624053955078]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 16.0, 21.0, 40.0, 45.0, 106.0, 193.0, 381.0, 842.0, 1914.0, 5754.0, 24199.0, 191191.0, 697741.0, 102295.0, 16180.0, 4355.0, 1693.0, 744.0, 366.0, 176.0, 119.0, 49.0, 38.0, 15.0, 20.0, 8.0, 12.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5908203125, -1.54583740234375, -1.5008544921875, -1.45587158203125, -1.410888671875, -1.36590576171875, -1.3209228515625, -1.27593994140625, -1.23095703125, -1.18597412109375, -1.1409912109375, -1.09600830078125, -1.051025390625, -1.00604248046875, -0.9610595703125, -0.91607666015625, -0.87109375, -0.82611083984375, -0.7811279296875, -0.73614501953125, -0.691162109375, -0.64617919921875, -0.6011962890625, -0.55621337890625, -0.51123046875, -0.46624755859375, -0.4212646484375, -0.37628173828125, -0.331298828125, -0.28631591796875, -0.2413330078125, -0.19635009765625, -0.1513671875, -0.10638427734375, -0.0614013671875, -0.01641845703125, 0.028564453125, 0.07354736328125, 0.1185302734375, 0.16351318359375, 0.20849609375, 0.25347900390625, 0.2984619140625, 0.34344482421875, 0.388427734375, 0.43341064453125, 0.4783935546875, 0.52337646484375, 0.568359375, 0.61334228515625, 0.6583251953125, 0.70330810546875, 0.748291015625, 0.79327392578125, 0.8382568359375, 0.88323974609375, 0.92822265625, 0.97320556640625, 1.0181884765625, 1.06317138671875, 1.108154296875, 1.15313720703125, 1.1981201171875, 1.24310302734375, 1.2880859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 7.0, 7.0, 19.0, 23.0, 28.0, 48.0, 61.0, 72.0, 87.0, 108.0, 133.0, 97.0, 63.0, 63.0, 52.0, 26.0, 31.0, 13.0, 20.0, 9.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -1.00274658203125, -0.9683837890625, -0.93402099609375, -0.899658203125, -0.86529541015625, -0.8309326171875, -0.79656982421875, -0.76220703125, -0.72784423828125, -0.6934814453125, -0.65911865234375, -0.624755859375, -0.59039306640625, -0.5560302734375, -0.52166748046875, -0.4873046875, -0.45294189453125, -0.4185791015625, -0.38421630859375, -0.349853515625, -0.31549072265625, -0.2811279296875, -0.24676513671875, -0.21240234375, -0.17803955078125, -0.1436767578125, -0.10931396484375, -0.074951171875, -0.04058837890625, -0.0062255859375, 0.02813720703125, 0.0625, 0.09686279296875, 0.1312255859375, 0.16558837890625, 0.199951171875, 0.23431396484375, 0.2686767578125, 0.30303955078125, 0.33740234375, 0.37176513671875, 0.4061279296875, 0.44049072265625, 0.474853515625, 0.50921630859375, 0.5435791015625, 0.57794189453125, 0.6123046875, 0.64666748046875, 0.6810302734375, 0.71539306640625, 0.749755859375, 0.78411865234375, 0.8184814453125, 0.85284423828125, 0.88720703125, 0.92156982421875, 0.9559326171875, 0.99029541015625, 1.024658203125, 1.05902099609375, 1.0933837890625, 1.12774658203125, 1.162109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 9.0, 28.0, 72.0, 308.0, 392.0, 148.0, 33.0, 7.0, 5.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.756298065185547, -20.25275421142578, -19.749210357666016, -19.245668411254883, -18.742124557495117, -18.23858070373535, -17.73503875732422, -17.231494903564453, -16.727951049804688, -16.224407196044922, -15.720864295959473, -15.217321395874023, -14.713777542114258, -14.210233688354492, -13.706690788269043, -13.203147888183594, -12.699604034423828, -12.196060180664062, -11.692517280578613, -11.188974380493164, -10.685430526733398, -10.181886672973633, -9.678343772888184, -9.174800872802734, -8.671257019042969, -8.167713165283203, -7.664170265197754, -7.1606268882751465, -6.657083511352539, -6.153540134429932, -5.649996757507324, -5.146453380584717, -4.642911911010742, -4.139368534088135, -3.6358251571655273, -3.13228178024292, -2.6287384033203125, -2.125195026397705, -1.6216516494750977, -1.1181082725524902, -0.6145648956298828, -0.11102151870727539, 0.39252185821533203, 0.8960652351379395, 1.3996086120605469, 1.9031519889831543, 2.4066953659057617, 2.910238742828369, 3.4137821197509766, 3.917325496673584, 4.420868873596191, 4.924412250518799, 5.427955627441406, 5.931499004364014, 6.435042381286621, 6.9385857582092285, 7.442129135131836, 7.945672512054443, 8.44921588897705, 8.9527587890625, 9.456302642822266, 9.959846496582031, 10.46338939666748, 10.96693229675293, 11.470476150512695]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 0.0, 4.0, 3.0, 11.0, 11.0, 15.0, 12.0, 39.0, 45.0, 52.0, 49.0, 86.0, 114.0, 115.0, 93.0, 92.0, 76.0, 48.0, 38.0, 23.0, 15.0, 16.0, 9.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.09846305847168, -7.8614397048950195, -7.624416351318359, -7.387392520904541, -7.150369167327881, -6.913345813751221, -6.6763224601745605, -6.439298629760742, -6.202275276184082, -5.965251922607422, -5.728228569030762, -5.491204738616943, -5.254181385040283, -5.017158031463623, -4.780134677886963, -4.5431108474731445, -4.306087493896484, -4.069064140319824, -3.832040548324585, -3.595017194747925, -3.3579936027526855, -3.1209702491760254, -2.8839468955993652, -2.646923303604126, -2.409900188446045, -2.1728768348693848, -1.9358532428741455, -1.6988298892974854, -1.461806297302246, -1.224782943725586, -0.9877594709396362, -0.7507359981536865, -0.5137124061584473, -0.27668893337249756, -0.03966549038887024, 0.19735795259475708, 0.4343814253807068, 0.6714048385620117, 0.9084283113479614, 1.1454517841339111, 1.3824752569198608, 1.6194987297058105, 1.8565222024917603, 2.09354567527771, 2.33056902885437, 2.5675926208496094, 2.8046159744262695, 3.0416393280029297, 3.278662919998169, 3.515686273574829, 3.7527098655700684, 3.9897332191467285, 4.226756572723389, 4.463780403137207, 4.700803756713867, 4.937827110290527, 5.1748504638671875, 5.411873817443848, 5.648897171020508, 5.885921001434326, 6.122944355010986, 6.3599677085876465, 6.596991062164307, 6.834014892578125, 7.071038246154785]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 6.0, 15.0, 9.0, 14.0, 7.0, 14.0, 18.0, 38.0, 27.0, 47.0, 38.0, 66.0, 102.0, 132.0, 180.0, 229.0, 358.0, 547.0, 962.0, 1757.0, 3783.0, 12893.0, 105395.0, 4002422.0, 50020.0, 8954.0, 2888.0, 1392.0, 771.0, 409.0, 286.0, 214.0, 118.0, 59.0, 50.0, 23.0, 13.0, 11.0, 2.0, 5.0, 4.0, 1.0], "bins": [-5.15234375, -5.038787841796875, -4.92523193359375, -4.811676025390625, -4.6981201171875, -4.584564208984375, -4.47100830078125, -4.357452392578125, -4.243896484375, -4.130340576171875, -4.01678466796875, -3.903228759765625, -3.7896728515625, -3.676116943359375, -3.56256103515625, -3.449005126953125, -3.33544921875, -3.221893310546875, -3.10833740234375, -2.994781494140625, -2.8812255859375, -2.767669677734375, -2.65411376953125, -2.540557861328125, -2.427001953125, -2.313446044921875, -2.19989013671875, -2.086334228515625, -1.9727783203125, -1.859222412109375, -1.74566650390625, -1.632110595703125, -1.5185546875, -1.404998779296875, -1.29144287109375, -1.177886962890625, -1.0643310546875, -0.950775146484375, -0.83721923828125, -0.723663330078125, -0.610107421875, -0.496551513671875, -0.38299560546875, -0.269439697265625, -0.1558837890625, -0.042327880859375, 0.07122802734375, 0.184783935546875, 0.29833984375, 0.411895751953125, 0.52545166015625, 0.639007568359375, 0.7525634765625, 0.866119384765625, 0.97967529296875, 1.093231201171875, 1.206787109375, 1.320343017578125, 1.43389892578125, 1.547454833984375, 1.6610107421875, 1.774566650390625, 1.88812255859375, 2.001678466796875, 2.115234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 3.0, 1.0, 7.0, 9.0, 4.0, 12.0, 15.0, 24.0, 55.0, 75.0, 104.0, 133.0, 135.0, 132.0, 94.0, 68.0, 40.0, 23.0, 8.0, 16.0, 9.0, 9.0, 4.0, 6.0, 2.0, 2.0, 6.0, 0.0, 4.0, 4.0], "bins": [-0.2271728515625, -0.22226428985595703, -0.21735572814941406, -0.2124471664428711, -0.20753860473632812, -0.20263004302978516, -0.1977214813232422, -0.19281291961669922, -0.18790435791015625, -0.18299579620361328, -0.1780872344970703, -0.17317867279052734, -0.16827011108398438, -0.1633615493774414, -0.15845298767089844, -0.15354442596435547, -0.1486358642578125, -0.14372730255126953, -0.13881874084472656, -0.1339101791381836, -0.12900161743164062, -0.12409305572509766, -0.11918449401855469, -0.11427593231201172, -0.10936737060546875, -0.10445880889892578, -0.09955024719238281, -0.09464168548583984, -0.08973312377929688, -0.0848245620727539, -0.07991600036621094, -0.07500743865966797, -0.070098876953125, -0.06519031524658203, -0.06028175354003906, -0.055373191833496094, -0.050464630126953125, -0.045556068420410156, -0.04064750671386719, -0.03573894500732422, -0.03083038330078125, -0.02592182159423828, -0.021013259887695312, -0.016104698181152344, -0.011196136474609375, -0.006287574768066406, -0.0013790130615234375, 0.0035295486450195312, 0.0084381103515625, 0.013346672058105469, 0.018255233764648438, 0.023163795471191406, 0.028072357177734375, 0.032980918884277344, 0.03788948059082031, 0.04279804229736328, 0.04770660400390625, 0.05261516571044922, 0.05752372741699219, 0.062432289123535156, 0.06734085083007812, 0.0722494125366211, 0.07715797424316406, 0.08206653594970703, 0.08697509765625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 4.0, 9.0, 7.0, 24.0, 39.0, 77.0, 198.0, 1239.0, 92034.0, 4096814.0, 3307.0, 312.0, 85.0, 44.0, 30.0, 17.0, 11.0, 11.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.871337890625, -7.57080078125, -7.270263671875, -6.9697265625, -6.669189453125, -6.36865234375, -6.068115234375, -5.767578125, -5.467041015625, -5.16650390625, -4.865966796875, -4.5654296875, -4.264892578125, -3.96435546875, -3.663818359375, -3.36328125, -3.062744140625, -2.76220703125, -2.461669921875, -2.1611328125, -1.860595703125, -1.56005859375, -1.259521484375, -0.958984375, -0.658447265625, -0.35791015625, -0.057373046875, 0.2431640625, 0.543701171875, 0.84423828125, 1.144775390625, 1.4453125, 1.745849609375, 2.04638671875, 2.346923828125, 2.6474609375, 2.947998046875, 3.24853515625, 3.549072265625, 3.849609375, 4.150146484375, 4.45068359375, 4.751220703125, 5.0517578125, 5.352294921875, 5.65283203125, 5.953369140625, 6.25390625, 6.554443359375, 6.85498046875, 7.155517578125, 7.4560546875, 7.756591796875, 8.05712890625, 8.357666015625, 8.658203125, 8.958740234375, 9.25927734375, 9.559814453125, 9.8603515625, 10.160888671875, 10.46142578125, 10.761962890625, 11.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 4.0, 5.0, 9.0, 7.0, 19.0, 13.0, 27.0, 30.0, 49.0, 82.0, 178.0, 562.0, 1849.0, 693.0, 260.0, 106.0, 63.0, 46.0, 19.0, 12.0, 11.0, 7.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.493896484375, -0.4830589294433594, -0.47222137451171875, -0.4613838195800781, -0.4505462646484375, -0.4397087097167969, -0.42887115478515625, -0.4180335998535156, -0.407196044921875, -0.3963584899902344, -0.38552093505859375, -0.3746833801269531, -0.3638458251953125, -0.3530082702636719, -0.34217071533203125, -0.3313331604003906, -0.32049560546875, -0.3096580505371094, -0.29882049560546875, -0.2879829406738281, -0.2771453857421875, -0.2663078308105469, -0.25547027587890625, -0.24463272094726562, -0.233795166015625, -0.22295761108398438, -0.21212005615234375, -0.20128250122070312, -0.1904449462890625, -0.17960739135742188, -0.16876983642578125, -0.15793228149414062, -0.1470947265625, -0.13625717163085938, -0.12541961669921875, -0.11458206176757812, -0.1037445068359375, -0.09290695190429688, -0.08206939697265625, -0.07123184204101562, -0.060394287109375, -0.049556732177734375, -0.03871917724609375, -0.027881622314453125, -0.0170440673828125, -0.006206512451171875, 0.00463104248046875, 0.015468597412109375, 0.02630615234375, 0.037143707275390625, 0.04798126220703125, 0.058818817138671875, 0.0696563720703125, 0.08049392700195312, 0.09133148193359375, 0.10216903686523438, 0.113006591796875, 0.12384414672851562, 0.13468170166015625, 0.14551925659179688, 0.1563568115234375, 0.16719436645507812, 0.17803192138671875, 0.18886947631835938, 0.19970703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 39.0, 637.0, 315.0, 16.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.277685165405273, -18.905841827392578, -18.533998489379883, -18.162155151367188, -17.790311813354492, -17.418468475341797, -17.0466251373291, -16.674781799316406, -16.30293846130371, -15.931095123291016, -15.55925178527832, -15.187408447265625, -14.81556510925293, -14.443721771240234, -14.071878433227539, -13.700035095214844, -13.328192710876465, -12.95634937286377, -12.584506034851074, -12.212662696838379, -11.840819358825684, -11.468976020812988, -11.09713363647461, -10.725290298461914, -10.353446960449219, -9.981603622436523, -9.609760284423828, -9.237916946411133, -8.866073608398438, -8.494230270385742, -8.122386932373047, -7.75054407119751, -7.37869930267334, -7.0068559646606445, -6.635012626647949, -6.263169288635254, -5.891325950622559, -5.519482612609863, -5.147639751434326, -4.775796413421631, -4.4039530754089355, -4.03210973739624, -3.660266399383545, -3.2884232997894287, -2.9165799617767334, -2.544736623764038, -2.172893524169922, -1.8010501861572266, -1.4292068481445312, -1.057363510131836, -0.6855202913284302, -0.3136770725250244, 0.0581662654876709, 0.4300096035003662, 0.8018527030944824, 1.1736960411071777, 1.545539379119873, 1.9173827171325684, 2.2892260551452637, 2.66106915473938, 3.032912492752075, 3.4047558307647705, 3.7765989303588867, 4.148442268371582, 4.520285606384277]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 20.0, 41.0, 105.0, 137.0, 190.0, 163.0, 143.0, 91.0, 44.0, 37.0, 13.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.974608421325684, -4.855602741241455, -4.736596584320068, -4.61759090423584, -4.498584747314453, -4.379579067230225, -4.260573387145996, -4.141567230224609, -4.022561550140381, -3.9035556316375732, -3.7845497131347656, -3.665544033050537, -3.5465381145477295, -3.427532196044922, -3.3085265159606934, -3.1895205974578857, -3.070514678955078, -2.9515087604522705, -2.832502841949463, -2.7134971618652344, -2.5944912433624268, -2.475485324859619, -2.3564796447753906, -2.237473726272583, -2.1184678077697754, -1.9994618892669678, -1.8804560899734497, -1.7614502906799316, -1.642444372177124, -1.5234384536743164, -1.4044326543807983, -1.2854268550872803, -1.1664209365844727, -1.047415018081665, -0.928409218788147, -0.8094033598899841, -0.6903975009918213, -0.5713916420936584, -0.4523857831954956, -0.33337992429733276, -0.21437406539916992, -0.09536820650100708, 0.02363765239715576, 0.1426435112953186, 0.26164937019348145, 0.3806552290916443, 0.49966108798980713, 0.61866694688797, 0.7376728057861328, 0.8566786646842957, 0.9756845235824585, 1.0946903228759766, 1.2136962413787842, 1.3327021598815918, 1.4517079591751099, 1.570713758468628, 1.6897196769714355, 1.8087255954742432, 1.9277313947677612, 2.0467371940612793, 2.165743112564087, 2.2847490310668945, 2.403754711151123, 2.5227606296539307, 2.6417665481567383]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 8.0, 5.0, 11.0, 9.0, 12.0, 11.0, 18.0, 29.0, 26.0, 32.0, 32.0, 46.0, 47.0, 75.0, 120.0, 1350.0, 1013665.0, 32360.0, 295.0, 78.0, 64.0, 41.0, 37.0, 29.0, 25.0, 19.0, 18.0, 26.0, 12.0, 16.0, 6.0, 9.0, 5.0, 12.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8671875, -9.5465087890625, -9.225830078125, -8.9051513671875, -8.58447265625, -8.2637939453125, -7.943115234375, -7.6224365234375, -7.3017578125, -6.9810791015625, -6.660400390625, -6.3397216796875, -6.01904296875, -5.6983642578125, -5.377685546875, -5.0570068359375, -4.736328125, -4.4156494140625, -4.094970703125, -3.7742919921875, -3.45361328125, -3.1329345703125, -2.812255859375, -2.4915771484375, -2.1708984375, -1.8502197265625, -1.529541015625, -1.2088623046875, -0.88818359375, -0.5675048828125, -0.246826171875, 0.0738525390625, 0.39453125, 0.7152099609375, 1.035888671875, 1.3565673828125, 1.67724609375, 1.9979248046875, 2.318603515625, 2.6392822265625, 2.9599609375, 3.2806396484375, 3.601318359375, 3.9219970703125, 4.24267578125, 4.5633544921875, 4.884033203125, 5.2047119140625, 5.525390625, 5.8460693359375, 6.166748046875, 6.4874267578125, 6.80810546875, 7.1287841796875, 7.449462890625, 7.7701416015625, 8.0908203125, 8.4114990234375, 8.732177734375, 9.0528564453125, 9.37353515625, 9.6942138671875, 10.014892578125, 10.3355712890625, 10.65625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 66.0, 313.0, 490.0, 112.0, 18.0, 8.0], "bins": [-1.2265625, -1.2061548233032227, -1.1857471466064453, -1.165339469909668, -1.1449317932128906, -1.1245241165161133, -1.104116439819336, -1.0837087631225586, -1.0633010864257812, -1.042893409729004, -1.0224857330322266, -1.0020780563354492, -0.9816703796386719, -0.9612627029418945, -0.9408550262451172, -0.9204473495483398, -0.9000396728515625, -0.8796319961547852, -0.8592243194580078, -0.8388166427612305, -0.8184089660644531, -0.7980012893676758, -0.7775936126708984, -0.7571859359741211, -0.7367782592773438, -0.7163705825805664, -0.6959629058837891, -0.6755552291870117, -0.6551475524902344, -0.634739875793457, -0.6143321990966797, -0.5939245223999023, -0.573516845703125, -0.5531091690063477, -0.5327014923095703, -0.512293815612793, -0.4918861389160156, -0.4714784622192383, -0.45107078552246094, -0.4306631088256836, -0.41025543212890625, -0.3898477554321289, -0.36944007873535156, -0.3490324020385742, -0.3286247253417969, -0.30821704864501953, -0.2878093719482422, -0.26740169525146484, -0.2469940185546875, -0.22658634185791016, -0.2061786651611328, -0.18577098846435547, -0.16536331176757812, -0.14495563507080078, -0.12454795837402344, -0.1041402816772461, -0.08373260498046875, -0.0633249282836914, -0.04291725158691406, -0.02250957489013672, -0.002101898193359375, 0.01830577850341797, 0.03871345520019531, 0.059121131896972656, 0.07952880859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 15.0, 7.0, 23.0, 23.0, 30.0, 42.0, 93.0, 129.0, 257.0, 625.0, 2211.0, 14256.0, 386842.0, 616509.0, 23143.0, 2804.0, 795.0, 307.0, 148.0, 78.0, 56.0, 39.0, 33.0, 21.0, 10.0, 9.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.576171875, -3.457305908203125, -3.33843994140625, -3.219573974609375, -3.1007080078125, -2.981842041015625, -2.86297607421875, -2.744110107421875, -2.625244140625, -2.506378173828125, -2.38751220703125, -2.268646240234375, -2.1497802734375, -2.030914306640625, -1.91204833984375, -1.793182373046875, -1.67431640625, -1.555450439453125, -1.43658447265625, -1.317718505859375, -1.1988525390625, -1.079986572265625, -0.96112060546875, -0.842254638671875, -0.723388671875, -0.604522705078125, -0.48565673828125, -0.366790771484375, -0.2479248046875, -0.129058837890625, -0.01019287109375, 0.108673095703125, 0.2275390625, 0.346405029296875, 0.46527099609375, 0.584136962890625, 0.7030029296875, 0.821868896484375, 0.94073486328125, 1.059600830078125, 1.178466796875, 1.297332763671875, 1.41619873046875, 1.535064697265625, 1.6539306640625, 1.772796630859375, 1.89166259765625, 2.010528564453125, 2.12939453125, 2.248260498046875, 2.36712646484375, 2.485992431640625, 2.6048583984375, 2.723724365234375, 2.84259033203125, 2.961456298828125, 3.080322265625, 3.199188232421875, 3.31805419921875, 3.436920166015625, 3.5557861328125, 3.674652099609375, 3.79351806640625, 3.912384033203125, 4.03125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 15.0, 12.0, 13.0, 21.0, 28.0, 29.0, 41.0, 42.0, 41.0, 49.0, 55.0, 58.0, 69.0, 48.0, 49.0, 70.0, 56.0, 38.0, 43.0, 35.0, 23.0, 28.0, 23.0, 18.0, 15.0, 13.0, 12.0, 10.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8339004516601562, -0.8030548095703125, -0.7722091674804688, -0.741363525390625, -0.7105178833007812, -0.6796722412109375, -0.6488265991210938, -0.61798095703125, -0.5871353149414062, -0.5562896728515625, -0.5254440307617188, -0.494598388671875, -0.46375274658203125, -0.4329071044921875, -0.40206146240234375, -0.3712158203125, -0.34037017822265625, -0.3095245361328125, -0.27867889404296875, -0.247833251953125, -0.21698760986328125, -0.1861419677734375, -0.15529632568359375, -0.12445068359375, -0.09360504150390625, -0.0627593994140625, -0.03191375732421875, -0.001068115234375, 0.02977752685546875, 0.0606231689453125, 0.09146881103515625, 0.122314453125, 0.15316009521484375, 0.1840057373046875, 0.21485137939453125, 0.245697021484375, 0.27654266357421875, 0.3073883056640625, 0.33823394775390625, 0.36907958984375, 0.39992523193359375, 0.4307708740234375, 0.46161651611328125, 0.492462158203125, 0.5233078002929688, 0.5541534423828125, 0.5849990844726562, 0.6158447265625, 0.6466903686523438, 0.6775360107421875, 0.7083816528320312, 0.739227294921875, 0.7700729370117188, 0.8009185791015625, 0.8317642211914062, 0.86260986328125, 0.8934555053710938, 0.9243011474609375, 0.9551467895507812, 0.985992431640625, 1.0168380737304688, 1.0476837158203125, 1.0785293579101562, 1.109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 10.0, 12.0, 32.0, 52.0, 90.0, 179.0, 497.0, 1784.0, 10820.0, 609127.0, 414496.0, 8994.0, 1571.0, 471.0, 199.0, 84.0, 50.0, 20.0, 13.0, 5.0, 7.0, 4.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.72265625, -3.609710693359375, -3.49676513671875, -3.383819580078125, -3.2708740234375, -3.157928466796875, -3.04498291015625, -2.932037353515625, -2.819091796875, -2.706146240234375, -2.59320068359375, -2.480255126953125, -2.3673095703125, -2.254364013671875, -2.14141845703125, -2.028472900390625, -1.91552734375, -1.802581787109375, -1.68963623046875, -1.576690673828125, -1.4637451171875, -1.350799560546875, -1.23785400390625, -1.124908447265625, -1.011962890625, -0.899017333984375, -0.78607177734375, -0.673126220703125, -0.5601806640625, -0.447235107421875, -0.33428955078125, -0.221343994140625, -0.1083984375, 0.004547119140625, 0.11749267578125, 0.230438232421875, 0.3433837890625, 0.456329345703125, 0.56927490234375, 0.682220458984375, 0.795166015625, 0.908111572265625, 1.02105712890625, 1.134002685546875, 1.2469482421875, 1.359893798828125, 1.47283935546875, 1.585784912109375, 1.69873046875, 1.811676025390625, 1.92462158203125, 2.037567138671875, 2.1505126953125, 2.263458251953125, 2.37640380859375, 2.489349365234375, 2.602294921875, 2.715240478515625, 2.82818603515625, 2.941131591796875, 3.0540771484375, 3.167022705078125, 3.27996826171875, 3.392913818359375, 3.505859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 8.0, 4.0, 9.0, 9.0, 19.0, 29.0, 39.0, 55.0, 85.0, 103.0, 122.0, 132.0, 120.0, 89.0, 52.0, 38.0, 28.0, 18.0, 10.0, 9.0, 9.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019228458404541016, -0.0001863129436969757, -0.00018034130334854126, -0.0001743696630001068, -0.00016839802265167236, -0.00016242638230323792, -0.00015645474195480347, -0.00015048310160636902, -0.00014451146125793457, -0.00013853982090950012, -0.00013256818056106567, -0.00012659654021263123, -0.00012062489986419678, -0.00011465325951576233, -0.00010868161916732788, -0.00010270997881889343, -9.673833847045898e-05, -9.076669812202454e-05, -8.479505777359009e-05, -7.882341742515564e-05, -7.285177707672119e-05, -6.688013672828674e-05, -6.0908496379852295e-05, -5.493685603141785e-05, -4.89652156829834e-05, -4.299357533454895e-05, -3.70219349861145e-05, -3.1050294637680054e-05, -2.5078654289245605e-05, -1.9107013940811157e-05, -1.3135373592376709e-05, -7.163733243942261e-06, -1.1920928955078125e-06, 4.779547452926636e-06, 1.0751187801361084e-05, 1.6722828149795532e-05, 2.269446849822998e-05, 2.866610884666443e-05, 3.463774919509888e-05, 4.0609389543533325e-05, 4.6581029891967773e-05, 5.255267024040222e-05, 5.852431058883667e-05, 6.449595093727112e-05, 7.046759128570557e-05, 7.643923163414001e-05, 8.241087198257446e-05, 8.838251233100891e-05, 9.435415267944336e-05, 0.00010032579302787781, 0.00010629743337631226, 0.0001122690737247467, 0.00011824071407318115, 0.0001242123544216156, 0.00013018399477005005, 0.0001361556351184845, 0.00014212727546691895, 0.0001480989158153534, 0.00015407055616378784, 0.0001600421965122223, 0.00016601383686065674, 0.0001719854772090912, 0.00017795711755752563, 0.00018392875790596008, 0.00018990039825439453]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 5.0, 14.0, 21.0, 25.0, 51.0, 76.0, 142.0, 315.0, 815.0, 2616.0, 17818.0, 873637.0, 143643.0, 6887.0, 1501.0, 514.0, 183.0, 112.0, 47.0, 35.0, 15.0, 18.0, 13.0, 4.0, 6.0, 5.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.740234375, -3.6326904296875, -3.525146484375, -3.4176025390625, -3.31005859375, -3.2025146484375, -3.094970703125, -2.9874267578125, -2.8798828125, -2.7723388671875, -2.664794921875, -2.5572509765625, -2.44970703125, -2.3421630859375, -2.234619140625, -2.1270751953125, -2.01953125, -1.9119873046875, -1.804443359375, -1.6968994140625, -1.58935546875, -1.4818115234375, -1.374267578125, -1.2667236328125, -1.1591796875, -1.0516357421875, -0.944091796875, -0.8365478515625, -0.72900390625, -0.6214599609375, -0.513916015625, -0.4063720703125, -0.298828125, -0.1912841796875, -0.083740234375, 0.0238037109375, 0.13134765625, 0.2388916015625, 0.346435546875, 0.4539794921875, 0.5615234375, 0.6690673828125, 0.776611328125, 0.8841552734375, 0.99169921875, 1.0992431640625, 1.206787109375, 1.3143310546875, 1.421875, 1.5294189453125, 1.636962890625, 1.7445068359375, 1.85205078125, 1.9595947265625, 2.067138671875, 2.1746826171875, 2.2822265625, 2.3897705078125, 2.497314453125, 2.6048583984375, 2.71240234375, 2.8199462890625, 2.927490234375, 3.0350341796875, 3.142578125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 4.0, 11.0, 16.0, 18.0, 29.0, 38.0, 57.0, 111.0, 143.0, 164.0, 154.0, 71.0, 59.0, 51.0, 18.0, 16.0, 12.0, 8.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.2509765625, -1.2191619873046875, -1.187347412109375, -1.1555328369140625, -1.12371826171875, -1.0919036865234375, -1.060089111328125, -1.0282745361328125, -0.9964599609375, -0.9646453857421875, -0.932830810546875, -0.9010162353515625, -0.86920166015625, -0.8373870849609375, -0.805572509765625, -0.7737579345703125, -0.741943359375, -0.7101287841796875, -0.678314208984375, -0.6464996337890625, -0.61468505859375, -0.5828704833984375, -0.551055908203125, -0.5192413330078125, -0.4874267578125, -0.4556121826171875, -0.423797607421875, -0.3919830322265625, -0.36016845703125, -0.3283538818359375, -0.296539306640625, -0.2647247314453125, -0.23291015625, -0.2010955810546875, -0.169281005859375, -0.1374664306640625, -0.10565185546875, -0.0738372802734375, -0.042022705078125, -0.0102081298828125, 0.0216064453125, 0.0534210205078125, 0.085235595703125, 0.1170501708984375, 0.14886474609375, 0.1806793212890625, 0.212493896484375, 0.2443084716796875, 0.276123046875, 0.3079376220703125, 0.339752197265625, 0.3715667724609375, 0.40338134765625, 0.4351959228515625, 0.467010498046875, 0.4988250732421875, 0.5306396484375, 0.5624542236328125, 0.594268798828125, 0.6260833740234375, 0.65789794921875, 0.6897125244140625, 0.721527099609375, 0.7533416748046875, 0.78515625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 30.0, 433.0, 446.0, 83.0, 10.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.10663604736328, -62.76987838745117, -61.43312072753906, -60.09636306762695, -58.759605407714844, -57.422847747802734, -56.086090087890625, -54.74933624267578, -53.412574768066406, -52.0758171081543, -50.73905944824219, -49.40230178833008, -48.06554412841797, -46.72878646850586, -45.39202880859375, -44.055274963378906, -42.7185173034668, -41.38175964355469, -40.04500198364258, -38.70824432373047, -37.37148666381836, -36.03472900390625, -34.697975158691406, -33.36121368408203, -32.02445983886719, -30.687702178955078, -29.35094451904297, -28.01418685913086, -26.67742919921875, -25.34067153930664, -24.003915786743164, -22.667158126831055, -21.330400466918945, -19.993642807006836, -18.656885147094727, -17.32012939453125, -15.983370780944824, -14.646613121032715, -13.309856414794922, -11.973098754882812, -10.636341094970703, -9.299583435058594, -7.962826251983643, -6.626069068908691, -5.289311408996582, -3.9525537490844727, -2.6157970428466797, -1.2790393829345703, 0.05771827697753906, 1.3944756984710693, 2.7312331199645996, 4.067990303039551, 5.40474796295166, 6.7415056228637695, 8.078262329101562, 9.415019989013672, 10.751777648925781, 12.08853530883789, 13.42529296875, 14.762049674987793, 16.09880828857422, 17.435565948486328, 18.772321701049805, 20.109079360961914, 21.445837020874023]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 11.0, 12.0, 14.0, 25.0, 24.0, 33.0, 28.0, 45.0, 60.0, 62.0, 77.0, 66.0, 72.0, 58.0, 63.0, 64.0, 52.0, 50.0, 50.0, 41.0, 26.0, 21.0, 14.0, 7.0, 8.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-11.261678695678711, -11.014328002929688, -10.766977310180664, -10.519627571105957, -10.272276878356934, -10.02492618560791, -9.777576446533203, -9.53022575378418, -9.282875061035156, -9.035524368286133, -8.78817367553711, -8.540823936462402, -8.293473243713379, -8.046122550964355, -7.79877233505249, -7.551422119140625, -7.304071426391602, -7.056720733642578, -6.809370517730713, -6.562020301818848, -6.314669609069824, -6.067318916320801, -5.8199687004089355, -5.57261848449707, -5.325267791748047, -5.077917098999023, -4.830566883087158, -4.583216667175293, -4.3358659744262695, -4.088515281677246, -3.841165065765381, -3.5938146114349365, -3.3464646339416504, -3.099114179611206, -2.8517637252807617, -2.6044132709503174, -2.357062816619873, -2.1097123622894287, -1.8623619079589844, -1.61501145362854, -1.3676609992980957, -1.1203105449676514, -0.872960090637207, -0.6256096363067627, -0.37825918197631836, -0.13090872764587402, 0.11644172668457031, 0.36379218101501465, 0.611142635345459, 0.8584930896759033, 1.1058435440063477, 1.353193998336792, 1.6005444526672363, 1.8478949069976807, 2.095245361328125, 2.3425958156585693, 2.5899462699890137, 2.837296724319458, 3.0846471786499023, 3.3319976329803467, 3.579348087310791, 3.8266985416412354, 4.07404899597168, 4.321399688720703, 4.568749904632568]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 8.0, 8.0, 22.0, 20.0, 34.0, 38.0, 79.0, 128.0, 259.0, 1171.0, 4106470.0, 85646.0, 278.0, 72.0, 26.0, 15.0, 5.0], "bins": [-41.78125, -41.0594482421875, -40.337646484375, -39.6158447265625, -38.89404296875, -38.1722412109375, -37.450439453125, -36.7286376953125, -36.0068359375, -35.2850341796875, -34.563232421875, -33.8414306640625, -33.11962890625, -32.3978271484375, -31.676025390625, -30.9542236328125, -30.232421875, -29.5106201171875, -28.788818359375, -28.0670166015625, -27.34521484375, -26.6234130859375, -25.901611328125, -25.1798095703125, -24.4580078125, -23.7362060546875, -23.014404296875, -22.2926025390625, -21.57080078125, -20.8489990234375, -20.127197265625, -19.4053955078125, -18.68359375, -17.9617919921875, -17.239990234375, -16.5181884765625, -15.79638671875, -15.0745849609375, -14.352783203125, -13.6309814453125, -12.9091796875, -12.1873779296875, -11.465576171875, -10.7437744140625, -10.02197265625, -9.3001708984375, -8.578369140625, -7.8565673828125, -7.134765625, -6.4129638671875, -5.691162109375, -4.9693603515625, -4.24755859375, -3.5257568359375, -2.803955078125, -2.0821533203125, -1.3603515625, -0.6385498046875, 0.083251953125, 0.8050537109375, 1.52685546875, 2.2486572265625, 2.970458984375, 3.6922607421875, 4.4140625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 13.0, 43.0, 124.0, 243.0, 308.0, 180.0, 62.0, 26.0, 10.0], "bins": [-1.2763671875, -1.2547712326049805, -1.233175277709961, -1.2115793228149414, -1.1899833679199219, -1.1683874130249023, -1.1467914581298828, -1.1251955032348633, -1.1035995483398438, -1.0820035934448242, -1.0604076385498047, -1.0388116836547852, -1.0172157287597656, -0.9956197738647461, -0.9740238189697266, -0.952427864074707, -0.9308319091796875, -0.909235954284668, -0.8876399993896484, -0.8660440444946289, -0.8444480895996094, -0.8228521347045898, -0.8012561798095703, -0.7796602249145508, -0.7580642700195312, -0.7364683151245117, -0.7148723602294922, -0.6932764053344727, -0.6716804504394531, -0.6500844955444336, -0.6284885406494141, -0.6068925857543945, -0.585296630859375, -0.5637006759643555, -0.5421047210693359, -0.5205087661743164, -0.4989128112792969, -0.47731685638427734, -0.4557209014892578, -0.4341249465942383, -0.41252899169921875, -0.3909330368041992, -0.3693370819091797, -0.34774112701416016, -0.3261451721191406, -0.3045492172241211, -0.28295326232910156, -0.26135730743408203, -0.2397613525390625, -0.21816539764404297, -0.19656944274902344, -0.1749734878540039, -0.15337753295898438, -0.13178157806396484, -0.11018562316894531, -0.08858966827392578, -0.06699371337890625, -0.04539775848388672, -0.023801803588867188, -0.0022058486938476562, 0.019390106201171875, 0.040986061096191406, 0.06258201599121094, 0.08417797088623047, 0.10577392578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 14.0, 25.0, 52.0, 88.0, 160.0, 302.0, 1996.0, 4190529.0, 713.0, 216.0, 103.0, 51.0, 19.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.9375, -78.134765625, -76.33203125, -74.529296875, -72.7265625, -70.923828125, -69.12109375, -67.318359375, -65.515625, -63.712890625, -61.91015625, -60.107421875, -58.3046875, -56.501953125, -54.69921875, -52.896484375, -51.09375, -49.291015625, -47.48828125, -45.685546875, -43.8828125, -42.080078125, -40.27734375, -38.474609375, -36.671875, -34.869140625, -33.06640625, -31.263671875, -29.4609375, -27.658203125, -25.85546875, -24.052734375, -22.25, -20.447265625, -18.64453125, -16.841796875, -15.0390625, -13.236328125, -11.43359375, -9.630859375, -7.828125, -6.025390625, -4.22265625, -2.419921875, -0.6171875, 1.185546875, 2.98828125, 4.791015625, 6.59375, 8.396484375, 10.19921875, 12.001953125, 13.8046875, 15.607421875, 17.41015625, 19.212890625, 21.015625, 22.818359375, 24.62109375, 26.423828125, 28.2265625, 30.029296875, 31.83203125, 33.634765625, 35.4375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 54.0, 453.0, 3419.0, 114.0, 24.0, 12.0, 7.0, 1.0, 3.0], "bins": [-6.484375, -6.371040344238281, -6.2577056884765625, -6.144371032714844, -6.031036376953125, -5.917701721191406, -5.8043670654296875, -5.691032409667969, -5.57769775390625, -5.464363098144531, -5.3510284423828125, -5.237693786621094, -5.124359130859375, -5.011024475097656, -4.8976898193359375, -4.784355163574219, -4.6710205078125, -4.557685852050781, -4.4443511962890625, -4.331016540527344, -4.217681884765625, -4.104347229003906, -3.9910125732421875, -3.8776779174804688, -3.76434326171875, -3.6510086059570312, -3.5376739501953125, -3.4243392944335938, -3.311004638671875, -3.1976699829101562, -3.0843353271484375, -2.9710006713867188, -2.857666015625, -2.7443313598632812, -2.6309967041015625, -2.5176620483398438, -2.404327392578125, -2.2909927368164062, -2.1776580810546875, -2.0643234252929688, -1.95098876953125, -1.8376541137695312, -1.7243194580078125, -1.6109848022460938, -1.497650146484375, -1.3843154907226562, -1.2709808349609375, -1.1576461791992188, -1.0443115234375, -0.9309768676757812, -0.8176422119140625, -0.7043075561523438, -0.590972900390625, -0.47763824462890625, -0.3643035888671875, -0.25096893310546875, -0.13763427734375, -0.02429962158203125, 0.0890350341796875, 0.20236968994140625, 0.315704345703125, 0.42903900146484375, 0.5423736572265625, 0.6557083129882812, 0.76904296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 12.0, 187.0, 773.0, 32.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.92539978027344, -73.57017517089844, -71.2149429321289, -68.8597183227539, -66.50448608398438, -64.14926147460938, -61.79403305053711, -59.438804626464844, -57.083580017089844, -54.72835159301758, -52.37312316894531, -50.01789855957031, -47.66267013549805, -45.30744171142578, -42.952213287353516, -40.59698486328125, -38.241756439208984, -35.88652801513672, -33.53129959106445, -31.17607307434082, -28.820846557617188, -26.465618133544922, -24.110389709472656, -21.755163192749023, -19.399934768676758, -17.044706344604492, -14.68947982788086, -12.334251403808594, -9.979023933410645, -7.623796463012695, -5.26856803894043, -2.913341522216797, -0.5581130981445312, 1.797114610671997, 4.152342319488525, 6.507570266723633, 8.862797737121582, 11.218025207519531, 13.573253631591797, 15.92848014831543, 18.283708572387695, 20.63893699645996, 22.994163513183594, 25.34939193725586, 27.704620361328125, 30.059846878051758, 32.415077209472656, 34.770301818847656, 37.12553024291992, 39.48075866699219, 41.83598709106445, 44.19121551513672, 46.54644012451172, 48.901668548583984, 51.25689697265625, 53.61212158203125, 55.96735382080078, 58.32258224487305, 60.67781066894531, 63.03303527832031, 65.38826751708984, 67.74349212646484, 70.09872436523438, 72.45394897460938, 74.80917358398438]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 26.0, 34.0, 68.0, 111.0, 151.0, 150.0, 156.0, 110.0, 80.0, 45.0, 39.0, 11.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.098915100097656, -19.478059768676758, -18.857202529907227, -18.236347198486328, -17.615489959716797, -16.9946346282959, -16.373777389526367, -15.752922058105469, -15.132065773010254, -14.511209487915039, -13.890353202819824, -13.26949691772461, -12.648641586303711, -12.02778434753418, -11.406929016113281, -10.786072731018066, -10.165216445922852, -9.544360160827637, -8.923503875732422, -8.302647590637207, -7.68179178237915, -7.0609354972839355, -6.440079689025879, -5.819223403930664, -5.198367118835449, -4.577510833740234, -3.9566547870635986, -3.335798740386963, -2.714942455291748, -2.094086170196533, -1.4732301235198975, -0.8523740768432617, -0.2315196990966797, 0.3893364667892456, 1.010192632675171, 1.6310487985610962, 2.2519049644470215, 2.8727612495422363, 3.493617296218872, 4.114473342895508, 4.735329627990723, 5.3561859130859375, 5.977042198181152, 6.597898006439209, 7.218754291534424, 7.839610576629639, 8.460466384887695, 9.08132266998291, 9.702178955078125, 10.32303524017334, 10.943891525268555, 11.56474781036377, 12.185604095458984, 12.806459426879883, 13.427315711975098, 14.048171997070312, 14.669028282165527, 15.289884567260742, 15.910740852355957, 16.531597137451172, 17.15245246887207, 17.7733097076416, 18.3941650390625, 19.01502227783203, 19.63587760925293]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 14.0, 13.0, 25.0, 34.0, 43.0, 59.0, 90.0, 175.0, 432.0, 1260.0, 5395.0, 108479.0, 901377.0, 26835.0, 2809.0, 835.0, 290.0, 121.0, 86.0, 55.0, 33.0, 18.0, 19.0, 11.0, 13.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0078125, -12.628662109375, -12.24951171875, -11.870361328125, -11.4912109375, -11.112060546875, -10.73291015625, -10.353759765625, -9.974609375, -9.595458984375, -9.21630859375, -8.837158203125, -8.4580078125, -8.078857421875, -7.69970703125, -7.320556640625, -6.94140625, -6.562255859375, -6.18310546875, -5.803955078125, -5.4248046875, -5.045654296875, -4.66650390625, -4.287353515625, -3.908203125, -3.529052734375, -3.14990234375, -2.770751953125, -2.3916015625, -2.012451171875, -1.63330078125, -1.254150390625, -0.875, -0.495849609375, -0.11669921875, 0.262451171875, 0.6416015625, 1.020751953125, 1.39990234375, 1.779052734375, 2.158203125, 2.537353515625, 2.91650390625, 3.295654296875, 3.6748046875, 4.053955078125, 4.43310546875, 4.812255859375, 5.19140625, 5.570556640625, 5.94970703125, 6.328857421875, 6.7080078125, 7.087158203125, 7.46630859375, 7.845458984375, 8.224609375, 8.603759765625, 8.98291015625, 9.362060546875, 9.7412109375, 10.120361328125, 10.49951171875, 10.878662109375, 11.2578125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 21.0, 27.0, 69.0, 100.0, 156.0, 156.0, 185.0, 103.0, 85.0, 54.0, 27.0, 12.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7373046875, -1.7008209228515625, -1.664337158203125, -1.6278533935546875, -1.59136962890625, -1.5548858642578125, -1.518402099609375, -1.4819183349609375, -1.4454345703125, -1.4089508056640625, -1.372467041015625, -1.3359832763671875, -1.29949951171875, -1.2630157470703125, -1.226531982421875, -1.1900482177734375, -1.153564453125, -1.1170806884765625, -1.080596923828125, -1.0441131591796875, -1.00762939453125, -0.9711456298828125, -0.934661865234375, -0.8981781005859375, -0.8616943359375, -0.8252105712890625, -0.788726806640625, -0.7522430419921875, -0.71575927734375, -0.6792755126953125, -0.642791748046875, -0.6063079833984375, -0.56982421875, -0.5333404541015625, -0.496856689453125, -0.4603729248046875, -0.42388916015625, -0.3874053955078125, -0.350921630859375, -0.3144378662109375, -0.2779541015625, -0.2414703369140625, -0.204986572265625, -0.1685028076171875, -0.13201904296875, -0.0955352783203125, -0.059051513671875, -0.0225677490234375, 0.013916015625, 0.0503997802734375, 0.086883544921875, 0.1233673095703125, 0.15985107421875, 0.1963348388671875, 0.232818603515625, 0.2693023681640625, 0.3057861328125, 0.3422698974609375, 0.378753662109375, 0.4152374267578125, 0.45172119140625, 0.4882049560546875, 0.524688720703125, 0.5611724853515625, 0.59765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 7.0, 12.0, 10.0, 8.0, 8.0, 18.0, 23.0, 23.0, 40.0, 61.0, 80.0, 139.0, 207.0, 453.0, 1003.0, 3476.0, 26988.0, 695273.0, 302689.0, 14061.0, 2310.0, 761.0, 357.0, 184.0, 107.0, 77.0, 53.0, 28.0, 24.0, 24.0, 10.0, 9.0, 6.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.478271484375, -6.29248046875, -6.106689453125, -5.9208984375, -5.735107421875, -5.54931640625, -5.363525390625, -5.177734375, -4.991943359375, -4.80615234375, -4.620361328125, -4.4345703125, -4.248779296875, -4.06298828125, -3.877197265625, -3.69140625, -3.505615234375, -3.31982421875, -3.134033203125, -2.9482421875, -2.762451171875, -2.57666015625, -2.390869140625, -2.205078125, -2.019287109375, -1.83349609375, -1.647705078125, -1.4619140625, -1.276123046875, -1.09033203125, -0.904541015625, -0.71875, -0.532958984375, -0.34716796875, -0.161376953125, 0.0244140625, 0.210205078125, 0.39599609375, 0.581787109375, 0.767578125, 0.953369140625, 1.13916015625, 1.324951171875, 1.5107421875, 1.696533203125, 1.88232421875, 2.068115234375, 2.25390625, 2.439697265625, 2.62548828125, 2.811279296875, 2.9970703125, 3.182861328125, 3.36865234375, 3.554443359375, 3.740234375, 3.926025390625, 4.11181640625, 4.297607421875, 4.4833984375, 4.669189453125, 4.85498046875, 5.040771484375, 5.2265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 10.0, 4.0, 9.0, 7.0, 10.0, 13.0, 24.0, 27.0, 30.0, 28.0, 35.0, 41.0, 45.0, 75.0, 67.0, 59.0, 76.0, 66.0, 65.0, 46.0, 55.0, 36.0, 34.0, 25.0, 24.0, 19.0, 11.0, 15.0, 8.0, 13.0, 7.0, 5.0, 8.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26953125, -2.199554443359375, -2.12957763671875, -2.059600830078125, -1.9896240234375, -1.919647216796875, -1.84967041015625, -1.779693603515625, -1.709716796875, -1.639739990234375, -1.56976318359375, -1.499786376953125, -1.4298095703125, -1.359832763671875, -1.28985595703125, -1.219879150390625, -1.14990234375, -1.079925537109375, -1.00994873046875, -0.939971923828125, -0.8699951171875, -0.800018310546875, -0.73004150390625, -0.660064697265625, -0.590087890625, -0.520111083984375, -0.45013427734375, -0.380157470703125, -0.3101806640625, -0.240203857421875, -0.17022705078125, -0.100250244140625, -0.0302734375, 0.039703369140625, 0.10968017578125, 0.179656982421875, 0.2496337890625, 0.319610595703125, 0.38958740234375, 0.459564208984375, 0.529541015625, 0.599517822265625, 0.66949462890625, 0.739471435546875, 0.8094482421875, 0.879425048828125, 0.94940185546875, 1.019378662109375, 1.08935546875, 1.159332275390625, 1.22930908203125, 1.299285888671875, 1.3692626953125, 1.439239501953125, 1.50921630859375, 1.579193115234375, 1.649169921875, 1.719146728515625, 1.78912353515625, 1.859100341796875, 1.9290771484375, 1.999053955078125, 2.06903076171875, 2.139007568359375, 2.208984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 15.0, 27.0, 72.0, 127.0, 401.0, 1893.0, 128594.0, 912980.0, 3553.0, 538.0, 194.0, 77.0, 32.0, 25.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.1796875, -12.8875732421875, -12.595458984375, -12.3033447265625, -12.01123046875, -11.7191162109375, -11.427001953125, -11.1348876953125, -10.8427734375, -10.5506591796875, -10.258544921875, -9.9664306640625, -9.67431640625, -9.3822021484375, -9.090087890625, -8.7979736328125, -8.505859375, -8.2137451171875, -7.921630859375, -7.6295166015625, -7.33740234375, -7.0452880859375, -6.753173828125, -6.4610595703125, -6.1689453125, -5.8768310546875, -5.584716796875, -5.2926025390625, -5.00048828125, -4.7083740234375, -4.416259765625, -4.1241455078125, -3.83203125, -3.5399169921875, -3.247802734375, -2.9556884765625, -2.66357421875, -2.3714599609375, -2.079345703125, -1.7872314453125, -1.4951171875, -1.2030029296875, -0.910888671875, -0.6187744140625, -0.32666015625, -0.0345458984375, 0.257568359375, 0.5496826171875, 0.841796875, 1.1339111328125, 1.426025390625, 1.7181396484375, 2.01025390625, 2.3023681640625, 2.594482421875, 2.8865966796875, 3.1787109375, 3.4708251953125, 3.762939453125, 4.0550537109375, 4.34716796875, 4.6392822265625, 4.931396484375, 5.2235107421875, 5.515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 1.0, 11.0, 17.0, 14.0, 21.0, 44.0, 66.0, 128.0, 204.0, 208.0, 117.0, 42.0, 32.0, 25.0, 12.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0004940032958984375, -0.0004819035530090332, -0.0004698038101196289, -0.0004577040672302246, -0.0004456043243408203, -0.000433504581451416, -0.0004214048385620117, -0.0004093050956726074, -0.0003972053527832031, -0.00038510560989379883, -0.00037300586700439453, -0.00036090612411499023, -0.00034880638122558594, -0.00033670663833618164, -0.00032460689544677734, -0.00031250715255737305, -0.00030040740966796875, -0.00028830766677856445, -0.00027620792388916016, -0.00026410818099975586, -0.00025200843811035156, -0.00023990869522094727, -0.00022780895233154297, -0.00021570920944213867, -0.00020360946655273438, -0.00019150972366333008, -0.00017940998077392578, -0.00016731023788452148, -0.0001552104949951172, -0.0001431107521057129, -0.0001310110092163086, -0.0001189112663269043, -0.0001068115234375, -9.47117805480957e-05, -8.26120376586914e-05, -7.051229476928711e-05, -5.841255187988281e-05, -4.6312808990478516e-05, -3.421306610107422e-05, -2.2113323211669922e-05, -1.0013580322265625e-05, 2.086162567138672e-06, 1.4185905456542969e-05, 2.6285648345947266e-05, 3.838539123535156e-05, 5.048513412475586e-05, 6.258487701416016e-05, 7.468461990356445e-05, 8.678436279296875e-05, 9.888410568237305e-05, 0.00011098384857177734, 0.00012308359146118164, 0.00013518333435058594, 0.00014728307723999023, 0.00015938282012939453, 0.00017148256301879883, 0.00018358230590820312, 0.00019568204879760742, 0.00020778179168701172, 0.00021988153457641602, 0.0002319812774658203, 0.0002440810203552246, 0.0002561807632446289, 0.0002682805061340332, 0.0002803802490234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 25.0, 46.0, 77.0, 149.0, 394.0, 1563.0, 16094.0, 981670.0, 44957.0, 2676.0, 511.0, 178.0, 69.0, 55.0, 28.0, 16.0, 12.0, 6.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.5, -8.313751220703125, -8.12750244140625, -7.941253662109375, -7.7550048828125, -7.568756103515625, -7.38250732421875, -7.196258544921875, -7.010009765625, -6.823760986328125, -6.63751220703125, -6.451263427734375, -6.2650146484375, -6.078765869140625, -5.89251708984375, -5.706268310546875, -5.52001953125, -5.333770751953125, -5.14752197265625, -4.961273193359375, -4.7750244140625, -4.588775634765625, -4.40252685546875, -4.216278076171875, -4.030029296875, -3.843780517578125, -3.65753173828125, -3.471282958984375, -3.2850341796875, -3.098785400390625, -2.91253662109375, -2.726287841796875, -2.5400390625, -2.353790283203125, -2.16754150390625, -1.981292724609375, -1.7950439453125, -1.608795166015625, -1.42254638671875, -1.236297607421875, -1.050048828125, -0.863800048828125, -0.67755126953125, -0.491302490234375, -0.3050537109375, -0.118804931640625, 0.06744384765625, 0.253692626953125, 0.43994140625, 0.626190185546875, 0.81243896484375, 0.998687744140625, 1.1849365234375, 1.371185302734375, 1.55743408203125, 1.743682861328125, 1.929931640625, 2.116180419921875, 2.30242919921875, 2.488677978515625, 2.6749267578125, 2.861175537109375, 3.04742431640625, 3.233673095703125, 3.419921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 10.0, 15.0, 18.0, 26.0, 49.0, 79.0, 158.0, 206.0, 168.0, 110.0, 49.0, 30.0, 22.0, 14.0, 6.0, 13.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.9462890625, -1.8945770263671875, -1.842864990234375, -1.7911529541015625, -1.73944091796875, -1.6877288818359375, -1.636016845703125, -1.5843048095703125, -1.5325927734375, -1.4808807373046875, -1.429168701171875, -1.3774566650390625, -1.32574462890625, -1.2740325927734375, -1.222320556640625, -1.1706085205078125, -1.118896484375, -1.0671844482421875, -1.015472412109375, -0.9637603759765625, -0.91204833984375, -0.8603363037109375, -0.808624267578125, -0.7569122314453125, -0.7052001953125, -0.6534881591796875, -0.601776123046875, -0.5500640869140625, -0.49835205078125, -0.4466400146484375, -0.394927978515625, -0.3432159423828125, -0.29150390625, -0.2397918701171875, -0.188079833984375, -0.1363677978515625, -0.08465576171875, -0.0329437255859375, 0.018768310546875, 0.0704803466796875, 0.1221923828125, 0.1739044189453125, 0.225616455078125, 0.2773284912109375, 0.32904052734375, 0.3807525634765625, 0.432464599609375, 0.4841766357421875, 0.535888671875, 0.5876007080078125, 0.639312744140625, 0.6910247802734375, 0.74273681640625, 0.7944488525390625, 0.846160888671875, 0.8978729248046875, 0.9495849609375, 1.0012969970703125, 1.053009033203125, 1.1047210693359375, 1.15643310546875, 1.2081451416015625, 1.259857177734375, 1.3115692138671875, 1.36328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 33.0, 508.0, 426.0, 32.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.5018081665039, -114.94254302978516, -112.38328552246094, -109.82402038574219, -107.26475524902344, -104.70549011230469, -102.14623260498047, -99.58696746826172, -97.0277099609375, -94.46844482421875, -91.90918731689453, -89.34992218017578, -86.79065704345703, -84.23139953613281, -81.67213439941406, -79.11286926269531, -76.55360412597656, -73.99433898925781, -71.4350814819336, -68.87581634521484, -66.3165512084961, -63.75728988647461, -61.198028564453125, -58.638763427734375, -56.07950210571289, -53.520240783691406, -50.960975646972656, -48.40171432495117, -45.84245300292969, -43.28318786621094, -40.72392654418945, -38.16466522216797, -35.60540008544922, -33.046138763427734, -30.486873626708984, -27.9276123046875, -25.368349075317383, -22.809085845947266, -20.24982452392578, -17.690561294555664, -15.131298065185547, -12.57203483581543, -10.012772560119629, -7.45350980758667, -4.894247055053711, -2.3349838256835938, 0.22427845001220703, 2.783540725708008, 5.342803955078125, 7.902066707611084, 10.461329460144043, 13.020591735839844, 15.579854965209961, 18.139118194580078, 20.698379516601562, 23.25764274597168, 25.816905975341797, 28.376169204711914, 30.93543243408203, 33.494693756103516, 36.053955078125, 38.61322021484375, 41.172481536865234, 43.73174285888672, 46.29100799560547]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 14.0, 8.0, 17.0, 30.0, 24.0, 37.0, 34.0, 47.0, 52.0, 63.0, 66.0, 50.0, 68.0, 59.0, 67.0, 55.0, 58.0, 44.0, 34.0, 31.0, 30.0, 22.0, 24.0, 17.0, 16.0, 9.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.444101333618164, -12.952472686767578, -12.460844039916992, -11.969215393066406, -11.477587699890137, -10.98595905303955, -10.494330406188965, -10.002701759338379, -9.511073112487793, -9.019444465637207, -8.527815818786621, -8.036188125610352, -7.544559001922607, -7.05293083190918, -6.561302185058594, -6.069673538208008, -5.57804536819458, -5.086416721343994, -4.594788551330566, -4.1031599044799805, -3.6115312576293945, -3.1199028491973877, -2.628274440765381, -2.136645793914795, -1.645017385482788, -1.1533888578414917, -0.6617603898048401, -0.17013192176818848, 0.3214966058731079, 0.8131251335144043, 1.3047535419464111, 1.796382188796997, 2.288010597229004, 2.7796390056610107, 3.2712676525115967, 3.7628960609436035, 4.2545247077941895, 4.746152877807617, 5.237781524658203, 5.729410171508789, 6.221038818359375, 6.712667465209961, 7.204295635223389, 7.695924282073975, 8.187552452087402, 8.679181098937988, 9.170809745788574, 9.66243839263916, 10.15406608581543, 10.645694732666016, 11.137323379516602, 11.628952026367188, 12.120579719543457, 12.612208366394043, 13.103837013244629, 13.595465660095215, 14.0870943069458, 14.578722953796387, 15.070351600646973, 15.561979293823242, 16.053607940673828, 16.545236587524414, 17.036865234375, 17.528493881225586, 18.020122528076172]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 3.0, 7.0, 8.0, 7.0, 4.0, 12.0, 6.0, 10.0, 14.0, 12.0, 20.0, 10.0, 18.0, 36.0, 47.0, 65.0, 81.0, 129.0, 196.0, 320.0, 722.0, 1920.0, 6627.0, 30660.0, 3705365.0, 418133.0, 21716.0, 5394.0, 1637.0, 582.0, 217.0, 126.0, 76.0, 37.0, 21.0, 14.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-10.96875, -10.739715576171875, -10.51068115234375, -10.281646728515625, -10.0526123046875, -9.823577880859375, -9.59454345703125, -9.365509033203125, -9.136474609375, -8.907440185546875, -8.67840576171875, -8.449371337890625, -8.2203369140625, -7.991302490234375, -7.76226806640625, -7.533233642578125, -7.30419921875, -7.075164794921875, -6.84613037109375, -6.617095947265625, -6.3880615234375, -6.159027099609375, -5.92999267578125, -5.700958251953125, -5.471923828125, -5.242889404296875, -5.01385498046875, -4.784820556640625, -4.5557861328125, -4.326751708984375, -4.09771728515625, -3.868682861328125, -3.6396484375, -3.410614013671875, -3.18157958984375, -2.952545166015625, -2.7235107421875, -2.494476318359375, -2.26544189453125, -2.036407470703125, -1.807373046875, -1.578338623046875, -1.34930419921875, -1.120269775390625, -0.8912353515625, -0.662200927734375, -0.43316650390625, -0.204132080078125, 0.02490234375, 0.253936767578125, 0.48297119140625, 0.712005615234375, 0.9410400390625, 1.170074462890625, 1.39910888671875, 1.628143310546875, 1.857177734375, 2.086212158203125, 2.31524658203125, 2.544281005859375, 2.7733154296875, 3.002349853515625, 3.23138427734375, 3.460418701171875, 3.689453125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 10.0, 17.0, 33.0, 49.0, 68.0, 104.0, 136.0, 152.0, 129.0, 108.0, 76.0, 47.0, 36.0, 21.0, 10.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6473770141601562, -1.6140899658203125, -1.5808029174804688, -1.547515869140625, -1.5142288208007812, -1.4809417724609375, -1.4476547241210938, -1.41436767578125, -1.3810806274414062, -1.3477935791015625, -1.3145065307617188, -1.281219482421875, -1.2479324340820312, -1.2146453857421875, -1.1813583374023438, -1.1480712890625, -1.1147842407226562, -1.0814971923828125, -1.0482101440429688, -1.014923095703125, -0.9816360473632812, -0.9483489990234375, -0.9150619506835938, -0.88177490234375, -0.8484878540039062, -0.8152008056640625, -0.7819137573242188, -0.748626708984375, -0.7153396606445312, -0.6820526123046875, -0.6487655639648438, -0.615478515625, -0.5821914672851562, -0.5489044189453125, -0.5156173706054688, -0.482330322265625, -0.44904327392578125, -0.4157562255859375, -0.38246917724609375, -0.34918212890625, -0.31589508056640625, -0.2826080322265625, -0.24932098388671875, -0.216033935546875, -0.18274688720703125, -0.1494598388671875, -0.11617279052734375, -0.0828857421875, -0.04959869384765625, -0.0163116455078125, 0.01697540283203125, 0.050262451171875, 0.08354949951171875, 0.1168365478515625, 0.15012359619140625, 0.18341064453125, 0.21669769287109375, 0.2499847412109375, 0.28327178955078125, 0.316558837890625, 0.34984588623046875, 0.3831329345703125, 0.41641998291015625, 0.44970703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 18.0, 23.0, 54.0, 136.0, 289.0, 736.0, 7975.0, 4182008.0, 2322.0, 455.0, 156.0, 52.0, 30.0, 11.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.65625, -60.381103515625, -59.10595703125, -57.830810546875, -56.5556640625, -55.280517578125, -54.00537109375, -52.730224609375, -51.455078125, -50.179931640625, -48.90478515625, -47.629638671875, -46.3544921875, -45.079345703125, -43.80419921875, -42.529052734375, -41.25390625, -39.978759765625, -38.70361328125, -37.428466796875, -36.1533203125, -34.878173828125, -33.60302734375, -32.327880859375, -31.052734375, -29.777587890625, -28.50244140625, -27.227294921875, -25.9521484375, -24.677001953125, -23.40185546875, -22.126708984375, -20.8515625, -19.576416015625, -18.30126953125, -17.026123046875, -15.7509765625, -14.475830078125, -13.20068359375, -11.925537109375, -10.650390625, -9.375244140625, -8.10009765625, -6.824951171875, -5.5498046875, -4.274658203125, -2.99951171875, -1.724365234375, -0.44921875, 0.825927734375, 2.10107421875, 3.376220703125, 4.6513671875, 5.926513671875, 7.20166015625, 8.476806640625, 9.751953125, 11.027099609375, 12.30224609375, 13.577392578125, 14.8525390625, 16.127685546875, 17.40283203125, 18.677978515625, 19.953125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 16.0, 48.0, 115.0, 3134.0, 639.0, 68.0, 24.0, 13.0, 7.0, 3.0, 1.0, 1.0, 3.0], "bins": [-6.40625, -6.2894439697265625, -6.172637939453125, -6.0558319091796875, -5.93902587890625, -5.8222198486328125, -5.705413818359375, -5.5886077880859375, -5.4718017578125, -5.3549957275390625, -5.238189697265625, -5.1213836669921875, -5.00457763671875, -4.8877716064453125, -4.770965576171875, -4.6541595458984375, -4.537353515625, -4.4205474853515625, -4.303741455078125, -4.1869354248046875, -4.07012939453125, -3.9533233642578125, -3.836517333984375, -3.7197113037109375, -3.6029052734375, -3.4860992431640625, -3.369293212890625, -3.2524871826171875, -3.13568115234375, -3.0188751220703125, -2.902069091796875, -2.7852630615234375, -2.66845703125, -2.5516510009765625, -2.434844970703125, -2.3180389404296875, -2.20123291015625, -2.0844268798828125, -1.967620849609375, -1.8508148193359375, -1.7340087890625, -1.6172027587890625, -1.500396728515625, -1.3835906982421875, -1.26678466796875, -1.1499786376953125, -1.033172607421875, -0.9163665771484375, -0.799560546875, -0.6827545166015625, -0.565948486328125, -0.4491424560546875, -0.33233642578125, -0.2155303955078125, -0.098724365234375, 0.0180816650390625, 0.1348876953125, 0.2516937255859375, 0.368499755859375, 0.4853057861328125, 0.60211181640625, 0.7189178466796875, 0.835723876953125, 0.9525299072265625, 1.0693359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 9.0, 43.0, 831.0, 119.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.366512298583984, -55.1344108581543, -52.90230941772461, -50.67020797729492, -48.4381103515625, -46.20600891113281, -43.973907470703125, -41.74180603027344, -39.50970458984375, -37.27760314941406, -35.045501708984375, -32.81340026855469, -30.581300735473633, -28.349199295043945, -26.11709976196289, -23.884998321533203, -21.652896881103516, -19.420795440673828, -17.18869400024414, -14.956594467163086, -12.724493026733398, -10.492391586303711, -8.26029109954834, -6.028190612792969, -3.7960891723632812, -1.563988208770752, 0.6681127548217773, 2.9002137184143066, 5.132314682006836, 7.364416122436523, 9.596516609191895, 11.828617095947266, 14.060714721679688, 16.292816162109375, 18.524917602539062, 20.757017135620117, 22.989118576049805, 25.221220016479492, 27.453319549560547, 29.685420989990234, 31.917522430419922, 34.14962387084961, 36.3817253112793, 38.613826751708984, 40.845924377441406, 43.078025817871094, 45.31012725830078, 47.54222869873047, 49.774330139160156, 52.006431579589844, 54.23853302001953, 56.47063446044922, 58.702735900878906, 60.934837341308594, 63.166934967041016, 65.39903259277344, 67.63113403320312, 69.86323547363281, 72.0953369140625, 74.32743835449219, 76.55953979492188, 78.79164123535156, 81.02374267578125, 83.25584411621094, 85.48794555664062]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 5.0, 15.0, 27.0, 35.0, 45.0, 68.0, 89.0, 103.0, 100.0, 96.0, 90.0, 81.0, 82.0, 48.0, 42.0, 26.0, 9.0, 17.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.444375991821289, -12.057659149169922, -11.670942306518555, -11.284225463867188, -10.89750862121582, -10.510791778564453, -10.124074935913086, -9.737358093261719, -9.350641250610352, -8.963924407958984, -8.577207565307617, -8.19049072265625, -7.803773880004883, -7.417057037353516, -7.030340671539307, -6.6436238288879395, -6.2569074630737305, -5.870190620422363, -5.483473777770996, -5.096756935119629, -4.710040092468262, -4.3233232498168945, -3.9366068840026855, -3.5498900413513184, -3.163173198699951, -2.776456356048584, -2.389739513397217, -2.0030229091644287, -1.6163060665130615, -1.2295892238616943, -0.8428726196289062, -0.45615577697753906, -0.06943893432617188, 0.31727784872055054, 0.703994631767273, 1.0907113552093506, 1.4774281978607178, 1.864145040512085, 2.250861644744873, 2.6375784873962402, 3.0242953300476074, 3.4110121726989746, 3.797729015350342, 4.184445381164551, 4.571162223815918, 4.957879066467285, 5.344595909118652, 5.7313127517700195, 6.118029594421387, 6.504746437072754, 6.891463279724121, 7.278180122375488, 7.6648969650268555, 8.051613807678223, 8.438329696655273, 8.82504653930664, 9.211763381958008, 9.598480224609375, 9.985197067260742, 10.37191390991211, 10.758630752563477, 11.145347595214844, 11.532064437866211, 11.918781280517578, 12.305498123168945]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 9.0, 24.0, 20.0, 32.0, 25.0, 52.0, 59.0, 118.0, 137.0, 189.0, 289.0, 463.0, 764.0, 1494.0, 3689.0, 11513.0, 51667.0, 372884.0, 512611.0, 69535.0, 14568.0, 4245.0, 1746.0, 831.0, 500.0, 300.0, 209.0, 151.0, 125.0, 68.0, 45.0, 44.0, 30.0, 16.0, 24.0, 19.0, 8.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.91015625, -4.7469482421875, -4.583740234375, -4.4205322265625, -4.25732421875, -4.0941162109375, -3.930908203125, -3.7677001953125, -3.6044921875, -3.4412841796875, -3.278076171875, -3.1148681640625, -2.95166015625, -2.7884521484375, -2.625244140625, -2.4620361328125, -2.298828125, -2.1356201171875, -1.972412109375, -1.8092041015625, -1.64599609375, -1.4827880859375, -1.319580078125, -1.1563720703125, -0.9931640625, -0.8299560546875, -0.666748046875, -0.5035400390625, -0.34033203125, -0.1771240234375, -0.013916015625, 0.1492919921875, 0.3125, 0.4757080078125, 0.638916015625, 0.8021240234375, 0.96533203125, 1.1285400390625, 1.291748046875, 1.4549560546875, 1.6181640625, 1.7813720703125, 1.944580078125, 2.1077880859375, 2.27099609375, 2.4342041015625, 2.597412109375, 2.7606201171875, 2.923828125, 3.0870361328125, 3.250244140625, 3.4134521484375, 3.57666015625, 3.7398681640625, 3.903076171875, 4.0662841796875, 4.2294921875, 4.3927001953125, 4.555908203125, 4.7191162109375, 4.88232421875, 5.0455322265625, 5.208740234375, 5.3719482421875, 5.53515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 17.0, 37.0, 45.0, 58.0, 80.0, 108.0, 112.0, 104.0, 125.0, 99.0, 78.0, 50.0, 29.0, 20.0, 9.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7666015625, -1.7255706787109375, -1.684539794921875, -1.6435089111328125, -1.60247802734375, -1.5614471435546875, -1.520416259765625, -1.4793853759765625, -1.4383544921875, -1.3973236083984375, -1.356292724609375, -1.3152618408203125, -1.27423095703125, -1.2332000732421875, -1.192169189453125, -1.1511383056640625, -1.110107421875, -1.0690765380859375, -1.028045654296875, -0.9870147705078125, -0.94598388671875, -0.9049530029296875, -0.863922119140625, -0.8228912353515625, -0.7818603515625, -0.7408294677734375, -0.699798583984375, -0.6587677001953125, -0.61773681640625, -0.5767059326171875, -0.535675048828125, -0.4946441650390625, -0.45361328125, -0.4125823974609375, -0.371551513671875, -0.3305206298828125, -0.28948974609375, -0.2484588623046875, -0.207427978515625, -0.1663970947265625, -0.1253662109375, -0.0843353271484375, -0.043304443359375, -0.0022735595703125, 0.03875732421875, 0.0797882080078125, 0.120819091796875, 0.1618499755859375, 0.202880859375, 0.2439117431640625, 0.284942626953125, 0.3259735107421875, 0.36700439453125, 0.4080352783203125, 0.449066162109375, 0.4900970458984375, 0.5311279296875, 0.5721588134765625, 0.613189697265625, 0.6542205810546875, 0.69525146484375, 0.7362823486328125, 0.777313232421875, 0.8183441162109375, 0.859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 7.0, 16.0, 13.0, 26.0, 30.0, 43.0, 60.0, 92.0, 183.0, 480.0, 1204.0, 5408.0, 49424.0, 817942.0, 159028.0, 11296.0, 2010.0, 601.0, 249.0, 151.0, 78.0, 48.0, 22.0, 27.0, 23.0, 15.0, 6.0, 7.0, 7.0, 7.0, 2.0, 5.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.62890625, -6.41290283203125, -6.1968994140625, -5.98089599609375, -5.764892578125, -5.54888916015625, -5.3328857421875, -5.11688232421875, -4.90087890625, -4.68487548828125, -4.4688720703125, -4.25286865234375, -4.036865234375, -3.82086181640625, -3.6048583984375, -3.38885498046875, -3.1728515625, -2.95684814453125, -2.7408447265625, -2.52484130859375, -2.308837890625, -2.09283447265625, -1.8768310546875, -1.66082763671875, -1.44482421875, -1.22882080078125, -1.0128173828125, -0.79681396484375, -0.580810546875, -0.36480712890625, -0.1488037109375, 0.06719970703125, 0.283203125, 0.49920654296875, 0.7152099609375, 0.93121337890625, 1.147216796875, 1.36322021484375, 1.5792236328125, 1.79522705078125, 2.01123046875, 2.22723388671875, 2.4432373046875, 2.65924072265625, 2.875244140625, 3.09124755859375, 3.3072509765625, 3.52325439453125, 3.7392578125, 3.95526123046875, 4.1712646484375, 4.38726806640625, 4.603271484375, 4.81927490234375, 5.0352783203125, 5.25128173828125, 5.46728515625, 5.68328857421875, 5.8992919921875, 6.11529541015625, 6.331298828125, 6.54730224609375, 6.7633056640625, 6.97930908203125, 7.1953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 12.0, 12.0, 11.0, 14.0, 17.0, 16.0, 31.0, 31.0, 32.0, 35.0, 36.0, 49.0, 54.0, 52.0, 49.0, 53.0, 58.0, 56.0, 56.0, 34.0, 44.0, 41.0, 36.0, 42.0, 21.0, 19.0, 18.0, 11.0, 10.0, 7.0, 6.0, 9.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.005859375, -2.917999267578125, -2.83013916015625, -2.742279052734375, -2.6544189453125, -2.566558837890625, -2.47869873046875, -2.390838623046875, -2.302978515625, -2.215118408203125, -2.12725830078125, -2.039398193359375, -1.9515380859375, -1.863677978515625, -1.77581787109375, -1.687957763671875, -1.60009765625, -1.512237548828125, -1.42437744140625, -1.336517333984375, -1.2486572265625, -1.160797119140625, -1.07293701171875, -0.985076904296875, -0.897216796875, -0.809356689453125, -0.72149658203125, -0.633636474609375, -0.5457763671875, -0.457916259765625, -0.37005615234375, -0.282196044921875, -0.1943359375, -0.106475830078125, -0.01861572265625, 0.069244384765625, 0.1571044921875, 0.244964599609375, 0.33282470703125, 0.420684814453125, 0.508544921875, 0.596405029296875, 0.68426513671875, 0.772125244140625, 0.8599853515625, 0.947845458984375, 1.03570556640625, 1.123565673828125, 1.21142578125, 1.299285888671875, 1.38714599609375, 1.475006103515625, 1.5628662109375, 1.650726318359375, 1.73858642578125, 1.826446533203125, 1.914306640625, 2.002166748046875, 2.09002685546875, 2.177886962890625, 2.2657470703125, 2.353607177734375, 2.44146728515625, 2.529327392578125, 2.6171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 6.0, 10.0, 10.0, 16.0, 22.0, 28.0, 49.0, 67.0, 129.0, 216.0, 466.0, 940.0, 2610.0, 8523.0, 44132.0, 644644.0, 310930.0, 26252.0, 6046.0, 1879.0, 711.0, 346.0, 184.0, 110.0, 71.0, 48.0, 26.0, 17.0, 22.0, 13.0, 8.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.56439208984375, -1.4959716796875, -1.42755126953125, -1.359130859375, -1.29071044921875, -1.2222900390625, -1.15386962890625, -1.08544921875, -1.01702880859375, -0.9486083984375, -0.88018798828125, -0.811767578125, -0.74334716796875, -0.6749267578125, -0.60650634765625, -0.5380859375, -0.46966552734375, -0.4012451171875, -0.33282470703125, -0.264404296875, -0.19598388671875, -0.1275634765625, -0.05914306640625, 0.00927734375, 0.07769775390625, 0.1461181640625, 0.21453857421875, 0.282958984375, 0.35137939453125, 0.4197998046875, 0.48822021484375, 0.556640625, 0.62506103515625, 0.6934814453125, 0.76190185546875, 0.830322265625, 0.89874267578125, 0.9671630859375, 1.03558349609375, 1.10400390625, 1.17242431640625, 1.2408447265625, 1.30926513671875, 1.377685546875, 1.44610595703125, 1.5145263671875, 1.58294677734375, 1.6513671875, 1.71978759765625, 1.7882080078125, 1.85662841796875, 1.925048828125, 1.99346923828125, 2.0618896484375, 2.13031005859375, 2.19873046875, 2.26715087890625, 2.3355712890625, 2.40399169921875, 2.472412109375, 2.54083251953125, 2.6092529296875, 2.67767333984375, 2.74609375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 6.0, 16.0, 18.0, 14.0, 25.0, 33.0, 45.0, 76.0, 118.0, 140.0, 128.0, 92.0, 82.0, 43.0, 39.0, 25.0, 24.0, 14.0, 11.0, 5.0, 12.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020051002502441406, -0.00019279494881629944, -0.00018507987260818481, -0.0001773647964000702, -0.00016964972019195557, -0.00016193464398384094, -0.00015421956777572632, -0.0001465044915676117, -0.00013878941535949707, -0.00013107433915138245, -0.00012335926294326782, -0.0001156441867351532, -0.00010792911052703857, -0.00010021403431892395, -9.249895811080933e-05, -8.47838819026947e-05, -7.706880569458008e-05, -6.935372948646545e-05, -6.163865327835083e-05, -5.3923577070236206e-05, -4.620850086212158e-05, -3.849342465400696e-05, -3.0778348445892334e-05, -2.306327223777771e-05, -1.5348196029663086e-05, -7.633119821548462e-06, 8.195638656616211e-08, 7.797032594680786e-06, 1.551210880279541e-05, 2.3227185010910034e-05, 3.094226121902466e-05, 3.865733742713928e-05, 4.6372413635253906e-05, 5.408748984336853e-05, 6.180256605148315e-05, 6.951764225959778e-05, 7.72327184677124e-05, 8.494779467582703e-05, 9.266287088394165e-05, 0.00010037794709205627, 0.0001080930233001709, 0.00011580809950828552, 0.00012352317571640015, 0.00013123825192451477, 0.0001389533281326294, 0.00014666840434074402, 0.00015438348054885864, 0.00016209855675697327, 0.0001698136329650879, 0.00017752870917320251, 0.00018524378538131714, 0.00019295886158943176, 0.0002006739377975464, 0.000208389014005661, 0.00021610409021377563, 0.00022381916642189026, 0.00023153424263000488, 0.0002392493188381195, 0.00024696439504623413, 0.00025467947125434875, 0.0002623945474624634, 0.000270109623670578, 0.0002778246998786926, 0.00028553977608680725, 0.0002932548522949219]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 6.0, 7.0, 6.0, 16.0, 22.0, 48.0, 56.0, 112.0, 280.0, 711.0, 2600.0, 13213.0, 205118.0, 789083.0, 30744.0, 4694.0, 1125.0, 358.0, 142.0, 82.0, 37.0, 32.0, 18.0, 15.0, 3.0, 6.0, 1.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.1036376953125, -3.004150390625, -2.9046630859375, -2.80517578125, -2.7056884765625, -2.606201171875, -2.5067138671875, -2.4072265625, -2.3077392578125, -2.208251953125, -2.1087646484375, -2.00927734375, -1.9097900390625, -1.810302734375, -1.7108154296875, -1.611328125, -1.5118408203125, -1.412353515625, -1.3128662109375, -1.21337890625, -1.1138916015625, -1.014404296875, -0.9149169921875, -0.8154296875, -0.7159423828125, -0.616455078125, -0.5169677734375, -0.41748046875, -0.3179931640625, -0.218505859375, -0.1190185546875, -0.01953125, 0.0799560546875, 0.179443359375, 0.2789306640625, 0.37841796875, 0.4779052734375, 0.577392578125, 0.6768798828125, 0.7763671875, 0.8758544921875, 0.975341796875, 1.0748291015625, 1.17431640625, 1.2738037109375, 1.373291015625, 1.4727783203125, 1.572265625, 1.6717529296875, 1.771240234375, 1.8707275390625, 1.97021484375, 2.0697021484375, 2.169189453125, 2.2686767578125, 2.3681640625, 2.4676513671875, 2.567138671875, 2.6666259765625, 2.76611328125, 2.8656005859375, 2.965087890625, 3.0645751953125, 3.1640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 2.0, 9.0, 4.0, 7.0, 17.0, 23.0, 37.0, 23.0, 37.0, 52.0, 65.0, 102.0, 112.0, 115.0, 88.0, 59.0, 57.0, 46.0, 28.0, 28.0, 27.0, 11.0, 11.0, 7.0, 5.0, 2.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0849609375, -1.052215576171875, -1.01947021484375, -0.986724853515625, -0.9539794921875, -0.921234130859375, -0.88848876953125, -0.855743408203125, -0.822998046875, -0.790252685546875, -0.75750732421875, -0.724761962890625, -0.6920166015625, -0.659271240234375, -0.62652587890625, -0.593780517578125, -0.56103515625, -0.528289794921875, -0.49554443359375, -0.462799072265625, -0.4300537109375, -0.397308349609375, -0.36456298828125, -0.331817626953125, -0.299072265625, -0.266326904296875, -0.23358154296875, -0.200836181640625, -0.1680908203125, -0.135345458984375, -0.10260009765625, -0.069854736328125, -0.037109375, -0.004364013671875, 0.02838134765625, 0.061126708984375, 0.0938720703125, 0.126617431640625, 0.15936279296875, 0.192108154296875, 0.224853515625, 0.257598876953125, 0.29034423828125, 0.323089599609375, 0.3558349609375, 0.388580322265625, 0.42132568359375, 0.454071044921875, 0.48681640625, 0.519561767578125, 0.55230712890625, 0.585052490234375, 0.6177978515625, 0.650543212890625, 0.68328857421875, 0.716033935546875, 0.748779296875, 0.781524658203125, 0.81427001953125, 0.847015380859375, 0.8797607421875, 0.912506103515625, 0.94525146484375, 0.977996826171875, 1.0107421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 84.0, 708.0, 186.0, 20.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.61773681640625, -158.48463439941406, -155.35153198242188, -152.2184295654297, -149.0853271484375, -145.9522247314453, -142.81912231445312, -139.68601989746094, -136.55291748046875, -133.41981506347656, -130.28671264648438, -127.15361022949219, -124.0205078125, -120.88740539550781, -117.75430297851562, -114.62120056152344, -111.48809814453125, -108.35499572753906, -105.22189331054688, -102.08879089355469, -98.9556884765625, -95.82258605957031, -92.68948364257812, -89.55638122558594, -86.42327880859375, -83.29017639160156, -80.15707397460938, -77.02397155761719, -73.890869140625, -70.75776672363281, -67.62466430664062, -64.49156188964844, -61.35846710205078, -58.225364685058594, -55.092262268066406, -51.95915985107422, -48.82605743408203, -45.692955017089844, -42.559852600097656, -39.42675018310547, -36.29364776611328, -33.160545349121094, -30.027442932128906, -26.89434051513672, -23.76123809814453, -20.628135681152344, -17.495033264160156, -14.361930847167969, -11.228828430175781, -8.095726013183594, -4.962623596191406, -1.8295211791992188, 1.3035812377929688, 4.436683654785156, 7.569786071777344, 10.702888488769531, 13.835990905761719, 16.969093322753906, 20.102195739746094, 23.23529815673828, 26.36840057373047, 29.501502990722656, 32.634605407714844, 35.76770782470703, 38.90081024169922]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 2.0, 11.0, 7.0, 17.0, 15.0, 17.0, 31.0, 32.0, 27.0, 26.0, 29.0, 25.0, 35.0, 33.0, 49.0, 40.0, 39.0, 57.0, 69.0, 39.0, 44.0, 38.0, 43.0, 34.0, 40.0, 34.0, 28.0, 18.0, 13.0, 15.0, 12.0, 14.0, 12.0, 10.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.173456192016602, -13.752357482910156, -13.331258773803711, -12.910160064697266, -12.48906135559082, -12.067962646484375, -11.64686393737793, -11.225765228271484, -10.804666519165039, -10.383567810058594, -9.962469100952148, -9.541370391845703, -9.120271682739258, -8.699172973632812, -8.278074264526367, -7.856975555419922, -7.435877323150635, -7.0147786140441895, -6.593679904937744, -6.172581195831299, -5.7514824867248535, -5.330384254455566, -4.909285545349121, -4.488186836242676, -4.0670881271362305, -3.645989418029785, -3.22489070892334, -2.8037919998168945, -2.382693290710449, -1.961594820022583, -1.5404961109161377, -1.1193974018096924, -0.698298454284668, -0.27719977498054504, 0.14389890432357788, 0.5649975538253784, 0.9860962629318237, 1.4071948528289795, 1.8282935619354248, 2.24939227104187, 2.6704909801483154, 3.0915896892547607, 3.512688398361206, 3.9337868690490723, 4.354885578155518, 4.775984287261963, 5.197082996368408, 5.6181817054748535, 6.039280414581299, 6.460379123687744, 6.8814778327941895, 7.302576541900635, 7.72367525100708, 8.144773483276367, 8.565872192382812, 8.986970901489258, 9.408069610595703, 9.829168319702148, 10.250267028808594, 10.671365737915039, 11.092464447021484, 11.51356315612793, 11.934661865234375, 12.35576057434082, 12.776859283447266]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 0.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 16.0, 18.0, 15.0, 26.0, 37.0, 56.0, 64.0, 102.0, 149.0, 277.0, 530.0, 1347.0, 4232.0, 20239.0, 4063130.0, 90950.0, 8877.0, 2432.0, 912.0, 392.0, 160.0, 91.0, 69.0, 37.0, 20.0, 21.0, 13.0, 5.0, 7.0, 0.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6953125, -11.385498046875, -11.07568359375, -10.765869140625, -10.4560546875, -10.146240234375, -9.83642578125, -9.526611328125, -9.216796875, -8.906982421875, -8.59716796875, -8.287353515625, -7.9775390625, -7.667724609375, -7.35791015625, -7.048095703125, -6.73828125, -6.428466796875, -6.11865234375, -5.808837890625, -5.4990234375, -5.189208984375, -4.87939453125, -4.569580078125, -4.259765625, -3.949951171875, -3.64013671875, -3.330322265625, -3.0205078125, -2.710693359375, -2.40087890625, -2.091064453125, -1.78125, -1.471435546875, -1.16162109375, -0.851806640625, -0.5419921875, -0.232177734375, 0.07763671875, 0.387451171875, 0.697265625, 1.007080078125, 1.31689453125, 1.626708984375, 1.9365234375, 2.246337890625, 2.55615234375, 2.865966796875, 3.17578125, 3.485595703125, 3.79541015625, 4.105224609375, 4.4150390625, 4.724853515625, 5.03466796875, 5.344482421875, 5.654296875, 5.964111328125, 6.27392578125, 6.583740234375, 6.8935546875, 7.203369140625, 7.51318359375, 7.822998046875, 8.1328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 10.0, 13.0, 28.0, 39.0, 50.0, 69.0, 93.0, 104.0, 118.0, 94.0, 110.0, 88.0, 45.0, 51.0, 33.0, 25.0, 11.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7021484375, -1.6603469848632812, -1.6185455322265625, -1.5767440795898438, -1.534942626953125, -1.4931411743164062, -1.4513397216796875, -1.4095382690429688, -1.36773681640625, -1.3259353637695312, -1.2841339111328125, -1.2423324584960938, -1.200531005859375, -1.1587295532226562, -1.1169281005859375, -1.0751266479492188, -1.0333251953125, -0.9915237426757812, -0.9497222900390625, -0.9079208374023438, -0.866119384765625, -0.8243179321289062, -0.7825164794921875, -0.7407150268554688, -0.69891357421875, -0.6571121215820312, -0.6153106689453125, -0.5735092163085938, -0.531707763671875, -0.48990631103515625, -0.4481048583984375, -0.40630340576171875, -0.364501953125, -0.32270050048828125, -0.2808990478515625, -0.23909759521484375, -0.197296142578125, -0.15549468994140625, -0.1136932373046875, -0.07189178466796875, -0.03009033203125, 0.01171112060546875, 0.0535125732421875, 0.09531402587890625, 0.137115478515625, 0.17891693115234375, 0.2207183837890625, 0.26251983642578125, 0.3043212890625, 0.34612274169921875, 0.3879241943359375, 0.42972564697265625, 0.471527099609375, 0.5133285522460938, 0.5551300048828125, 0.5969314575195312, 0.63873291015625, 0.6805343627929688, 0.7223358154296875, 0.7641372680664062, 0.805938720703125, 0.8477401733398438, 0.8895416259765625, 0.9313430786132812, 0.97314453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 31.0, 41.0, 125.0, 320.0, 1085.0, 10294.0, 4160232.0, 20150.0, 1400.0, 351.0, 135.0, 50.0, 22.0, 17.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.359375, -21.731201171875, -21.10302734375, -20.474853515625, -19.8466796875, -19.218505859375, -18.59033203125, -17.962158203125, -17.333984375, -16.705810546875, -16.07763671875, -15.449462890625, -14.8212890625, -14.193115234375, -13.56494140625, -12.936767578125, -12.30859375, -11.680419921875, -11.05224609375, -10.424072265625, -9.7958984375, -9.167724609375, -8.53955078125, -7.911376953125, -7.283203125, -6.655029296875, -6.02685546875, -5.398681640625, -4.7705078125, -4.142333984375, -3.51416015625, -2.885986328125, -2.2578125, -1.629638671875, -1.00146484375, -0.373291015625, 0.2548828125, 0.883056640625, 1.51123046875, 2.139404296875, 2.767578125, 3.395751953125, 4.02392578125, 4.652099609375, 5.2802734375, 5.908447265625, 6.53662109375, 7.164794921875, 7.79296875, 8.421142578125, 9.04931640625, 9.677490234375, 10.3056640625, 10.933837890625, 11.56201171875, 12.190185546875, 12.818359375, 13.446533203125, 14.07470703125, 14.702880859375, 15.3310546875, 15.959228515625, 16.58740234375, 17.215576171875, 17.84375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 7.0, 21.0, 61.0, 217.0, 3223.0, 382.0, 67.0, 25.0, 24.0, 4.0, 13.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.585235595703125, -2.50836181640625, -2.431488037109375, -2.3546142578125, -2.277740478515625, -2.20086669921875, -2.123992919921875, -2.047119140625, -1.970245361328125, -1.89337158203125, -1.816497802734375, -1.7396240234375, -1.662750244140625, -1.58587646484375, -1.509002685546875, -1.43212890625, -1.355255126953125, -1.27838134765625, -1.201507568359375, -1.1246337890625, -1.047760009765625, -0.97088623046875, -0.894012451171875, -0.817138671875, -0.740264892578125, -0.66339111328125, -0.586517333984375, -0.5096435546875, -0.432769775390625, -0.35589599609375, -0.279022216796875, -0.2021484375, -0.125274658203125, -0.04840087890625, 0.028472900390625, 0.1053466796875, 0.182220458984375, 0.25909423828125, 0.335968017578125, 0.412841796875, 0.489715576171875, 0.56658935546875, 0.643463134765625, 0.7203369140625, 0.797210693359375, 0.87408447265625, 0.950958251953125, 1.02783203125, 1.104705810546875, 1.18157958984375, 1.258453369140625, 1.3353271484375, 1.412200927734375, 1.48907470703125, 1.565948486328125, 1.642822265625, 1.719696044921875, 1.79656982421875, 1.873443603515625, 1.9503173828125, 2.027191162109375, 2.10406494140625, 2.180938720703125, 2.2578125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 23.0, 91.0, 355.0, 399.0, 100.0, 24.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.43174171447754, -26.849515914916992, -26.267290115356445, -25.6850643157959, -25.10283851623535, -24.520612716674805, -23.938386917114258, -23.356163024902344, -22.773937225341797, -22.19171142578125, -21.609485626220703, -21.027259826660156, -20.44503402709961, -19.862808227539062, -19.280582427978516, -18.69835662841797, -18.116130828857422, -17.533905029296875, -16.951679229736328, -16.36945343017578, -15.787227630615234, -15.205001831054688, -14.622776985168457, -14.04055118560791, -13.458325386047363, -12.876099586486816, -12.29387378692627, -11.711647987365723, -11.129423141479492, -10.547197341918945, -9.964971542358398, -9.382745742797852, -8.800521850585938, -8.21829605102539, -7.636070251464844, -7.053844928741455, -6.471619129180908, -5.889393329620361, -5.307168006896973, -4.724942207336426, -4.142716407775879, -3.560490608215332, -2.9782650470733643, -2.3960394859313965, -1.8138136863708496, -1.2315878868103027, -0.649362325668335, -0.06713676452636719, 0.5150890350341797, 1.097314715385437, 1.6795403957366943, 2.261765956878662, 2.843991756439209, 3.426217555999756, 4.0084428787231445, 4.590668678283691, 5.172894477844238, 5.755120277404785, 6.337346076965332, 6.919571399688721, 7.501797199249268, 8.084022521972656, 8.666248321533203, 9.24847412109375, 9.830699920654297]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 12.0, 12.0, 15.0, 17.0, 14.0, 26.0, 31.0, 39.0, 27.0, 47.0, 48.0, 52.0, 55.0, 64.0, 52.0, 61.0, 45.0, 52.0, 50.0, 42.0, 46.0, 41.0, 24.0, 23.0, 26.0, 21.0, 8.0, 13.0, 13.0, 10.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.078470230102539, -3.934617042541504, -3.7907638549804688, -3.6469109058380127, -3.5030577182769775, -3.3592045307159424, -3.2153515815734863, -3.071498394012451, -2.927645206451416, -2.783792018890381, -2.6399388313293457, -2.4960858821868896, -2.3522326946258545, -2.2083795070648193, -2.0645265579223633, -1.9206733703613281, -1.776820182800293, -1.6329669952392578, -1.4891139268875122, -1.3452608585357666, -1.2014076709747314, -1.0575544834136963, -0.9137014150619507, -0.7698483467102051, -0.6259951591491699, -0.48214203119277954, -0.33828890323638916, -0.19443577527999878, -0.0505826473236084, 0.09327048063278198, 0.23712360858917236, 0.38097667694091797, 0.5248293876647949, 0.6686825156211853, 0.8125356435775757, 0.9563887715339661, 1.1002418994903564, 1.2440950870513916, 1.3879481554031372, 1.5318012237548828, 1.675654411315918, 1.8195075988769531, 1.9633606672286987, 2.1072137355804443, 2.2510669231414795, 2.3949201107025146, 2.5387730598449707, 2.682626247406006, 2.826479434967041, 2.970332622528076, 3.1141858100891113, 3.2580387592315674, 3.4018919467926025, 3.5457451343536377, 3.6895980834960938, 3.833451271057129, 3.977304458618164, 4.121157646179199, 4.265010833740234, 4.4088640213012695, 4.552717208862305, 4.696569919586182, 4.840423107147217, 4.984276294708252, 5.128129482269287]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 15.0, 14.0, 11.0, 16.0, 24.0, 27.0, 41.0, 77.0, 109.0, 127.0, 191.0, 322.0, 491.0, 820.0, 1573.0, 3966.0, 13597.0, 65018.0, 501687.0, 390036.0, 51880.0, 11293.0, 3642.0, 1470.0, 789.0, 442.0, 301.0, 169.0, 116.0, 87.0, 64.0, 38.0, 28.0, 21.0, 20.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.16796875, -5.9862060546875, -5.804443359375, -5.6226806640625, -5.44091796875, -5.2591552734375, -5.077392578125, -4.8956298828125, -4.7138671875, -4.5321044921875, -4.350341796875, -4.1685791015625, -3.98681640625, -3.8050537109375, -3.623291015625, -3.4415283203125, -3.259765625, -3.0780029296875, -2.896240234375, -2.7144775390625, -2.53271484375, -2.3509521484375, -2.169189453125, -1.9874267578125, -1.8056640625, -1.6239013671875, -1.442138671875, -1.2603759765625, -1.07861328125, -0.8968505859375, -0.715087890625, -0.5333251953125, -0.3515625, -0.1697998046875, 0.011962890625, 0.1937255859375, 0.37548828125, 0.5572509765625, 0.739013671875, 0.9207763671875, 1.1025390625, 1.2843017578125, 1.466064453125, 1.6478271484375, 1.82958984375, 2.0113525390625, 2.193115234375, 2.3748779296875, 2.556640625, 2.7384033203125, 2.920166015625, 3.1019287109375, 3.28369140625, 3.4654541015625, 3.647216796875, 3.8289794921875, 4.0107421875, 4.1925048828125, 4.374267578125, 4.5560302734375, 4.73779296875, 4.9195556640625, 5.101318359375, 5.2830810546875, 5.46484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 7.0, 16.0, 22.0, 29.0, 56.0, 52.0, 83.0, 87.0, 95.0, 120.0, 102.0, 91.0, 74.0, 55.0, 35.0, 25.0, 24.0, 8.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.73046875, -1.6874847412109375, -1.644500732421875, -1.6015167236328125, -1.55853271484375, -1.5155487060546875, -1.472564697265625, -1.4295806884765625, -1.3865966796875, -1.3436126708984375, -1.300628662109375, -1.2576446533203125, -1.21466064453125, -1.1716766357421875, -1.128692626953125, -1.0857086181640625, -1.042724609375, -0.9997406005859375, -0.956756591796875, -0.9137725830078125, -0.87078857421875, -0.8278045654296875, -0.784820556640625, -0.7418365478515625, -0.6988525390625, -0.6558685302734375, -0.612884521484375, -0.5699005126953125, -0.52691650390625, -0.4839324951171875, -0.440948486328125, -0.3979644775390625, -0.35498046875, -0.3119964599609375, -0.269012451171875, -0.2260284423828125, -0.18304443359375, -0.1400604248046875, -0.097076416015625, -0.0540924072265625, -0.0111083984375, 0.0318756103515625, 0.074859619140625, 0.1178436279296875, 0.16082763671875, 0.2038116455078125, 0.246795654296875, 0.2897796630859375, 0.332763671875, 0.3757476806640625, 0.418731689453125, 0.4617156982421875, 0.50469970703125, 0.5476837158203125, 0.590667724609375, 0.6336517333984375, 0.6766357421875, 0.7196197509765625, 0.762603759765625, 0.8055877685546875, 0.84857177734375, 0.8915557861328125, 0.934539794921875, 0.9775238037109375, 1.0205078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 8.0, 9.0, 17.0, 17.0, 27.0, 39.0, 67.0, 124.0, 262.0, 729.0, 2921.0, 26365.0, 807156.0, 198969.0, 9320.0, 1579.0, 464.0, 183.0, 91.0, 61.0, 36.0, 22.0, 16.0, 14.0, 11.0, 5.0, 5.0, 4.0, 7.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.1328125, -11.811767578125, -11.49072265625, -11.169677734375, -10.8486328125, -10.527587890625, -10.20654296875, -9.885498046875, -9.564453125, -9.243408203125, -8.92236328125, -8.601318359375, -8.2802734375, -7.959228515625, -7.63818359375, -7.317138671875, -6.99609375, -6.675048828125, -6.35400390625, -6.032958984375, -5.7119140625, -5.390869140625, -5.06982421875, -4.748779296875, -4.427734375, -4.106689453125, -3.78564453125, -3.464599609375, -3.1435546875, -2.822509765625, -2.50146484375, -2.180419921875, -1.859375, -1.538330078125, -1.21728515625, -0.896240234375, -0.5751953125, -0.254150390625, 0.06689453125, 0.387939453125, 0.708984375, 1.030029296875, 1.35107421875, 1.672119140625, 1.9931640625, 2.314208984375, 2.63525390625, 2.956298828125, 3.27734375, 3.598388671875, 3.91943359375, 4.240478515625, 4.5615234375, 4.882568359375, 5.20361328125, 5.524658203125, 5.845703125, 6.166748046875, 6.48779296875, 6.808837890625, 7.1298828125, 7.450927734375, 7.77197265625, 8.093017578125, 8.4140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 5.0, 8.0, 4.0, 5.0, 15.0, 15.0, 13.0, 13.0, 19.0, 36.0, 31.0, 42.0, 48.0, 65.0, 55.0, 71.0, 70.0, 78.0, 58.0, 66.0, 48.0, 52.0, 34.0, 32.0, 32.0, 23.0, 14.0, 12.0, 7.0, 7.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.2109375, -5.075836181640625, -4.94073486328125, -4.805633544921875, -4.6705322265625, -4.535430908203125, -4.40032958984375, -4.265228271484375, -4.130126953125, -3.995025634765625, -3.85992431640625, -3.724822998046875, -3.5897216796875, -3.454620361328125, -3.31951904296875, -3.184417724609375, -3.04931640625, -2.914215087890625, -2.77911376953125, -2.644012451171875, -2.5089111328125, -2.373809814453125, -2.23870849609375, -2.103607177734375, -1.968505859375, -1.833404541015625, -1.69830322265625, -1.563201904296875, -1.4281005859375, -1.292999267578125, -1.15789794921875, -1.022796630859375, -0.8876953125, -0.752593994140625, -0.61749267578125, -0.482391357421875, -0.3472900390625, -0.212188720703125, -0.07708740234375, 0.058013916015625, 0.193115234375, 0.328216552734375, 0.46331787109375, 0.598419189453125, 0.7335205078125, 0.868621826171875, 1.00372314453125, 1.138824462890625, 1.27392578125, 1.409027099609375, 1.54412841796875, 1.679229736328125, 1.8143310546875, 1.949432373046875, 2.08453369140625, 2.219635009765625, 2.354736328125, 2.489837646484375, 2.62493896484375, 2.760040283203125, 2.8951416015625, 3.030242919921875, 3.16534423828125, 3.300445556640625, 3.435546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 15.0, 18.0, 26.0, 48.0, 82.0, 139.0, 309.0, 718.0, 1920.0, 6719.0, 38496.0, 801313.0, 177097.0, 15837.0, 3596.0, 1172.0, 513.0, 235.0, 114.0, 60.0, 35.0, 29.0, 14.0, 13.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.47265625, -3.35980224609375, -3.2469482421875, -3.13409423828125, -3.021240234375, -2.90838623046875, -2.7955322265625, -2.68267822265625, -2.56982421875, -2.45697021484375, -2.3441162109375, -2.23126220703125, -2.118408203125, -2.00555419921875, -1.8927001953125, -1.77984619140625, -1.6669921875, -1.55413818359375, -1.4412841796875, -1.32843017578125, -1.215576171875, -1.10272216796875, -0.9898681640625, -0.87701416015625, -0.76416015625, -0.65130615234375, -0.5384521484375, -0.42559814453125, -0.312744140625, -0.19989013671875, -0.0870361328125, 0.02581787109375, 0.138671875, 0.25152587890625, 0.3643798828125, 0.47723388671875, 0.590087890625, 0.70294189453125, 0.8157958984375, 0.92864990234375, 1.04150390625, 1.15435791015625, 1.2672119140625, 1.38006591796875, 1.492919921875, 1.60577392578125, 1.7186279296875, 1.83148193359375, 1.9443359375, 2.05718994140625, 2.1700439453125, 2.28289794921875, 2.395751953125, 2.50860595703125, 2.6214599609375, 2.73431396484375, 2.84716796875, 2.96002197265625, 3.0728759765625, 3.18572998046875, 3.298583984375, 3.41143798828125, 3.5242919921875, 3.63714599609375, 3.75]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 4.0, 8.0, 8.0, 14.0, 15.0, 17.0, 22.0, 34.0, 69.0, 105.0, 151.0, 172.0, 106.0, 88.0, 52.0, 38.0, 23.0, 11.0, 17.0, 9.0, 10.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004134178161621094, -0.0004016794264316559, -0.0003899410367012024, -0.0003782026469707489, -0.0003664642572402954, -0.0003547258675098419, -0.00034298747777938843, -0.00033124908804893494, -0.00031951069831848145, -0.00030777230858802795, -0.00029603391885757446, -0.00028429552912712097, -0.0002725571393966675, -0.000260818749666214, -0.0002490803599357605, -0.000237341970205307, -0.00022560358047485352, -0.00021386519074440002, -0.00020212680101394653, -0.00019038841128349304, -0.00017865002155303955, -0.00016691163182258606, -0.00015517324209213257, -0.00014343485236167908, -0.00013169646263122559, -0.0001199580729007721, -0.0001082196831703186, -9.648129343986511e-05, -8.474290370941162e-05, -7.300451397895813e-05, -6.126612424850464e-05, -4.952773451805115e-05, -3.7789344787597656e-05, -2.6050955057144165e-05, -1.4312565326690674e-05, -2.5741755962371826e-06, 9.164214134216309e-06, 2.09026038646698e-05, 3.264099359512329e-05, 4.437938332557678e-05, 5.6117773056030273e-05, 6.785616278648376e-05, 7.959455251693726e-05, 9.133294224739075e-05, 0.00010307133197784424, 0.00011480972170829773, 0.00012654811143875122, 0.0001382865011692047, 0.0001500248908996582, 0.0001617632806301117, 0.00017350167036056519, 0.00018524006009101868, 0.00019697844982147217, 0.00020871683955192566, 0.00022045522928237915, 0.00023219361901283264, 0.00024393200874328613, 0.0002556703984737396, 0.0002674087882041931, 0.0002791471779346466, 0.0002908855676651001, 0.0003026239573955536, 0.0003143623471260071, 0.00032610073685646057, 0.00033783912658691406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 10.0, 6.0, 12.0, 24.0, 64.0, 154.0, 474.0, 2766.0, 69980.0, 960258.0, 13118.0, 1125.0, 322.0, 111.0, 52.0, 29.0, 14.0, 8.0, 15.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.74609375, -4.52313232421875, -4.3001708984375, -4.07720947265625, -3.854248046875, -3.63128662109375, -3.4083251953125, -3.18536376953125, -2.96240234375, -2.73944091796875, -2.5164794921875, -2.29351806640625, -2.070556640625, -1.84759521484375, -1.6246337890625, -1.40167236328125, -1.1787109375, -0.95574951171875, -0.7327880859375, -0.50982666015625, -0.286865234375, -0.06390380859375, 0.1590576171875, 0.38201904296875, 0.60498046875, 0.82794189453125, 1.0509033203125, 1.27386474609375, 1.496826171875, 1.71978759765625, 1.9427490234375, 2.16571044921875, 2.388671875, 2.61163330078125, 2.8345947265625, 3.05755615234375, 3.280517578125, 3.50347900390625, 3.7264404296875, 3.94940185546875, 4.17236328125, 4.39532470703125, 4.6182861328125, 4.84124755859375, 5.064208984375, 5.28717041015625, 5.5101318359375, 5.73309326171875, 5.9560546875, 6.17901611328125, 6.4019775390625, 6.62493896484375, 6.847900390625, 7.07086181640625, 7.2938232421875, 7.51678466796875, 7.73974609375, 7.96270751953125, 8.1856689453125, 8.40863037109375, 8.631591796875, 8.85455322265625, 9.0775146484375, 9.30047607421875, 9.5234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 6.0, 7.0, 6.0, 19.0, 21.0, 39.0, 70.0, 119.0, 214.0, 186.0, 103.0, 75.0, 50.0, 24.0, 19.0, 18.0, 8.0, 6.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5478515625, -1.4659576416015625, -1.384063720703125, -1.3021697998046875, -1.22027587890625, -1.1383819580078125, -1.056488037109375, -0.9745941162109375, -0.8927001953125, -0.8108062744140625, -0.728912353515625, -0.6470184326171875, -0.56512451171875, -0.4832305908203125, -0.401336669921875, -0.3194427490234375, -0.237548828125, -0.1556549072265625, -0.073760986328125, 0.0081329345703125, 0.09002685546875, 0.1719207763671875, 0.253814697265625, 0.3357086181640625, 0.4176025390625, 0.4994964599609375, 0.581390380859375, 0.6632843017578125, 0.74517822265625, 0.8270721435546875, 0.908966064453125, 0.9908599853515625, 1.07275390625, 1.1546478271484375, 1.236541748046875, 1.3184356689453125, 1.40032958984375, 1.4822235107421875, 1.564117431640625, 1.6460113525390625, 1.7279052734375, 1.8097991943359375, 1.891693115234375, 1.9735870361328125, 2.05548095703125, 2.1373748779296875, 2.219268798828125, 2.3011627197265625, 2.383056640625, 2.4649505615234375, 2.546844482421875, 2.6287384033203125, 2.71063232421875, 2.7925262451171875, 2.874420166015625, 2.9563140869140625, 3.0382080078125, 3.1201019287109375, 3.201995849609375, 3.2838897705078125, 3.36578369140625, 3.4476776123046875, 3.529571533203125, 3.6114654541015625, 3.693359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 24.0, 144.0, 544.0, 243.0, 36.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-154.6659698486328, -151.7776641845703, -148.88937377929688, -146.00106811523438, -143.11276245117188, -140.22447204589844, -137.33616638183594, -134.4478759765625, -131.5595703125, -128.6712646484375, -125.78296661376953, -122.89466857910156, -120.0063705444336, -117.11807250976562, -114.22976684570312, -111.34146881103516, -108.45317077636719, -105.56487274169922, -102.67656707763672, -99.78826904296875, -96.89997100830078, -94.01167297363281, -91.12336730957031, -88.23506927490234, -85.34676361083984, -82.45846557617188, -79.57015991210938, -76.6818618774414, -73.79356384277344, -70.90526580810547, -68.01696014404297, -65.128662109375, -62.240360260009766, -59.35205841064453, -56.46376037597656, -53.57545852661133, -50.68716049194336, -47.798858642578125, -44.910560607910156, -42.02225875854492, -39.13395690917969, -36.24565505981445, -33.357357025146484, -30.46905517578125, -27.58075714111328, -24.692455291748047, -21.804155349731445, -18.915855407714844, -16.027557373046875, -13.139257431030273, -10.250957489013672, -7.362656593322754, -4.474356651306152, -1.5860567092895508, 1.3022441864013672, 4.190544128417969, 7.07884407043457, 9.967144012451172, 12.855443954467773, 15.743744850158691, 18.63204574584961, 21.520343780517578, 24.408645629882812, 27.296945571899414, 30.185245513916016]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 7.0, 13.0, 15.0, 27.0, 24.0, 20.0, 18.0, 26.0, 29.0, 35.0, 33.0, 35.0, 60.0, 47.0, 47.0, 40.0, 44.0, 40.0, 48.0, 44.0, 51.0, 42.0, 35.0, 46.0, 25.0, 19.0, 22.0, 19.0, 11.0, 16.0, 8.0, 8.0, 9.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.404150009155273, -18.829570770263672, -18.254993438720703, -17.6804141998291, -17.105836868286133, -16.53125762939453, -15.956679344177246, -15.382101058959961, -14.807522773742676, -14.23294448852539, -13.658366203308105, -13.08378791809082, -12.509208679199219, -11.93463134765625, -11.360052108764648, -10.785473823547363, -10.210895538330078, -9.636317253112793, -9.061738967895508, -8.487160682678223, -7.912581920623779, -7.338003635406494, -6.763424873352051, -6.188846588134766, -5.6142683029174805, -5.039690017700195, -4.46511173248291, -3.890532970428467, -3.3159546852111816, -2.7413763999938965, -2.1667978763580322, -1.592219352722168, -1.01763916015625, -0.4430607557296753, 0.13151764869689941, 0.7060960531234741, 1.2806744575500488, 1.855252742767334, 2.4298312664031982, 3.0044097900390625, 3.5789880752563477, 4.153566360473633, 4.728144645690918, 5.302723407745361, 5.8773016929626465, 6.451879978179932, 7.026458740234375, 7.60103702545166, 8.175615310668945, 8.75019359588623, 9.324771881103516, 9.8993501663208, 10.473928451538086, 11.048507690429688, 11.623085975646973, 12.197664260864258, 12.772242546081543, 13.346820831298828, 13.921399116516113, 14.495977401733398, 15.070556640625, 15.645133972167969, 16.21971321105957, 16.794292449951172, 17.36886978149414]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 9.0, 13.0, 5.0, 19.0, 16.0, 27.0, 33.0, 33.0, 42.0, 66.0, 80.0, 97.0, 132.0, 205.0, 313.0, 571.0, 1080.0, 2786.0, 7463.0, 26759.0, 612747.0, 3491064.0, 35393.0, 9022.0, 3230.0, 1402.0, 686.0, 364.0, 186.0, 143.0, 103.0, 53.0, 41.0, 24.0, 16.0, 13.0, 12.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-9.828125, -9.5828857421875, -9.337646484375, -9.0924072265625, -8.84716796875, -8.6019287109375, -8.356689453125, -8.1114501953125, -7.8662109375, -7.6209716796875, -7.375732421875, -7.1304931640625, -6.88525390625, -6.6400146484375, -6.394775390625, -6.1495361328125, -5.904296875, -5.6590576171875, -5.413818359375, -5.1685791015625, -4.92333984375, -4.6781005859375, -4.432861328125, -4.1876220703125, -3.9423828125, -3.6971435546875, -3.451904296875, -3.2066650390625, -2.96142578125, -2.7161865234375, -2.470947265625, -2.2257080078125, -1.98046875, -1.7352294921875, -1.489990234375, -1.2447509765625, -0.99951171875, -0.7542724609375, -0.509033203125, -0.2637939453125, -0.0185546875, 0.2266845703125, 0.471923828125, 0.7171630859375, 0.96240234375, 1.2076416015625, 1.452880859375, 1.6981201171875, 1.943359375, 2.1885986328125, 2.433837890625, 2.6790771484375, 2.92431640625, 3.1695556640625, 3.414794921875, 3.6600341796875, 3.9052734375, 4.1505126953125, 4.395751953125, 4.6409912109375, 4.88623046875, 5.1314697265625, 5.376708984375, 5.6219482421875, 5.8671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 17.0, 19.0, 28.0, 31.0, 53.0, 67.0, 67.0, 86.0, 87.0, 85.0, 108.0, 76.0, 67.0, 68.0, 41.0, 28.0, 19.0, 19.0, 11.0, 6.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.7041015625, -1.6628646850585938, -1.6216278076171875, -1.5803909301757812, -1.539154052734375, -1.4979171752929688, -1.4566802978515625, -1.4154434204101562, -1.37420654296875, -1.3329696655273438, -1.2917327880859375, -1.2504959106445312, -1.209259033203125, -1.1680221557617188, -1.1267852783203125, -1.0855484008789062, -1.0443115234375, -1.0030746459960938, -0.9618377685546875, -0.9206008911132812, -0.879364013671875, -0.8381271362304688, -0.7968902587890625, -0.7556533813476562, -0.71441650390625, -0.6731796264648438, -0.6319427490234375, -0.5907058715820312, -0.549468994140625, -0.5082321166992188, -0.4669952392578125, -0.42575836181640625, -0.384521484375, -0.34328460693359375, -0.3020477294921875, -0.26081085205078125, -0.219573974609375, -0.17833709716796875, -0.1371002197265625, -0.09586334228515625, -0.05462646484375, -0.01338958740234375, 0.0278472900390625, 0.06908416748046875, 0.110321044921875, 0.15155792236328125, 0.1927947998046875, 0.23403167724609375, 0.2752685546875, 0.31650543212890625, 0.3577423095703125, 0.39897918701171875, 0.440216064453125, 0.48145294189453125, 0.5226898193359375, 0.5639266967773438, 0.60516357421875, 0.6464004516601562, 0.6876373291015625, 0.7288742065429688, 0.770111083984375, 0.8113479614257812, 0.8525848388671875, 0.8938217163085938, 0.93505859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 4.0, 4.0, 6.0, 17.0, 54.0, 90.0, 197.0, 415.0, 1350.0, 15464.0, 4154060.0, 20545.0, 1390.0, 362.0, 156.0, 74.0, 36.0, 25.0, 12.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.5, -35.6983642578125, -34.896728515625, -34.0950927734375, -33.29345703125, -32.4918212890625, -31.690185546875, -30.8885498046875, -30.0869140625, -29.2852783203125, -28.483642578125, -27.6820068359375, -26.88037109375, -26.0787353515625, -25.277099609375, -24.4754638671875, -23.673828125, -22.8721923828125, -22.070556640625, -21.2689208984375, -20.46728515625, -19.6656494140625, -18.864013671875, -18.0623779296875, -17.2607421875, -16.4591064453125, -15.657470703125, -14.8558349609375, -14.05419921875, -13.2525634765625, -12.450927734375, -11.6492919921875, -10.84765625, -10.0460205078125, -9.244384765625, -8.4427490234375, -7.64111328125, -6.8394775390625, -6.037841796875, -5.2362060546875, -4.4345703125, -3.6329345703125, -2.831298828125, -2.0296630859375, -1.22802734375, -0.4263916015625, 0.375244140625, 1.1768798828125, 1.978515625, 2.7801513671875, 3.581787109375, 4.3834228515625, 5.18505859375, 5.9866943359375, 6.788330078125, 7.5899658203125, 8.3916015625, 9.1932373046875, 9.994873046875, 10.7965087890625, 11.59814453125, 12.3997802734375, 13.201416015625, 14.0030517578125, 14.8046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 9.0, 21.0, 28.0, 40.0, 134.0, 545.0, 2789.0, 249.0, 94.0, 48.0, 28.0, 26.0, 18.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.015625, -4.9074249267578125, -4.799224853515625, -4.6910247802734375, -4.58282470703125, -4.4746246337890625, -4.366424560546875, -4.2582244873046875, -4.1500244140625, -4.0418243408203125, -3.933624267578125, -3.8254241943359375, -3.71722412109375, -3.6090240478515625, -3.500823974609375, -3.3926239013671875, -3.284423828125, -3.1762237548828125, -3.068023681640625, -2.9598236083984375, -2.85162353515625, -2.7434234619140625, -2.635223388671875, -2.5270233154296875, -2.4188232421875, -2.3106231689453125, -2.202423095703125, -2.0942230224609375, -1.98602294921875, -1.8778228759765625, -1.769622802734375, -1.6614227294921875, -1.55322265625, -1.4450225830078125, -1.336822509765625, -1.2286224365234375, -1.12042236328125, -1.0122222900390625, -0.904022216796875, -0.7958221435546875, -0.6876220703125, -0.5794219970703125, -0.471221923828125, -0.3630218505859375, -0.25482177734375, -0.1466217041015625, -0.038421630859375, 0.0697784423828125, 0.177978515625, 0.2861785888671875, 0.394378662109375, 0.5025787353515625, 0.61077880859375, 0.7189788818359375, 0.827178955078125, 0.9353790283203125, 1.0435791015625, 1.1517791748046875, 1.259979248046875, 1.3681793212890625, 1.47637939453125, 1.5845794677734375, 1.692779541015625, 1.8009796142578125, 1.9091796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 16.0, 108.0, 611.0, 223.0, 35.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.953716278076172, -21.270702362060547, -19.587688446044922, -17.904674530029297, -16.221660614013672, -14.538646697998047, -12.855632781982422, -11.172618865966797, -9.489604949951172, -7.806591033935547, -6.123577117919922, -4.440563201904297, -2.757549285888672, -1.0745353698730469, 0.6084785461425781, 2.291492462158203, 3.974506378173828, 5.657520294189453, 7.340534210205078, 9.023548126220703, 10.706562042236328, 12.389575958251953, 14.072589874267578, 15.755603790283203, 17.438617706298828, 19.121631622314453, 20.804645538330078, 22.487659454345703, 24.170673370361328, 25.853687286376953, 27.536701202392578, 29.219715118408203, 30.902725219726562, 32.58573913574219, 34.26875305175781, 35.95176696777344, 37.63478088378906, 39.31779479980469, 41.00080871582031, 42.68382263183594, 44.36683654785156, 46.04985046386719, 47.73286437988281, 49.41587829589844, 51.09889221191406, 52.78190612792969, 54.46492004394531, 56.14793395996094, 57.83094787597656, 59.51396179199219, 61.19697570800781, 62.87998962402344, 64.56300354003906, 66.24601745605469, 67.92903137207031, 69.61204528808594, 71.29505920410156, 72.97807312011719, 74.66108703613281, 76.34410095214844, 78.02711486816406, 79.71012878417969, 81.39314270019531, 83.07615661621094, 84.75917053222656]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 13.0, 22.0, 27.0, 41.0, 54.0, 56.0, 73.0, 69.0, 85.0, 74.0, 89.0, 80.0, 64.0, 59.0, 49.0, 37.0, 26.0, 28.0, 16.0, 12.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.73967456817627, -12.371551513671875, -12.003429412841797, -11.635306358337402, -11.267183303833008, -10.89906120300293, -10.530938148498535, -10.16281509399414, -9.794692993164062, -9.426569938659668, -9.05844783782959, -8.690324783325195, -8.322202682495117, -7.954079627990723, -7.585956573486328, -7.217833995819092, -6.8497114181518555, -6.481588840484619, -6.113466262817383, -5.745343208312988, -5.377220630645752, -5.009098052978516, -4.640974998474121, -4.272852420806885, -3.9047298431396484, -3.536607265472412, -3.1684844493865967, -2.8003616333007812, -2.432239055633545, -2.0641164779663086, -1.6959936618804932, -1.3278708457946777, -0.959747314453125, -0.5916246175765991, -0.22350192070007324, 0.14462077617645264, 0.5127434730529785, 0.8808661699295044, 1.2489888668060303, 1.6171116828918457, 1.985234260559082, 2.3533568382263184, 2.721479654312134, 3.089602470397949, 3.4577250480651855, 3.825847625732422, 4.193970680236816, 4.562093257904053, 4.930215835571289, 5.298338413238525, 5.666460990905762, 6.034584045410156, 6.402706623077393, 6.770829200744629, 7.138952255249023, 7.50707483291626, 7.875197410583496, 8.24332046508789, 8.611442565917969, 8.979565620422363, 9.347688674926758, 9.715810775756836, 10.08393383026123, 10.452056884765625, 10.820178985595703]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 20.0, 14.0, 31.0, 37.0, 46.0, 67.0, 80.0, 111.0, 159.0, 199.0, 287.0, 443.0, 776.0, 1642.0, 4176.0, 14325.0, 66234.0, 491919.0, 395049.0, 53686.0, 11776.0, 3768.0, 1554.0, 761.0, 379.0, 272.0, 190.0, 126.0, 101.0, 85.0, 51.0, 39.0, 30.0, 26.0, 16.0, 11.0, 13.0, 6.0, 6.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.8310546875, -5.642578125, -5.4541015625, -5.265625, -5.0771484375, -4.888671875, -4.7001953125, -4.51171875, -4.3232421875, -4.134765625, -3.9462890625, -3.7578125, -3.5693359375, -3.380859375, -3.1923828125, -3.00390625, -2.8154296875, -2.626953125, -2.4384765625, -2.25, -2.0615234375, -1.873046875, -1.6845703125, -1.49609375, -1.3076171875, -1.119140625, -0.9306640625, -0.7421875, -0.5537109375, -0.365234375, -0.1767578125, 0.01171875, 0.2001953125, 0.388671875, 0.5771484375, 0.765625, 0.9541015625, 1.142578125, 1.3310546875, 1.51953125, 1.7080078125, 1.896484375, 2.0849609375, 2.2734375, 2.4619140625, 2.650390625, 2.8388671875, 3.02734375, 3.2158203125, 3.404296875, 3.5927734375, 3.78125, 3.9697265625, 4.158203125, 4.3466796875, 4.53515625, 4.7236328125, 4.912109375, 5.1005859375, 5.2890625, 5.4775390625, 5.666015625, 5.8544921875, 6.04296875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 13.0, 20.0, 33.0, 35.0, 70.0, 91.0, 87.0, 120.0, 117.0, 120.0, 99.0, 70.0, 54.0, 29.0, 14.0, 8.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9479827880859375, -1.894012451171875, -1.8400421142578125, -1.78607177734375, -1.7321014404296875, -1.678131103515625, -1.6241607666015625, -1.5701904296875, -1.5162200927734375, -1.462249755859375, -1.4082794189453125, -1.35430908203125, -1.3003387451171875, -1.246368408203125, -1.1923980712890625, -1.138427734375, -1.0844573974609375, -1.030487060546875, -0.9765167236328125, -0.92254638671875, -0.8685760498046875, -0.814605712890625, -0.7606353759765625, -0.7066650390625, -0.6526947021484375, -0.598724365234375, -0.5447540283203125, -0.49078369140625, -0.4368133544921875, -0.382843017578125, -0.3288726806640625, -0.27490234375, -0.2209320068359375, -0.166961669921875, -0.1129913330078125, -0.05902099609375, -0.0050506591796875, 0.048919677734375, 0.1028900146484375, 0.1568603515625, 0.2108306884765625, 0.264801025390625, 0.3187713623046875, 0.37274169921875, 0.4267120361328125, 0.480682373046875, 0.5346527099609375, 0.588623046875, 0.6425933837890625, 0.696563720703125, 0.7505340576171875, 0.80450439453125, 0.8584747314453125, 0.912445068359375, 0.9664154052734375, 1.0203857421875, 1.0743560791015625, 1.128326416015625, 1.1822967529296875, 1.23626708984375, 1.2902374267578125, 1.344207763671875, 1.3981781005859375, 1.4521484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 6.0, 10.0, 5.0, 3.0, 8.0, 12.0, 14.0, 19.0, 16.0, 26.0, 25.0, 48.0, 39.0, 64.0, 120.0, 274.0, 681.0, 2682.0, 13977.0, 132629.0, 741866.0, 137433.0, 14571.0, 2662.0, 695.0, 245.0, 128.0, 74.0, 50.0, 46.0, 23.0, 18.0, 14.0, 15.0, 8.0, 6.0, 6.0, 11.0, 4.0, 4.0, 9.0, 2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.98828125, -5.7982177734375, -5.608154296875, -5.4180908203125, -5.22802734375, -5.0379638671875, -4.847900390625, -4.6578369140625, -4.4677734375, -4.2777099609375, -4.087646484375, -3.8975830078125, -3.70751953125, -3.5174560546875, -3.327392578125, -3.1373291015625, -2.947265625, -2.7572021484375, -2.567138671875, -2.3770751953125, -2.18701171875, -1.9969482421875, -1.806884765625, -1.6168212890625, -1.4267578125, -1.2366943359375, -1.046630859375, -0.8565673828125, -0.66650390625, -0.4764404296875, -0.286376953125, -0.0963134765625, 0.09375, 0.2838134765625, 0.473876953125, 0.6639404296875, 0.85400390625, 1.0440673828125, 1.234130859375, 1.4241943359375, 1.6142578125, 1.8043212890625, 1.994384765625, 2.1844482421875, 2.37451171875, 2.5645751953125, 2.754638671875, 2.9447021484375, 3.134765625, 3.3248291015625, 3.514892578125, 3.7049560546875, 3.89501953125, 4.0850830078125, 4.275146484375, 4.4652099609375, 4.6552734375, 4.8453369140625, 5.035400390625, 5.2254638671875, 5.41552734375, 5.6055908203125, 5.795654296875, 5.9857177734375, 6.17578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 4.0, 10.0, 7.0, 9.0, 15.0, 19.0, 14.0, 24.0, 24.0, 40.0, 32.0, 43.0, 33.0, 33.0, 45.0, 49.0, 52.0, 34.0, 56.0, 49.0, 33.0, 35.0, 53.0, 41.0, 33.0, 37.0, 33.0, 32.0, 20.0, 17.0, 18.0, 16.0, 8.0, 3.0, 8.0, 6.0, 2.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.1798095703125, -3.080322265625, -2.9808349609375, -2.88134765625, -2.7818603515625, -2.682373046875, -2.5828857421875, -2.4833984375, -2.3839111328125, -2.284423828125, -2.1849365234375, -2.08544921875, -1.9859619140625, -1.886474609375, -1.7869873046875, -1.6875, -1.5880126953125, -1.488525390625, -1.3890380859375, -1.28955078125, -1.1900634765625, -1.090576171875, -0.9910888671875, -0.8916015625, -0.7921142578125, -0.692626953125, -0.5931396484375, -0.49365234375, -0.3941650390625, -0.294677734375, -0.1951904296875, -0.095703125, 0.0037841796875, 0.103271484375, 0.2027587890625, 0.30224609375, 0.4017333984375, 0.501220703125, 0.6007080078125, 0.7001953125, 0.7996826171875, 0.899169921875, 0.9986572265625, 1.09814453125, 1.1976318359375, 1.297119140625, 1.3966064453125, 1.49609375, 1.5955810546875, 1.695068359375, 1.7945556640625, 1.89404296875, 1.9935302734375, 2.093017578125, 2.1925048828125, 2.2919921875, 2.3914794921875, 2.490966796875, 2.5904541015625, 2.68994140625, 2.7894287109375, 2.888916015625, 2.9884033203125, 3.087890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 9.0, 15.0, 33.0, 38.0, 75.0, 196.0, 528.0, 1962.0, 13032.0, 285253.0, 718794.0, 24453.0, 2965.0, 736.0, 246.0, 91.0, 51.0, 28.0, 12.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.400390625, -3.275054931640625, -3.14971923828125, -3.024383544921875, -2.8990478515625, -2.773712158203125, -2.64837646484375, -2.523040771484375, -2.397705078125, -2.272369384765625, -2.14703369140625, -2.021697998046875, -1.8963623046875, -1.771026611328125, -1.64569091796875, -1.520355224609375, -1.39501953125, -1.269683837890625, -1.14434814453125, -1.019012451171875, -0.8936767578125, -0.768341064453125, -0.64300537109375, -0.517669677734375, -0.392333984375, -0.266998291015625, -0.14166259765625, -0.016326904296875, 0.1090087890625, 0.234344482421875, 0.35968017578125, 0.485015869140625, 0.6103515625, 0.735687255859375, 0.86102294921875, 0.986358642578125, 1.1116943359375, 1.237030029296875, 1.36236572265625, 1.487701416015625, 1.613037109375, 1.738372802734375, 1.86370849609375, 1.989044189453125, 2.1143798828125, 2.239715576171875, 2.36505126953125, 2.490386962890625, 2.61572265625, 2.741058349609375, 2.86639404296875, 2.991729736328125, 3.1170654296875, 3.242401123046875, 3.36773681640625, 3.493072509765625, 3.618408203125, 3.743743896484375, 3.86907958984375, 3.994415283203125, 4.1197509765625, 4.245086669921875, 4.37042236328125, 4.495758056640625, 4.62109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 2.0, 12.0, 4.0, 11.0, 27.0, 26.0, 44.0, 83.0, 123.0, 156.0, 169.0, 128.0, 74.0, 43.0, 27.0, 28.0, 11.0, 10.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000461578369140625, -0.00044872239232063293, -0.00043586641550064087, -0.0004230104386806488, -0.00041015446186065674, -0.00039729848504066467, -0.0003844425082206726, -0.00037158653140068054, -0.0003587305545806885, -0.0003458745777606964, -0.00033301860094070435, -0.0003201626241207123, -0.0003073066473007202, -0.00029445067048072815, -0.0002815946936607361, -0.000268738716840744, -0.00025588274002075195, -0.0002430267632007599, -0.00023017078638076782, -0.00021731480956077576, -0.0002044588327407837, -0.00019160285592079163, -0.00017874687910079956, -0.0001658909022808075, -0.00015303492546081543, -0.00014017894864082336, -0.0001273229718208313, -0.00011446699500083923, -0.00010161101818084717, -8.87550413608551e-05, -7.589906454086304e-05, -6.304308772087097e-05, -5.0187110900878906e-05, -3.733113408088684e-05, -2.4475157260894775e-05, -1.161918044090271e-05, 1.2367963790893555e-06, 1.4092773199081421e-05, 2.6948750019073486e-05, 3.980472683906555e-05, 5.266070365905762e-05, 6.551668047904968e-05, 7.837265729904175e-05, 9.122863411903381e-05, 0.00010408461093902588, 0.00011694058775901794, 0.00012979656457901, 0.00014265254139900208, 0.00015550851821899414, 0.0001683644950389862, 0.00018122047185897827, 0.00019407644867897034, 0.0002069324254989624, 0.00021978840231895447, 0.00023264437913894653, 0.0002455003559589386, 0.00025835633277893066, 0.00027121230959892273, 0.0002840682864189148, 0.00029692426323890686, 0.0003097802400588989, 0.000322636216878891, 0.00033549219369888306, 0.0003483481705188751, 0.0003612041473388672]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 2.0, 12.0, 6.0, 4.0, 12.0, 14.0, 19.0, 38.0, 59.0, 117.0, 238.0, 534.0, 1707.0, 8864.0, 90144.0, 863132.0, 73542.0, 7592.0, 1533.0, 473.0, 204.0, 106.0, 61.0, 32.0, 32.0, 13.0, 16.0, 10.0, 9.0, 6.0, 2.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.377044677734375, -3.26971435546875, -3.162384033203125, -3.0550537109375, -2.947723388671875, -2.84039306640625, -2.733062744140625, -2.625732421875, -2.518402099609375, -2.41107177734375, -2.303741455078125, -2.1964111328125, -2.089080810546875, -1.98175048828125, -1.874420166015625, -1.76708984375, -1.659759521484375, -1.55242919921875, -1.445098876953125, -1.3377685546875, -1.230438232421875, -1.12310791015625, -1.015777587890625, -0.908447265625, -0.801116943359375, -0.69378662109375, -0.586456298828125, -0.4791259765625, -0.371795654296875, -0.26446533203125, -0.157135009765625, -0.0498046875, 0.057525634765625, 0.16485595703125, 0.272186279296875, 0.3795166015625, 0.486846923828125, 0.59417724609375, 0.701507568359375, 0.808837890625, 0.916168212890625, 1.02349853515625, 1.130828857421875, 1.2381591796875, 1.345489501953125, 1.45281982421875, 1.560150146484375, 1.66748046875, 1.774810791015625, 1.88214111328125, 1.989471435546875, 2.0968017578125, 2.204132080078125, 2.31146240234375, 2.418792724609375, 2.526123046875, 2.633453369140625, 2.74078369140625, 2.848114013671875, 2.9554443359375, 3.062774658203125, 3.17010498046875, 3.277435302734375, 3.384765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 7.0, 7.0, 15.0, 17.0, 13.0, 21.0, 24.0, 33.0, 46.0, 50.0, 67.0, 58.0, 94.0, 77.0, 85.0, 81.0, 47.0, 55.0, 33.0, 34.0, 25.0, 20.0, 19.0, 12.0, 8.0, 6.0, 3.0, 7.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1748046875, -1.137451171875, -1.10009765625, -1.062744140625, -1.025390625, -0.988037109375, -0.95068359375, -0.913330078125, -0.8759765625, -0.838623046875, -0.80126953125, -0.763916015625, -0.7265625, -0.689208984375, -0.65185546875, -0.614501953125, -0.5771484375, -0.539794921875, -0.50244140625, -0.465087890625, -0.427734375, -0.390380859375, -0.35302734375, -0.315673828125, -0.2783203125, -0.240966796875, -0.20361328125, -0.166259765625, -0.12890625, -0.091552734375, -0.05419921875, -0.016845703125, 0.0205078125, 0.057861328125, 0.09521484375, 0.132568359375, 0.169921875, 0.207275390625, 0.24462890625, 0.281982421875, 0.3193359375, 0.356689453125, 0.39404296875, 0.431396484375, 0.46875, 0.506103515625, 0.54345703125, 0.580810546875, 0.6181640625, 0.655517578125, 0.69287109375, 0.730224609375, 0.767578125, 0.804931640625, 0.84228515625, 0.879638671875, 0.9169921875, 0.954345703125, 0.99169921875, 1.029052734375, 1.06640625, 1.103759765625, 1.14111328125, 1.178466796875, 1.2158203125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 12.0, 44.0, 284.0, 502.0, 136.0, 26.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.98316192626953, -95.41917419433594, -92.85519409179688, -90.29120635986328, -87.72721862792969, -85.16323852539062, -82.59925079345703, -80.03526306152344, -77.47128295898438, -74.90729522705078, -72.34331512451172, -69.77932739257812, -67.21533966064453, -64.65135192871094, -62.087371826171875, -59.52338409423828, -56.95939636230469, -54.39541244506836, -51.831424713134766, -49.26744079589844, -46.703453063964844, -44.139469146728516, -41.57548522949219, -39.011497497558594, -36.447513580322266, -33.88352966308594, -31.319541931152344, -28.755558013916016, -26.191572189331055, -23.627586364746094, -21.063602447509766, -18.499616622924805, -15.935623168945312, -13.371637344360352, -10.807652473449707, -8.243667602539062, -5.679681777954102, -3.1156959533691406, -0.5517110824584961, 2.0122737884521484, 4.576259613037109, 7.140244960784912, 9.704230308532715, 12.26821517944336, 14.83220100402832, 17.39618682861328, 19.96017074584961, 22.52415657043457, 25.08814239501953, 27.652128219604492, 30.216114044189453, 32.78009796142578, 35.344085693359375, 37.9080696105957, 40.47205352783203, 43.036041259765625, 45.60002517700195, 48.16400909423828, 50.727996826171875, 53.2919807434082, 55.85596466064453, 58.419952392578125, 60.98393630981445, 63.54792022705078, 66.11190795898438]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 4.0, 13.0, 8.0, 12.0, 6.0, 11.0, 18.0, 16.0, 23.0, 20.0, 19.0, 23.0, 26.0, 34.0, 42.0, 36.0, 43.0, 39.0, 35.0, 36.0, 46.0, 43.0, 53.0, 54.0, 44.0, 33.0, 35.0, 35.0, 24.0, 15.0, 25.0, 26.0, 22.0, 17.0, 8.0, 8.0, 9.0, 7.0, 5.0, 6.0, 7.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.820239067077637, -15.33089828491211, -14.841558456420898, -14.352217674255371, -13.862876892089844, -13.373537063598633, -12.884196281433105, -12.394855499267578, -11.905515670776367, -11.41617488861084, -10.926835060119629, -10.437494277954102, -9.948153495788574, -9.458812713623047, -8.969472885131836, -8.480132102966309, -7.990791320800781, -7.501451015472412, -7.012110233306885, -6.522769927978516, -6.033429145812988, -5.544088840484619, -5.05474853515625, -4.565407752990723, -4.0760674476623535, -3.5867269039154053, -3.097386360168457, -2.608046054840088, -2.1187055110931396, -1.6293649673461914, -1.1400246620178223, -0.650684118270874, -0.1613445281982422, 0.3279959559440613, 0.8173364400863647, 1.3066768646240234, 1.7960174083709717, 2.28535795211792, 2.774698257446289, 3.2640388011932373, 3.7533793449401855, 4.242719650268555, 4.732060432434082, 5.221400737762451, 5.71074104309082, 6.200081825256348, 6.689422130584717, 7.178762435913086, 7.668103218078613, 8.15744400024414, 8.646783828735352, 9.136124610900879, 9.625465393066406, 10.114805221557617, 10.604146003723145, 11.093486785888672, 11.582826614379883, 12.07216739654541, 12.561507225036621, 13.050848007202148, 13.540188789367676, 14.029529571533203, 14.518869400024414, 15.008210182189941, 15.497550964355469]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 8.0, 5.0, 3.0, 8.0, 11.0, 16.0, 10.0, 28.0, 31.0, 29.0, 36.0, 48.0, 85.0, 109.0, 217.0, 430.0, 1075.0, 3246.0, 13315.0, 2864649.0, 1291933.0, 13777.0, 3258.0, 1065.0, 441.0, 186.0, 99.0, 59.0, 35.0, 24.0, 13.0, 7.0, 4.0, 8.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.379150390625, -11.06298828125, -10.746826171875, -10.4306640625, -10.114501953125, -9.79833984375, -9.482177734375, -9.166015625, -8.849853515625, -8.53369140625, -8.217529296875, -7.9013671875, -7.585205078125, -7.26904296875, -6.952880859375, -6.63671875, -6.320556640625, -6.00439453125, -5.688232421875, -5.3720703125, -5.055908203125, -4.73974609375, -4.423583984375, -4.107421875, -3.791259765625, -3.47509765625, -3.158935546875, -2.8427734375, -2.526611328125, -2.21044921875, -1.894287109375, -1.578125, -1.261962890625, -0.94580078125, -0.629638671875, -0.3134765625, 0.002685546875, 0.31884765625, 0.635009765625, 0.951171875, 1.267333984375, 1.58349609375, 1.899658203125, 2.2158203125, 2.531982421875, 2.84814453125, 3.164306640625, 3.48046875, 3.796630859375, 4.11279296875, 4.428955078125, 4.7451171875, 5.061279296875, 5.37744140625, 5.693603515625, 6.009765625, 6.325927734375, 6.64208984375, 6.958251953125, 7.2744140625, 7.590576171875, 7.90673828125, 8.222900390625, 8.5390625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 9.0, 15.0, 25.0, 32.0, 47.0, 59.0, 76.0, 98.0, 93.0, 97.0, 76.0, 107.0, 78.0, 60.0, 40.0, 32.0, 22.0, 10.0, 4.0, 7.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.89453125, -1.8436737060546875, -1.792816162109375, -1.7419586181640625, -1.69110107421875, -1.6402435302734375, -1.589385986328125, -1.5385284423828125, -1.4876708984375, -1.4368133544921875, -1.385955810546875, -1.3350982666015625, -1.28424072265625, -1.2333831787109375, -1.182525634765625, -1.1316680908203125, -1.080810546875, -1.0299530029296875, -0.979095458984375, -0.9282379150390625, -0.87738037109375, -0.8265228271484375, -0.775665283203125, -0.7248077392578125, -0.6739501953125, -0.6230926513671875, -0.572235107421875, -0.5213775634765625, -0.47052001953125, -0.4196624755859375, -0.368804931640625, -0.3179473876953125, -0.26708984375, -0.2162322998046875, -0.165374755859375, -0.1145172119140625, -0.06365966796875, -0.0128021240234375, 0.038055419921875, 0.0889129638671875, 0.1397705078125, 0.1906280517578125, 0.241485595703125, 0.2923431396484375, 0.34320068359375, 0.3940582275390625, 0.444915771484375, 0.4957733154296875, 0.546630859375, 0.5974884033203125, 0.648345947265625, 0.6992034912109375, 0.75006103515625, 0.8009185791015625, 0.851776123046875, 0.9026336669921875, 0.9534912109375, 1.0043487548828125, 1.055206298828125, 1.1060638427734375, 1.15692138671875, 1.2077789306640625, 1.258636474609375, 1.3094940185546875, 1.3603515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 5.0, 9.0, 12.0, 22.0, 36.0, 96.0, 180.0, 509.0, 2210.0, 20837.0, 4097707.0, 67030.0, 4228.0, 836.0, 297.0, 134.0, 56.0, 32.0, 15.0, 11.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.2392578125, -9.806640625, -9.3740234375, -8.94140625, -8.5087890625, -8.076171875, -7.6435546875, -7.2109375, -6.7783203125, -6.345703125, -5.9130859375, -5.48046875, -5.0478515625, -4.615234375, -4.1826171875, -3.75, -3.3173828125, -2.884765625, -2.4521484375, -2.01953125, -1.5869140625, -1.154296875, -0.7216796875, -0.2890625, 0.1435546875, 0.576171875, 1.0087890625, 1.44140625, 1.8740234375, 2.306640625, 2.7392578125, 3.171875, 3.6044921875, 4.037109375, 4.4697265625, 4.90234375, 5.3349609375, 5.767578125, 6.2001953125, 6.6328125, 7.0654296875, 7.498046875, 7.9306640625, 8.36328125, 8.7958984375, 9.228515625, 9.6611328125, 10.09375, 10.5263671875, 10.958984375, 11.3916015625, 11.82421875, 12.2568359375, 12.689453125, 13.1220703125, 13.5546875, 13.9873046875, 14.419921875, 14.8525390625, 15.28515625, 15.7177734375, 16.150390625, 16.5830078125, 17.015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 7.0, 6.0, 8.0, 17.0, 30.0, 25.0, 40.0, 93.0, 485.0, 2706.0, 365.0, 105.0, 51.0, 35.0, 23.0, 15.0, 12.0, 11.0, 9.0, 3.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6904296875, -1.6264190673828125, -1.562408447265625, -1.4983978271484375, -1.43438720703125, -1.3703765869140625, -1.306365966796875, -1.2423553466796875, -1.1783447265625, -1.1143341064453125, -1.050323486328125, -0.9863128662109375, -0.92230224609375, -0.8582916259765625, -0.794281005859375, -0.7302703857421875, -0.666259765625, -0.6022491455078125, -0.538238525390625, -0.4742279052734375, -0.41021728515625, -0.3462066650390625, -0.282196044921875, -0.2181854248046875, -0.1541748046875, -0.0901641845703125, -0.026153564453125, 0.0378570556640625, 0.10186767578125, 0.1658782958984375, 0.229888916015625, 0.2938995361328125, 0.35791015625, 0.4219207763671875, 0.485931396484375, 0.5499420166015625, 0.61395263671875, 0.6779632568359375, 0.741973876953125, 0.8059844970703125, 0.8699951171875, 0.9340057373046875, 0.998016357421875, 1.0620269775390625, 1.12603759765625, 1.1900482177734375, 1.254058837890625, 1.3180694580078125, 1.382080078125, 1.4460906982421875, 1.510101318359375, 1.5741119384765625, 1.63812255859375, 1.7021331787109375, 1.766143798828125, 1.8301544189453125, 1.8941650390625, 1.9581756591796875, 2.022186279296875, 2.0861968994140625, 2.15020751953125, 2.2142181396484375, 2.278228759765625, 2.3422393798828125, 2.40625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 18.0, 57.0, 209.0, 365.0, 212.0, 87.0, 29.0, 11.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.73103141784668, -9.055800437927246, -8.380568504333496, -7.7053375244140625, -7.030106067657471, -6.354874610900879, -5.679643630981445, -5.0044121742248535, -4.329180717468262, -3.65394926071167, -2.9787180423736572, -2.3034868240356445, -1.6282553672790527, -0.9530239105224609, -0.27779293060302734, 0.39743852615356445, 1.0726699829101562, 1.7479013204574585, 2.4231326580047607, 3.0983638763427734, 3.7735953330993652, 4.448826789855957, 5.124057769775391, 5.799289226531982, 6.474520683288574, 7.149752140045166, 7.824983596801758, 8.500214576721191, 9.175445556640625, 9.850677490234375, 10.525908470153809, 11.201139450073242, 11.87636947631836, 12.551600456237793, 13.226832389831543, 13.902063369750977, 14.577295303344727, 15.25252628326416, 15.927757263183594, 16.602989196777344, 17.278221130371094, 17.953453063964844, 18.62868309020996, 19.30391502380371, 19.97914695739746, 20.654376983642578, 21.329608917236328, 22.004840850830078, 22.680070877075195, 23.355302810668945, 24.030532836914062, 24.705764770507812, 25.380996704101562, 26.056228637695312, 26.73145866394043, 27.40669059753418, 28.081920623779297, 28.757152557373047, 29.432382583618164, 30.107614517211914, 30.782846450805664, 31.45807647705078, 32.13330841064453, 32.80854034423828, 33.48377227783203]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 15.0, 17.0, 11.0, 25.0, 25.0, 21.0, 22.0, 21.0, 22.0, 35.0, 32.0, 34.0, 34.0, 39.0, 44.0, 37.0, 44.0, 47.0, 46.0, 42.0, 36.0, 37.0, 30.0, 24.0, 36.0, 28.0, 38.0, 25.0, 18.0, 21.0, 13.0, 13.0, 12.0, 10.0, 6.0, 6.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.519067764282227, -5.352389812469482, -5.185711860656738, -5.019033908843994, -4.85235595703125, -4.685677528381348, -4.519000053405762, -4.352321624755859, -4.185643672943115, -4.018965721130371, -3.852287769317627, -3.685609817504883, -3.5189316272735596, -3.3522536754608154, -3.1855757236480713, -3.018897533416748, -2.852219820022583, -2.685541868209839, -2.5188639163970947, -2.3521857261657715, -2.1855077743530273, -2.018829822540283, -1.852151870727539, -1.6854737997055054, -1.5187958478927612, -1.352117896080017, -1.1854398250579834, -1.0187618732452393, -0.8520838618278503, -0.6854058504104614, -0.5187278985977173, -0.3520498275756836, -0.18537187576293945, -0.01869387924671173, 0.147984117269516, 0.3146620988845825, 0.48134011030197144, 0.6480181217193604, 0.8146960735321045, 0.9813741445541382, 1.1480520963668823, 1.3147300481796265, 1.4814081192016602, 1.6480860710144043, 1.8147640228271484, 1.9814420938491821, 2.1481199264526367, 2.31479811668396, 2.481476068496704, 2.6481540203094482, 2.8148319721221924, 2.9815101623535156, 3.1481881141662598, 3.314866065979004, 3.481544017791748, 3.648221969604492, 3.8148999214172363, 3.9815778732299805, 4.148255825042725, 4.314933776855469, 4.481611728668213, 4.648289680480957, 4.814968109130859, 4.9816460609436035, 5.148324012756348]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 16.0, 18.0, 17.0, 23.0, 35.0, 48.0, 84.0, 90.0, 127.0, 212.0, 285.0, 551.0, 1012.0, 2232.0, 5871.0, 19795.0, 88845.0, 498586.0, 348853.0, 58986.0, 14322.0, 4567.0, 1773.0, 833.0, 446.0, 287.0, 163.0, 130.0, 78.0, 76.0, 44.0, 27.0, 29.0, 21.0, 15.0, 9.0, 12.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.61297607421875, -5.4368896484375, -5.26080322265625, -5.084716796875, -4.90863037109375, -4.7325439453125, -4.55645751953125, -4.38037109375, -4.20428466796875, -4.0281982421875, -3.85211181640625, -3.676025390625, -3.49993896484375, -3.3238525390625, -3.14776611328125, -2.9716796875, -2.79559326171875, -2.6195068359375, -2.44342041015625, -2.267333984375, -2.09124755859375, -1.9151611328125, -1.73907470703125, -1.56298828125, -1.38690185546875, -1.2108154296875, -1.03472900390625, -0.858642578125, -0.68255615234375, -0.5064697265625, -0.33038330078125, -0.154296875, 0.02178955078125, 0.1978759765625, 0.37396240234375, 0.550048828125, 0.72613525390625, 0.9022216796875, 1.07830810546875, 1.25439453125, 1.43048095703125, 1.6065673828125, 1.78265380859375, 1.958740234375, 2.13482666015625, 2.3109130859375, 2.48699951171875, 2.6630859375, 2.83917236328125, 3.0152587890625, 3.19134521484375, 3.367431640625, 3.54351806640625, 3.7196044921875, 3.89569091796875, 4.07177734375, 4.24786376953125, 4.4239501953125, 4.60003662109375, 4.776123046875, 4.95220947265625, 5.1282958984375, 5.30438232421875, 5.48046875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 9.0, 12.0, 23.0, 37.0, 39.0, 56.0, 74.0, 104.0, 93.0, 91.0, 82.0, 96.0, 86.0, 65.0, 41.0, 31.0, 20.0, 11.0, 9.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.8591156005859375, -1.808074951171875, -1.7570343017578125, -1.70599365234375, -1.6549530029296875, -1.603912353515625, -1.5528717041015625, -1.5018310546875, -1.4507904052734375, -1.399749755859375, -1.3487091064453125, -1.29766845703125, -1.2466278076171875, -1.195587158203125, -1.1445465087890625, -1.093505859375, -1.0424652099609375, -0.991424560546875, -0.9403839111328125, -0.88934326171875, -0.8383026123046875, -0.787261962890625, -0.7362213134765625, -0.6851806640625, -0.6341400146484375, -0.583099365234375, -0.5320587158203125, -0.48101806640625, -0.4299774169921875, -0.378936767578125, -0.3278961181640625, -0.27685546875, -0.2258148193359375, -0.174774169921875, -0.1237335205078125, -0.07269287109375, -0.0216522216796875, 0.029388427734375, 0.0804290771484375, 0.1314697265625, 0.1825103759765625, 0.233551025390625, 0.2845916748046875, 0.33563232421875, 0.3866729736328125, 0.437713623046875, 0.4887542724609375, 0.539794921875, 0.5908355712890625, 0.641876220703125, 0.6929168701171875, 0.74395751953125, 0.7949981689453125, 0.846038818359375, 0.8970794677734375, 0.9481201171875, 0.9991607666015625, 1.050201416015625, 1.1012420654296875, 1.15228271484375, 1.2033233642578125, 1.254364013671875, 1.3054046630859375, 1.3564453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 12.0, 6.0, 10.0, 18.0, 14.0, 21.0, 29.0, 34.0, 61.0, 86.0, 118.0, 229.0, 571.0, 1788.0, 7464.0, 44955.0, 417277.0, 507854.0, 55720.0, 8844.0, 2046.0, 652.0, 272.0, 130.0, 87.0, 56.0, 42.0, 23.0, 19.0, 10.0, 14.0, 21.0, 15.0, 5.0, 7.0, 1.0, 6.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.07421875, -5.88470458984375, -5.6951904296875, -5.50567626953125, -5.316162109375, -5.12664794921875, -4.9371337890625, -4.74761962890625, -4.55810546875, -4.36859130859375, -4.1790771484375, -3.98956298828125, -3.800048828125, -3.61053466796875, -3.4210205078125, -3.23150634765625, -3.0419921875, -2.85247802734375, -2.6629638671875, -2.47344970703125, -2.283935546875, -2.09442138671875, -1.9049072265625, -1.71539306640625, -1.52587890625, -1.33636474609375, -1.1468505859375, -0.95733642578125, -0.767822265625, -0.57830810546875, -0.3887939453125, -0.19927978515625, -0.009765625, 0.17974853515625, 0.3692626953125, 0.55877685546875, 0.748291015625, 0.93780517578125, 1.1273193359375, 1.31683349609375, 1.50634765625, 1.69586181640625, 1.8853759765625, 2.07489013671875, 2.264404296875, 2.45391845703125, 2.6434326171875, 2.83294677734375, 3.0224609375, 3.21197509765625, 3.4014892578125, 3.59100341796875, 3.780517578125, 3.97003173828125, 4.1595458984375, 4.34906005859375, 4.53857421875, 4.72808837890625, 4.9176025390625, 5.10711669921875, 5.296630859375, 5.48614501953125, 5.6756591796875, 5.86517333984375, 6.0546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 6.0, 5.0, 10.0, 7.0, 11.0, 18.0, 17.0, 19.0, 21.0, 18.0, 27.0, 25.0, 38.0, 29.0, 33.0, 30.0, 28.0, 31.0, 27.0, 44.0, 40.0, 33.0, 34.0, 52.0, 36.0, 42.0, 37.0, 27.0, 25.0, 28.0, 22.0, 11.0, 15.0, 29.0, 21.0, 12.0, 13.0, 17.0, 8.0, 6.0, 13.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-3.14453125, -3.046051025390625, -2.94757080078125, -2.849090576171875, -2.7506103515625, -2.652130126953125, -2.55364990234375, -2.455169677734375, -2.356689453125, -2.258209228515625, -2.15972900390625, -2.061248779296875, -1.9627685546875, -1.864288330078125, -1.76580810546875, -1.667327880859375, -1.56884765625, -1.470367431640625, -1.37188720703125, -1.273406982421875, -1.1749267578125, -1.076446533203125, -0.97796630859375, -0.879486083984375, -0.781005859375, -0.682525634765625, -0.58404541015625, -0.485565185546875, -0.3870849609375, -0.288604736328125, -0.19012451171875, -0.091644287109375, 0.0068359375, 0.105316162109375, 0.20379638671875, 0.302276611328125, 0.4007568359375, 0.499237060546875, 0.59771728515625, 0.696197509765625, 0.794677734375, 0.893157958984375, 0.99163818359375, 1.090118408203125, 1.1885986328125, 1.287078857421875, 1.38555908203125, 1.484039306640625, 1.58251953125, 1.680999755859375, 1.77947998046875, 1.877960205078125, 1.9764404296875, 2.074920654296875, 2.17340087890625, 2.271881103515625, 2.370361328125, 2.468841552734375, 2.56732177734375, 2.665802001953125, 2.7642822265625, 2.862762451171875, 2.96124267578125, 3.059722900390625, 3.158203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 3.0, 6.0, 6.0, 15.0, 20.0, 27.0, 61.0, 113.0, 270.0, 690.0, 2204.0, 10653.0, 120537.0, 847838.0, 56576.0, 6894.0, 1617.0, 561.0, 202.0, 127.0, 53.0, 22.0, 18.0, 10.0, 8.0, 6.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.332061767578125, -5.20318603515625, -5.074310302734375, -4.9454345703125, -4.816558837890625, -4.68768310546875, -4.558807373046875, -4.429931640625, -4.301055908203125, -4.17218017578125, -4.043304443359375, -3.9144287109375, -3.785552978515625, -3.65667724609375, -3.527801513671875, -3.39892578125, -3.270050048828125, -3.14117431640625, -3.012298583984375, -2.8834228515625, -2.754547119140625, -2.62567138671875, -2.496795654296875, -2.367919921875, -2.239044189453125, -2.11016845703125, -1.981292724609375, -1.8524169921875, -1.723541259765625, -1.59466552734375, -1.465789794921875, -1.3369140625, -1.208038330078125, -1.07916259765625, -0.950286865234375, -0.8214111328125, -0.692535400390625, -0.56365966796875, -0.434783935546875, -0.305908203125, -0.177032470703125, -0.04815673828125, 0.080718994140625, 0.2095947265625, 0.338470458984375, 0.46734619140625, 0.596221923828125, 0.72509765625, 0.853973388671875, 0.98284912109375, 1.111724853515625, 1.2406005859375, 1.369476318359375, 1.49835205078125, 1.627227783203125, 1.756103515625, 1.884979248046875, 2.01385498046875, 2.142730712890625, 2.2716064453125, 2.400482177734375, 2.52935791015625, 2.658233642578125, 2.787109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 4.0, 6.0, 14.0, 21.0, 19.0, 37.0, 35.0, 56.0, 67.0, 97.0, 133.0, 128.0, 96.0, 82.0, 52.0, 34.0, 32.0, 13.0, 17.0, 12.0, 9.0, 0.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0004000663757324219, -0.00038975104689598083, -0.0003794357180595398, -0.00036912038922309875, -0.0003588050603866577, -0.0003484897315502167, -0.00033817440271377563, -0.0003278590738773346, -0.00031754374504089355, -0.0003072284162044525, -0.0002969130873680115, -0.00028659775853157043, -0.0002762824296951294, -0.00026596710085868835, -0.0002556517720222473, -0.0002453364431858063, -0.00023502111434936523, -0.0002247057855129242, -0.00021439045667648315, -0.00020407512784004211, -0.00019375979900360107, -0.00018344447016716003, -0.000173129141330719, -0.00016281381249427795, -0.00015249848365783691, -0.00014218315482139587, -0.00013186782598495483, -0.0001215524971485138, -0.00011123716831207275, -0.00010092183947563171, -9.060651063919067e-05, -8.029118180274963e-05, -6.99758529663086e-05, -5.9660524129867554e-05, -4.9345195293426514e-05, -3.9029866456985474e-05, -2.8714537620544434e-05, -1.8399208784103394e-05, -8.083879947662354e-06, 2.2314488887786865e-06, 1.2546777725219727e-05, 2.2862106561660767e-05, 3.317743539810181e-05, 4.349276423454285e-05, 5.380809307098389e-05, 6.412342190742493e-05, 7.443875074386597e-05, 8.475407958030701e-05, 9.506940841674805e-05, 0.00010538473725318909, 0.00011570006608963013, 0.00012601539492607117, 0.0001363307237625122, 0.00014664605259895325, 0.0001569613814353943, 0.00016727671027183533, 0.00017759203910827637, 0.0001879073679447174, 0.00019822269678115845, 0.0002085380256175995, 0.00021885335445404053, 0.00022916868329048157, 0.0002394840121269226, 0.00024979934096336365, 0.0002601146697998047]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 4.0, 13.0, 12.0, 29.0, 42.0, 72.0, 140.0, 373.0, 1266.0, 6748.0, 87640.0, 898210.0, 47631.0, 4782.0, 984.0, 302.0, 137.0, 62.0, 32.0, 14.0, 18.0, 10.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.08203125, -5.935150146484375, -5.78826904296875, -5.641387939453125, -5.4945068359375, -5.347625732421875, -5.20074462890625, -5.053863525390625, -4.906982421875, -4.760101318359375, -4.61322021484375, -4.466339111328125, -4.3194580078125, -4.172576904296875, -4.02569580078125, -3.878814697265625, -3.73193359375, -3.585052490234375, -3.43817138671875, -3.291290283203125, -3.1444091796875, -2.997528076171875, -2.85064697265625, -2.703765869140625, -2.556884765625, -2.410003662109375, -2.26312255859375, -2.116241455078125, -1.9693603515625, -1.822479248046875, -1.67559814453125, -1.528717041015625, -1.3818359375, -1.234954833984375, -1.08807373046875, -0.941192626953125, -0.7943115234375, -0.647430419921875, -0.50054931640625, -0.353668212890625, -0.206787109375, -0.059906005859375, 0.08697509765625, 0.233856201171875, 0.3807373046875, 0.527618408203125, 0.67449951171875, 0.821380615234375, 0.96826171875, 1.115142822265625, 1.26202392578125, 1.408905029296875, 1.5557861328125, 1.702667236328125, 1.84954833984375, 1.996429443359375, 2.143310546875, 2.290191650390625, 2.43707275390625, 2.583953857421875, 2.7308349609375, 2.877716064453125, 3.02459716796875, 3.171478271484375, 3.318359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 4.0, 14.0, 17.0, 28.0, 26.0, 45.0, 64.0, 82.0, 118.0, 118.0, 125.0, 86.0, 78.0, 59.0, 40.0, 31.0, 11.0, 9.0, 13.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.79296875, -2.725860595703125, -2.65875244140625, -2.591644287109375, -2.5245361328125, -2.457427978515625, -2.39031982421875, -2.323211669921875, -2.256103515625, -2.188995361328125, -2.12188720703125, -2.054779052734375, -1.9876708984375, -1.920562744140625, -1.85345458984375, -1.786346435546875, -1.71923828125, -1.652130126953125, -1.58502197265625, -1.517913818359375, -1.4508056640625, -1.383697509765625, -1.31658935546875, -1.249481201171875, -1.182373046875, -1.115264892578125, -1.04815673828125, -0.981048583984375, -0.9139404296875, -0.846832275390625, -0.77972412109375, -0.712615966796875, -0.6455078125, -0.578399658203125, -0.51129150390625, -0.444183349609375, -0.3770751953125, -0.309967041015625, -0.24285888671875, -0.175750732421875, -0.108642578125, -0.041534423828125, 0.02557373046875, 0.092681884765625, 0.1597900390625, 0.226898193359375, 0.29400634765625, 0.361114501953125, 0.42822265625, 0.495330810546875, 0.56243896484375, 0.629547119140625, 0.6966552734375, 0.763763427734375, 0.83087158203125, 0.897979736328125, 0.965087890625, 1.032196044921875, 1.09930419921875, 1.166412353515625, 1.2335205078125, 1.300628662109375, 1.36773681640625, 1.434844970703125, 1.501953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 44.0, 279.0, 519.0, 137.0, 21.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-172.2296142578125, -168.93008422851562, -165.63055419921875, -162.33102416992188, -159.031494140625, -155.73196411132812, -152.4324493408203, -149.13291931152344, -145.83338928222656, -142.5338592529297, -139.2343292236328, -135.93479919433594, -132.63526916503906, -129.33575439453125, -126.03621673583984, -122.7366943359375, -119.43716430664062, -116.13763427734375, -112.83810424804688, -109.53858184814453, -106.23905181884766, -102.93952178955078, -99.6399917602539, -96.34046936035156, -93.04093170166016, -89.74140167236328, -86.4418716430664, -83.14234924316406, -79.84281921386719, -76.54328918457031, -73.24375915527344, -69.94422912597656, -66.64469909667969, -63.34516906738281, -60.0456428527832, -56.74611282348633, -53.44658660888672, -50.147056579589844, -46.84752655029297, -43.54800033569336, -40.24847412109375, -36.948944091796875, -33.649417877197266, -30.34988784790039, -27.05036163330078, -23.750831604003906, -20.451303482055664, -17.151775360107422, -13.852249145507812, -10.55272102355957, -7.25319242477417, -3.9536638259887695, -0.6541357040405273, 2.6453933715820312, 5.944921493530273, 9.244449615478516, 12.543977737426758, 15.843505859375, 19.143033981323242, 22.442562103271484, 25.74209213256836, 29.0416202545166, 32.341148376464844, 35.64067840576172, 38.94020462036133]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 8.0, 8.0, 9.0, 14.0, 13.0, 18.0, 9.0, 21.0, 25.0, 23.0, 26.0, 37.0, 39.0, 40.0, 38.0, 40.0, 26.0, 46.0, 44.0, 43.0, 42.0, 40.0, 48.0, 37.0, 32.0, 27.0, 33.0, 23.0, 23.0, 24.0, 23.0, 12.0, 16.0, 10.0, 15.0, 8.0, 6.0, 6.0, 2.0, 7.0, 3.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-20.68939971923828, -20.064788818359375, -19.440176010131836, -18.81556510925293, -18.19095230102539, -17.566341400146484, -16.941730499267578, -16.317119598388672, -15.692506790161133, -15.06789493560791, -14.443283081054688, -13.818672180175781, -13.194060325622559, -12.569448471069336, -11.94483757019043, -11.320225715637207, -10.695613861083984, -10.071002006530762, -9.446390151977539, -8.821779251098633, -8.19716739654541, -7.5725555419921875, -6.947944164276123, -6.323332786560059, -5.698720932006836, -5.074109077453613, -4.449497699737549, -3.8248860836029053, -3.2002744674682617, -2.575662851333618, -1.9510512351989746, -1.3264398574829102, -0.7018280029296875, -0.07721638679504395, 0.5473952293395996, 1.1720068454742432, 1.7966184616088867, 2.4212300777435303, 3.045841693878174, 3.6704530715942383, 4.295064926147461, 4.919676780700684, 5.544288158416748, 6.1688995361328125, 6.793511390686035, 7.418123245239258, 8.042734146118164, 8.667346000671387, 9.29195785522461, 9.916569709777832, 10.541181564331055, 11.165792465209961, 11.790404319763184, 12.415016174316406, 13.039627075195312, 13.664238929748535, 14.288850784301758, 14.91346263885498, 15.538074493408203, 16.16268539428711, 16.787296295166016, 17.411909103393555, 18.03652000427246, 18.6611328125, 19.285743713378906]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 7.0, 4.0, 4.0, 6.0, 8.0, 2.0, 13.0, 9.0, 12.0, 15.0, 21.0, 18.0, 26.0, 35.0, 47.0, 78.0, 112.0, 194.0, 302.0, 525.0, 1058.0, 2384.0, 5833.0, 20810.0, 374604.0, 3738514.0, 35774.0, 8179.0, 2997.0, 1260.0, 607.0, 303.0, 197.0, 113.0, 61.0, 46.0, 28.0, 23.0, 21.0, 10.0, 13.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.76171875, -7.552734375, -7.34375, -7.134765625, -6.92578125, -6.716796875, -6.5078125, -6.298828125, -6.08984375, -5.880859375, -5.671875, -5.462890625, -5.25390625, -5.044921875, -4.8359375, -4.626953125, -4.41796875, -4.208984375, -4.0, -3.791015625, -3.58203125, -3.373046875, -3.1640625, -2.955078125, -2.74609375, -2.537109375, -2.328125, -2.119140625, -1.91015625, -1.701171875, -1.4921875, -1.283203125, -1.07421875, -0.865234375, -0.65625, -0.447265625, -0.23828125, -0.029296875, 0.1796875, 0.388671875, 0.59765625, 0.806640625, 1.015625, 1.224609375, 1.43359375, 1.642578125, 1.8515625, 2.060546875, 2.26953125, 2.478515625, 2.6875, 2.896484375, 3.10546875, 3.314453125, 3.5234375, 3.732421875, 3.94140625, 4.150390625, 4.359375, 4.568359375, 4.77734375, 4.986328125, 5.1953125, 5.404296875, 5.61328125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 14.0, 11.0, 13.0, 19.0, 18.0, 37.0, 23.0, 49.0, 48.0, 47.0, 63.0, 80.0, 74.0, 83.0, 72.0, 53.0, 60.0, 48.0, 49.0, 45.0, 27.0, 19.0, 14.0, 13.0, 5.0, 9.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.6959381103515625, -1.648712158203125, -1.6014862060546875, -1.55426025390625, -1.5070343017578125, -1.459808349609375, -1.4125823974609375, -1.3653564453125, -1.3181304931640625, -1.270904541015625, -1.2236785888671875, -1.17645263671875, -1.1292266845703125, -1.082000732421875, -1.0347747802734375, -0.987548828125, -0.9403228759765625, -0.893096923828125, -0.8458709716796875, -0.79864501953125, -0.7514190673828125, -0.704193115234375, -0.6569671630859375, -0.6097412109375, -0.5625152587890625, -0.515289306640625, -0.4680633544921875, -0.42083740234375, -0.3736114501953125, -0.326385498046875, -0.2791595458984375, -0.23193359375, -0.1847076416015625, -0.137481689453125, -0.0902557373046875, -0.04302978515625, 0.0041961669921875, 0.051422119140625, 0.0986480712890625, 0.1458740234375, 0.1930999755859375, 0.240325927734375, 0.2875518798828125, 0.33477783203125, 0.3820037841796875, 0.429229736328125, 0.4764556884765625, 0.523681640625, 0.5709075927734375, 0.618133544921875, 0.6653594970703125, 0.71258544921875, 0.7598114013671875, 0.807037353515625, 0.8542633056640625, 0.9014892578125, 0.9487152099609375, 0.995941162109375, 1.0431671142578125, 1.09039306640625, 1.1376190185546875, 1.184844970703125, 1.2320709228515625, 1.279296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 3.0, 11.0, 10.0, 6.0, 9.0, 19.0, 29.0, 77.0, 283.0, 1039.0, 5175.0, 50376.0, 4082051.0, 48800.0, 4975.0, 976.0, 257.0, 90.0, 32.0, 22.0, 5.0, 8.0, 9.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -11.9896240234375, -11.596435546875, -11.2032470703125, -10.81005859375, -10.4168701171875, -10.023681640625, -9.6304931640625, -9.2373046875, -8.8441162109375, -8.450927734375, -8.0577392578125, -7.66455078125, -7.2713623046875, -6.878173828125, -6.4849853515625, -6.091796875, -5.6986083984375, -5.305419921875, -4.9122314453125, -4.51904296875, -4.1258544921875, -3.732666015625, -3.3394775390625, -2.9462890625, -2.5531005859375, -2.159912109375, -1.7667236328125, -1.37353515625, -0.9803466796875, -0.587158203125, -0.1939697265625, 0.19921875, 0.5924072265625, 0.985595703125, 1.3787841796875, 1.77197265625, 2.1651611328125, 2.558349609375, 2.9515380859375, 3.3447265625, 3.7379150390625, 4.131103515625, 4.5242919921875, 4.91748046875, 5.3106689453125, 5.703857421875, 6.0970458984375, 6.490234375, 6.8834228515625, 7.276611328125, 7.6697998046875, 8.06298828125, 8.4561767578125, 8.849365234375, 9.2425537109375, 9.6357421875, 10.0289306640625, 10.422119140625, 10.8153076171875, 11.20849609375, 11.6016845703125, 11.994873046875, 12.3880615234375, 12.78125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 5.0, 7.0, 11.0, 12.0, 14.0, 23.0, 61.0, 126.0, 356.0, 2527.0, 570.0, 164.0, 57.0, 42.0, 19.0, 12.0, 12.0, 15.0, 6.0, 6.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.574798583984375, -2.48162841796875, -2.388458251953125, -2.2952880859375, -2.202117919921875, -2.10894775390625, -2.015777587890625, -1.922607421875, -1.829437255859375, -1.73626708984375, -1.643096923828125, -1.5499267578125, -1.456756591796875, -1.36358642578125, -1.270416259765625, -1.17724609375, -1.084075927734375, -0.99090576171875, -0.897735595703125, -0.8045654296875, -0.711395263671875, -0.61822509765625, -0.525054931640625, -0.431884765625, -0.338714599609375, -0.24554443359375, -0.152374267578125, -0.0592041015625, 0.033966064453125, 0.12713623046875, 0.220306396484375, 0.3134765625, 0.406646728515625, 0.49981689453125, 0.592987060546875, 0.6861572265625, 0.779327392578125, 0.87249755859375, 0.965667724609375, 1.058837890625, 1.152008056640625, 1.24517822265625, 1.338348388671875, 1.4315185546875, 1.524688720703125, 1.61785888671875, 1.711029052734375, 1.80419921875, 1.897369384765625, 1.99053955078125, 2.083709716796875, 2.1768798828125, 2.270050048828125, 2.36322021484375, 2.456390380859375, 2.549560546875, 2.642730712890625, 2.73590087890625, 2.829071044921875, 2.9222412109375, 3.015411376953125, 3.10858154296875, 3.201751708984375, 3.294921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 11.0, 29.0, 95.0, 224.0, 307.0, 197.0, 81.0, 28.0, 7.0, 14.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.588905334472656, -21.891502380371094, -21.1940975189209, -20.496694564819336, -19.79928970336914, -19.101886749267578, -18.404483795166016, -17.70707893371582, -17.009674072265625, -16.312271118164062, -15.614866256713867, -14.917463302612305, -14.22005844116211, -13.522655487060547, -12.825251579284668, -12.127847671508789, -11.430444717407227, -10.733040809631348, -10.035636901855469, -9.338233947753906, -8.640829086303711, -7.94342565536499, -7.2460222244262695, -6.548618316650391, -5.851214408874512, -5.153810501098633, -4.456406593322754, -3.759003162384033, -3.0615992546081543, -2.3641953468322754, -1.6667919158935547, -0.9693880081176758, -0.2719860076904297, 0.42541778087615967, 1.122821569442749, 1.8202252388000488, 2.5176291465759277, 3.2150330543518066, 3.9124364852905273, 4.609840393066406, 5.307244300842285, 6.004648208618164, 6.702052116394043, 7.399455547332764, 8.096858978271484, 8.79426383972168, 9.491666793823242, 10.189070701599121, 10.886474609375, 11.583878517150879, 12.281282424926758, 12.97868537902832, 13.676090240478516, 14.373493194580078, 15.070897102355957, 15.768301010131836, 16.46570587158203, 17.163108825683594, 17.86051368713379, 18.55791664123535, 19.255321502685547, 19.95272445678711, 20.650127410888672, 21.347532272338867, 22.04493522644043]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 15.0, 17.0, 15.0, 21.0, 32.0, 32.0, 23.0, 30.0, 30.0, 37.0, 37.0, 48.0, 48.0, 48.0, 43.0, 54.0, 46.0, 49.0, 47.0, 34.0, 31.0, 35.0, 31.0, 25.0, 28.0, 21.0, 19.0, 16.0, 15.0, 17.0, 17.0, 5.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.762662887573242, -6.536893844604492, -6.311124801635742, -6.085355758666992, -5.859586715698242, -5.633817672729492, -5.408048629760742, -5.182279586791992, -4.956510543823242, -4.730741500854492, -4.504972457885742, -4.279203414916992, -4.053434371948242, -3.827665328979492, -3.601896286010742, -3.376127243041992, -3.150358200073242, -2.924589157104492, -2.698820114135742, -2.473051071166992, -2.247282028198242, -2.021512985229492, -1.7957439422607422, -1.5699748992919922, -1.3442058563232422, -1.1184368133544922, -0.8926677703857422, -0.6668987274169922, -0.4411296844482422, -0.2153606414794922, 0.010408401489257812, 0.2361774444580078, 0.4619464874267578, 0.6877155303955078, 0.9134845733642578, 1.1392536163330078, 1.3650226593017578, 1.5907917022705078, 1.8165607452392578, 2.042329788208008, 2.268098831176758, 2.493867874145508, 2.719636917114258, 2.945405960083008, 3.171175003051758, 3.396944046020508, 3.622713088989258, 3.848482131958008, 4.074251174926758, 4.300020217895508, 4.525789260864258, 4.751558303833008, 4.977327346801758, 5.203096389770508, 5.428865432739258, 5.654634475708008, 5.880403518676758, 6.106172561645508, 6.331941604614258, 6.557710647583008, 6.783479690551758, 7.009248733520508, 7.235017776489258, 7.460786819458008, 7.686555862426758]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 3.0, 4.0, 7.0, 15.0, 15.0, 43.0, 49.0, 106.0, 200.0, 445.0, 1043.0, 2793.0, 9840.0, 58167.0, 631374.0, 303346.0, 31113.0, 6542.0, 1966.0, 730.0, 323.0, 167.0, 83.0, 74.0, 32.0, 27.0, 4.0, 9.0, 13.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.890625, -7.626220703125, -7.36181640625, -7.097412109375, -6.8330078125, -6.568603515625, -6.30419921875, -6.039794921875, -5.775390625, -5.510986328125, -5.24658203125, -4.982177734375, -4.7177734375, -4.453369140625, -4.18896484375, -3.924560546875, -3.66015625, -3.395751953125, -3.13134765625, -2.866943359375, -2.6025390625, -2.338134765625, -2.07373046875, -1.809326171875, -1.544921875, -1.280517578125, -1.01611328125, -0.751708984375, -0.4873046875, -0.222900390625, 0.04150390625, 0.305908203125, 0.5703125, 0.834716796875, 1.09912109375, 1.363525390625, 1.6279296875, 1.892333984375, 2.15673828125, 2.421142578125, 2.685546875, 2.949951171875, 3.21435546875, 3.478759765625, 3.7431640625, 4.007568359375, 4.27197265625, 4.536376953125, 4.80078125, 5.065185546875, 5.32958984375, 5.593994140625, 5.8583984375, 6.122802734375, 6.38720703125, 6.651611328125, 6.916015625, 7.180419921875, 7.44482421875, 7.709228515625, 7.9736328125, 8.238037109375, 8.50244140625, 8.766845703125, 9.03125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 11.0, 20.0, 19.0, 21.0, 23.0, 35.0, 39.0, 38.0, 73.0, 60.0, 83.0, 77.0, 78.0, 64.0, 72.0, 67.0, 42.0, 41.0, 36.0, 27.0, 17.0, 16.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8447265625, -1.7958984375, -1.7470703125, -1.6982421875, -1.6494140625, -1.6005859375, -1.5517578125, -1.5029296875, -1.4541015625, -1.4052734375, -1.3564453125, -1.3076171875, -1.2587890625, -1.2099609375, -1.1611328125, -1.1123046875, -1.0634765625, -1.0146484375, -0.9658203125, -0.9169921875, -0.8681640625, -0.8193359375, -0.7705078125, -0.7216796875, -0.6728515625, -0.6240234375, -0.5751953125, -0.5263671875, -0.4775390625, -0.4287109375, -0.3798828125, -0.3310546875, -0.2822265625, -0.2333984375, -0.1845703125, -0.1357421875, -0.0869140625, -0.0380859375, 0.0107421875, 0.0595703125, 0.1083984375, 0.1572265625, 0.2060546875, 0.2548828125, 0.3037109375, 0.3525390625, 0.4013671875, 0.4501953125, 0.4990234375, 0.5478515625, 0.5966796875, 0.6455078125, 0.6943359375, 0.7431640625, 0.7919921875, 0.8408203125, 0.8896484375, 0.9384765625, 0.9873046875, 1.0361328125, 1.0849609375, 1.1337890625, 1.1826171875, 1.2314453125, 1.2802734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 10.0, 29.0, 23.0, 38.0, 68.0, 94.0, 130.0, 337.0, 925.0, 4213.0, 41808.0, 819150.0, 168844.0, 10078.0, 1670.0, 531.0, 215.0, 102.0, 69.0, 53.0, 40.0, 26.0, 18.0, 9.0, 10.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.671875, -10.345703125, -10.01953125, -9.693359375, -9.3671875, -9.041015625, -8.71484375, -8.388671875, -8.0625, -7.736328125, -7.41015625, -7.083984375, -6.7578125, -6.431640625, -6.10546875, -5.779296875, -5.453125, -5.126953125, -4.80078125, -4.474609375, -4.1484375, -3.822265625, -3.49609375, -3.169921875, -2.84375, -2.517578125, -2.19140625, -1.865234375, -1.5390625, -1.212890625, -0.88671875, -0.560546875, -0.234375, 0.091796875, 0.41796875, 0.744140625, 1.0703125, 1.396484375, 1.72265625, 2.048828125, 2.375, 2.701171875, 3.02734375, 3.353515625, 3.6796875, 4.005859375, 4.33203125, 4.658203125, 4.984375, 5.310546875, 5.63671875, 5.962890625, 6.2890625, 6.615234375, 6.94140625, 7.267578125, 7.59375, 7.919921875, 8.24609375, 8.572265625, 8.8984375, 9.224609375, 9.55078125, 9.876953125, 10.203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 11.0, 8.0, 7.0, 16.0, 11.0, 23.0, 23.0, 20.0, 37.0, 42.0, 46.0, 36.0, 47.0, 54.0, 45.0, 47.0, 71.0, 63.0, 48.0, 49.0, 38.0, 40.0, 43.0, 23.0, 40.0, 19.0, 13.0, 18.0, 17.0, 8.0, 9.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.45703125, -5.29229736328125, -5.1275634765625, -4.96282958984375, -4.798095703125, -4.63336181640625, -4.4686279296875, -4.30389404296875, -4.13916015625, -3.97442626953125, -3.8096923828125, -3.64495849609375, -3.480224609375, -3.31549072265625, -3.1507568359375, -2.98602294921875, -2.8212890625, -2.65655517578125, -2.4918212890625, -2.32708740234375, -2.162353515625, -1.99761962890625, -1.8328857421875, -1.66815185546875, -1.50341796875, -1.33868408203125, -1.1739501953125, -1.00921630859375, -0.844482421875, -0.67974853515625, -0.5150146484375, -0.35028076171875, -0.185546875, -0.02081298828125, 0.1439208984375, 0.30865478515625, 0.473388671875, 0.63812255859375, 0.8028564453125, 0.96759033203125, 1.13232421875, 1.29705810546875, 1.4617919921875, 1.62652587890625, 1.791259765625, 1.95599365234375, 2.1207275390625, 2.28546142578125, 2.4501953125, 2.61492919921875, 2.7796630859375, 2.94439697265625, 3.109130859375, 3.27386474609375, 3.4385986328125, 3.60333251953125, 3.76806640625, 3.93280029296875, 4.0975341796875, 4.26226806640625, 4.427001953125, 4.59173583984375, 4.7564697265625, 4.92120361328125, 5.0859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 10.0, 14.0, 18.0, 30.0, 51.0, 69.0, 152.0, 280.0, 627.0, 1945.0, 9452.0, 201436.0, 809329.0, 20225.0, 3243.0, 898.0, 359.0, 148.0, 91.0, 61.0, 31.0, 18.0, 20.0, 13.0, 6.0, 3.0, 0.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.8671875, -4.732635498046875, -4.59808349609375, -4.463531494140625, -4.3289794921875, -4.194427490234375, -4.05987548828125, -3.925323486328125, -3.790771484375, -3.656219482421875, -3.52166748046875, -3.387115478515625, -3.2525634765625, -3.118011474609375, -2.98345947265625, -2.848907470703125, -2.71435546875, -2.579803466796875, -2.44525146484375, -2.310699462890625, -2.1761474609375, -2.041595458984375, -1.90704345703125, -1.772491455078125, -1.637939453125, -1.503387451171875, -1.36883544921875, -1.234283447265625, -1.0997314453125, -0.965179443359375, -0.83062744140625, -0.696075439453125, -0.5615234375, -0.426971435546875, -0.29241943359375, -0.157867431640625, -0.0233154296875, 0.111236572265625, 0.24578857421875, 0.380340576171875, 0.514892578125, 0.649444580078125, 0.78399658203125, 0.918548583984375, 1.0531005859375, 1.187652587890625, 1.32220458984375, 1.456756591796875, 1.59130859375, 1.725860595703125, 1.86041259765625, 1.994964599609375, 2.1295166015625, 2.264068603515625, 2.39862060546875, 2.533172607421875, 2.667724609375, 2.802276611328125, 2.93682861328125, 3.071380615234375, 3.2059326171875, 3.340484619140625, 3.47503662109375, 3.609588623046875, 3.744140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 19.0, 12.0, 22.0, 48.0, 62.0, 110.0, 193.0, 202.0, 114.0, 74.0, 35.0, 21.0, 19.0, 14.0, 6.0, 7.0, 6.0, 3.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003371238708496094, -0.000324152410030365, -0.0003111809492111206, -0.0002982094883918762, -0.00028523802757263184, -0.00027226656675338745, -0.00025929510593414307, -0.0002463236451148987, -0.0002333521842956543, -0.0002203807234764099, -0.00020740926265716553, -0.00019443780183792114, -0.00018146634101867676, -0.00016849488019943237, -0.000155523419380188, -0.0001425519585609436, -0.00012958049774169922, -0.00011660903692245483, -0.00010363757610321045, -9.066611528396606e-05, -7.769465446472168e-05, -6.47231936454773e-05, -5.175173282623291e-05, -3.8780272006988525e-05, -2.580881118774414e-05, -1.2837350368499756e-05, 1.341104507446289e-07, 1.3105571269989014e-05, 2.60770320892334e-05, 3.904849290847778e-05, 5.201995372772217e-05, 6.499141454696655e-05, 7.796287536621094e-05, 9.093433618545532e-05, 0.00010390579700469971, 0.00011687725782394409, 0.00012984871864318848, 0.00014282017946243286, 0.00015579164028167725, 0.00016876310110092163, 0.00018173456192016602, 0.0001947060227394104, 0.00020767748355865479, 0.00022064894437789917, 0.00023362040519714355, 0.00024659186601638794, 0.0002595633268356323, 0.0002725347876548767, 0.0002855062484741211, 0.0002984777092933655, 0.00031144917011260986, 0.00032442063093185425, 0.00033739209175109863, 0.000350363552570343, 0.0003633350133895874, 0.0003763064742088318, 0.00038927793502807617, 0.00040224939584732056, 0.00041522085666656494, 0.0004281923174858093, 0.0004411637783050537, 0.0004541352391242981, 0.0004671066999435425, 0.00048007816076278687, 0.0004930496215820312]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 5.0, 7.0, 14.0, 16.0, 39.0, 97.0, 181.0, 780.0, 6025.0, 493801.0, 540267.0, 6152.0, 756.0, 204.0, 96.0, 44.0, 33.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-8.515625, -8.326416015625, -8.13720703125, -7.947998046875, -7.7587890625, -7.569580078125, -7.38037109375, -7.191162109375, -7.001953125, -6.812744140625, -6.62353515625, -6.434326171875, -6.2451171875, -6.055908203125, -5.86669921875, -5.677490234375, -5.48828125, -5.299072265625, -5.10986328125, -4.920654296875, -4.7314453125, -4.542236328125, -4.35302734375, -4.163818359375, -3.974609375, -3.785400390625, -3.59619140625, -3.406982421875, -3.2177734375, -3.028564453125, -2.83935546875, -2.650146484375, -2.4609375, -2.271728515625, -2.08251953125, -1.893310546875, -1.7041015625, -1.514892578125, -1.32568359375, -1.136474609375, -0.947265625, -0.758056640625, -0.56884765625, -0.379638671875, -0.1904296875, -0.001220703125, 0.18798828125, 0.377197265625, 0.56640625, 0.755615234375, 0.94482421875, 1.134033203125, 1.3232421875, 1.512451171875, 1.70166015625, 1.890869140625, 2.080078125, 2.269287109375, 2.45849609375, 2.647705078125, 2.8369140625, 3.026123046875, 3.21533203125, 3.404541015625, 3.59375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 16.0, 41.0, 70.0, 149.0, 199.0, 230.0, 112.0, 67.0, 43.0, 18.0, 12.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.87762451171875, -3.7806396484375, -3.68365478515625, -3.586669921875, -3.48968505859375, -3.3927001953125, -3.29571533203125, -3.19873046875, -3.10174560546875, -3.0047607421875, -2.90777587890625, -2.810791015625, -2.71380615234375, -2.6168212890625, -2.51983642578125, -2.4228515625, -2.32586669921875, -2.2288818359375, -2.13189697265625, -2.034912109375, -1.93792724609375, -1.8409423828125, -1.74395751953125, -1.64697265625, -1.54998779296875, -1.4530029296875, -1.35601806640625, -1.259033203125, -1.16204833984375, -1.0650634765625, -0.96807861328125, -0.87109375, -0.77410888671875, -0.6771240234375, -0.58013916015625, -0.483154296875, -0.38616943359375, -0.2891845703125, -0.19219970703125, -0.09521484375, 0.00177001953125, 0.0987548828125, 0.19573974609375, 0.292724609375, 0.38970947265625, 0.4866943359375, 0.58367919921875, 0.6806640625, 0.77764892578125, 0.8746337890625, 0.97161865234375, 1.068603515625, 1.16558837890625, 1.2625732421875, 1.35955810546875, 1.45654296875, 1.55352783203125, 1.6505126953125, 1.74749755859375, 1.844482421875, 1.94146728515625, 2.0384521484375, 2.13543701171875, 2.232421875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 45.0, 331.0, 491.0, 107.0, 23.0, 7.0, 3.0, 0.0, 2.0], "bins": [-202.78085327148438, -199.2318572998047, -195.682861328125, -192.1338653564453, -188.58486938476562, -185.03585815429688, -181.48687744140625, -177.9378662109375, -174.3888702392578, -170.83987426757812, -167.29087829589844, -163.74188232421875, -160.19288635253906, -156.64389038085938, -153.09487915039062, -149.54588317871094, -145.99688720703125, -142.44789123535156, -138.89889526367188, -135.3498992919922, -131.8009033203125, -128.25189208984375, -124.7029037475586, -121.1539077758789, -117.60491943359375, -114.05592346191406, -110.50692749023438, -106.95793151855469, -103.40892791748047, -99.85993194580078, -96.3109359741211, -92.7619400024414, -89.21293640136719, -85.6639404296875, -82.11494445800781, -78.56594848632812, -75.0169448852539, -71.46794891357422, -67.91895294189453, -64.36995697021484, -60.820953369140625, -57.27195739746094, -53.722957611083984, -50.1739616394043, -46.624961853027344, -43.075965881347656, -39.52696990966797, -35.97797393798828, -32.42897415161133, -28.879976272583008, -25.330978393554688, -21.781982421875, -18.23298454284668, -14.68398666381836, -11.134990692138672, -7.585992813110352, -4.036994934082031, -0.48799753189086914, 3.060999870300293, 6.609996795654297, 10.158994674682617, 13.707992553710938, 17.256988525390625, 20.805986404418945, 24.354984283447266]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 8.0, 9.0, 12.0, 18.0, 10.0, 19.0, 17.0, 12.0, 22.0, 25.0, 25.0, 40.0, 26.0, 31.0, 35.0, 37.0, 45.0, 30.0, 41.0, 37.0, 45.0, 50.0, 33.0, 32.0, 24.0, 26.0, 34.0, 36.0, 24.0, 19.0, 26.0, 19.0, 20.0, 24.0, 13.0, 6.0, 13.0, 4.0, 6.0, 3.0, 10.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-21.572227478027344, -20.940044403076172, -20.307861328125, -19.675678253173828, -19.043495178222656, -18.411312103271484, -17.779129028320312, -17.14694595336914, -16.51476287841797, -15.882579803466797, -15.250396728515625, -14.618213653564453, -13.986030578613281, -13.35384750366211, -12.721664428710938, -12.089481353759766, -11.457298278808594, -10.825115203857422, -10.19293212890625, -9.560749053955078, -8.928565979003906, -8.296382904052734, -7.6641998291015625, -7.032016754150391, -6.399833679199219, -5.767650604248047, -5.135467529296875, -4.503284454345703, -3.8711013793945312, -3.2389183044433594, -2.6067352294921875, -1.9745521545410156, -1.3423690795898438, -0.7101860046386719, -0.0780029296875, 0.5541801452636719, 1.1863632202148438, 1.8185462951660156, 2.4507293701171875, 3.0829124450683594, 3.7150955200195312, 4.347278594970703, 4.979461669921875, 5.611644744873047, 6.243827819824219, 6.876010894775391, 7.5081939697265625, 8.140377044677734, 8.772560119628906, 9.404743194580078, 10.03692626953125, 10.669109344482422, 11.301292419433594, 11.933475494384766, 12.565658569335938, 13.19784164428711, 13.830024719238281, 14.462207794189453, 15.094390869140625, 15.726573944091797, 16.35875701904297, 16.99094009399414, 17.623123168945312, 18.255306243896484, 18.887489318847656]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 8.0, 4.0, 3.0, 11.0, 7.0, 6.0, 11.0, 9.0, 16.0, 19.0, 19.0, 41.0, 41.0, 74.0, 93.0, 144.0, 228.0, 420.0, 833.0, 1607.0, 3647.0, 10067.0, 46542.0, 3887759.0, 210971.0, 20562.0, 6190.0, 2466.0, 1163.0, 563.0, 284.0, 183.0, 100.0, 63.0, 36.0, 25.0, 17.0, 12.0, 9.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.5390625, -6.37457275390625, -6.2100830078125, -6.04559326171875, -5.881103515625, -5.71661376953125, -5.5521240234375, -5.38763427734375, -5.22314453125, -5.05865478515625, -4.8941650390625, -4.72967529296875, -4.565185546875, -4.40069580078125, -4.2362060546875, -4.07171630859375, -3.9072265625, -3.74273681640625, -3.5782470703125, -3.41375732421875, -3.249267578125, -3.08477783203125, -2.9202880859375, -2.75579833984375, -2.59130859375, -2.42681884765625, -2.2623291015625, -2.09783935546875, -1.933349609375, -1.76885986328125, -1.6043701171875, -1.43988037109375, -1.275390625, -1.11090087890625, -0.9464111328125, -0.78192138671875, -0.617431640625, -0.45294189453125, -0.2884521484375, -0.12396240234375, 0.04052734375, 0.20501708984375, 0.3695068359375, 0.53399658203125, 0.698486328125, 0.86297607421875, 1.0274658203125, 1.19195556640625, 1.3564453125, 1.52093505859375, 1.6854248046875, 1.84991455078125, 2.014404296875, 2.17889404296875, 2.3433837890625, 2.50787353515625, 2.67236328125, 2.83685302734375, 3.0013427734375, 3.16583251953125, 3.330322265625, 3.49481201171875, 3.6593017578125, 3.82379150390625, 3.98828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 13.0, 5.0, 13.0, 18.0, 15.0, 26.0, 30.0, 46.0, 32.0, 39.0, 46.0, 57.0, 61.0, 54.0, 78.0, 70.0, 57.0, 70.0, 47.0, 31.0, 33.0, 46.0, 26.0, 27.0, 22.0, 8.0, 5.0, 6.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.810546875, -1.763031005859375, -1.71551513671875, -1.667999267578125, -1.6204833984375, -1.572967529296875, -1.52545166015625, -1.477935791015625, -1.430419921875, -1.382904052734375, -1.33538818359375, -1.287872314453125, -1.2403564453125, -1.192840576171875, -1.14532470703125, -1.097808837890625, -1.05029296875, -1.002777099609375, -0.95526123046875, -0.907745361328125, -0.8602294921875, -0.812713623046875, -0.76519775390625, -0.717681884765625, -0.670166015625, -0.622650146484375, -0.57513427734375, -0.527618408203125, -0.4801025390625, -0.432586669921875, -0.38507080078125, -0.337554931640625, -0.2900390625, -0.242523193359375, -0.19500732421875, -0.147491455078125, -0.0999755859375, -0.052459716796875, -0.00494384765625, 0.042572021484375, 0.090087890625, 0.137603759765625, 0.18511962890625, 0.232635498046875, 0.2801513671875, 0.327667236328125, 0.37518310546875, 0.422698974609375, 0.47021484375, 0.517730712890625, 0.56524658203125, 0.612762451171875, 0.6602783203125, 0.707794189453125, 0.75531005859375, 0.802825927734375, 0.850341796875, 0.897857666015625, 0.94537353515625, 0.992889404296875, 1.0404052734375, 1.087921142578125, 1.13543701171875, 1.182952880859375, 1.23046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 15.0, 17.0, 48.0, 123.0, 381.0, 1116.0, 4369.0, 25221.0, 4007301.0, 141752.0, 10535.0, 2361.0, 635.0, 224.0, 77.0, 41.0, 14.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.064208984375, -8.73779296875, -8.411376953125, -8.0849609375, -7.758544921875, -7.43212890625, -7.105712890625, -6.779296875, -6.452880859375, -6.12646484375, -5.800048828125, -5.4736328125, -5.147216796875, -4.82080078125, -4.494384765625, -4.16796875, -3.841552734375, -3.51513671875, -3.188720703125, -2.8623046875, -2.535888671875, -2.20947265625, -1.883056640625, -1.556640625, -1.230224609375, -0.90380859375, -0.577392578125, -0.2509765625, 0.075439453125, 0.40185546875, 0.728271484375, 1.0546875, 1.381103515625, 1.70751953125, 2.033935546875, 2.3603515625, 2.686767578125, 3.01318359375, 3.339599609375, 3.666015625, 3.992431640625, 4.31884765625, 4.645263671875, 4.9716796875, 5.298095703125, 5.62451171875, 5.950927734375, 6.27734375, 6.603759765625, 6.93017578125, 7.256591796875, 7.5830078125, 7.909423828125, 8.23583984375, 8.562255859375, 8.888671875, 9.215087890625, 9.54150390625, 9.867919921875, 10.1943359375, 10.520751953125, 10.84716796875, 11.173583984375, 11.5]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 11.0, 9.0, 18.0, 22.0, 24.0, 58.0, 147.0, 407.0, 2639.0, 420.0, 109.0, 54.0, 36.0, 23.0, 14.0, 10.0, 10.0, 8.0, 7.0, 3.0, 4.0, 3.0, 2.0, 7.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6876373291015625, -1.626251220703125, -1.5648651123046875, -1.50347900390625, -1.4420928955078125, -1.380706787109375, -1.3193206787109375, -1.2579345703125, -1.1965484619140625, -1.135162353515625, -1.0737762451171875, -1.01239013671875, -0.9510040283203125, -0.889617919921875, -0.8282318115234375, -0.766845703125, -0.7054595947265625, -0.644073486328125, -0.5826873779296875, -0.52130126953125, -0.4599151611328125, -0.398529052734375, -0.3371429443359375, -0.2757568359375, -0.2143707275390625, -0.152984619140625, -0.0915985107421875, -0.03021240234375, 0.0311737060546875, 0.092559814453125, 0.1539459228515625, 0.21533203125, 0.2767181396484375, 0.338104248046875, 0.3994903564453125, 0.46087646484375, 0.5222625732421875, 0.583648681640625, 0.6450347900390625, 0.7064208984375, 0.7678070068359375, 0.829193115234375, 0.8905792236328125, 0.95196533203125, 1.0133514404296875, 1.074737548828125, 1.1361236572265625, 1.197509765625, 1.2588958740234375, 1.320281982421875, 1.3816680908203125, 1.44305419921875, 1.5044403076171875, 1.565826416015625, 1.6272125244140625, 1.6885986328125, 1.7499847412109375, 1.811370849609375, 1.8727569580078125, 1.93414306640625, 1.9955291748046875, 2.056915283203125, 2.1183013916015625, 2.1796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 7.0, 4.0, 27.0, 116.0, 382.0, 340.0, 96.0, 16.0, 10.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.919740676879883, -9.094311714172363, -8.268882751464844, -7.443453311920166, -6.6180243492126465, -5.792595386505127, -4.967165946960449, -4.14173698425293, -3.31630802154541, -2.4908790588378906, -1.665449857711792, -0.8400206565856934, -0.014591693878173828, 0.8108372688293457, 1.6362667083740234, 2.461695671081543, 3.2871246337890625, 4.112553596496582, 4.937982559204102, 5.763411998748779, 6.588840961456299, 7.414269924163818, 8.239699363708496, 9.065128326416016, 9.890557289123535, 10.715986251831055, 11.541415214538574, 12.366844177246094, 13.19227409362793, 14.017702102661133, 14.843132019042969, 15.668560981750488, 16.49399185180664, 17.319421768188477, 18.14484977722168, 18.970279693603516, 19.79570770263672, 20.621137619018555, 21.44656753540039, 22.271995544433594, 23.097423553466797, 23.922853469848633, 24.748281478881836, 25.573711395263672, 26.399139404296875, 27.22456932067871, 28.049999237060547, 28.87542724609375, 29.700857162475586, 30.526287078857422, 31.351715087890625, 32.17714309692383, 33.0025749206543, 33.8280029296875, 34.6534309387207, 35.478858947753906, 36.304290771484375, 37.12971878051758, 37.95515060424805, 38.78057861328125, 39.60600662231445, 40.431434631347656, 41.256866455078125, 42.08229446411133, 42.90772247314453]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 8.0, 14.0, 10.0, 15.0, 12.0, 26.0, 33.0, 27.0, 48.0, 46.0, 44.0, 50.0, 48.0, 48.0, 47.0, 47.0, 52.0, 53.0, 50.0, 37.0, 37.0, 31.0, 37.0, 31.0, 30.0, 19.0, 9.0, 16.0, 16.0, 12.0, 12.0, 7.0, 4.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.004368782043457, -4.826638221740723, -4.6489081382751465, -4.471177577972412, -4.293447494506836, -4.115716934204102, -3.9379866123199463, -3.760256290435791, -3.5825257301330566, -3.4047954082489014, -3.227065086364746, -3.0493345260620117, -2.8716042041778564, -2.693873882293701, -2.516143560409546, -2.3384132385253906, -2.1606829166412354, -1.98295259475708, -1.8052221536636353, -1.62749183177948, -1.4497613906860352, -1.2720310688018799, -1.0943007469177246, -0.9165703058242798, -0.7388399839401245, -0.5611096024513245, -0.3833792507648468, -0.20564889907836914, -0.027918517589569092, 0.14981186389923096, 0.32754218578338623, 0.505272626876831, 0.6830029487609863, 0.8607333302497864, 1.0384637117385864, 1.2161940336227417, 1.3939244747161865, 1.5716547966003418, 1.749385118484497, 1.927115559577942, 2.1048460006713867, 2.282576322555542, 2.4603066444396973, 2.6380372047424316, 2.815767526626587, 2.993497848510742, 3.1712281703948975, 3.3489584922790527, 3.526688814163208, 3.7044191360473633, 3.8821494579315186, 4.059879779815674, 4.237610340118408, 4.415340423583984, 4.593070983886719, 4.770801544189453, 4.948531627655029, 5.126262187957764, 5.30399227142334, 5.481722831726074, 5.65945291519165, 5.837183475494385, 6.014913558959961, 6.192644119262695, 6.37037467956543]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 16.0, 13.0, 17.0, 27.0, 28.0, 62.0, 66.0, 84.0, 166.0, 260.0, 476.0, 952.0, 1816.0, 4052.0, 10197.0, 31457.0, 120246.0, 505832.0, 279080.0, 63216.0, 18158.0, 6640.0, 2795.0, 1256.0, 669.0, 361.0, 193.0, 131.0, 77.0, 67.0, 33.0, 34.0, 18.0, 15.0, 5.0, 4.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.68255615234375, -4.5252685546875, -4.36798095703125, -4.210693359375, -4.05340576171875, -3.8961181640625, -3.73883056640625, -3.58154296875, -3.42425537109375, -3.2669677734375, -3.10968017578125, -2.952392578125, -2.79510498046875, -2.6378173828125, -2.48052978515625, -2.3232421875, -2.16595458984375, -2.0086669921875, -1.85137939453125, -1.694091796875, -1.53680419921875, -1.3795166015625, -1.22222900390625, -1.06494140625, -0.90765380859375, -0.7503662109375, -0.59307861328125, -0.435791015625, -0.27850341796875, -0.1212158203125, 0.03607177734375, 0.193359375, 0.35064697265625, 0.5079345703125, 0.66522216796875, 0.822509765625, 0.97979736328125, 1.1370849609375, 1.29437255859375, 1.45166015625, 1.60894775390625, 1.7662353515625, 1.92352294921875, 2.080810546875, 2.23809814453125, 2.3953857421875, 2.55267333984375, 2.7099609375, 2.86724853515625, 3.0245361328125, 3.18182373046875, 3.339111328125, 3.49639892578125, 3.6536865234375, 3.81097412109375, 3.96826171875, 4.12554931640625, 4.2828369140625, 4.44012451171875, 4.597412109375, 4.75469970703125, 4.9119873046875, 5.06927490234375, 5.2265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 9.0, 14.0, 10.0, 22.0, 24.0, 25.0, 30.0, 36.0, 45.0, 51.0, 40.0, 72.0, 57.0, 69.0, 70.0, 76.0, 58.0, 53.0, 53.0, 39.0, 35.0, 25.0, 22.0, 22.0, 11.0, 5.0, 8.0, 2.0, 3.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.892578125, -1.84332275390625, -1.7940673828125, -1.74481201171875, -1.695556640625, -1.64630126953125, -1.5970458984375, -1.54779052734375, -1.49853515625, -1.44927978515625, -1.4000244140625, -1.35076904296875, -1.301513671875, -1.25225830078125, -1.2030029296875, -1.15374755859375, -1.1044921875, -1.05523681640625, -1.0059814453125, -0.95672607421875, -0.907470703125, -0.85821533203125, -0.8089599609375, -0.75970458984375, -0.71044921875, -0.66119384765625, -0.6119384765625, -0.56268310546875, -0.513427734375, -0.46417236328125, -0.4149169921875, -0.36566162109375, -0.31640625, -0.26715087890625, -0.2178955078125, -0.16864013671875, -0.119384765625, -0.07012939453125, -0.0208740234375, 0.02838134765625, 0.07763671875, 0.12689208984375, 0.1761474609375, 0.22540283203125, 0.274658203125, 0.32391357421875, 0.3731689453125, 0.42242431640625, 0.4716796875, 0.52093505859375, 0.5701904296875, 0.61944580078125, 0.668701171875, 0.71795654296875, 0.7672119140625, 0.81646728515625, 0.86572265625, 0.91497802734375, 0.9642333984375, 1.01348876953125, 1.062744140625, 1.11199951171875, 1.1612548828125, 1.21051025390625, 1.259765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 4.0, 14.0, 8.0, 8.0, 16.0, 22.0, 36.0, 32.0, 47.0, 88.0, 133.0, 282.0, 679.0, 2228.0, 11486.0, 96365.0, 770096.0, 146967.0, 15636.0, 2851.0, 743.0, 297.0, 162.0, 93.0, 72.0, 32.0, 38.0, 21.0, 23.0, 16.0, 8.0, 8.0, 8.0, 7.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.87890625, -7.62127685546875, -7.3636474609375, -7.10601806640625, -6.848388671875, -6.59075927734375, -6.3331298828125, -6.07550048828125, -5.81787109375, -5.56024169921875, -5.3026123046875, -5.04498291015625, -4.787353515625, -4.52972412109375, -4.2720947265625, -4.01446533203125, -3.7568359375, -3.49920654296875, -3.2415771484375, -2.98394775390625, -2.726318359375, -2.46868896484375, -2.2110595703125, -1.95343017578125, -1.69580078125, -1.43817138671875, -1.1805419921875, -0.92291259765625, -0.665283203125, -0.40765380859375, -0.1500244140625, 0.10760498046875, 0.365234375, 0.62286376953125, 0.8804931640625, 1.13812255859375, 1.395751953125, 1.65338134765625, 1.9110107421875, 2.16864013671875, 2.42626953125, 2.68389892578125, 2.9415283203125, 3.19915771484375, 3.456787109375, 3.71441650390625, 3.9720458984375, 4.22967529296875, 4.4873046875, 4.74493408203125, 5.0025634765625, 5.26019287109375, 5.517822265625, 5.77545166015625, 6.0330810546875, 6.29071044921875, 6.54833984375, 6.80596923828125, 7.0635986328125, 7.32122802734375, 7.578857421875, 7.83648681640625, 8.0941162109375, 8.35174560546875, 8.609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 9.0, 7.0, 6.0, 11.0, 12.0, 19.0, 18.0, 19.0, 31.0, 32.0, 33.0, 25.0, 32.0, 37.0, 41.0, 37.0, 43.0, 51.0, 42.0, 43.0, 46.0, 42.0, 45.0, 43.0, 20.0, 43.0, 27.0, 21.0, 26.0, 18.0, 19.0, 14.0, 21.0, 5.0, 12.0, 6.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.21484375, -4.0704345703125, -3.926025390625, -3.7816162109375, -3.63720703125, -3.4927978515625, -3.348388671875, -3.2039794921875, -3.0595703125, -2.9151611328125, -2.770751953125, -2.6263427734375, -2.48193359375, -2.3375244140625, -2.193115234375, -2.0487060546875, -1.904296875, -1.7598876953125, -1.615478515625, -1.4710693359375, -1.32666015625, -1.1822509765625, -1.037841796875, -0.8934326171875, -0.7490234375, -0.6046142578125, -0.460205078125, -0.3157958984375, -0.17138671875, -0.0269775390625, 0.117431640625, 0.2618408203125, 0.40625, 0.5506591796875, 0.695068359375, 0.8394775390625, 0.98388671875, 1.1282958984375, 1.272705078125, 1.4171142578125, 1.5615234375, 1.7059326171875, 1.850341796875, 1.9947509765625, 2.13916015625, 2.2835693359375, 2.427978515625, 2.5723876953125, 2.716796875, 2.8612060546875, 3.005615234375, 3.1500244140625, 3.29443359375, 3.4388427734375, 3.583251953125, 3.7276611328125, 3.8720703125, 4.0164794921875, 4.160888671875, 4.3052978515625, 4.44970703125, 4.5941162109375, 4.738525390625, 4.8829345703125, 5.02734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 11.0, 6.0, 12.0, 12.0, 26.0, 22.0, 43.0, 53.0, 92.0, 138.0, 239.0, 458.0, 854.0, 1810.0, 4252.0, 12426.0, 57262.0, 592759.0, 326968.0, 35685.0, 8965.0, 3253.0, 1432.0, 719.0, 383.0, 232.0, 150.0, 89.0, 67.0, 33.0, 22.0, 13.0, 16.0, 10.0, 6.0, 3.0, 9.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.087890625, -2.022369384765625, -1.95684814453125, -1.891326904296875, -1.8258056640625, -1.760284423828125, -1.69476318359375, -1.629241943359375, -1.563720703125, -1.498199462890625, -1.43267822265625, -1.367156982421875, -1.3016357421875, -1.236114501953125, -1.17059326171875, -1.105072021484375, -1.03955078125, -0.974029541015625, -0.90850830078125, -0.842987060546875, -0.7774658203125, -0.711944580078125, -0.64642333984375, -0.580902099609375, -0.515380859375, -0.449859619140625, -0.38433837890625, -0.318817138671875, -0.2532958984375, -0.187774658203125, -0.12225341796875, -0.056732177734375, 0.0087890625, 0.074310302734375, 0.13983154296875, 0.205352783203125, 0.2708740234375, 0.336395263671875, 0.40191650390625, 0.467437744140625, 0.532958984375, 0.598480224609375, 0.66400146484375, 0.729522705078125, 0.7950439453125, 0.860565185546875, 0.92608642578125, 0.991607666015625, 1.05712890625, 1.122650146484375, 1.18817138671875, 1.253692626953125, 1.3192138671875, 1.384735107421875, 1.45025634765625, 1.515777587890625, 1.581298828125, 1.646820068359375, 1.71234130859375, 1.777862548828125, 1.8433837890625, 1.908905029296875, 1.97442626953125, 2.039947509765625, 2.10546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 9.0, 8.0, 7.0, 14.0, 30.0, 32.0, 46.0, 84.0, 98.0, 156.0, 137.0, 102.0, 86.0, 54.0, 28.0, 24.0, 19.0, 15.0, 10.0, 8.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003566741943359375, -0.00034677237272262573, -0.00033687055110931396, -0.0003269687294960022, -0.00031706690788269043, -0.00030716508626937866, -0.0002972632646560669, -0.0002873614430427551, -0.00027745962142944336, -0.0002675577998161316, -0.0002576559782028198, -0.00024775415658950806, -0.0002378523349761963, -0.00022795051336288452, -0.00021804869174957275, -0.00020814687013626099, -0.00019824504852294922, -0.00018834322690963745, -0.00017844140529632568, -0.00016853958368301392, -0.00015863776206970215, -0.00014873594045639038, -0.0001388341188430786, -0.00012893229722976685, -0.00011903047561645508, -0.00010912865400314331, -9.922683238983154e-05, -8.932501077651978e-05, -7.942318916320801e-05, -6.952136754989624e-05, -5.961954593658447e-05, -4.9717724323272705e-05, -3.981590270996094e-05, -2.991408109664917e-05, -2.0012259483337402e-05, -1.0110437870025635e-05, -2.086162567138672e-07, 9.6932053565979e-06, 1.9595026969909668e-05, 2.9496848583221436e-05, 3.93986701965332e-05, 4.930049180984497e-05, 5.920231342315674e-05, 6.91041350364685e-05, 7.900595664978027e-05, 8.890777826309204e-05, 9.880959987640381e-05, 0.00010871142148971558, 0.00011861324310302734, 0.0001285150647163391, 0.00013841688632965088, 0.00014831870794296265, 0.00015822052955627441, 0.00016812235116958618, 0.00017802417278289795, 0.00018792599439620972, 0.00019782781600952148, 0.00020772963762283325, 0.00021763145923614502, 0.0002275332808494568, 0.00023743510246276855, 0.0002473369240760803, 0.0002572387456893921, 0.00026714056730270386, 0.0002770423889160156]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 6.0, 3.0, 5.0, 14.0, 16.0, 26.0, 65.0, 132.0, 441.0, 1905.0, 17065.0, 961015.0, 63185.0, 3610.0, 686.0, 205.0, 86.0, 34.0, 20.0, 10.0, 12.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.091796875, -4.92578125, -4.759765625, -4.59375, -4.427734375, -4.26171875, -4.095703125, -3.9296875, -3.763671875, -3.59765625, -3.431640625, -3.265625, -3.099609375, -2.93359375, -2.767578125, -2.6015625, -2.435546875, -2.26953125, -2.103515625, -1.9375, -1.771484375, -1.60546875, -1.439453125, -1.2734375, -1.107421875, -0.94140625, -0.775390625, -0.609375, -0.443359375, -0.27734375, -0.111328125, 0.0546875, 0.220703125, 0.38671875, 0.552734375, 0.71875, 0.884765625, 1.05078125, 1.216796875, 1.3828125, 1.548828125, 1.71484375, 1.880859375, 2.046875, 2.212890625, 2.37890625, 2.544921875, 2.7109375, 2.876953125, 3.04296875, 3.208984375, 3.375, 3.541015625, 3.70703125, 3.873046875, 4.0390625, 4.205078125, 4.37109375, 4.537109375, 4.703125, 4.869140625, 5.03515625, 5.201171875, 5.3671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 13.0, 20.0, 22.0, 43.0, 48.0, 97.0, 130.0, 189.0, 125.0, 93.0, 62.0, 31.0, 24.0, 15.0, 20.0, 8.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.7987518310546875, -1.735198974609375, -1.6716461181640625, -1.60809326171875, -1.5445404052734375, -1.480987548828125, -1.4174346923828125, -1.3538818359375, -1.2903289794921875, -1.226776123046875, -1.1632232666015625, -1.09967041015625, -1.0361175537109375, -0.972564697265625, -0.9090118408203125, -0.845458984375, -0.7819061279296875, -0.718353271484375, -0.6548004150390625, -0.59124755859375, -0.5276947021484375, -0.464141845703125, -0.4005889892578125, -0.3370361328125, -0.2734832763671875, -0.209930419921875, -0.1463775634765625, -0.08282470703125, -0.0192718505859375, 0.044281005859375, 0.1078338623046875, 0.17138671875, 0.2349395751953125, 0.298492431640625, 0.3620452880859375, 0.42559814453125, 0.4891510009765625, 0.552703857421875, 0.6162567138671875, 0.6798095703125, 0.7433624267578125, 0.806915283203125, 0.8704681396484375, 0.93402099609375, 0.9975738525390625, 1.061126708984375, 1.1246795654296875, 1.188232421875, 1.2517852783203125, 1.315338134765625, 1.3788909912109375, 1.44244384765625, 1.5059967041015625, 1.569549560546875, 1.6331024169921875, 1.6966552734375, 1.7602081298828125, 1.823760986328125, 1.8873138427734375, 1.95086669921875, 2.0144195556640625, 2.077972412109375, 2.1415252685546875, 2.205078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 18.0, 46.0, 161.0, 332.0, 272.0, 103.0, 42.0, 15.0, 8.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.45199584960938, -74.37818145751953, -72.30435943603516, -70.23054504394531, -68.15672302246094, -66.0829086303711, -64.00908660888672, -61.935272216796875, -59.8614501953125, -57.78763198852539, -55.71381378173828, -53.63999557495117, -51.56617736816406, -49.49235916137695, -47.418540954589844, -45.3447265625, -43.27090835571289, -41.19709014892578, -39.12327194213867, -37.04945373535156, -34.97563552856445, -32.901817321777344, -30.828001022338867, -28.754182815551758, -26.68036460876465, -24.60654640197754, -22.53272819519043, -20.458911895751953, -18.385093688964844, -16.311275482177734, -14.237457275390625, -12.163639068603516, -10.089824676513672, -8.016006469726562, -5.942188739776611, -3.86837100982666, -1.7945528030395508, 0.2792654037475586, 2.3530826568603516, 4.426900863647461, 6.50071907043457, 8.57453727722168, 10.648355484008789, 12.722172737121582, 14.795990943908691, 16.869808197021484, 18.943626403808594, 21.017444610595703, 23.091262817382812, 25.165081024169922, 27.23889923095703, 29.31271743774414, 31.38653564453125, 33.46035385131836, 35.53417205810547, 37.60798645019531, 39.68180847167969, 41.7556266784668, 43.829444885253906, 45.903263092041016, 47.977081298828125, 50.050899505615234, 52.124717712402344, 54.19853210449219, 56.2723503112793]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 1.0, 10.0, 4.0, 14.0, 19.0, 10.0, 16.0, 22.0, 28.0, 15.0, 29.0, 22.0, 29.0, 30.0, 36.0, 40.0, 27.0, 30.0, 40.0, 33.0, 35.0, 37.0, 42.0, 47.0, 27.0, 31.0, 26.0, 35.0, 34.0, 35.0, 35.0, 20.0, 22.0, 19.0, 13.0, 12.0, 10.0, 12.0, 9.0, 8.0, 7.0, 4.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-21.207210540771484, -20.573505401611328, -19.939802169799805, -19.30609703063965, -18.672393798828125, -18.03868865966797, -17.404985427856445, -16.77128028869629, -16.137577056884766, -15.503872871398926, -14.870168685913086, -14.236464500427246, -13.602760314941406, -12.969056129455566, -12.335351943969727, -11.70164680480957, -11.06794261932373, -10.43423843383789, -9.80053424835205, -9.166830062866211, -8.533125877380371, -7.899421691894531, -7.265717029571533, -6.632012844085693, -5.9983086585998535, -5.364604473114014, -4.730900287628174, -4.097195625305176, -3.463491678237915, -2.829787492752075, -2.1960830688476562, -1.5623788833618164, -0.9286746978759766, -0.29497045278549194, 0.3387337923049927, 0.9724380970001221, 1.606142282485962, 2.2398464679718018, 2.8735508918762207, 3.5072550773620605, 4.1409592628479, 4.77466344833374, 5.40836763381958, 6.042072296142578, 6.675776481628418, 7.309480667114258, 7.943184852600098, 8.576889038085938, 9.210593223571777, 9.844297409057617, 10.478001594543457, 11.111705780029297, 11.745409965515137, 12.379114151000977, 13.012819290161133, 13.646522521972656, 14.280227661132812, 14.913931846618652, 15.547636032104492, 16.18134117126465, 16.815044403076172, 17.448749542236328, 18.08245277404785, 18.716157913208008, 19.34986114501953]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 3.0, 7.0, 6.0, 5.0, 10.0, 12.0, 9.0, 23.0, 21.0, 33.0, 48.0, 75.0, 131.0, 182.0, 281.0, 444.0, 932.0, 2070.0, 4901.0, 15822.0, 122341.0, 3984959.0, 45859.0, 9866.0, 3295.0, 1434.0, 639.0, 353.0, 212.0, 108.0, 73.0, 45.0, 31.0, 20.0, 14.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.828125, -13.501220703125, -13.17431640625, -12.847412109375, -12.5205078125, -12.193603515625, -11.86669921875, -11.539794921875, -11.212890625, -10.885986328125, -10.55908203125, -10.232177734375, -9.9052734375, -9.578369140625, -9.25146484375, -8.924560546875, -8.59765625, -8.270751953125, -7.94384765625, -7.616943359375, -7.2900390625, -6.963134765625, -6.63623046875, -6.309326171875, -5.982421875, -5.655517578125, -5.32861328125, -5.001708984375, -4.6748046875, -4.347900390625, -4.02099609375, -3.694091796875, -3.3671875, -3.040283203125, -2.71337890625, -2.386474609375, -2.0595703125, -1.732666015625, -1.40576171875, -1.078857421875, -0.751953125, -0.425048828125, -0.09814453125, 0.228759765625, 0.5556640625, 0.882568359375, 1.20947265625, 1.536376953125, 1.86328125, 2.190185546875, 2.51708984375, 2.843994140625, 3.1708984375, 3.497802734375, 3.82470703125, 4.151611328125, 4.478515625, 4.805419921875, 5.13232421875, 5.459228515625, 5.7861328125, 6.113037109375, 6.43994140625, 6.766845703125, 7.09375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 13.0, 14.0, 12.0, 13.0, 29.0, 27.0, 29.0, 28.0, 49.0, 31.0, 37.0, 51.0, 55.0, 65.0, 66.0, 54.0, 57.0, 56.0, 60.0, 42.0, 42.0, 31.0, 24.0, 20.0, 35.0, 12.0, 9.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.8974609375, -1.8478240966796875, -1.798187255859375, -1.7485504150390625, -1.69891357421875, -1.6492767333984375, -1.599639892578125, -1.5500030517578125, -1.5003662109375, -1.4507293701171875, -1.401092529296875, -1.3514556884765625, -1.30181884765625, -1.2521820068359375, -1.202545166015625, -1.1529083251953125, -1.103271484375, -1.0536346435546875, -1.003997802734375, -0.9543609619140625, -0.90472412109375, -0.8550872802734375, -0.805450439453125, -0.7558135986328125, -0.7061767578125, -0.6565399169921875, -0.606903076171875, -0.5572662353515625, -0.50762939453125, -0.4579925537109375, -0.408355712890625, -0.3587188720703125, -0.30908203125, -0.2594451904296875, -0.209808349609375, -0.1601715087890625, -0.11053466796875, -0.0608978271484375, -0.011260986328125, 0.0383758544921875, 0.0880126953125, 0.1376495361328125, 0.187286376953125, 0.2369232177734375, 0.28656005859375, 0.3361968994140625, 0.385833740234375, 0.4354705810546875, 0.485107421875, 0.5347442626953125, 0.584381103515625, 0.6340179443359375, 0.68365478515625, 0.7332916259765625, 0.782928466796875, 0.8325653076171875, 0.8822021484375, 0.9318389892578125, 0.981475830078125, 1.0311126708984375, 1.08074951171875, 1.1303863525390625, 1.180023193359375, 1.2296600341796875, 1.279296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 11.0, 16.0, 17.0, 46.0, 67.0, 146.0, 392.0, 1230.0, 4676.0, 26628.0, 3632386.0, 501567.0, 21072.0, 4136.0, 1103.0, 403.0, 162.0, 92.0, 44.0, 33.0, 12.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.5823974609375, -8.172607421875, -7.7628173828125, -7.35302734375, -6.9432373046875, -6.533447265625, -6.1236572265625, -5.7138671875, -5.3040771484375, -4.894287109375, -4.4844970703125, -4.07470703125, -3.6649169921875, -3.255126953125, -2.8453369140625, -2.435546875, -2.0257568359375, -1.615966796875, -1.2061767578125, -0.79638671875, -0.3865966796875, 0.023193359375, 0.4329833984375, 0.8427734375, 1.2525634765625, 1.662353515625, 2.0721435546875, 2.48193359375, 2.8917236328125, 3.301513671875, 3.7113037109375, 4.12109375, 4.5308837890625, 4.940673828125, 5.3504638671875, 5.76025390625, 6.1700439453125, 6.579833984375, 6.9896240234375, 7.3994140625, 7.8092041015625, 8.218994140625, 8.6287841796875, 9.03857421875, 9.4483642578125, 9.858154296875, 10.2679443359375, 10.677734375, 11.0875244140625, 11.497314453125, 11.9071044921875, 12.31689453125, 12.7266845703125, 13.136474609375, 13.5462646484375, 13.9560546875, 14.3658447265625, 14.775634765625, 15.1854248046875, 15.59521484375, 16.0050048828125, 16.414794921875, 16.8245849609375, 17.234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 7.0, 10.0, 9.0, 13.0, 11.0, 29.0, 48.0, 67.0, 206.0, 2780.0, 555.0, 122.0, 55.0, 38.0, 22.0, 17.0, 20.0, 21.0, 10.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9912109375, -1.8854522705078125, -1.779693603515625, -1.6739349365234375, -1.56817626953125, -1.4624176025390625, -1.356658935546875, -1.2509002685546875, -1.1451416015625, -1.0393829345703125, -0.933624267578125, -0.8278656005859375, -0.72210693359375, -0.6163482666015625, -0.510589599609375, -0.4048309326171875, -0.299072265625, -0.1933135986328125, -0.087554931640625, 0.0182037353515625, 0.12396240234375, 0.2297210693359375, 0.335479736328125, 0.4412384033203125, 0.5469970703125, 0.6527557373046875, 0.758514404296875, 0.8642730712890625, 0.97003173828125, 1.0757904052734375, 1.181549072265625, 1.2873077392578125, 1.39306640625, 1.4988250732421875, 1.604583740234375, 1.7103424072265625, 1.81610107421875, 1.9218597412109375, 2.027618408203125, 2.1333770751953125, 2.2391357421875, 2.3448944091796875, 2.450653076171875, 2.5564117431640625, 2.66217041015625, 2.7679290771484375, 2.873687744140625, 2.9794464111328125, 3.085205078125, 3.1909637451171875, 3.296722412109375, 3.4024810791015625, 3.50823974609375, 3.6139984130859375, 3.719757080078125, 3.8255157470703125, 3.9312744140625, 4.0370330810546875, 4.142791748046875, 4.2485504150390625, 4.35430908203125, 4.4600677490234375, 4.565826416015625, 4.6715850830078125, 4.77734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 16.0, 141.0, 549.0, 234.0, 49.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.888368606567383, -17.388874053955078, -15.889381408691406, -14.389886856079102, -12.890393257141113, -11.390899658203125, -9.89140510559082, -8.391911506652832, -6.892417907714844, -5.3929243087768555, -3.893430233001709, -2.3939361572265625, -0.8944425582885742, 0.6050510406494141, 2.1045455932617188, 3.604039192199707, 5.103532791137695, 6.603026390075684, 8.102519989013672, 9.602014541625977, 11.101508140563965, 12.601001739501953, 14.100496292114258, 15.599989891052246, 17.099483489990234, 18.59897804260254, 20.09847068786621, 21.597965240478516, 23.097457885742188, 24.596952438354492, 26.096446990966797, 27.59593963623047, 29.095436096191406, 30.59493064880371, 32.094425201416016, 33.59391784667969, 35.09341049194336, 36.59290313720703, 38.09239959716797, 39.59189224243164, 41.09138488769531, 42.590877532958984, 44.09037399291992, 45.589866638183594, 47.089359283447266, 48.58885192871094, 50.088348388671875, 51.58784103393555, 53.087337493896484, 54.586830139160156, 56.086326599121094, 57.585819244384766, 59.08531188964844, 60.584808349609375, 62.08430099487305, 63.58379364013672, 65.08329010009766, 66.5827865600586, 68.082275390625, 69.58177185058594, 71.08126831054688, 72.58075714111328, 74.08025360107422, 75.57975006103516, 77.07923889160156]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 10.0, 17.0, 29.0, 21.0, 35.0, 34.0, 51.0, 49.0, 52.0, 60.0, 72.0, 59.0, 66.0, 69.0, 58.0, 56.0, 48.0, 53.0, 40.0, 36.0, 15.0, 25.0, 15.0, 3.0, 7.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.459957122802734, -11.08094596862793, -10.701934814453125, -10.322922706604004, -9.9439115524292, -9.564900398254395, -9.185888290405273, -8.806877136230469, -8.427865982055664, -8.04885482788086, -7.6698431968688965, -7.290831565856934, -6.911820411682129, -6.532809257507324, -6.153797626495361, -5.774785995483398, -5.395774841308594, -5.016763687133789, -4.637752056121826, -4.258740425109863, -3.8797292709350586, -3.500717878341675, -3.121706485748291, -2.7426950931549072, -2.3636837005615234, -1.9846723079681396, -1.6056609153747559, -1.226649522781372, -0.8476381301879883, -0.4686267375946045, -0.0896153450012207, 0.2893960475921631, 0.6684074401855469, 1.0474188327789307, 1.4264302253723145, 1.8054416179656982, 2.184453010559082, 2.563464403152466, 2.9424757957458496, 3.3214871883392334, 3.700498580932617, 4.079509735107422, 4.458521366119385, 4.837532997131348, 5.216544151306152, 5.595555305480957, 5.97456693649292, 6.353578567504883, 6.7325897216796875, 7.111600875854492, 7.490612506866455, 7.869624137878418, 8.248635292053223, 8.627646446228027, 9.006658554077148, 9.385669708251953, 9.764680862426758, 10.143692016601562, 10.522703170776367, 10.901715278625488, 11.280726432800293, 11.659737586975098, 12.038749694824219, 12.417760848999023, 12.796772003173828]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 6.0, 13.0, 18.0, 30.0, 32.0, 56.0, 87.0, 148.0, 240.0, 423.0, 774.0, 1693.0, 3551.0, 8483.0, 22823.0, 72149.0, 282353.0, 467582.0, 128276.0, 37042.0, 12871.0, 5088.0, 2294.0, 1102.0, 590.0, 287.0, 189.0, 117.0, 71.0, 41.0, 33.0, 19.0, 12.0, 12.0, 5.0, 3.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.6036376953125, -5.418212890625, -5.2327880859375, -5.04736328125, -4.8619384765625, -4.676513671875, -4.4910888671875, -4.3056640625, -4.1202392578125, -3.934814453125, -3.7493896484375, -3.56396484375, -3.3785400390625, -3.193115234375, -3.0076904296875, -2.822265625, -2.6368408203125, -2.451416015625, -2.2659912109375, -2.08056640625, -1.8951416015625, -1.709716796875, -1.5242919921875, -1.3388671875, -1.1534423828125, -0.968017578125, -0.7825927734375, -0.59716796875, -0.4117431640625, -0.226318359375, -0.0408935546875, 0.14453125, 0.3299560546875, 0.515380859375, 0.7008056640625, 0.88623046875, 1.0716552734375, 1.257080078125, 1.4425048828125, 1.6279296875, 1.8133544921875, 1.998779296875, 2.1842041015625, 2.36962890625, 2.5550537109375, 2.740478515625, 2.9259033203125, 3.111328125, 3.2967529296875, 3.482177734375, 3.6676025390625, 3.85302734375, 4.0384521484375, 4.223876953125, 4.4093017578125, 4.5947265625, 4.7801513671875, 4.965576171875, 5.1510009765625, 5.33642578125, 5.5218505859375, 5.707275390625, 5.8927001953125, 6.078125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 16.0, 20.0, 21.0, 21.0, 26.0, 28.0, 36.0, 42.0, 47.0, 53.0, 54.0, 46.0, 68.0, 74.0, 56.0, 66.0, 62.0, 57.0, 39.0, 34.0, 29.0, 30.0, 25.0, 12.0, 7.0, 5.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.9501190185546875, -1.892425537109375, -1.8347320556640625, -1.77703857421875, -1.7193450927734375, -1.661651611328125, -1.6039581298828125, -1.5462646484375, -1.4885711669921875, -1.430877685546875, -1.3731842041015625, -1.31549072265625, -1.2577972412109375, -1.200103759765625, -1.1424102783203125, -1.084716796875, -1.0270233154296875, -0.969329833984375, -0.9116363525390625, -0.85394287109375, -0.7962493896484375, -0.738555908203125, -0.6808624267578125, -0.6231689453125, -0.5654754638671875, -0.507781982421875, -0.4500885009765625, -0.39239501953125, -0.3347015380859375, -0.277008056640625, -0.2193145751953125, -0.16162109375, -0.1039276123046875, -0.046234130859375, 0.0114593505859375, 0.06915283203125, 0.1268463134765625, 0.184539794921875, 0.2422332763671875, 0.2999267578125, 0.3576202392578125, 0.415313720703125, 0.4730072021484375, 0.53070068359375, 0.5883941650390625, 0.646087646484375, 0.7037811279296875, 0.761474609375, 0.8191680908203125, 0.876861572265625, 0.9345550537109375, 0.99224853515625, 1.0499420166015625, 1.107635498046875, 1.1653289794921875, 1.2230224609375, 1.2807159423828125, 1.338409423828125, 1.3961029052734375, 1.45379638671875, 1.5114898681640625, 1.569183349609375, 1.6268768310546875, 1.6845703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 3.0, 5.0, 4.0, 7.0, 9.0, 12.0, 6.0, 10.0, 22.0, 38.0, 39.0, 58.0, 78.0, 149.0, 252.0, 573.0, 1319.0, 3759.0, 13578.0, 67147.0, 503760.0, 388514.0, 52259.0, 11156.0, 3404.0, 1212.0, 462.0, 248.0, 161.0, 96.0, 57.0, 41.0, 34.0, 20.0, 14.0, 8.0, 9.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.68359375, -6.45257568359375, -6.2215576171875, -5.99053955078125, -5.759521484375, -5.52850341796875, -5.2974853515625, -5.06646728515625, -4.83544921875, -4.60443115234375, -4.3734130859375, -4.14239501953125, -3.911376953125, -3.68035888671875, -3.4493408203125, -3.21832275390625, -2.9873046875, -2.75628662109375, -2.5252685546875, -2.29425048828125, -2.063232421875, -1.83221435546875, -1.6011962890625, -1.37017822265625, -1.13916015625, -0.90814208984375, -0.6771240234375, -0.44610595703125, -0.215087890625, 0.01593017578125, 0.2469482421875, 0.47796630859375, 0.708984375, 0.94000244140625, 1.1710205078125, 1.40203857421875, 1.633056640625, 1.86407470703125, 2.0950927734375, 2.32611083984375, 2.55712890625, 2.78814697265625, 3.0191650390625, 3.25018310546875, 3.481201171875, 3.71221923828125, 3.9432373046875, 4.17425537109375, 4.4052734375, 4.63629150390625, 4.8673095703125, 5.09832763671875, 5.329345703125, 5.56036376953125, 5.7913818359375, 6.02239990234375, 6.25341796875, 6.48443603515625, 6.7154541015625, 6.94647216796875, 7.177490234375, 7.40850830078125, 7.6395263671875, 7.87054443359375, 8.1015625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 15.0, 7.0, 14.0, 23.0, 19.0, 22.0, 44.0, 51.0, 59.0, 47.0, 66.0, 54.0, 51.0, 59.0, 61.0, 45.0, 47.0, 39.0, 53.0, 29.0, 32.0, 35.0, 19.0, 22.0, 23.0, 7.0, 11.0, 5.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.18359375, -6.90997314453125, -6.6363525390625, -6.36273193359375, -6.089111328125, -5.81549072265625, -5.5418701171875, -5.26824951171875, -4.99462890625, -4.72100830078125, -4.4473876953125, -4.17376708984375, -3.900146484375, -3.62652587890625, -3.3529052734375, -3.07928466796875, -2.8056640625, -2.53204345703125, -2.2584228515625, -1.98480224609375, -1.711181640625, -1.43756103515625, -1.1639404296875, -0.89031982421875, -0.61669921875, -0.34307861328125, -0.0694580078125, 0.20416259765625, 0.477783203125, 0.75140380859375, 1.0250244140625, 1.29864501953125, 1.572265625, 1.84588623046875, 2.1195068359375, 2.39312744140625, 2.666748046875, 2.94036865234375, 3.2139892578125, 3.48760986328125, 3.76123046875, 4.03485107421875, 4.3084716796875, 4.58209228515625, 4.855712890625, 5.12933349609375, 5.4029541015625, 5.67657470703125, 5.9501953125, 6.22381591796875, 6.4974365234375, 6.77105712890625, 7.044677734375, 7.31829833984375, 7.5919189453125, 7.86553955078125, 8.13916015625, 8.41278076171875, 8.6864013671875, 8.96002197265625, 9.233642578125, 9.50726318359375, 9.7808837890625, 10.05450439453125, 10.328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 11.0, 7.0, 24.0, 45.0, 80.0, 161.0, 610.0, 2160.0, 12687.0, 408990.0, 605883.0, 14414.0, 2436.0, 629.0, 210.0, 81.0, 51.0, 27.0, 10.0, 9.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.88031005859375, -4.6239013671875, -4.36749267578125, -4.111083984375, -3.85467529296875, -3.5982666015625, -3.34185791015625, -3.08544921875, -2.82904052734375, -2.5726318359375, -2.31622314453125, -2.059814453125, -1.80340576171875, -1.5469970703125, -1.29058837890625, -1.0341796875, -0.77777099609375, -0.5213623046875, -0.26495361328125, -0.008544921875, 0.24786376953125, 0.5042724609375, 0.76068115234375, 1.01708984375, 1.27349853515625, 1.5299072265625, 1.78631591796875, 2.042724609375, 2.29913330078125, 2.5555419921875, 2.81195068359375, 3.068359375, 3.32476806640625, 3.5811767578125, 3.83758544921875, 4.093994140625, 4.35040283203125, 4.6068115234375, 4.86322021484375, 5.11962890625, 5.37603759765625, 5.6324462890625, 5.88885498046875, 6.145263671875, 6.40167236328125, 6.6580810546875, 6.91448974609375, 7.1708984375, 7.42730712890625, 7.6837158203125, 7.94012451171875, 8.196533203125, 8.45294189453125, 8.7093505859375, 8.96575927734375, 9.22216796875, 9.47857666015625, 9.7349853515625, 9.99139404296875, 10.247802734375, 10.50421142578125, 10.7606201171875, 11.01702880859375, 11.2734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 3.0, 5.0, 12.0, 25.0, 26.0, 49.0, 81.0, 114.0, 191.0, 193.0, 103.0, 62.0, 39.0, 31.0, 18.0, 15.0, 11.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007390975952148438, -0.0007210709154605865, -0.0007030442357063293, -0.0006850175559520721, -0.0006669908761978149, -0.0006489641964435577, -0.0006309375166893005, -0.0006129108369350433, -0.0005948841571807861, -0.0005768574774265289, -0.0005588307976722717, -0.0005408041179180145, -0.0005227774381637573, -0.0005047507584095001, -0.0004867240786552429, -0.0004686973989009857, -0.0004506707191467285, -0.0004326440393924713, -0.0004146173596382141, -0.0003965906798839569, -0.0003785640001296997, -0.0003605373203754425, -0.0003425106406211853, -0.0003244839608669281, -0.0003064572811126709, -0.0002884306013584137, -0.0002704039216041565, -0.0002523772418498993, -0.0002343505620956421, -0.0002163238823413849, -0.00019829720258712769, -0.00018027052283287048, -0.00016224384307861328, -0.00014421716332435608, -0.00012619048357009888, -0.00010816380381584167, -9.013712406158447e-05, -7.211044430732727e-05, -5.408376455307007e-05, -3.6057084798812866e-05, -1.8030405044555664e-05, -3.725290298461914e-09, 1.802295446395874e-05, 3.604963421821594e-05, 5.4076313972473145e-05, 7.210299372673035e-05, 9.012967348098755e-05, 0.00010815635323524475, 0.00012618303298950195, 0.00014420971274375916, 0.00016223639249801636, 0.00018026307225227356, 0.00019828975200653076, 0.00021631643176078796, 0.00023434311151504517, 0.00025236979126930237, 0.00027039647102355957, 0.00028842315077781677, 0.000306449830532074, 0.0003244765102863312, 0.0003425031900405884, 0.0003605298697948456, 0.0003785565495491028, 0.00039658322930336, 0.0004146099090576172]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 3.0, 14.0, 18.0, 26.0, 66.0, 145.0, 314.0, 827.0, 2516.0, 10932.0, 595724.0, 424268.0, 9900.0, 2400.0, 823.0, 318.0, 104.0, 63.0, 40.0, 22.0, 12.0, 9.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.875, -11.5538330078125, -11.232666015625, -10.9114990234375, -10.59033203125, -10.2691650390625, -9.947998046875, -9.6268310546875, -9.3056640625, -8.9844970703125, -8.663330078125, -8.3421630859375, -8.02099609375, -7.6998291015625, -7.378662109375, -7.0574951171875, -6.736328125, -6.4151611328125, -6.093994140625, -5.7728271484375, -5.45166015625, -5.1304931640625, -4.809326171875, -4.4881591796875, -4.1669921875, -3.8458251953125, -3.524658203125, -3.2034912109375, -2.88232421875, -2.5611572265625, -2.239990234375, -1.9188232421875, -1.59765625, -1.2764892578125, -0.955322265625, -0.6341552734375, -0.31298828125, 0.0081787109375, 0.329345703125, 0.6505126953125, 0.9716796875, 1.2928466796875, 1.614013671875, 1.9351806640625, 2.25634765625, 2.5775146484375, 2.898681640625, 3.2198486328125, 3.541015625, 3.8621826171875, 4.183349609375, 4.5045166015625, 4.82568359375, 5.1468505859375, 5.468017578125, 5.7891845703125, 6.1103515625, 6.4315185546875, 6.752685546875, 7.0738525390625, 7.39501953125, 7.7161865234375, 8.037353515625, 8.3585205078125, 8.6796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 7.0, 8.0, 17.0, 25.0, 42.0, 104.0, 197.0, 212.0, 175.0, 90.0, 46.0, 20.0, 12.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.046875, -7.84210205078125, -7.6373291015625, -7.43255615234375, -7.227783203125, -7.02301025390625, -6.8182373046875, -6.61346435546875, -6.40869140625, -6.20391845703125, -5.9991455078125, -5.79437255859375, -5.589599609375, -5.38482666015625, -5.1800537109375, -4.97528076171875, -4.7705078125, -4.56573486328125, -4.3609619140625, -4.15618896484375, -3.951416015625, -3.74664306640625, -3.5418701171875, -3.33709716796875, -3.13232421875, -2.92755126953125, -2.7227783203125, -2.51800537109375, -2.313232421875, -2.10845947265625, -1.9036865234375, -1.69891357421875, -1.494140625, -1.28936767578125, -1.0845947265625, -0.87982177734375, -0.675048828125, -0.47027587890625, -0.2655029296875, -0.06072998046875, 0.14404296875, 0.34881591796875, 0.5535888671875, 0.75836181640625, 0.963134765625, 1.16790771484375, 1.3726806640625, 1.57745361328125, 1.7822265625, 1.98699951171875, 2.1917724609375, 2.39654541015625, 2.601318359375, 2.80609130859375, 3.0108642578125, 3.21563720703125, 3.42041015625, 3.62518310546875, 3.8299560546875, 4.03472900390625, 4.239501953125, 4.44427490234375, 4.6490478515625, 4.85382080078125, 5.05859375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 27.0, 112.0, 376.0, 350.0, 104.0, 22.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.4786376953125, -268.4112854003906, -263.3439636230469, -258.276611328125, -253.20928955078125, -248.14193725585938, -243.07460021972656, -238.00726318359375, -232.93992614746094, -227.87258911132812, -222.8052520751953, -217.7379150390625, -212.67056274414062, -207.6032257080078, -202.535888671875, -197.4685516357422, -192.40121459960938, -187.33387756347656, -182.26654052734375, -177.19920349121094, -172.13186645507812, -167.06451416015625, -161.99717712402344, -156.92984008789062, -151.8625030517578, -146.795166015625, -141.7278289794922, -136.66049194335938, -131.5931396484375, -126.52581024169922, -121.45846557617188, -116.39112854003906, -111.32379150390625, -106.25645446777344, -101.18911743164062, -96.12177276611328, -91.05443572998047, -85.98709869384766, -80.91975402832031, -75.8524169921875, -70.78507995605469, -65.71774291992188, -60.6504020690918, -55.58306121826172, -50.515724182128906, -45.448387145996094, -40.381046295166016, -35.31370544433594, -30.24637222290039, -25.179033279418945, -20.1116943359375, -15.044355392456055, -9.97701644897461, -4.909677505493164, 0.15766143798828125, 5.225002288818359, 10.292339324951172, 15.359678268432617, 20.427017211914062, 25.494356155395508, 30.561695098876953, 35.62903594970703, 40.696372985839844, 45.76371383666992, 50.831050872802734]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 5.0, 6.0, 10.0, 6.0, 15.0, 13.0, 9.0, 17.0, 24.0, 28.0, 27.0, 25.0, 41.0, 26.0, 30.0, 42.0, 39.0, 51.0, 44.0, 43.0, 41.0, 38.0, 49.0, 40.0, 34.0, 27.0, 38.0, 29.0, 33.0, 31.0, 18.0, 17.0, 17.0, 14.0, 13.0, 12.0, 14.0, 7.0, 3.0, 3.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.04365921020508, -40.749080657958984, -39.45450210571289, -38.1599235534668, -36.86534881591797, -35.570770263671875, -34.27619171142578, -32.98161315917969, -31.687034606933594, -30.3924560546875, -29.097877502441406, -27.803300857543945, -26.50872230529785, -25.214143753051758, -23.919567108154297, -22.624988555908203, -21.33041000366211, -20.035831451416016, -18.741252899169922, -17.44667625427246, -16.152097702026367, -14.857519149780273, -13.562941551208496, -12.268363952636719, -10.973785400390625, -9.679206848144531, -8.384629249572754, -7.090051174163818, -5.795473098754883, -4.500895023345947, -3.2063169479370117, -1.9117393493652344, -0.6171646118164062, 0.6774134635925293, 1.9719915390014648, 3.2665696144104004, 4.561147689819336, 5.8557257652282715, 7.150303840637207, 8.444881439208984, 9.739459991455078, 11.034038543701172, 12.32861614227295, 13.623193740844727, 14.91777229309082, 16.212350845336914, 17.506927490234375, 18.80150604248047, 20.096084594726562, 21.390663146972656, 22.68524169921875, 23.97981834411621, 25.274396896362305, 26.5689754486084, 27.86355209350586, 29.158130645751953, 30.452709197998047, 31.74728775024414, 33.041866302490234, 34.33644485473633, 35.631019592285156, 36.92559814453125, 38.220176696777344, 39.51475524902344, 40.80933380126953]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 2.0, 5.0, 4.0, 5.0, 10.0, 17.0, 18.0, 15.0, 28.0, 32.0, 51.0, 78.0, 116.0, 167.0, 312.0, 477.0, 857.0, 1489.0, 2837.0, 6100.0, 15277.0, 54169.0, 3418669.0, 623466.0, 45116.0, 13344.0, 5644.0, 2698.0, 1363.0, 778.0, 404.0, 250.0, 170.0, 99.0, 64.0, 43.0, 32.0, 25.0, 10.0, 11.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.5078125, -9.24322509765625, -8.9786376953125, -8.71405029296875, -8.449462890625, -8.18487548828125, -7.9202880859375, -7.65570068359375, -7.39111328125, -7.12652587890625, -6.8619384765625, -6.59735107421875, -6.332763671875, -6.06817626953125, -5.8035888671875, -5.53900146484375, -5.2744140625, -5.00982666015625, -4.7452392578125, -4.48065185546875, -4.216064453125, -3.95147705078125, -3.6868896484375, -3.42230224609375, -3.15771484375, -2.89312744140625, -2.6285400390625, -2.36395263671875, -2.099365234375, -1.83477783203125, -1.5701904296875, -1.30560302734375, -1.041015625, -0.77642822265625, -0.5118408203125, -0.24725341796875, 0.017333984375, 0.28192138671875, 0.5465087890625, 0.81109619140625, 1.07568359375, 1.34027099609375, 1.6048583984375, 1.86944580078125, 2.134033203125, 2.39862060546875, 2.6632080078125, 2.92779541015625, 3.1923828125, 3.45697021484375, 3.7215576171875, 3.98614501953125, 4.250732421875, 4.51531982421875, 4.7799072265625, 5.04449462890625, 5.30908203125, 5.57366943359375, 5.8382568359375, 6.10284423828125, 6.367431640625, 6.63201904296875, 6.8966064453125, 7.16119384765625, 7.42578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 5.0, 12.0, 9.0, 23.0, 15.0, 17.0, 29.0, 27.0, 29.0, 34.0, 42.0, 43.0, 40.0, 63.0, 43.0, 56.0, 57.0, 66.0, 47.0, 54.0, 41.0, 38.0, 38.0, 30.0, 20.0, 26.0, 14.0, 20.0, 10.0, 5.0, 9.0, 7.0, 9.0, 5.0, 6.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.0908203125, -2.02734375, -1.9638671875, -1.900390625, -1.8369140625, -1.7734375, -1.7099609375, -1.646484375, -1.5830078125, -1.51953125, -1.4560546875, -1.392578125, -1.3291015625, -1.265625, -1.2021484375, -1.138671875, -1.0751953125, -1.01171875, -0.9482421875, -0.884765625, -0.8212890625, -0.7578125, -0.6943359375, -0.630859375, -0.5673828125, -0.50390625, -0.4404296875, -0.376953125, -0.3134765625, -0.25, -0.1865234375, -0.123046875, -0.0595703125, 0.00390625, 0.0673828125, 0.130859375, 0.1943359375, 0.2578125, 0.3212890625, 0.384765625, 0.4482421875, 0.51171875, 0.5751953125, 0.638671875, 0.7021484375, 0.765625, 0.8291015625, 0.892578125, 0.9560546875, 1.01953125, 1.0830078125, 1.146484375, 1.2099609375, 1.2734375, 1.3369140625, 1.400390625, 1.4638671875, 1.52734375, 1.5908203125, 1.654296875, 1.7177734375, 1.78125, 1.8447265625, 1.908203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 9.0, 15.0, 17.0, 36.0, 78.0, 129.0, 240.0, 618.0, 1535.0, 4202.0, 13363.0, 52642.0, 851526.0, 3185151.0, 62076.0, 15096.0, 4637.0, 1657.0, 638.0, 273.0, 146.0, 82.0, 31.0, 26.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5286865234375, -8.244873046875, -7.9610595703125, -7.67724609375, -7.3934326171875, -7.109619140625, -6.8258056640625, -6.5419921875, -6.2581787109375, -5.974365234375, -5.6905517578125, -5.40673828125, -5.1229248046875, -4.839111328125, -4.5552978515625, -4.271484375, -3.9876708984375, -3.703857421875, -3.4200439453125, -3.13623046875, -2.8524169921875, -2.568603515625, -2.2847900390625, -2.0009765625, -1.7171630859375, -1.433349609375, -1.1495361328125, -0.86572265625, -0.5819091796875, -0.298095703125, -0.0142822265625, 0.26953125, 0.5533447265625, 0.837158203125, 1.1209716796875, 1.40478515625, 1.6885986328125, 1.972412109375, 2.2562255859375, 2.5400390625, 2.8238525390625, 3.107666015625, 3.3914794921875, 3.67529296875, 3.9591064453125, 4.242919921875, 4.5267333984375, 4.810546875, 5.0943603515625, 5.378173828125, 5.6619873046875, 5.94580078125, 6.2296142578125, 6.513427734375, 6.7972412109375, 7.0810546875, 7.3648681640625, 7.648681640625, 7.9324951171875, 8.21630859375, 8.5001220703125, 8.783935546875, 9.0677490234375, 9.3515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 9.0, 15.0, 16.0, 19.0, 18.0, 31.0, 37.0, 55.0, 91.0, 256.0, 2543.0, 548.0, 147.0, 77.0, 48.0, 38.0, 28.0, 20.0, 20.0, 4.0, 9.0, 1.0, 9.0, 5.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.74609375, -4.6168212890625, -4.487548828125, -4.3582763671875, -4.22900390625, -4.0997314453125, -3.970458984375, -3.8411865234375, -3.7119140625, -3.5826416015625, -3.453369140625, -3.3240966796875, -3.19482421875, -3.0655517578125, -2.936279296875, -2.8070068359375, -2.677734375, -2.5484619140625, -2.419189453125, -2.2899169921875, -2.16064453125, -2.0313720703125, -1.902099609375, -1.7728271484375, -1.6435546875, -1.5142822265625, -1.385009765625, -1.2557373046875, -1.12646484375, -0.9971923828125, -0.867919921875, -0.7386474609375, -0.609375, -0.4801025390625, -0.350830078125, -0.2215576171875, -0.09228515625, 0.0369873046875, 0.166259765625, 0.2955322265625, 0.4248046875, 0.5540771484375, 0.683349609375, 0.8126220703125, 0.94189453125, 1.0711669921875, 1.200439453125, 1.3297119140625, 1.458984375, 1.5882568359375, 1.717529296875, 1.8468017578125, 1.97607421875, 2.1053466796875, 2.234619140625, 2.3638916015625, 2.4931640625, 2.6224365234375, 2.751708984375, 2.8809814453125, 3.01025390625, 3.1395263671875, 3.268798828125, 3.3980712890625, 3.52734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 10.0, 18.0, 30.0, 30.0, 85.0, 108.0, 145.0, 159.0, 143.0, 102.0, 70.0, 28.0, 27.0, 17.0, 10.0, 4.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.773128509521484, -14.130102157592773, -13.487074851989746, -12.844048500061035, -12.201021194458008, -11.557994842529297, -10.914968490600586, -10.271941184997559, -9.628913879394531, -8.98588752746582, -8.342860221862793, -7.699833869934082, -7.056806564331055, -6.413780212402344, -5.770753383636475, -5.1277265548706055, -4.4847002029418945, -3.8416733741760254, -3.1986465454101562, -2.555619955062866, -1.912593126296997, -1.269566297531128, -0.6265397071838379, 0.01648712158203125, 0.6595139503479004, 1.3025407791137695, 1.9455674886703491, 2.5885941982269287, 3.231621026992798, 3.874647855758667, 4.517674446105957, 5.160701274871826, 5.803728103637695, 6.4467549324035645, 7.089781761169434, 7.7328081130981445, 8.375835418701172, 9.018861770629883, 9.661888122558594, 10.304915428161621, 10.947942733764648, 11.59096908569336, 12.233996391296387, 12.877022743225098, 13.520050048828125, 14.163076400756836, 14.806102752685547, 15.449130058288574, 16.09215545654297, 16.73518180847168, 17.37820816040039, 18.021236419677734, 18.664262771606445, 19.307289123535156, 19.950315475463867, 20.593341827392578, 21.236370086669922, 21.879396438598633, 22.522422790527344, 23.165451049804688, 23.8084774017334, 24.45150375366211, 25.09453010559082, 25.73755645751953, 26.380584716796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 11.0, 16.0, 9.0, 14.0, 19.0, 6.0, 27.0, 29.0, 37.0, 41.0, 26.0, 48.0, 42.0, 41.0, 42.0, 46.0, 55.0, 55.0, 38.0, 40.0, 39.0, 37.0, 44.0, 40.0, 32.0, 28.0, 18.0, 21.0, 19.0, 12.0, 15.0, 9.0, 14.0, 8.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.372135162353516, -12.018607139587402, -11.665079116821289, -11.311551094055176, -10.958023071289062, -10.604494094848633, -10.25096607208252, -9.897438049316406, -9.543910026550293, -9.19038200378418, -8.836853981018066, -8.483325958251953, -8.129796981811523, -7.776269435882568, -7.422740936279297, -7.069212913513184, -6.71568489074707, -6.362156867980957, -6.008628845214844, -5.655100345611572, -5.301572322845459, -4.948044300079346, -4.594515800476074, -4.240987777709961, -3.8874597549438477, -3.5339317321777344, -3.180403470993042, -2.8268752098083496, -2.4733471870422363, -2.119819164276123, -1.7662909030914307, -1.4127626419067383, -1.059234619140625, -0.7057064771652222, -0.35217833518981934, 0.001349806785583496, 0.35487794876098633, 0.7084060907363892, 1.061934232711792, 1.4154624938964844, 1.7689905166625977, 2.122518539428711, 2.4760468006134033, 2.8295750617980957, 3.183103084564209, 3.5366311073303223, 3.8901593685150146, 4.243687629699707, 4.59721565246582, 4.950743675231934, 5.304271697998047, 5.657800197601318, 6.011328220367432, 6.364856243133545, 6.718384742736816, 7.07191276550293, 7.425440788269043, 7.778968811035156, 8.13249683380127, 8.486024856567383, 8.839553833007812, 9.193081855773926, 9.546609878540039, 9.900137901306152, 10.253665924072266]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 19.0, 25.0, 40.0, 66.0, 91.0, 122.0, 181.0, 306.0, 479.0, 784.0, 1392.0, 2506.0, 4863.0, 10040.0, 21601.0, 52698.0, 150715.0, 378893.0, 268016.0, 90829.0, 34812.0, 14757.0, 6991.0, 3598.0, 1938.0, 1131.0, 610.0, 359.0, 219.0, 160.0, 81.0, 67.0, 36.0, 26.0, 21.0, 20.0, 11.0, 8.0, 10.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-6.82421875, -6.6334228515625, -6.442626953125, -6.2518310546875, -6.06103515625, -5.8702392578125, -5.679443359375, -5.4886474609375, -5.2978515625, -5.1070556640625, -4.916259765625, -4.7254638671875, -4.53466796875, -4.3438720703125, -4.153076171875, -3.9622802734375, -3.771484375, -3.5806884765625, -3.389892578125, -3.1990966796875, -3.00830078125, -2.8175048828125, -2.626708984375, -2.4359130859375, -2.2451171875, -2.0543212890625, -1.863525390625, -1.6727294921875, -1.48193359375, -1.2911376953125, -1.100341796875, -0.9095458984375, -0.71875, -0.5279541015625, -0.337158203125, -0.1463623046875, 0.04443359375, 0.2352294921875, 0.426025390625, 0.6168212890625, 0.8076171875, 0.9984130859375, 1.189208984375, 1.3800048828125, 1.57080078125, 1.7615966796875, 1.952392578125, 2.1431884765625, 2.333984375, 2.5247802734375, 2.715576171875, 2.9063720703125, 3.09716796875, 3.2879638671875, 3.478759765625, 3.6695556640625, 3.8603515625, 4.0511474609375, 4.241943359375, 4.4327392578125, 4.62353515625, 4.8143310546875, 5.005126953125, 5.1959228515625, 5.38671875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 7.0, 6.0, 9.0, 17.0, 10.0, 15.0, 25.0, 26.0, 20.0, 32.0, 31.0, 36.0, 48.0, 38.0, 47.0, 44.0, 51.0, 51.0, 50.0, 67.0, 58.0, 46.0, 32.0, 37.0, 29.0, 30.0, 26.0, 27.0, 13.0, 7.0, 11.0, 10.0, 5.0, 5.0, 9.0, 7.0, 2.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.08203125, -2.0212249755859375, -1.960418701171875, -1.8996124267578125, -1.83880615234375, -1.7779998779296875, -1.717193603515625, -1.6563873291015625, -1.5955810546875, -1.5347747802734375, -1.473968505859375, -1.4131622314453125, -1.35235595703125, -1.2915496826171875, -1.230743408203125, -1.1699371337890625, -1.109130859375, -1.0483245849609375, -0.987518310546875, -0.9267120361328125, -0.86590576171875, -0.8050994873046875, -0.744293212890625, -0.6834869384765625, -0.6226806640625, -0.5618743896484375, -0.501068115234375, -0.4402618408203125, -0.37945556640625, -0.3186492919921875, -0.257843017578125, -0.1970367431640625, -0.13623046875, -0.0754241943359375, -0.014617919921875, 0.0461883544921875, 0.10699462890625, 0.1678009033203125, 0.228607177734375, 0.2894134521484375, 0.3502197265625, 0.4110260009765625, 0.471832275390625, 0.5326385498046875, 0.59344482421875, 0.6542510986328125, 0.715057373046875, 0.7758636474609375, 0.836669921875, 0.8974761962890625, 0.958282470703125, 1.0190887451171875, 1.07989501953125, 1.1407012939453125, 1.201507568359375, 1.2623138427734375, 1.3231201171875, 1.3839263916015625, 1.444732666015625, 1.5055389404296875, 1.56634521484375, 1.6271514892578125, 1.687957763671875, 1.7487640380859375, 1.8095703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 5.0, 6.0, 7.0, 6.0, 14.0, 14.0, 18.0, 21.0, 38.0, 37.0, 51.0, 106.0, 174.0, 365.0, 889.0, 2357.0, 8573.0, 37842.0, 281279.0, 604951.0, 88889.0, 16177.0, 4187.0, 1430.0, 510.0, 212.0, 125.0, 78.0, 54.0, 38.0, 30.0, 16.0, 11.0, 8.0, 9.0, 6.0, 7.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.3560791015625, -9.024658203125, -8.6932373046875, -8.36181640625, -8.0303955078125, -7.698974609375, -7.3675537109375, -7.0361328125, -6.7047119140625, -6.373291015625, -6.0418701171875, -5.71044921875, -5.3790283203125, -5.047607421875, -4.7161865234375, -4.384765625, -4.0533447265625, -3.721923828125, -3.3905029296875, -3.05908203125, -2.7276611328125, -2.396240234375, -2.0648193359375, -1.7333984375, -1.4019775390625, -1.070556640625, -0.7391357421875, -0.40771484375, -0.0762939453125, 0.255126953125, 0.5865478515625, 0.91796875, 1.2493896484375, 1.580810546875, 1.9122314453125, 2.24365234375, 2.5750732421875, 2.906494140625, 3.2379150390625, 3.5693359375, 3.9007568359375, 4.232177734375, 4.5635986328125, 4.89501953125, 5.2264404296875, 5.557861328125, 5.8892822265625, 6.220703125, 6.5521240234375, 6.883544921875, 7.2149658203125, 7.54638671875, 7.8778076171875, 8.209228515625, 8.5406494140625, 8.8720703125, 9.2034912109375, 9.534912109375, 9.8663330078125, 10.19775390625, 10.5291748046875, 10.860595703125, 11.1920166015625, 11.5234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 0.0, 6.0, 11.0, 7.0, 9.0, 6.0, 12.0, 17.0, 20.0, 18.0, 19.0, 29.0, 32.0, 33.0, 51.0, 58.0, 46.0, 57.0, 59.0, 63.0, 53.0, 39.0, 50.0, 36.0, 45.0, 40.0, 36.0, 36.0, 20.0, 16.0, 13.0, 13.0, 8.0, 14.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.9453125, -12.5782470703125, -12.211181640625, -11.8441162109375, -11.47705078125, -11.1099853515625, -10.742919921875, -10.3758544921875, -10.0087890625, -9.6417236328125, -9.274658203125, -8.9075927734375, -8.54052734375, -8.1734619140625, -7.806396484375, -7.4393310546875, -7.072265625, -6.7052001953125, -6.338134765625, -5.9710693359375, -5.60400390625, -5.2369384765625, -4.869873046875, -4.5028076171875, -4.1357421875, -3.7686767578125, -3.401611328125, -3.0345458984375, -2.66748046875, -2.3004150390625, -1.933349609375, -1.5662841796875, -1.19921875, -0.8321533203125, -0.465087890625, -0.0980224609375, 0.26904296875, 0.6361083984375, 1.003173828125, 1.3702392578125, 1.7373046875, 2.1043701171875, 2.471435546875, 2.8385009765625, 3.20556640625, 3.5726318359375, 3.939697265625, 4.3067626953125, 4.673828125, 5.0408935546875, 5.407958984375, 5.7750244140625, 6.14208984375, 6.5091552734375, 6.876220703125, 7.2432861328125, 7.6103515625, 7.9774169921875, 8.344482421875, 8.7115478515625, 9.07861328125, 9.4456787109375, 9.812744140625, 10.1798095703125, 10.546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 11.0, 14.0, 30.0, 34.0, 82.0, 177.0, 345.0, 790.0, 2444.0, 10737.0, 83184.0, 725916.0, 199049.0, 19835.0, 3858.0, 1167.0, 469.0, 188.0, 91.0, 54.0, 34.0, 8.0, 13.0, 8.0, 5.0, 0.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.92010498046875, -4.7542724609375, -4.58843994140625, -4.422607421875, -4.25677490234375, -4.0909423828125, -3.92510986328125, -3.75927734375, -3.59344482421875, -3.4276123046875, -3.26177978515625, -3.095947265625, -2.93011474609375, -2.7642822265625, -2.59844970703125, -2.4326171875, -2.26678466796875, -2.1009521484375, -1.93511962890625, -1.769287109375, -1.60345458984375, -1.4376220703125, -1.27178955078125, -1.10595703125, -0.94012451171875, -0.7742919921875, -0.60845947265625, -0.442626953125, -0.27679443359375, -0.1109619140625, 0.05487060546875, 0.220703125, 0.38653564453125, 0.5523681640625, 0.71820068359375, 0.884033203125, 1.04986572265625, 1.2156982421875, 1.38153076171875, 1.54736328125, 1.71319580078125, 1.8790283203125, 2.04486083984375, 2.210693359375, 2.37652587890625, 2.5423583984375, 2.70819091796875, 2.8740234375, 3.03985595703125, 3.2056884765625, 3.37152099609375, 3.537353515625, 3.70318603515625, 3.8690185546875, 4.03485107421875, 4.20068359375, 4.36651611328125, 4.5323486328125, 4.69818115234375, 4.864013671875, 5.02984619140625, 5.1956787109375, 5.36151123046875, 5.52734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 10.0, 7.0, 15.0, 16.0, 20.0, 20.0, 40.0, 49.0, 61.0, 66.0, 90.0, 92.0, 86.0, 70.0, 86.0, 52.0, 55.0, 33.0, 23.0, 26.0, 19.0, 13.0, 11.0, 4.0, 10.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0004897117614746094, -0.0004757232964038849, -0.0004617348313331604, -0.0004477463662624359, -0.0004337579011917114, -0.00041976943612098694, -0.00040578097105026245, -0.00039179250597953796, -0.0003778040409088135, -0.000363815575838089, -0.0003498271107673645, -0.00033583864569664, -0.00032185018062591553, -0.00030786171555519104, -0.00029387325048446655, -0.00027988478541374207, -0.0002658963203430176, -0.0002519078552722931, -0.0002379193902015686, -0.00022393092513084412, -0.00020994246006011963, -0.00019595399498939514, -0.00018196552991867065, -0.00016797706484794617, -0.00015398859977722168, -0.0001400001347064972, -0.0001260116696357727, -0.00011202320456504822, -9.803473949432373e-05, -8.404627442359924e-05, -7.005780935287476e-05, -5.606934428215027e-05, -4.208087921142578e-05, -2.8092414140701294e-05, -1.4103949069976807e-05, -1.1548399925231934e-07, 1.3872981071472168e-05, 2.7861446142196655e-05, 4.184991121292114e-05, 5.583837628364563e-05, 6.982684135437012e-05, 8.38153064250946e-05, 9.780377149581909e-05, 0.00011179223656654358, 0.00012578070163726807, 0.00013976916670799255, 0.00015375763177871704, 0.00016774609684944153, 0.00018173456192016602, 0.0001957230269908905, 0.000209711492061615, 0.00022369995713233948, 0.00023768842220306396, 0.00025167688727378845, 0.00026566535234451294, 0.0002796538174152374, 0.0002936422824859619, 0.0003076307475566864, 0.0003216192126274109, 0.0003356076776981354, 0.00034959614276885986, 0.00036358460783958435, 0.00037757307291030884, 0.0003915615379810333, 0.0004055500030517578]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 10.0, 13.0, 21.0, 42.0, 49.0, 86.0, 165.0, 356.0, 906.0, 2785.0, 10861.0, 64573.0, 581839.0, 340207.0, 36244.0, 7089.0, 1970.0, 698.0, 277.0, 131.0, 67.0, 48.0, 34.0, 24.0, 13.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.765625, -4.61602783203125, -4.4664306640625, -4.31683349609375, -4.167236328125, -4.01763916015625, -3.8680419921875, -3.71844482421875, -3.56884765625, -3.41925048828125, -3.2696533203125, -3.12005615234375, -2.970458984375, -2.82086181640625, -2.6712646484375, -2.52166748046875, -2.3720703125, -2.22247314453125, -2.0728759765625, -1.92327880859375, -1.773681640625, -1.62408447265625, -1.4744873046875, -1.32489013671875, -1.17529296875, -1.02569580078125, -0.8760986328125, -0.72650146484375, -0.576904296875, -0.42730712890625, -0.2777099609375, -0.12811279296875, 0.021484375, 0.17108154296875, 0.3206787109375, 0.47027587890625, 0.619873046875, 0.76947021484375, 0.9190673828125, 1.06866455078125, 1.21826171875, 1.36785888671875, 1.5174560546875, 1.66705322265625, 1.816650390625, 1.96624755859375, 2.1158447265625, 2.26544189453125, 2.4150390625, 2.56463623046875, 2.7142333984375, 2.86383056640625, 3.013427734375, 3.16302490234375, 3.3126220703125, 3.46221923828125, 3.61181640625, 3.76141357421875, 3.9110107421875, 4.06060791015625, 4.210205078125, 4.35980224609375, 4.5093994140625, 4.65899658203125, 4.80859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 12.0, 13.0, 17.0, 25.0, 34.0, 47.0, 75.0, 96.0, 111.0, 108.0, 97.0, 107.0, 66.0, 56.0, 34.0, 25.0, 19.0, 8.0, 16.0, 13.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46484375, -4.308837890625, -4.15283203125, -3.996826171875, -3.8408203125, -3.684814453125, -3.52880859375, -3.372802734375, -3.216796875, -3.060791015625, -2.90478515625, -2.748779296875, -2.5927734375, -2.436767578125, -2.28076171875, -2.124755859375, -1.96875, -1.812744140625, -1.65673828125, -1.500732421875, -1.3447265625, -1.188720703125, -1.03271484375, -0.876708984375, -0.720703125, -0.564697265625, -0.40869140625, -0.252685546875, -0.0966796875, 0.059326171875, 0.21533203125, 0.371337890625, 0.52734375, 0.683349609375, 0.83935546875, 0.995361328125, 1.1513671875, 1.307373046875, 1.46337890625, 1.619384765625, 1.775390625, 1.931396484375, 2.08740234375, 2.243408203125, 2.3994140625, 2.555419921875, 2.71142578125, 2.867431640625, 3.0234375, 3.179443359375, 3.33544921875, 3.491455078125, 3.6474609375, 3.803466796875, 3.95947265625, 4.115478515625, 4.271484375, 4.427490234375, 4.58349609375, 4.739501953125, 4.8955078125, 5.051513671875, 5.20751953125, 5.363525390625, 5.51953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 7.0, 17.0, 73.0, 258.0, 400.0, 189.0, 48.0, 15.0, 3.0, 0.0, 3.0], "bins": [-339.863037109375, -333.9338684082031, -328.0047302246094, -322.0755615234375, -316.1463928222656, -310.21722412109375, -304.2880859375, -298.3589172363281, -292.42974853515625, -286.5005798339844, -280.5714416503906, -274.64227294921875, -268.7131042480469, -262.783935546875, -256.85479736328125, -250.92562866210938, -244.99647521972656, -239.06732177734375, -233.13815307617188, -227.20899963378906, -221.2798309326172, -215.35067749023438, -209.4215087890625, -203.4923553466797, -197.56320190429688, -191.63404846191406, -185.7048797607422, -179.77572631835938, -173.8465576171875, -167.9174041748047, -161.98825073242188, -156.05908203125, -150.1299285888672, -144.20077514648438, -138.2716064453125, -132.3424530029297, -126.41328430175781, -120.484130859375, -114.55496978759766, -108.62580871582031, -102.69664001464844, -96.7674789428711, -90.83831787109375, -84.90916442871094, -78.97999572753906, -73.05084228515625, -67.1216812133789, -61.19252014160156, -55.263362884521484, -49.33420181274414, -43.40504455566406, -37.47588348388672, -31.546722412109375, -25.61756134033203, -19.688404083251953, -13.75924301147461, -7.830081939697266, -1.9009218215942383, 4.028238296508789, 9.9573974609375, 15.886558532714844, 21.815719604492188, 27.744876861572266, 33.67403793334961, 39.60319900512695]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 0.0, 3.0, 5.0, 2.0, 10.0, 14.0, 13.0, 21.0, 21.0, 29.0, 46.0, 60.0, 40.0, 62.0, 61.0, 60.0, 66.0, 63.0, 49.0, 64.0, 52.0, 38.0, 49.0, 26.0, 30.0, 27.0, 27.0, 19.0, 7.0, 12.0, 10.0, 2.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.37168884277344, -72.82408142089844, -70.27647399902344, -67.72886657714844, -65.18125915527344, -62.63365173339844, -60.08604431152344, -57.53843688964844, -54.99082946777344, -52.44322204589844, -49.89561462402344, -47.34800720214844, -44.80039978027344, -42.25279235839844, -39.70518493652344, -37.15757751464844, -34.60997009277344, -32.06236267089844, -29.514755249023438, -26.967147827148438, -24.419540405273438, -21.871932983398438, -19.324325561523438, -16.776718139648438, -14.229110717773438, -11.681503295898438, -9.133895874023438, -6.5862884521484375, -4.0386810302734375, -1.4910736083984375, 1.0565338134765625, 3.6041412353515625, 6.1517486572265625, 8.699356079101562, 11.246963500976562, 13.794570922851562, 16.342178344726562, 18.889785766601562, 21.437393188476562, 23.985000610351562, 26.532608032226562, 29.080215454101562, 31.627822875976562, 34.17543029785156, 36.72303771972656, 39.27064514160156, 41.81825256347656, 44.36585998535156, 46.91346740722656, 49.46107482910156, 52.00868225097656, 54.55628967285156, 57.10389709472656, 59.65150451660156, 62.19911193847656, 64.74671936035156, 67.29432678222656, 69.84193420410156, 72.38954162597656, 74.93714904785156, 77.48475646972656, 80.03236389160156, 82.57997131347656, 85.12757873535156, 87.67518615722656]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 4.0, 9.0, 12.0, 15.0, 21.0, 26.0, 41.0, 70.0, 125.0, 204.0, 292.0, 527.0, 1160.0, 2809.0, 10016.0, 4106526.0, 62021.0, 6311.0, 2057.0, 897.0, 477.0, 246.0, 162.0, 93.0, 39.0, 36.0, 38.0, 13.0, 11.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.1875, -27.47998046875, -26.7724609375, -26.06494140625, -25.357421875, -24.64990234375, -23.9423828125, -23.23486328125, -22.52734375, -21.81982421875, -21.1123046875, -20.40478515625, -19.697265625, -18.98974609375, -18.2822265625, -17.57470703125, -16.8671875, -16.15966796875, -15.4521484375, -14.74462890625, -14.037109375, -13.32958984375, -12.6220703125, -11.91455078125, -11.20703125, -10.49951171875, -9.7919921875, -9.08447265625, -8.376953125, -7.66943359375, -6.9619140625, -6.25439453125, -5.546875, -4.83935546875, -4.1318359375, -3.42431640625, -2.716796875, -2.00927734375, -1.3017578125, -0.59423828125, 0.11328125, 0.82080078125, 1.5283203125, 2.23583984375, 2.943359375, 3.65087890625, 4.3583984375, 5.06591796875, 5.7734375, 6.48095703125, 7.1884765625, 7.89599609375, 8.603515625, 9.31103515625, 10.0185546875, 10.72607421875, 11.43359375, 12.14111328125, 12.8486328125, 13.55615234375, 14.263671875, 14.97119140625, 15.6787109375, 16.38623046875, 17.09375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 16.0, 10.0, 11.0, 14.0, 16.0, 23.0, 23.0, 24.0, 34.0, 42.0, 57.0, 48.0, 55.0, 57.0, 49.0, 68.0, 66.0, 53.0, 60.0, 39.0, 53.0, 35.0, 28.0, 38.0, 13.0, 15.0, 16.0, 7.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.45703125, -3.354949951171875, -3.25286865234375, -3.150787353515625, -3.0487060546875, -2.946624755859375, -2.84454345703125, -2.742462158203125, -2.640380859375, -2.538299560546875, -2.43621826171875, -2.334136962890625, -2.2320556640625, -2.129974365234375, -2.02789306640625, -1.925811767578125, -1.82373046875, -1.721649169921875, -1.61956787109375, -1.517486572265625, -1.4154052734375, -1.313323974609375, -1.21124267578125, -1.109161376953125, -1.007080078125, -0.904998779296875, -0.80291748046875, -0.700836181640625, -0.5987548828125, -0.496673583984375, -0.39459228515625, -0.292510986328125, -0.1904296875, -0.088348388671875, 0.01373291015625, 0.115814208984375, 0.2178955078125, 0.319976806640625, 0.42205810546875, 0.524139404296875, 0.626220703125, 0.728302001953125, 0.83038330078125, 0.932464599609375, 1.0345458984375, 1.136627197265625, 1.23870849609375, 1.340789794921875, 1.44287109375, 1.544952392578125, 1.64703369140625, 1.749114990234375, 1.8511962890625, 1.953277587890625, 2.05535888671875, 2.157440185546875, 2.259521484375, 2.361602783203125, 2.46368408203125, 2.565765380859375, 2.6678466796875, 2.769927978515625, 2.87200927734375, 2.974090576171875, 3.076171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 13.0, 16.0, 15.0, 20.0, 32.0, 31.0, 49.0, 43.0, 90.0, 144.0, 202.0, 276.0, 408.0, 698.0, 1285.0, 2615.0, 5988.0, 22901.0, 4046749.0, 92431.0, 11680.0, 3979.0, 1761.0, 986.0, 628.0, 347.0, 262.0, 186.0, 108.0, 93.0, 64.0, 52.0, 35.0, 22.0, 22.0, 17.0, 8.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.703125, -12.245849609375, -11.78857421875, -11.331298828125, -10.8740234375, -10.416748046875, -9.95947265625, -9.502197265625, -9.044921875, -8.587646484375, -8.13037109375, -7.673095703125, -7.2158203125, -6.758544921875, -6.30126953125, -5.843994140625, -5.38671875, -4.929443359375, -4.47216796875, -4.014892578125, -3.5576171875, -3.100341796875, -2.64306640625, -2.185791015625, -1.728515625, -1.271240234375, -0.81396484375, -0.356689453125, 0.1005859375, 0.557861328125, 1.01513671875, 1.472412109375, 1.9296875, 2.386962890625, 2.84423828125, 3.301513671875, 3.7587890625, 4.216064453125, 4.67333984375, 5.130615234375, 5.587890625, 6.045166015625, 6.50244140625, 6.959716796875, 7.4169921875, 7.874267578125, 8.33154296875, 8.788818359375, 9.24609375, 9.703369140625, 10.16064453125, 10.617919921875, 11.0751953125, 11.532470703125, 11.98974609375, 12.447021484375, 12.904296875, 13.361572265625, 13.81884765625, 14.276123046875, 14.7333984375, 15.190673828125, 15.64794921875, 16.105224609375, 16.5625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 10.0, 21.0, 49.0, 3589.0, 281.0, 48.0, 23.0, 8.0, 5.0, 5.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.2862548828125, -2.158447265625, -2.0306396484375, -1.90283203125, -1.7750244140625, -1.647216796875, -1.5194091796875, -1.3916015625, -1.2637939453125, -1.135986328125, -1.0081787109375, -0.88037109375, -0.7525634765625, -0.624755859375, -0.4969482421875, -0.369140625, -0.2413330078125, -0.113525390625, 0.0142822265625, 0.14208984375, 0.2698974609375, 0.397705078125, 0.5255126953125, 0.6533203125, 0.7811279296875, 0.908935546875, 1.0367431640625, 1.16455078125, 1.2923583984375, 1.420166015625, 1.5479736328125, 1.67578125, 1.8035888671875, 1.931396484375, 2.0592041015625, 2.18701171875, 2.3148193359375, 2.442626953125, 2.5704345703125, 2.6982421875, 2.8260498046875, 2.953857421875, 3.0816650390625, 3.20947265625, 3.3372802734375, 3.465087890625, 3.5928955078125, 3.720703125, 3.8485107421875, 3.976318359375, 4.1041259765625, 4.23193359375, 4.3597412109375, 4.487548828125, 4.6153564453125, 4.7431640625, 4.8709716796875, 4.998779296875, 5.1265869140625, 5.25439453125, 5.3822021484375, 5.510009765625, 5.6378173828125, 5.765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 13.0, 23.0, 95.0, 308.0, 335.0, 153.0, 53.0, 17.0, 10.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.341644287109375, -6.603427886962891, -5.8652119636535645, -5.126996040344238, -4.388779640197754, -3.6505634784698486, -2.9123473167419434, -2.174131393432617, -1.4359149932861328, -0.6976988315582275, 0.040517330169677734, 0.778733491897583, 1.5169496536254883, 2.2551658153533936, 2.993381977081299, 3.731597900390625, 4.469814300537109, 5.208030700683594, 5.94624662399292, 6.684462547302246, 7.4226789474487305, 8.160895347595215, 8.899110794067383, 9.637327194213867, 10.375543594360352, 11.113759994506836, 11.85197639465332, 12.590191841125488, 13.328408241271973, 14.066624641418457, 14.804840087890625, 15.54305648803711, 16.281272888183594, 17.019489288330078, 17.757705688476562, 18.495922088623047, 19.23413848876953, 19.972352981567383, 20.710569381713867, 21.44878578186035, 22.187002182006836, 22.92521858215332, 23.663434982299805, 24.40165138244629, 25.13986587524414, 25.878082275390625, 26.61629867553711, 27.354515075683594, 28.092731475830078, 28.830947875976562, 29.569164276123047, 30.30738067626953, 31.045597076416016, 31.783811569213867, 32.522029876708984, 33.26024627685547, 33.99845886230469, 34.73667526245117, 35.474891662597656, 36.21310806274414, 36.951324462890625, 37.68954086303711, 38.427757263183594, 39.16596984863281, 39.90419006347656]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 14.0, 8.0, 12.0, 18.0, 30.0, 25.0, 36.0, 33.0, 30.0, 51.0, 36.0, 47.0, 56.0, 40.0, 52.0, 48.0, 48.0, 48.0, 54.0, 33.0, 32.0, 29.0, 37.0, 31.0, 23.0, 27.0, 16.0, 15.0, 14.0, 11.0, 6.0, 5.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.634207248687744, -7.403158187866211, -7.172109603881836, -6.941060543060303, -6.710011959075928, -6.4789628982543945, -6.2479143142700195, -6.016865253448486, -5.785816192626953, -5.55476713180542, -5.323718547821045, -5.092669486999512, -4.861620903015137, -4.6305718421936035, -4.39952278137207, -4.168474197387695, -3.937425374984741, -3.706376552581787, -3.475327730178833, -3.244278907775879, -3.0132298469543457, -2.7821810245513916, -2.5511322021484375, -2.3200831413269043, -2.0890345573425293, -1.8579857349395752, -1.6269367933273315, -1.3958879709243774, -1.1648390293121338, -0.9337902069091797, -0.7027413845062256, -0.47169244289398193, -0.24064350128173828, -0.009594634175300598, 0.22145423293113708, 0.4525030851364136, 0.6835519671440125, 0.9146008491516113, 1.1456496715545654, 1.376698613166809, 1.6077474355697632, 1.8387962579727173, 2.069845199584961, 2.300894021987915, 2.531942844390869, 2.7629919052124023, 2.9940404891967773, 3.2250895500183105, 3.4561383724212646, 3.6871871948242188, 3.918236017227173, 4.149284839630127, 4.38033390045166, 4.611382484436035, 4.842431545257568, 5.073480606079102, 5.304529190063477, 5.53557825088501, 5.766626834869385, 5.997675895690918, 6.228724479675293, 6.459773540496826, 6.690822601318359, 6.921871185302734, 7.152920246124268]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 2.0, 6.0, 13.0, 8.0, 20.0, 35.0, 40.0, 57.0, 121.0, 201.0, 363.0, 646.0, 1378.0, 3123.0, 7585.0, 20255.0, 63894.0, 216066.0, 434317.0, 206830.0, 60969.0, 19680.0, 7146.0, 2985.0, 1307.0, 654.0, 358.0, 177.0, 127.0, 72.0, 35.0, 38.0, 14.0, 6.0, 9.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.859375, -8.60968017578125, -8.3599853515625, -8.11029052734375, -7.860595703125, -7.61090087890625, -7.3612060546875, -7.11151123046875, -6.86181640625, -6.61212158203125, -6.3624267578125, -6.11273193359375, -5.863037109375, -5.61334228515625, -5.3636474609375, -5.11395263671875, -4.8642578125, -4.61456298828125, -4.3648681640625, -4.11517333984375, -3.865478515625, -3.61578369140625, -3.3660888671875, -3.11639404296875, -2.86669921875, -2.61700439453125, -2.3673095703125, -2.11761474609375, -1.867919921875, -1.61822509765625, -1.3685302734375, -1.11883544921875, -0.869140625, -0.61944580078125, -0.3697509765625, -0.12005615234375, 0.129638671875, 0.37933349609375, 0.6290283203125, 0.87872314453125, 1.12841796875, 1.37811279296875, 1.6278076171875, 1.87750244140625, 2.127197265625, 2.37689208984375, 2.6265869140625, 2.87628173828125, 3.1259765625, 3.37567138671875, 3.6253662109375, 3.87506103515625, 4.124755859375, 4.37445068359375, 4.6241455078125, 4.87384033203125, 5.12353515625, 5.37322998046875, 5.6229248046875, 5.87261962890625, 6.122314453125, 6.37200927734375, 6.6217041015625, 6.87139892578125, 7.12109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 2.0, 4.0, 11.0, 11.0, 9.0, 13.0, 15.0, 33.0, 21.0, 31.0, 25.0, 26.0, 36.0, 46.0, 53.0, 66.0, 50.0, 63.0, 61.0, 51.0, 48.0, 44.0, 38.0, 47.0, 34.0, 33.0, 29.0, 22.0, 18.0, 11.0, 11.0, 11.0, 8.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41015625, -3.308624267578125, -3.20709228515625, -3.105560302734375, -3.0040283203125, -2.902496337890625, -2.80096435546875, -2.699432373046875, -2.597900390625, -2.496368408203125, -2.39483642578125, -2.293304443359375, -2.1917724609375, -2.090240478515625, -1.98870849609375, -1.887176513671875, -1.78564453125, -1.684112548828125, -1.58258056640625, -1.481048583984375, -1.3795166015625, -1.277984619140625, -1.17645263671875, -1.074920654296875, -0.973388671875, -0.871856689453125, -0.77032470703125, -0.668792724609375, -0.5672607421875, -0.465728759765625, -0.36419677734375, -0.262664794921875, -0.1611328125, -0.059600830078125, 0.04193115234375, 0.143463134765625, 0.2449951171875, 0.346527099609375, 0.44805908203125, 0.549591064453125, 0.651123046875, 0.752655029296875, 0.85418701171875, 0.955718994140625, 1.0572509765625, 1.158782958984375, 1.26031494140625, 1.361846923828125, 1.46337890625, 1.564910888671875, 1.66644287109375, 1.767974853515625, 1.8695068359375, 1.971038818359375, 2.07257080078125, 2.174102783203125, 2.275634765625, 2.377166748046875, 2.47869873046875, 2.580230712890625, 2.6817626953125, 2.783294677734375, 2.88482666015625, 2.986358642578125, 3.087890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 19.0, 25.0, 52.0, 60.0, 87.0, 143.0, 237.0, 528.0, 1689.0, 7076.0, 43221.0, 489199.0, 455816.0, 40980.0, 6560.0, 1650.0, 563.0, 240.0, 135.0, 78.0, 52.0, 34.0, 28.0, 19.0, 15.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.33447265625, -11.8408203125, -11.34716796875, -10.853515625, -10.35986328125, -9.8662109375, -9.37255859375, -8.87890625, -8.38525390625, -7.8916015625, -7.39794921875, -6.904296875, -6.41064453125, -5.9169921875, -5.42333984375, -4.9296875, -4.43603515625, -3.9423828125, -3.44873046875, -2.955078125, -2.46142578125, -1.9677734375, -1.47412109375, -0.98046875, -0.48681640625, 0.0068359375, 0.50048828125, 0.994140625, 1.48779296875, 1.9814453125, 2.47509765625, 2.96875, 3.46240234375, 3.9560546875, 4.44970703125, 4.943359375, 5.43701171875, 5.9306640625, 6.42431640625, 6.91796875, 7.41162109375, 7.9052734375, 8.39892578125, 8.892578125, 9.38623046875, 9.8798828125, 10.37353515625, 10.8671875, 11.36083984375, 11.8544921875, 12.34814453125, 12.841796875, 13.33544921875, 13.8291015625, 14.32275390625, 14.81640625, 15.31005859375, 15.8037109375, 16.29736328125, 16.791015625, 17.28466796875, 17.7783203125, 18.27197265625, 18.765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 8.0, 14.0, 22.0, 20.0, 21.0, 26.0, 42.0, 37.0, 64.0, 62.0, 73.0, 81.0, 60.0, 61.0, 65.0, 60.0, 61.0, 40.0, 38.0, 32.0, 23.0, 24.0, 20.0, 8.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -15.9462890625, -15.173828125, -14.4013671875, -13.62890625, -12.8564453125, -12.083984375, -11.3115234375, -10.5390625, -9.7666015625, -8.994140625, -8.2216796875, -7.44921875, -6.6767578125, -5.904296875, -5.1318359375, -4.359375, -3.5869140625, -2.814453125, -2.0419921875, -1.26953125, -0.4970703125, 0.275390625, 1.0478515625, 1.8203125, 2.5927734375, 3.365234375, 4.1376953125, 4.91015625, 5.6826171875, 6.455078125, 7.2275390625, 8.0, 8.7724609375, 9.544921875, 10.3173828125, 11.08984375, 11.8623046875, 12.634765625, 13.4072265625, 14.1796875, 14.9521484375, 15.724609375, 16.4970703125, 17.26953125, 18.0419921875, 18.814453125, 19.5869140625, 20.359375, 21.1318359375, 21.904296875, 22.6767578125, 23.44921875, 24.2216796875, 24.994140625, 25.7666015625, 26.5390625, 27.3115234375, 28.083984375, 28.8564453125, 29.62890625, 30.4013671875, 31.173828125, 31.9462890625, 32.71875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 13.0, 18.0, 57.0, 133.0, 459.0, 3251.0, 540737.0, 499908.0, 3280.0, 452.0, 131.0, 47.0, 25.0, 17.0, 12.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1953125, -14.4354248046875, -13.675537109375, -12.9156494140625, -12.15576171875, -11.3958740234375, -10.635986328125, -9.8760986328125, -9.1162109375, -8.3563232421875, -7.596435546875, -6.8365478515625, -6.07666015625, -5.3167724609375, -4.556884765625, -3.7969970703125, -3.037109375, -2.2772216796875, -1.517333984375, -0.7574462890625, 0.00244140625, 0.7623291015625, 1.522216796875, 2.2821044921875, 3.0419921875, 3.8018798828125, 4.561767578125, 5.3216552734375, 6.08154296875, 6.8414306640625, 7.601318359375, 8.3612060546875, 9.12109375, 9.8809814453125, 10.640869140625, 11.4007568359375, 12.16064453125, 12.9205322265625, 13.680419921875, 14.4403076171875, 15.2001953125, 15.9600830078125, 16.719970703125, 17.4798583984375, 18.23974609375, 18.9996337890625, 19.759521484375, 20.5194091796875, 21.279296875, 22.0391845703125, 22.799072265625, 23.5589599609375, 24.31884765625, 25.0787353515625, 25.838623046875, 26.5985107421875, 27.3583984375, 28.1182861328125, 28.878173828125, 29.6380615234375, 30.39794921875, 31.1578369140625, 31.917724609375, 32.6776123046875, 33.4375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 1.0, 7.0, 12.0, 15.0, 31.0, 54.0, 89.0, 161.0, 199.0, 168.0, 98.0, 72.0, 37.0, 19.0, 17.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001071929931640625, -0.0010380446910858154, -0.0010041594505310059, -0.0009702742099761963, -0.0009363889694213867, -0.0009025037288665771, -0.0008686184883117676, -0.000834733247756958, -0.0008008480072021484, -0.0007669627666473389, -0.0007330775260925293, -0.0006991922855377197, -0.0006653070449829102, -0.0006314218044281006, -0.000597536563873291, -0.0005636513233184814, -0.0005297660827636719, -0.0004958808422088623, -0.00046199560165405273, -0.00042811036109924316, -0.0003942251205444336, -0.000360339879989624, -0.00032645463943481445, -0.0002925693988800049, -0.0002586841583251953, -0.00022479891777038574, -0.00019091367721557617, -0.0001570284366607666, -0.00012314319610595703, -8.925795555114746e-05, -5.537271499633789e-05, -2.148747444152832e-05, 1.239776611328125e-05, 4.628300666809082e-05, 8.016824722290039e-05, 0.00011405348777770996, 0.00014793872833251953, 0.0001818239688873291, 0.00021570920944213867, 0.00024959444999694824, 0.0002834796905517578, 0.0003173649311065674, 0.00035125017166137695, 0.0003851354122161865, 0.0004190206527709961, 0.00045290589332580566, 0.00048679113388061523, 0.0005206763744354248, 0.0005545616149902344, 0.0005884468555450439, 0.0006223320960998535, 0.0006562173366546631, 0.0006901025772094727, 0.0007239878177642822, 0.0007578730583190918, 0.0007917582988739014, 0.0008256435394287109, 0.0008595287799835205, 0.0008934140205383301, 0.0009272992610931396, 0.0009611845016479492, 0.0009950697422027588, 0.0010289549827575684, 0.001062840223312378, 0.0010967254638671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 16.0, 25.0, 41.0, 104.0, 218.0, 522.0, 1616.0, 5891.0, 46392.0, 913704.0, 69892.0, 7173.0, 1903.0, 567.0, 229.0, 97.0, 58.0, 22.0, 21.0, 16.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8125, -9.4805908203125, -9.148681640625, -8.8167724609375, -8.48486328125, -8.1529541015625, -7.821044921875, -7.4891357421875, -7.1572265625, -6.8253173828125, -6.493408203125, -6.1614990234375, -5.82958984375, -5.4976806640625, -5.165771484375, -4.8338623046875, -4.501953125, -4.1700439453125, -3.838134765625, -3.5062255859375, -3.17431640625, -2.8424072265625, -2.510498046875, -2.1785888671875, -1.8466796875, -1.5147705078125, -1.182861328125, -0.8509521484375, -0.51904296875, -0.1871337890625, 0.144775390625, 0.4766845703125, 0.80859375, 1.1405029296875, 1.472412109375, 1.8043212890625, 2.13623046875, 2.4681396484375, 2.800048828125, 3.1319580078125, 3.4638671875, 3.7957763671875, 4.127685546875, 4.4595947265625, 4.79150390625, 5.1234130859375, 5.455322265625, 5.7872314453125, 6.119140625, 6.4510498046875, 6.782958984375, 7.1148681640625, 7.44677734375, 7.7786865234375, 8.110595703125, 8.4425048828125, 8.7744140625, 9.1063232421875, 9.438232421875, 9.7701416015625, 10.10205078125, 10.4339599609375, 10.765869140625, 11.0977783203125, 11.4296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 10.0, 22.0, 32.0, 65.0, 111.0, 201.0, 198.0, 159.0, 76.0, 43.0, 27.0, 17.0, 5.0, 6.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.5772705078125, -11.248291015625, -10.9193115234375, -10.59033203125, -10.2613525390625, -9.932373046875, -9.6033935546875, -9.2744140625, -8.9454345703125, -8.616455078125, -8.2874755859375, -7.95849609375, -7.6295166015625, -7.300537109375, -6.9715576171875, -6.642578125, -6.3135986328125, -5.984619140625, -5.6556396484375, -5.32666015625, -4.9976806640625, -4.668701171875, -4.3397216796875, -4.0107421875, -3.6817626953125, -3.352783203125, -3.0238037109375, -2.69482421875, -2.3658447265625, -2.036865234375, -1.7078857421875, -1.37890625, -1.0499267578125, -0.720947265625, -0.3919677734375, -0.06298828125, 0.2659912109375, 0.594970703125, 0.9239501953125, 1.2529296875, 1.5819091796875, 1.910888671875, 2.2398681640625, 2.56884765625, 2.8978271484375, 3.226806640625, 3.5557861328125, 3.884765625, 4.2137451171875, 4.542724609375, 4.8717041015625, 5.20068359375, 5.5296630859375, 5.858642578125, 6.1876220703125, 6.5166015625, 6.8455810546875, 7.174560546875, 7.5035400390625, 7.83251953125, 8.1614990234375, 8.490478515625, 8.8194580078125, 9.1484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 27.0, 40.0, 101.0, 168.0, 252.0, 199.0, 123.0, 59.0, 18.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.962646484375, -111.98309326171875, -107.0035400390625, -102.02398681640625, -97.04443359375, -92.06488037109375, -87.0853271484375, -82.10577392578125, -77.126220703125, -72.14666748046875, -67.1671142578125, -62.18756103515625, -57.2080078125, -52.22845458984375, -47.248905181884766, -42.269351959228516, -37.28980255126953, -32.31024932861328, -27.33069610595703, -22.351144790649414, -17.371591567993164, -12.392038345336914, -7.412487030029297, -2.432933807373047, 2.546619415283203, 7.526172161102295, 12.505724906921387, 17.48527717590332, 22.46483039855957, 27.44438362121582, 32.42393493652344, 37.40348815917969, 42.38304138183594, 47.36259460449219, 52.34214782714844, 57.32170104980469, 62.30125427246094, 67.28080749511719, 72.26036071777344, 77.23991394042969, 82.21946716308594, 87.19902038574219, 92.17857360839844, 97.15812683105469, 102.13768005371094, 107.11723327636719, 112.09678649902344, 117.07633972167969, 122.0558853149414, 127.03543853759766, 132.01498413085938, 136.99453735351562, 141.97409057617188, 146.95364379882812, 151.93319702148438, 156.91275024414062, 161.89230346679688, 166.87185668945312, 171.85140991210938, 176.83096313476562, 181.81051635742188, 186.79006958007812, 191.76962280273438, 196.74917602539062, 201.72872924804688]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 2.0, 5.0, 5.0, 10.0, 11.0, 22.0, 8.0, 11.0, 15.0, 15.0, 17.0, 17.0, 22.0, 41.0, 38.0, 37.0, 45.0, 38.0, 34.0, 56.0, 68.0, 57.0, 44.0, 59.0, 60.0, 33.0, 32.0, 32.0, 32.0, 23.0, 18.0, 18.0, 17.0, 13.0, 6.0, 11.0, 8.0, 9.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-94.8558120727539, -92.02425384521484, -89.19269561767578, -86.36113739013672, -83.52957153320312, -80.69801330566406, -77.866455078125, -75.03489685058594, -72.20333862304688, -69.37178039550781, -66.54022216796875, -63.70866012573242, -60.87710189819336, -58.0455436706543, -55.21398162841797, -52.382423400878906, -49.550865173339844, -46.71930694580078, -43.88774871826172, -41.05618667602539, -38.22462844848633, -35.393070220947266, -32.56150817871094, -29.729949951171875, -26.898391723632812, -24.06683349609375, -21.235273361206055, -18.40371322631836, -15.572154998779297, -12.740595817565918, -9.909036636352539, -7.077476501464844, -4.24591064453125, -1.414351463317871, 1.4172077178955078, 4.248766899108887, 7.080326080322266, 9.911885261535645, 12.743444442749023, 15.575004577636719, 18.40656280517578, 21.238121032714844, 24.06968116760254, 26.901241302490234, 29.732799530029297, 32.56435775756836, 35.39591979980469, 38.22747802734375, 41.05903625488281, 43.890594482421875, 46.72215270996094, 49.553714752197266, 52.38527297973633, 55.21683120727539, 58.04839324951172, 60.87995147705078, 63.711509704589844, 66.5430679321289, 69.37462615966797, 72.20618438720703, 75.03775024414062, 77.86930847167969, 80.70086669921875, 83.53242492675781, 86.36398315429688]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 8.0, 6.0, 8.0, 10.0, 11.0, 17.0, 14.0, 31.0, 43.0, 56.0, 117.0, 155.0, 265.0, 456.0, 790.0, 1693.0, 4271.0, 14183.0, 3999213.0, 154572.0, 11654.0, 3730.0, 1474.0, 623.0, 369.0, 188.0, 114.0, 67.0, 49.0, 22.0, 26.0, 8.0, 10.0, 10.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.765625, -16.3115234375, -15.857421875, -15.4033203125, -14.94921875, -14.4951171875, -14.041015625, -13.5869140625, -13.1328125, -12.6787109375, -12.224609375, -11.7705078125, -11.31640625, -10.8623046875, -10.408203125, -9.9541015625, -9.5, -9.0458984375, -8.591796875, -8.1376953125, -7.68359375, -7.2294921875, -6.775390625, -6.3212890625, -5.8671875, -5.4130859375, -4.958984375, -4.5048828125, -4.05078125, -3.5966796875, -3.142578125, -2.6884765625, -2.234375, -1.7802734375, -1.326171875, -0.8720703125, -0.41796875, 0.0361328125, 0.490234375, 0.9443359375, 1.3984375, 1.8525390625, 2.306640625, 2.7607421875, 3.21484375, 3.6689453125, 4.123046875, 4.5771484375, 5.03125, 5.4853515625, 5.939453125, 6.3935546875, 6.84765625, 7.3017578125, 7.755859375, 8.2099609375, 8.6640625, 9.1181640625, 9.572265625, 10.0263671875, 10.48046875, 10.9345703125, 11.388671875, 11.8427734375, 12.296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 11.0, 16.0, 19.0, 19.0, 29.0, 34.0, 44.0, 40.0, 53.0, 65.0, 61.0, 80.0, 78.0, 64.0, 66.0, 52.0, 69.0, 38.0, 23.0, 25.0, 26.0, 17.0, 19.0, 9.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.8359375, -5.68206787109375, -5.5281982421875, -5.37432861328125, -5.220458984375, -5.06658935546875, -4.9127197265625, -4.75885009765625, -4.60498046875, -4.45111083984375, -4.2972412109375, -4.14337158203125, -3.989501953125, -3.83563232421875, -3.6817626953125, -3.52789306640625, -3.3740234375, -3.22015380859375, -3.0662841796875, -2.91241455078125, -2.758544921875, -2.60467529296875, -2.4508056640625, -2.29693603515625, -2.14306640625, -1.98919677734375, -1.8353271484375, -1.68145751953125, -1.527587890625, -1.37371826171875, -1.2198486328125, -1.06597900390625, -0.912109375, -0.75823974609375, -0.6043701171875, -0.45050048828125, -0.296630859375, -0.14276123046875, 0.0111083984375, 0.16497802734375, 0.31884765625, 0.47271728515625, 0.6265869140625, 0.78045654296875, 0.934326171875, 1.08819580078125, 1.2420654296875, 1.39593505859375, 1.5498046875, 1.70367431640625, 1.8575439453125, 2.01141357421875, 2.165283203125, 2.31915283203125, 2.4730224609375, 2.62689208984375, 2.78076171875, 2.93463134765625, 3.0885009765625, 3.24237060546875, 3.396240234375, 3.55010986328125, 3.7039794921875, 3.85784912109375, 4.01171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 11.0, 18.0, 19.0, 24.0, 25.0, 43.0, 72.0, 90.0, 124.0, 175.0, 303.0, 459.0, 728.0, 1304.0, 2732.0, 5883.0, 16169.0, 94510.0, 4011465.0, 40173.0, 10691.0, 4275.0, 2058.0, 1082.0, 665.0, 375.0, 252.0, 160.0, 102.0, 91.0, 54.0, 30.0, 21.0, 23.0, 15.0, 15.0, 11.0, 5.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0], "bins": [-17.625, -17.1649169921875, -16.704833984375, -16.2447509765625, -15.78466796875, -15.3245849609375, -14.864501953125, -14.4044189453125, -13.9443359375, -13.4842529296875, -13.024169921875, -12.5640869140625, -12.10400390625, -11.6439208984375, -11.183837890625, -10.7237548828125, -10.263671875, -9.8035888671875, -9.343505859375, -8.8834228515625, -8.42333984375, -7.9632568359375, -7.503173828125, -7.0430908203125, -6.5830078125, -6.1229248046875, -5.662841796875, -5.2027587890625, -4.74267578125, -4.2825927734375, -3.822509765625, -3.3624267578125, -2.90234375, -2.4422607421875, -1.982177734375, -1.5220947265625, -1.06201171875, -0.6019287109375, -0.141845703125, 0.3182373046875, 0.7783203125, 1.2384033203125, 1.698486328125, 2.1585693359375, 2.61865234375, 3.0787353515625, 3.538818359375, 3.9989013671875, 4.458984375, 4.9190673828125, 5.379150390625, 5.8392333984375, 6.29931640625, 6.7593994140625, 7.219482421875, 7.6795654296875, 8.1396484375, 8.5997314453125, 9.059814453125, 9.5198974609375, 9.97998046875, 10.4400634765625, 10.900146484375, 11.3602294921875, 11.8203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 6.0, 7.0, 17.0, 18.0, 32.0, 69.0, 2808.0, 988.0, 71.0, 20.0, 7.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.21295166015625, -4.0509033203125, -3.88885498046875, -3.726806640625, -3.56475830078125, -3.4027099609375, -3.24066162109375, -3.07861328125, -2.91656494140625, -2.7545166015625, -2.59246826171875, -2.430419921875, -2.26837158203125, -2.1063232421875, -1.94427490234375, -1.7822265625, -1.62017822265625, -1.4581298828125, -1.29608154296875, -1.134033203125, -0.97198486328125, -0.8099365234375, -0.64788818359375, -0.48583984375, -0.32379150390625, -0.1617431640625, 0.00030517578125, 0.162353515625, 0.32440185546875, 0.4864501953125, 0.64849853515625, 0.810546875, 0.97259521484375, 1.1346435546875, 1.29669189453125, 1.458740234375, 1.62078857421875, 1.7828369140625, 1.94488525390625, 2.10693359375, 2.26898193359375, 2.4310302734375, 2.59307861328125, 2.755126953125, 2.91717529296875, 3.0792236328125, 3.24127197265625, 3.4033203125, 3.56536865234375, 3.7274169921875, 3.88946533203125, 4.051513671875, 4.21356201171875, 4.3756103515625, 4.53765869140625, 4.69970703125, 4.86175537109375, 5.0238037109375, 5.18585205078125, 5.347900390625, 5.50994873046875, 5.6719970703125, 5.83404541015625, 5.99609375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 27.0, 299.0, 542.0, 127.0, 12.0], "bins": [-153.5853729248047, -151.08799743652344, -148.5906219482422, -146.09324645996094, -143.5958709716797, -141.09849548339844, -138.6011199951172, -136.10374450683594, -133.6063690185547, -131.10899353027344, -128.6116180419922, -126.11424255371094, -123.61686706542969, -121.11949157714844, -118.62211608886719, -116.12474060058594, -113.62737274169922, -111.12999725341797, -108.63262176513672, -106.13524627685547, -103.63787078857422, -101.14049530029297, -98.64311981201172, -96.145751953125, -93.64837646484375, -91.1510009765625, -88.65362548828125, -86.15625, -83.65887451171875, -81.1614990234375, -78.66412353515625, -76.166748046875, -73.66938018798828, -71.17200469970703, -68.67462921142578, -66.17725372314453, -63.67987823486328, -61.18250274658203, -58.68513107299805, -56.1877555847168, -53.69037628173828, -51.19300079345703, -48.69562530517578, -46.19824981689453, -43.70087432861328, -41.20349884033203, -38.70612716674805, -36.2087516784668, -33.71138000488281, -31.214004516601562, -28.716629028320312, -26.219255447387695, -23.721879959106445, -21.224504470825195, -18.727130889892578, -16.229755401611328, -13.732378005981445, -11.235002517700195, -8.737627983093262, -6.24025297164917, -3.742877960205078, -1.2455024719238281, 1.2518720626831055, 3.749246597290039, 6.246622085571289]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 7.0, 6.0, 14.0, 12.0, 14.0, 18.0, 25.0, 31.0, 47.0, 47.0, 36.0, 54.0, 59.0, 50.0, 61.0, 52.0, 51.0, 48.0, 51.0, 46.0, 37.0, 42.0, 31.0, 26.0, 29.0, 25.0, 22.0, 13.0, 15.0, 4.0, 9.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.21942710876465, -15.796246528625488, -15.373066902160645, -14.949886322021484, -14.526705741882324, -14.103525161743164, -13.68034553527832, -13.25716495513916, -12.833984375, -12.41080379486084, -11.987624168395996, -11.564443588256836, -11.141263008117676, -10.718082427978516, -10.294902801513672, -9.871722221374512, -9.448542594909668, -9.025362014770508, -8.602182388305664, -8.179001808166504, -7.755821228027344, -7.332641124725342, -6.90946102142334, -6.48628044128418, -6.063100337982178, -5.639920234680176, -5.216739654541016, -4.793559551239014, -4.370379447937012, -3.9471988677978516, -3.5240187644958496, -3.1008384227752686, -2.677657127380371, -2.25447678565979, -1.8312965631484985, -1.408116340637207, -0.984935998916626, -0.5617556571960449, -0.13857555389404297, 0.2846047878265381, 0.7077851295471191, 1.1309654712677002, 1.5541456937789917, 1.9773259162902832, 2.4005062580108643, 2.8236865997314453, 3.2468667030334473, 3.6700470447540283, 4.093227386474609, 4.516407489776611, 4.9395880699157715, 5.362768173217773, 5.785948753356934, 6.2091288566589355, 6.6323089599609375, 7.055489540100098, 7.4786696434021, 7.901849746704102, 8.325030326843262, 8.748210906982422, 9.171390533447266, 9.594571113586426, 10.017751693725586, 10.44093132019043, 10.86411190032959]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 11.0, 4.0, 18.0, 23.0, 33.0, 54.0, 102.0, 174.0, 324.0, 596.0, 1194.0, 2745.0, 7245.0, 21195.0, 75245.0, 313133.0, 452466.0, 123871.0, 32523.0, 10255.0, 4010.0, 1578.0, 791.0, 400.0, 221.0, 131.0, 67.0, 47.0, 34.0, 23.0, 10.0, 12.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5546875, -7.254638671875, -6.95458984375, -6.654541015625, -6.3544921875, -6.054443359375, -5.75439453125, -5.454345703125, -5.154296875, -4.854248046875, -4.55419921875, -4.254150390625, -3.9541015625, -3.654052734375, -3.35400390625, -3.053955078125, -2.75390625, -2.453857421875, -2.15380859375, -1.853759765625, -1.5537109375, -1.253662109375, -0.95361328125, -0.653564453125, -0.353515625, -0.053466796875, 0.24658203125, 0.546630859375, 0.8466796875, 1.146728515625, 1.44677734375, 1.746826171875, 2.046875, 2.346923828125, 2.64697265625, 2.947021484375, 3.2470703125, 3.547119140625, 3.84716796875, 4.147216796875, 4.447265625, 4.747314453125, 5.04736328125, 5.347412109375, 5.6474609375, 5.947509765625, 6.24755859375, 6.547607421875, 6.84765625, 7.147705078125, 7.44775390625, 7.747802734375, 8.0478515625, 8.347900390625, 8.64794921875, 8.947998046875, 9.248046875, 9.548095703125, 9.84814453125, 10.148193359375, 10.4482421875, 10.748291015625, 11.04833984375, 11.348388671875, 11.6484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 7.0, 11.0, 12.0, 19.0, 13.0, 20.0, 29.0, 24.0, 43.0, 45.0, 59.0, 64.0, 86.0, 70.0, 74.0, 71.0, 65.0, 59.0, 50.0, 37.0, 31.0, 26.0, 14.0, 11.0, 13.0, 10.0, 7.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.09375, -5.93218994140625, -5.7706298828125, -5.60906982421875, -5.447509765625, -5.28594970703125, -5.1243896484375, -4.96282958984375, -4.80126953125, -4.63970947265625, -4.4781494140625, -4.31658935546875, -4.155029296875, -3.99346923828125, -3.8319091796875, -3.67034912109375, -3.5087890625, -3.34722900390625, -3.1856689453125, -3.02410888671875, -2.862548828125, -2.70098876953125, -2.5394287109375, -2.37786865234375, -2.21630859375, -2.05474853515625, -1.8931884765625, -1.73162841796875, -1.570068359375, -1.40850830078125, -1.2469482421875, -1.08538818359375, -0.923828125, -0.76226806640625, -0.6007080078125, -0.43914794921875, -0.277587890625, -0.11602783203125, 0.0455322265625, 0.20709228515625, 0.36865234375, 0.53021240234375, 0.6917724609375, 0.85333251953125, 1.014892578125, 1.17645263671875, 1.3380126953125, 1.49957275390625, 1.6611328125, 1.82269287109375, 1.9842529296875, 2.14581298828125, 2.307373046875, 2.46893310546875, 2.6304931640625, 2.79205322265625, 2.95361328125, 3.11517333984375, 3.2767333984375, 3.43829345703125, 3.599853515625, 3.76141357421875, 3.9229736328125, 4.08453369140625, 4.24609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 12.0, 11.0, 29.0, 26.0, 59.0, 93.0, 212.0, 576.0, 2016.0, 12683.0, 243210.0, 750061.0, 34099.0, 3864.0, 910.0, 351.0, 137.0, 66.0, 39.0, 34.0, 15.0, 11.0, 5.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.328125, -30.548828125, -29.76953125, -28.990234375, -28.2109375, -27.431640625, -26.65234375, -25.873046875, -25.09375, -24.314453125, -23.53515625, -22.755859375, -21.9765625, -21.197265625, -20.41796875, -19.638671875, -18.859375, -18.080078125, -17.30078125, -16.521484375, -15.7421875, -14.962890625, -14.18359375, -13.404296875, -12.625, -11.845703125, -11.06640625, -10.287109375, -9.5078125, -8.728515625, -7.94921875, -7.169921875, -6.390625, -5.611328125, -4.83203125, -4.052734375, -3.2734375, -2.494140625, -1.71484375, -0.935546875, -0.15625, 0.623046875, 1.40234375, 2.181640625, 2.9609375, 3.740234375, 4.51953125, 5.298828125, 6.078125, 6.857421875, 7.63671875, 8.416015625, 9.1953125, 9.974609375, 10.75390625, 11.533203125, 12.3125, 13.091796875, 13.87109375, 14.650390625, 15.4296875, 16.208984375, 16.98828125, 17.767578125, 18.546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 14.0, 4.0, 11.0, 17.0, 14.0, 23.0, 25.0, 27.0, 32.0, 45.0, 63.0, 49.0, 52.0, 56.0, 71.0, 62.0, 61.0, 54.0, 33.0, 49.0, 37.0, 43.0, 28.0, 24.0, 25.0, 19.0, 15.0, 6.0, 5.0, 8.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.125, -20.380859375, -19.63671875, -18.892578125, -18.1484375, -17.404296875, -16.66015625, -15.916015625, -15.171875, -14.427734375, -13.68359375, -12.939453125, -12.1953125, -11.451171875, -10.70703125, -9.962890625, -9.21875, -8.474609375, -7.73046875, -6.986328125, -6.2421875, -5.498046875, -4.75390625, -4.009765625, -3.265625, -2.521484375, -1.77734375, -1.033203125, -0.2890625, 0.455078125, 1.19921875, 1.943359375, 2.6875, 3.431640625, 4.17578125, 4.919921875, 5.6640625, 6.408203125, 7.15234375, 7.896484375, 8.640625, 9.384765625, 10.12890625, 10.873046875, 11.6171875, 12.361328125, 13.10546875, 13.849609375, 14.59375, 15.337890625, 16.08203125, 16.826171875, 17.5703125, 18.314453125, 19.05859375, 19.802734375, 20.546875, 21.291015625, 22.03515625, 22.779296875, 23.5234375, 24.267578125, 25.01171875, 25.755859375, 26.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 28.0, 45.0, 101.0, 300.0, 1114.0, 11519.0, 895618.0, 135531.0, 3401.0, 585.0, 162.0, 74.0, 28.0, 17.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.703125, -23.1617431640625, -22.620361328125, -22.0789794921875, -21.53759765625, -20.9962158203125, -20.454833984375, -19.9134521484375, -19.3720703125, -18.8306884765625, -18.289306640625, -17.7479248046875, -17.20654296875, -16.6651611328125, -16.123779296875, -15.5823974609375, -15.041015625, -14.4996337890625, -13.958251953125, -13.4168701171875, -12.87548828125, -12.3341064453125, -11.792724609375, -11.2513427734375, -10.7099609375, -10.1685791015625, -9.627197265625, -9.0858154296875, -8.54443359375, -8.0030517578125, -7.461669921875, -6.9202880859375, -6.37890625, -5.8375244140625, -5.296142578125, -4.7547607421875, -4.21337890625, -3.6719970703125, -3.130615234375, -2.5892333984375, -2.0478515625, -1.5064697265625, -0.965087890625, -0.4237060546875, 0.11767578125, 0.6590576171875, 1.200439453125, 1.7418212890625, 2.283203125, 2.8245849609375, 3.365966796875, 3.9073486328125, 4.44873046875, 4.9901123046875, 5.531494140625, 6.0728759765625, 6.6142578125, 7.1556396484375, 7.697021484375, 8.2384033203125, 8.77978515625, 9.3211669921875, 9.862548828125, 10.4039306640625, 10.9453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 8.0, 3.0, 12.0, 9.0, 22.0, 27.0, 42.0, 52.0, 87.0, 105.0, 131.0, 113.0, 121.0, 85.0, 50.0, 40.0, 27.0, 20.0, 12.0, 7.0, 5.0, 4.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008401870727539062, -0.0008076578378677368, -0.0007751286029815674, -0.000742599368095398, -0.0007100701332092285, -0.0006775408983230591, -0.0006450116634368896, -0.0006124824285507202, -0.0005799531936645508, -0.0005474239587783813, -0.0005148947238922119, -0.0004823654890060425, -0.00044983625411987305, -0.0004173070192337036, -0.0003847777843475342, -0.00035224854946136475, -0.0003197193145751953, -0.0002871900796890259, -0.00025466084480285645, -0.000222131609916687, -0.00018960237503051758, -0.00015707314014434814, -0.0001245439052581787, -9.201467037200928e-05, -5.9485435485839844e-05, -2.695620059967041e-05, 5.5730342864990234e-06, 3.810226917266846e-05, 7.063150405883789e-05, 0.00010316073894500732, 0.00013568997383117676, 0.0001682192087173462, 0.00020074844360351562, 0.00023327767848968506, 0.0002658069133758545, 0.0002983361482620239, 0.00033086538314819336, 0.0003633946180343628, 0.0003959238529205322, 0.00042845308780670166, 0.0004609823226928711, 0.0004935115575790405, 0.00052604079246521, 0.0005585700273513794, 0.0005910992622375488, 0.0006236284971237183, 0.0006561577320098877, 0.0006886869668960571, 0.0007212162017822266, 0.000753745436668396, 0.0007862746715545654, 0.0008188039064407349, 0.0008513331413269043, 0.0008838623762130737, 0.0009163916110992432, 0.0009489208459854126, 0.000981450080871582, 0.0010139793157577515, 0.001046508550643921, 0.0010790377855300903, 0.0011115670204162598, 0.0011440962553024292, 0.0011766254901885986, 0.001209154725074768, 0.0012416839599609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 18.0, 32.0, 105.0, 240.0, 1156.0, 38971.0, 995082.0, 11924.0, 716.0, 195.0, 58.0, 32.0, 21.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.86181640625, -19.2080078125, -18.55419921875, -17.900390625, -17.24658203125, -16.5927734375, -15.93896484375, -15.28515625, -14.63134765625, -13.9775390625, -13.32373046875, -12.669921875, -12.01611328125, -11.3623046875, -10.70849609375, -10.0546875, -9.40087890625, -8.7470703125, -8.09326171875, -7.439453125, -6.78564453125, -6.1318359375, -5.47802734375, -4.82421875, -4.17041015625, -3.5166015625, -2.86279296875, -2.208984375, -1.55517578125, -0.9013671875, -0.24755859375, 0.40625, 1.06005859375, 1.7138671875, 2.36767578125, 3.021484375, 3.67529296875, 4.3291015625, 4.98291015625, 5.63671875, 6.29052734375, 6.9443359375, 7.59814453125, 8.251953125, 8.90576171875, 9.5595703125, 10.21337890625, 10.8671875, 11.52099609375, 12.1748046875, 12.82861328125, 13.482421875, 14.13623046875, 14.7900390625, 15.44384765625, 16.09765625, 16.75146484375, 17.4052734375, 18.05908203125, 18.712890625, 19.36669921875, 20.0205078125, 20.67431640625, 21.328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 11.0, 13.0, 37.0, 62.0, 97.0, 122.0, 150.0, 154.0, 156.0, 88.0, 39.0, 31.0, 16.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.45098876953125, -5.1090087890625, -4.76702880859375, -4.425048828125, -4.08306884765625, -3.7410888671875, -3.39910888671875, -3.05712890625, -2.71514892578125, -2.3731689453125, -2.03118896484375, -1.689208984375, -1.34722900390625, -1.0052490234375, -0.66326904296875, -0.3212890625, 0.02069091796875, 0.3626708984375, 0.70465087890625, 1.046630859375, 1.38861083984375, 1.7305908203125, 2.07257080078125, 2.41455078125, 2.75653076171875, 3.0985107421875, 3.44049072265625, 3.782470703125, 4.12445068359375, 4.4664306640625, 4.80841064453125, 5.150390625, 5.49237060546875, 5.8343505859375, 6.17633056640625, 6.518310546875, 6.86029052734375, 7.2022705078125, 7.54425048828125, 7.88623046875, 8.22821044921875, 8.5701904296875, 8.91217041015625, 9.254150390625, 9.59613037109375, 9.9381103515625, 10.28009033203125, 10.6220703125, 10.96405029296875, 11.3060302734375, 11.64801025390625, 11.989990234375, 12.33197021484375, 12.6739501953125, 13.01593017578125, 13.35791015625, 13.69989013671875, 14.0418701171875, 14.38385009765625, 14.725830078125, 15.06781005859375, 15.4097900390625, 15.75177001953125, 16.09375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 11.0, 41.0, 213.0, 431.0, 238.0, 53.0, 19.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-382.2702941894531, -370.532470703125, -358.79461669921875, -347.0567932128906, -335.3189697265625, -323.58111572265625, -311.8432922363281, -300.10546875, -288.36761474609375, -276.6297912597656, -264.8919372558594, -253.15411376953125, -241.41627502441406, -229.67843627929688, -217.94061279296875, -206.20277404785156, -194.46493530273438, -182.7270965576172, -170.9892578125, -159.25143432617188, -147.5135955810547, -135.7757568359375, -124.03792572021484, -112.30009460449219, -100.562255859375, -88.82441711425781, -77.08658599853516, -65.3487548828125, -53.61091613769531, -41.87308120727539, -30.13524627685547, -18.397415161132812, -6.6595458984375, 5.078289031982422, 16.816123962402344, 28.553958892822266, 40.29179382324219, 52.02962875366211, 63.76746368408203, 75.50529479980469, 87.24313354492188, 98.98097229003906, 110.71880340576172, 122.45663452148438, 134.19447326660156, 145.93231201171875, 157.67013549804688, 169.40797424316406, 181.14581298828125, 192.88365173339844, 204.62149047851562, 216.35931396484375, 228.09715270996094, 239.83499145507812, 251.57281494140625, 263.3106689453125, 275.0484924316406, 286.78631591796875, 298.524169921875, 310.2619934082031, 321.99981689453125, 333.7376708984375, 345.4754943847656, 357.21331787109375, 368.951171875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 1.0, 4.0, 11.0, 6.0, 8.0, 15.0, 11.0, 22.0, 22.0, 44.0, 28.0, 24.0, 32.0, 24.0, 41.0, 34.0, 33.0, 43.0, 52.0, 43.0, 49.0, 54.0, 52.0, 42.0, 41.0, 36.0, 25.0, 21.0, 24.0, 36.0, 18.0, 17.0, 18.0, 11.0, 8.0, 7.0, 9.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-76.63186645507812, -73.97627258300781, -71.32067108154297, -68.66506958007812, -66.00947570800781, -63.353878021240234, -60.698280334472656, -58.04268264770508, -55.3870849609375, -52.73148727416992, -50.075889587402344, -47.420291900634766, -44.76469421386719, -42.10909652709961, -39.45349884033203, -36.79790115356445, -34.142303466796875, -31.486705780029297, -28.83110809326172, -26.17551040649414, -23.519912719726562, -20.864315032958984, -18.208717346191406, -15.553119659423828, -12.89752197265625, -10.241924285888672, -7.586326599121094, -4.930728912353516, -2.2751312255859375, 0.3804664611816406, 3.0360641479492188, 5.691661834716797, 8.347259521484375, 11.002857208251953, 13.658454895019531, 16.31405258178711, 18.969650268554688, 21.625247955322266, 24.280845642089844, 26.936443328857422, 29.592041015625, 32.24763870239258, 34.903236389160156, 37.558834075927734, 40.21443176269531, 42.87002944946289, 45.52562713623047, 48.18122482299805, 50.836822509765625, 53.4924201965332, 56.14801788330078, 58.80361557006836, 61.45921325683594, 64.11480712890625, 66.7704086303711, 69.42601013183594, 72.08160400390625, 74.73719787597656, 77.3927993774414, 80.04840087890625, 82.70399475097656, 85.35958862304688, 88.01519012451172, 90.67079162597656, 93.32638549804688]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 5.0, 3.0, 9.0, 10.0, 17.0, 34.0, 34.0, 44.0, 93.0, 202.0, 418.0, 1419.0, 8226.0, 4171911.0, 9394.0, 1521.0, 495.0, 194.0, 106.0, 63.0, 33.0, 9.0, 9.0, 8.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0], "bins": [-51.59375, -50.38037109375, -49.1669921875, -47.95361328125, -46.740234375, -45.52685546875, -44.3134765625, -43.10009765625, -41.88671875, -40.67333984375, -39.4599609375, -38.24658203125, -37.033203125, -35.81982421875, -34.6064453125, -33.39306640625, -32.1796875, -30.96630859375, -29.7529296875, -28.53955078125, -27.326171875, -26.11279296875, -24.8994140625, -23.68603515625, -22.47265625, -21.25927734375, -20.0458984375, -18.83251953125, -17.619140625, -16.40576171875, -15.1923828125, -13.97900390625, -12.765625, -11.55224609375, -10.3388671875, -9.12548828125, -7.912109375, -6.69873046875, -5.4853515625, -4.27197265625, -3.05859375, -1.84521484375, -0.6318359375, 0.58154296875, 1.794921875, 3.00830078125, 4.2216796875, 5.43505859375, 6.6484375, 7.86181640625, 9.0751953125, 10.28857421875, 11.501953125, 12.71533203125, 13.9287109375, 15.14208984375, 16.35546875, 17.56884765625, 18.7822265625, 19.99560546875, 21.208984375, 22.42236328125, 23.6357421875, 24.84912109375, 26.0625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 18.0, 10.0, 19.0, 20.0, 25.0, 34.0, 42.0, 64.0, 96.0, 87.0, 97.0, 81.0, 95.0, 68.0, 51.0, 42.0, 47.0, 28.0, 18.0, 21.0, 6.0, 5.0, 3.0, 5.0, 1.0, 2.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.81640625, -7.59197998046875, -7.3675537109375, -7.14312744140625, -6.918701171875, -6.69427490234375, -6.4698486328125, -6.24542236328125, -6.02099609375, -5.79656982421875, -5.5721435546875, -5.34771728515625, -5.123291015625, -4.89886474609375, -4.6744384765625, -4.45001220703125, -4.2255859375, -4.00115966796875, -3.7767333984375, -3.55230712890625, -3.327880859375, -3.10345458984375, -2.8790283203125, -2.65460205078125, -2.43017578125, -2.20574951171875, -1.9813232421875, -1.75689697265625, -1.532470703125, -1.30804443359375, -1.0836181640625, -0.85919189453125, -0.634765625, -0.41033935546875, -0.1859130859375, 0.03851318359375, 0.262939453125, 0.48736572265625, 0.7117919921875, 0.93621826171875, 1.16064453125, 1.38507080078125, 1.6094970703125, 1.83392333984375, 2.058349609375, 2.28277587890625, 2.5072021484375, 2.73162841796875, 2.9560546875, 3.18048095703125, 3.4049072265625, 3.62933349609375, 3.853759765625, 4.07818603515625, 4.3026123046875, 4.52703857421875, 4.75146484375, 4.97589111328125, 5.2003173828125, 5.42474365234375, 5.649169921875, 5.87359619140625, 6.0980224609375, 6.32244873046875, 6.546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 9.0, 8.0, 17.0, 17.0, 25.0, 27.0, 42.0, 77.0, 86.0, 100.0, 178.0, 248.0, 375.0, 563.0, 996.0, 1955.0, 4891.0, 19663.0, 4111820.0, 40541.0, 6982.0, 2471.0, 1235.0, 645.0, 401.0, 264.0, 179.0, 129.0, 89.0, 63.0, 51.0, 36.0, 25.0, 23.0, 14.0, 11.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-26.484375, -25.79931640625, -25.1142578125, -24.42919921875, -23.744140625, -23.05908203125, -22.3740234375, -21.68896484375, -21.00390625, -20.31884765625, -19.6337890625, -18.94873046875, -18.263671875, -17.57861328125, -16.8935546875, -16.20849609375, -15.5234375, -14.83837890625, -14.1533203125, -13.46826171875, -12.783203125, -12.09814453125, -11.4130859375, -10.72802734375, -10.04296875, -9.35791015625, -8.6728515625, -7.98779296875, -7.302734375, -6.61767578125, -5.9326171875, -5.24755859375, -4.5625, -3.87744140625, -3.1923828125, -2.50732421875, -1.822265625, -1.13720703125, -0.4521484375, 0.23291015625, 0.91796875, 1.60302734375, 2.2880859375, 2.97314453125, 3.658203125, 4.34326171875, 5.0283203125, 5.71337890625, 6.3984375, 7.08349609375, 7.7685546875, 8.45361328125, 9.138671875, 9.82373046875, 10.5087890625, 11.19384765625, 11.87890625, 12.56396484375, 13.2490234375, 13.93408203125, 14.619140625, 15.30419921875, 15.9892578125, 16.67431640625, 17.359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 12.0, 13.0, 36.0, 101.0, 3813.0, 49.0, 11.0, 7.0, 9.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.26910400390625, -5.0889892578125, -4.90887451171875, -4.728759765625, -4.54864501953125, -4.3685302734375, -4.18841552734375, -4.00830078125, -3.82818603515625, -3.6480712890625, -3.46795654296875, -3.287841796875, -3.10772705078125, -2.9276123046875, -2.74749755859375, -2.5673828125, -2.38726806640625, -2.2071533203125, -2.02703857421875, -1.846923828125, -1.66680908203125, -1.4866943359375, -1.30657958984375, -1.12646484375, -0.94635009765625, -0.7662353515625, -0.58612060546875, -0.406005859375, -0.22589111328125, -0.0457763671875, 0.13433837890625, 0.314453125, 0.49456787109375, 0.6746826171875, 0.85479736328125, 1.034912109375, 1.21502685546875, 1.3951416015625, 1.57525634765625, 1.75537109375, 1.93548583984375, 2.1156005859375, 2.29571533203125, 2.475830078125, 2.65594482421875, 2.8360595703125, 3.01617431640625, 3.1962890625, 3.37640380859375, 3.5565185546875, 3.73663330078125, 3.916748046875, 4.09686279296875, 4.2769775390625, 4.45709228515625, 4.63720703125, 4.81732177734375, 4.9974365234375, 5.17755126953125, 5.357666015625, 5.53778076171875, 5.7178955078125, 5.89801025390625, 6.078125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 18.0, 21.0, 46.0, 106.0, 201.0, 240.0, 186.0, 91.0, 45.0, 20.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.456344604492188, -26.650529861450195, -25.844715118408203, -25.03890037536621, -24.23308563232422, -23.427270889282227, -22.621456146240234, -21.815643310546875, -21.00982666015625, -20.204011917114258, -19.398197174072266, -18.592382431030273, -17.78656768798828, -16.98075294494629, -16.174938201904297, -15.369124412536621, -14.563310623168945, -13.757495880126953, -12.951681137084961, -12.145866394042969, -11.340051651000977, -10.534236907958984, -9.728423118591309, -8.922608375549316, -8.116793632507324, -7.310978889465332, -6.50516414642334, -5.699349880218506, -4.893535137176514, -4.0877203941345215, -3.2819061279296875, -2.4760913848876953, -1.6702747344970703, -0.8644601106643677, -0.05864548683166504, 0.747169017791748, 1.5529837608337402, 2.3587985038757324, 3.1646127700805664, 3.9704275131225586, 4.776242256164551, 5.582056999206543, 6.387871742248535, 7.193686008453369, 7.999500751495361, 8.805315017700195, 9.611129760742188, 10.41694450378418, 11.222759246826172, 12.028573989868164, 12.834388732910156, 13.640203475952148, 14.44601821899414, 15.251832962036133, 16.057647705078125, 16.863460540771484, 17.66927719116211, 18.4750919342041, 19.280906677246094, 20.086721420288086, 20.892536163330078, 21.69835090637207, 22.504165649414062, 23.309978485107422, 24.115793228149414]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 5.0, 13.0, 15.0, 24.0, 20.0, 22.0, 27.0, 30.0, 36.0, 41.0, 36.0, 28.0, 45.0, 36.0, 41.0, 45.0, 37.0, 45.0, 51.0, 36.0, 43.0, 34.0, 32.0, 24.0, 25.0, 26.0, 31.0, 35.0, 20.0, 22.0, 21.0, 5.0, 8.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.653335571289062, -10.34294605255127, -10.032556533813477, -9.72216796875, -9.411778450012207, -9.101388931274414, -8.790999412536621, -8.480609893798828, -8.170221328735352, -7.859831809997559, -7.549442768096924, -7.239053249359131, -6.928664207458496, -6.618274688720703, -6.30788516998291, -5.997495651245117, -5.687106132507324, -5.376716613769531, -5.0663275718688965, -4.7559380531311035, -4.445549011230469, -4.135159492492676, -3.824769973754883, -3.514380693435669, -3.203991413116455, -2.893602132797241, -2.5832128524780273, -2.2728233337402344, -1.9624340534210205, -1.6520447731018066, -1.3416553735733032, -1.0312659740447998, -0.7208776473999023, -0.4104883074760437, -0.10009896755218506, 0.21029037237167358, 0.5206797122955322, 0.8310689926147461, 1.1414583921432495, 1.451847791671753, 1.7622370719909668, 2.0726263523101807, 2.3830156326293945, 2.6934051513671875, 3.0037944316864014, 3.3141837120056152, 3.624573230743408, 3.934962511062622, 4.245351791381836, 4.555741310119629, 4.866130352020264, 5.176519870758057, 5.486908912658691, 5.797298431396484, 6.107687950134277, 6.41807746887207, 6.728466510772705, 7.038856029510498, 7.349245071411133, 7.659634590148926, 7.970024108886719, 8.280412673950195, 8.590802192687988, 8.901191711425781, 9.211581230163574]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 3.0, 6.0, 12.0, 15.0, 16.0, 25.0, 48.0, 67.0, 102.0, 215.0, 350.0, 698.0, 1532.0, 4344.0, 14154.0, 65045.0, 380407.0, 470764.0, 84494.0, 17709.0, 4949.0, 1860.0, 801.0, 369.0, 198.0, 151.0, 77.0, 43.0, 24.0, 20.0, 23.0, 11.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4609375, -12.046630859375, -11.63232421875, -11.218017578125, -10.8037109375, -10.389404296875, -9.97509765625, -9.560791015625, -9.146484375, -8.732177734375, -8.31787109375, -7.903564453125, -7.4892578125, -7.074951171875, -6.66064453125, -6.246337890625, -5.83203125, -5.417724609375, -5.00341796875, -4.589111328125, -4.1748046875, -3.760498046875, -3.34619140625, -2.931884765625, -2.517578125, -2.103271484375, -1.68896484375, -1.274658203125, -0.8603515625, -0.446044921875, -0.03173828125, 0.382568359375, 0.796875, 1.211181640625, 1.62548828125, 2.039794921875, 2.4541015625, 2.868408203125, 3.28271484375, 3.697021484375, 4.111328125, 4.525634765625, 4.93994140625, 5.354248046875, 5.7685546875, 6.182861328125, 6.59716796875, 7.011474609375, 7.42578125, 7.840087890625, 8.25439453125, 8.668701171875, 9.0830078125, 9.497314453125, 9.91162109375, 10.325927734375, 10.740234375, 11.154541015625, 11.56884765625, 11.983154296875, 12.3974609375, 12.811767578125, 13.22607421875, 13.640380859375, 14.0546875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 9.0, 15.0, 9.0, 15.0, 18.0, 27.0, 42.0, 41.0, 43.0, 54.0, 74.0, 76.0, 79.0, 84.0, 59.0, 72.0, 53.0, 47.0, 43.0, 34.0, 25.0, 16.0, 13.0, 11.0, 11.0, 8.0, 3.0, 3.0, 0.0, 2.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.296875, -8.083251953125, -7.86962890625, -7.656005859375, -7.4423828125, -7.228759765625, -7.01513671875, -6.801513671875, -6.587890625, -6.374267578125, -6.16064453125, -5.947021484375, -5.7333984375, -5.519775390625, -5.30615234375, -5.092529296875, -4.87890625, -4.665283203125, -4.45166015625, -4.238037109375, -4.0244140625, -3.810791015625, -3.59716796875, -3.383544921875, -3.169921875, -2.956298828125, -2.74267578125, -2.529052734375, -2.3154296875, -2.101806640625, -1.88818359375, -1.674560546875, -1.4609375, -1.247314453125, -1.03369140625, -0.820068359375, -0.6064453125, -0.392822265625, -0.17919921875, 0.034423828125, 0.248046875, 0.461669921875, 0.67529296875, 0.888916015625, 1.1025390625, 1.316162109375, 1.52978515625, 1.743408203125, 1.95703125, 2.170654296875, 2.38427734375, 2.597900390625, 2.8115234375, 3.025146484375, 3.23876953125, 3.452392578125, 3.666015625, 3.879638671875, 4.09326171875, 4.306884765625, 4.5205078125, 4.734130859375, 4.94775390625, 5.161376953125, 5.375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 14.0, 25.0, 30.0, 40.0, 57.0, 74.0, 131.0, 202.0, 384.0, 905.0, 2743.0, 13602.0, 138337.0, 760018.0, 115733.0, 12051.0, 2497.0, 801.0, 331.0, 203.0, 103.0, 79.0, 61.0, 35.0, 20.0, 17.0, 7.0, 11.0, 12.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.146484375, -15.55859375, -14.970703125, -14.3828125, -13.794921875, -13.20703125, -12.619140625, -12.03125, -11.443359375, -10.85546875, -10.267578125, -9.6796875, -9.091796875, -8.50390625, -7.916015625, -7.328125, -6.740234375, -6.15234375, -5.564453125, -4.9765625, -4.388671875, -3.80078125, -3.212890625, -2.625, -2.037109375, -1.44921875, -0.861328125, -0.2734375, 0.314453125, 0.90234375, 1.490234375, 2.078125, 2.666015625, 3.25390625, 3.841796875, 4.4296875, 5.017578125, 5.60546875, 6.193359375, 6.78125, 7.369140625, 7.95703125, 8.544921875, 9.1328125, 9.720703125, 10.30859375, 10.896484375, 11.484375, 12.072265625, 12.66015625, 13.248046875, 13.8359375, 14.423828125, 15.01171875, 15.599609375, 16.1875, 16.775390625, 17.36328125, 17.951171875, 18.5390625, 19.126953125, 19.71484375, 20.302734375, 20.890625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 11.0, 19.0, 27.0, 30.0, 42.0, 46.0, 65.0, 74.0, 74.0, 80.0, 79.0, 88.0, 87.0, 73.0, 69.0, 36.0, 35.0, 21.0, 15.0, 10.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.984375, -28.699951171875, -27.41552734375, -26.131103515625, -24.8466796875, -23.562255859375, -22.27783203125, -20.993408203125, -19.708984375, -18.424560546875, -17.14013671875, -15.855712890625, -14.5712890625, -13.286865234375, -12.00244140625, -10.718017578125, -9.43359375, -8.149169921875, -6.86474609375, -5.580322265625, -4.2958984375, -3.011474609375, -1.72705078125, -0.442626953125, 0.841796875, 2.126220703125, 3.41064453125, 4.695068359375, 5.9794921875, 7.263916015625, 8.54833984375, 9.832763671875, 11.1171875, 12.401611328125, 13.68603515625, 14.970458984375, 16.2548828125, 17.539306640625, 18.82373046875, 20.108154296875, 21.392578125, 22.677001953125, 23.96142578125, 25.245849609375, 26.5302734375, 27.814697265625, 29.09912109375, 30.383544921875, 31.66796875, 32.952392578125, 34.23681640625, 35.521240234375, 36.8056640625, 38.090087890625, 39.37451171875, 40.658935546875, 41.943359375, 43.227783203125, 44.51220703125, 45.796630859375, 47.0810546875, 48.365478515625, 49.64990234375, 50.934326171875, 52.21875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 2.0, 6.0, 9.0, 7.0, 8.0, 15.0, 51.0, 101.0, 324.0, 2267.0, 143133.0, 897322.0, 4518.0, 525.0, 146.0, 55.0, 24.0, 15.0, 6.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.42041015625, -17.7158203125, -17.01123046875, -16.306640625, -15.60205078125, -14.8974609375, -14.19287109375, -13.48828125, -12.78369140625, -12.0791015625, -11.37451171875, -10.669921875, -9.96533203125, -9.2607421875, -8.55615234375, -7.8515625, -7.14697265625, -6.4423828125, -5.73779296875, -5.033203125, -4.32861328125, -3.6240234375, -2.91943359375, -2.21484375, -1.51025390625, -0.8056640625, -0.10107421875, 0.603515625, 1.30810546875, 2.0126953125, 2.71728515625, 3.421875, 4.12646484375, 4.8310546875, 5.53564453125, 6.240234375, 6.94482421875, 7.6494140625, 8.35400390625, 9.05859375, 9.76318359375, 10.4677734375, 11.17236328125, 11.876953125, 12.58154296875, 13.2861328125, 13.99072265625, 14.6953125, 15.39990234375, 16.1044921875, 16.80908203125, 17.513671875, 18.21826171875, 18.9228515625, 19.62744140625, 20.33203125, 21.03662109375, 21.7412109375, 22.44580078125, 23.150390625, 23.85498046875, 24.5595703125, 25.26416015625, 25.96875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 9.0, 16.0, 21.0, 36.0, 63.0, 93.0, 148.0, 162.0, 147.0, 114.0, 65.0, 31.0, 29.0, 22.0, 15.0, 13.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018987655639648438, -0.001857161521911621, -0.0018155574798583984, -0.0017739534378051758, -0.0017323493957519531, -0.0016907453536987305, -0.0016491413116455078, -0.0016075372695922852, -0.0015659332275390625, -0.0015243291854858398, -0.0014827251434326172, -0.0014411211013793945, -0.0013995170593261719, -0.0013579130172729492, -0.0013163089752197266, -0.001274704933166504, -0.0012331008911132812, -0.0011914968490600586, -0.001149892807006836, -0.0011082887649536133, -0.0010666847229003906, -0.001025080680847168, -0.0009834766387939453, -0.0009418725967407227, -0.0009002685546875, -0.0008586645126342773, -0.0008170604705810547, -0.000775456428527832, -0.0007338523864746094, -0.0006922483444213867, -0.0006506443023681641, -0.0006090402603149414, -0.0005674362182617188, -0.0005258321762084961, -0.00048422813415527344, -0.0004426240921020508, -0.0004010200500488281, -0.00035941600799560547, -0.0003178119659423828, -0.00027620792388916016, -0.0002346038818359375, -0.00019299983978271484, -0.0001513957977294922, -0.00010979175567626953, -6.818771362304688e-05, -2.658367156982422e-05, 1.5020370483398438e-05, 5.6624412536621094e-05, 9.822845458984375e-05, 0.0001398324966430664, 0.00018143653869628906, 0.00022304058074951172, 0.0002646446228027344, 0.00030624866485595703, 0.0003478527069091797, 0.00038945674896240234, 0.000431060791015625, 0.00047266483306884766, 0.0005142688751220703, 0.000555872917175293, 0.0005974769592285156, 0.0006390810012817383, 0.0006806850433349609, 0.0007222890853881836, 0.0007638931274414062]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 17.0, 28.0, 71.0, 112.0, 257.0, 729.0, 3766.0, 72610.0, 943925.0, 24024.0, 2108.0, 523.0, 187.0, 83.0, 38.0, 16.0, 18.0, 9.0, 6.0, 9.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.9375, -18.4796142578125, -18.021728515625, -17.5638427734375, -17.10595703125, -16.6480712890625, -16.190185546875, -15.7322998046875, -15.2744140625, -14.8165283203125, -14.358642578125, -13.9007568359375, -13.44287109375, -12.9849853515625, -12.527099609375, -12.0692138671875, -11.611328125, -11.1534423828125, -10.695556640625, -10.2376708984375, -9.77978515625, -9.3218994140625, -8.864013671875, -8.4061279296875, -7.9482421875, -7.4903564453125, -7.032470703125, -6.5745849609375, -6.11669921875, -5.6588134765625, -5.200927734375, -4.7430419921875, -4.28515625, -3.8272705078125, -3.369384765625, -2.9114990234375, -2.45361328125, -1.9957275390625, -1.537841796875, -1.0799560546875, -0.6220703125, -0.1641845703125, 0.293701171875, 0.7515869140625, 1.20947265625, 1.6673583984375, 2.125244140625, 2.5831298828125, 3.041015625, 3.4989013671875, 3.956787109375, 4.4146728515625, 4.87255859375, 5.3304443359375, 5.788330078125, 6.2462158203125, 6.7041015625, 7.1619873046875, 7.619873046875, 8.0777587890625, 8.53564453125, 8.9935302734375, 9.451416015625, 9.9093017578125, 10.3671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 17.0, 15.0, 63.0, 159.0, 320.0, 256.0, 102.0, 43.0, 15.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.16943359375, -17.4638671875, -16.75830078125, -16.052734375, -15.34716796875, -14.6416015625, -13.93603515625, -13.23046875, -12.52490234375, -11.8193359375, -11.11376953125, -10.408203125, -9.70263671875, -8.9970703125, -8.29150390625, -7.5859375, -6.88037109375, -6.1748046875, -5.46923828125, -4.763671875, -4.05810546875, -3.3525390625, -2.64697265625, -1.94140625, -1.23583984375, -0.5302734375, 0.17529296875, 0.880859375, 1.58642578125, 2.2919921875, 2.99755859375, 3.703125, 4.40869140625, 5.1142578125, 5.81982421875, 6.525390625, 7.23095703125, 7.9365234375, 8.64208984375, 9.34765625, 10.05322265625, 10.7587890625, 11.46435546875, 12.169921875, 12.87548828125, 13.5810546875, 14.28662109375, 14.9921875, 15.69775390625, 16.4033203125, 17.10888671875, 17.814453125, 18.52001953125, 19.2255859375, 19.93115234375, 20.63671875, 21.34228515625, 22.0478515625, 22.75341796875, 23.458984375, 24.16455078125, 24.8701171875, 25.57568359375, 26.28125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 11.0, 11.0, 29.0, 75.0, 161.0, 277.0, 208.0, 135.0, 66.0, 19.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.51182556152344, -116.6333999633789, -110.75497436523438, -104.87655639648438, -98.99813079833984, -93.11970520019531, -87.24128723144531, -81.36286163330078, -75.48443603515625, -69.60601043701172, -63.72758865356445, -57.84916687011719, -51.970741271972656, -46.092315673828125, -40.21389389038086, -34.335472106933594, -28.457046508789062, -22.578622817993164, -16.700199127197266, -10.821775436401367, -4.943351745605469, 0.9350719451904297, 6.813495635986328, 12.691917419433594, 18.570343017578125, 24.448766708374023, 30.327190399169922, 36.20561218261719, 42.08403778076172, 47.96246337890625, 53.840885162353516, 59.71930694580078, 65.59774780273438, 71.4761734008789, 77.35459899902344, 83.23301696777344, 89.11144256591797, 94.9898681640625, 100.8682861328125, 106.74671173095703, 112.62513732910156, 118.5035629272461, 124.38198852539062, 130.26040649414062, 136.13882446289062, 142.0172576904297, 147.8956756591797, 153.77410888671875, 159.65252685546875, 165.53094482421875, 171.4093780517578, 177.2877960205078, 183.16622924804688, 189.04464721679688, 194.92306518554688, 200.80148315429688, 206.67991638183594, 212.55833435058594, 218.436767578125, 224.315185546875, 230.193603515625, 236.07203674316406, 241.95045471191406, 247.82888793945312, 253.70730590820312]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 3.0, 8.0, 7.0, 9.0, 6.0, 9.0, 14.0, 16.0, 9.0, 17.0, 20.0, 22.0, 26.0, 27.0, 37.0, 38.0, 49.0, 45.0, 48.0, 63.0, 47.0, 39.0, 52.0, 54.0, 38.0, 38.0, 37.0, 32.0, 32.0, 18.0, 22.0, 16.0, 13.0, 11.0, 11.0, 11.0, 7.0, 12.0, 6.0, 4.0, 1.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-97.31277465820312, -94.21078491210938, -91.10879516601562, -88.00680541992188, -84.90481567382812, -81.80282592773438, -78.70083618164062, -75.59884643554688, -72.49685668945312, -69.39486694335938, -66.29287719726562, -63.190887451171875, -60.088897705078125, -56.986907958984375, -53.88492202758789, -50.78293228149414, -47.680946350097656, -44.578956604003906, -41.476966857910156, -38.374977111816406, -35.272987365722656, -32.170997619628906, -29.069011688232422, -25.967021942138672, -22.865032196044922, -19.763042449951172, -16.661052703857422, -13.559064865112305, -10.457075119018555, -7.355085372924805, -4.2530975341796875, -1.1511077880859375, 1.9508743286132812, 5.052863597869873, 8.154852867126465, 11.256841659545898, 14.358831405639648, 17.4608211517334, 20.562808990478516, 23.664798736572266, 26.766788482666016, 29.868778228759766, 32.970767974853516, 36.07275390625, 39.17474365234375, 42.2767333984375, 45.37872314453125, 48.480712890625, 51.58270263671875, 54.6846923828125, 57.78668212890625, 60.888671875, 63.99066162109375, 67.0926513671875, 70.19464111328125, 73.296630859375, 76.39862060546875, 79.5006103515625, 82.60260009765625, 85.70458984375, 88.80657958984375, 91.9085693359375, 95.01055908203125, 98.112548828125, 101.21453094482422]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 7.0, 8.0, 13.0, 17.0, 30.0, 38.0, 87.0, 169.0, 545.0, 2304.0, 25271.0, 4152350.0, 11390.0, 1444.0, 374.0, 134.0, 49.0, 23.0, 12.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.375, -56.1103515625, -54.845703125, -53.5810546875, -52.31640625, -51.0517578125, -49.787109375, -48.5224609375, -47.2578125, -45.9931640625, -44.728515625, -43.4638671875, -42.19921875, -40.9345703125, -39.669921875, -38.4052734375, -37.140625, -35.8759765625, -34.611328125, -33.3466796875, -32.08203125, -30.8173828125, -29.552734375, -28.2880859375, -27.0234375, -25.7587890625, -24.494140625, -23.2294921875, -21.96484375, -20.7001953125, -19.435546875, -18.1708984375, -16.90625, -15.6416015625, -14.376953125, -13.1123046875, -11.84765625, -10.5830078125, -9.318359375, -8.0537109375, -6.7890625, -5.5244140625, -4.259765625, -2.9951171875, -1.73046875, -0.4658203125, 0.798828125, 2.0634765625, 3.328125, 4.5927734375, 5.857421875, 7.1220703125, 8.38671875, 9.6513671875, 10.916015625, 12.1806640625, 13.4453125, 14.7099609375, 15.974609375, 17.2392578125, 18.50390625, 19.7685546875, 21.033203125, 22.2978515625, 23.5625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 24.0, 47.0, 69.0, 118.0, 175.0, 178.0, 155.0, 112.0, 55.0, 23.0, 20.0, 8.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.297119140625, -15.85986328125, -15.422607421875, -14.9853515625, -14.548095703125, -14.11083984375, -13.673583984375, -13.236328125, -12.799072265625, -12.36181640625, -11.924560546875, -11.4873046875, -11.050048828125, -10.61279296875, -10.175537109375, -9.73828125, -9.301025390625, -8.86376953125, -8.426513671875, -7.9892578125, -7.552001953125, -7.11474609375, -6.677490234375, -6.240234375, -5.802978515625, -5.36572265625, -4.928466796875, -4.4912109375, -4.053955078125, -3.61669921875, -3.179443359375, -2.7421875, -2.304931640625, -1.86767578125, -1.430419921875, -0.9931640625, -0.555908203125, -0.11865234375, 0.318603515625, 0.755859375, 1.193115234375, 1.63037109375, 2.067626953125, 2.5048828125, 2.942138671875, 3.37939453125, 3.816650390625, 4.25390625, 4.691162109375, 5.12841796875, 5.565673828125, 6.0029296875, 6.440185546875, 6.87744140625, 7.314697265625, 7.751953125, 8.189208984375, 8.62646484375, 9.063720703125, 9.5009765625, 9.938232421875, 10.37548828125, 10.812744140625, 11.25]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 8.0, 24.0, 25.0, 31.0, 66.0, 76.0, 89.0, 136.0, 187.0, 261.0, 348.0, 543.0, 881.0, 1318.0, 2111.0, 3897.0, 8238.0, 21316.0, 105536.0, 3947124.0, 69034.0, 17124.0, 6931.0, 3325.0, 1926.0, 1205.0, 772.0, 496.0, 342.0, 234.0, 191.0, 139.0, 89.0, 54.0, 51.0, 37.0, 26.0, 19.0, 19.0, 15.0, 13.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-13.2890625, -12.87890625, -12.46875, -12.05859375, -11.6484375, -11.23828125, -10.828125, -10.41796875, -10.0078125, -9.59765625, -9.1875, -8.77734375, -8.3671875, -7.95703125, -7.546875, -7.13671875, -6.7265625, -6.31640625, -5.90625, -5.49609375, -5.0859375, -4.67578125, -4.265625, -3.85546875, -3.4453125, -3.03515625, -2.625, -2.21484375, -1.8046875, -1.39453125, -0.984375, -0.57421875, -0.1640625, 0.24609375, 0.65625, 1.06640625, 1.4765625, 1.88671875, 2.296875, 2.70703125, 3.1171875, 3.52734375, 3.9375, 4.34765625, 4.7578125, 5.16796875, 5.578125, 5.98828125, 6.3984375, 6.80859375, 7.21875, 7.62890625, 8.0390625, 8.44921875, 8.859375, 9.26953125, 9.6796875, 10.08984375, 10.5, 10.91015625, 11.3203125, 11.73046875, 12.140625, 12.55078125, 12.9609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 16.0, 22.0, 36.0, 53.0, 205.0, 3457.0, 140.0, 50.0, 30.0, 15.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.234375, -8.9305419921875, -8.626708984375, -8.3228759765625, -8.01904296875, -7.7152099609375, -7.411376953125, -7.1075439453125, -6.8037109375, -6.4998779296875, -6.196044921875, -5.8922119140625, -5.58837890625, -5.2845458984375, -4.980712890625, -4.6768798828125, -4.373046875, -4.0692138671875, -3.765380859375, -3.4615478515625, -3.15771484375, -2.8538818359375, -2.550048828125, -2.2462158203125, -1.9423828125, -1.6385498046875, -1.334716796875, -1.0308837890625, -0.72705078125, -0.4232177734375, -0.119384765625, 0.1844482421875, 0.48828125, 0.7921142578125, 1.095947265625, 1.3997802734375, 1.70361328125, 2.0074462890625, 2.311279296875, 2.6151123046875, 2.9189453125, 3.2227783203125, 3.526611328125, 3.8304443359375, 4.13427734375, 4.4381103515625, 4.741943359375, 5.0457763671875, 5.349609375, 5.6534423828125, 5.957275390625, 6.2611083984375, 6.56494140625, 6.8687744140625, 7.172607421875, 7.4764404296875, 7.7802734375, 8.0841064453125, 8.387939453125, 8.6917724609375, 8.99560546875, 9.2994384765625, 9.603271484375, 9.9071044921875, 10.2109375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 9.0, 11.0, 26.0, 37.0, 36.0, 46.0, 77.0, 95.0, 84.0, 124.0, 130.0, 97.0, 57.0, 47.0, 31.0, 28.0, 12.0, 8.0, 10.0, 5.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.505218505859375, -15.768282890319824, -15.031346321105957, -14.294410705566406, -13.557475090026855, -12.820539474487305, -12.083602905273438, -11.346667289733887, -10.609731674194336, -9.872796058654785, -9.135859489440918, -8.398923873901367, -7.661988258361816, -6.925052165985107, -6.188116073608398, -5.451180458068848, -4.7142438888549805, -3.9773080348968506, -3.2403721809387207, -2.5034360885620117, -1.7665002346038818, -1.029564380645752, -0.29262828826904297, 0.4443073272705078, 1.1812434196472168, 1.9181792736053467, 2.6551151275634766, 3.3920512199401855, 4.1289873123168945, 4.865922927856445, 5.602859020233154, 6.339794635772705, 7.076730728149414, 7.813666820526123, 8.550602912902832, 9.287538528442383, 10.024474143981934, 10.761409759521484, 11.498346328735352, 12.235281944274902, 12.972217559814453, 13.709153175354004, 14.446089744567871, 15.183025360107422, 15.919960975646973, 16.656896591186523, 17.39383316040039, 18.130767822265625, 18.867706298828125, 19.604642868041992, 20.341577529907227, 21.078514099121094, 21.81545066833496, 22.552385330200195, 23.289321899414062, 24.026256561279297, 24.763193130493164, 25.50012969970703, 26.237064361572266, 26.974000930786133, 27.7109375, 28.447872161865234, 29.1848087310791, 29.92174530029297, 30.658679962158203]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 6.0, 6.0, 8.0, 10.0, 16.0, 28.0, 23.0, 31.0, 39.0, 57.0, 51.0, 59.0, 49.0, 63.0, 63.0, 58.0, 66.0, 36.0, 42.0, 45.0, 39.0, 34.0, 32.0, 26.0, 17.0, 18.0, 18.0, 16.0, 7.0, 14.0, 9.0, 6.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.03154754638672, -24.31671142578125, -23.60187530517578, -22.887041091918945, -22.172204971313477, -21.457368850708008, -20.742534637451172, -20.027698516845703, -19.312862396240234, -18.598026275634766, -17.883190155029297, -17.16835594177246, -16.453519821166992, -15.738683700561523, -15.023848533630371, -14.309013366699219, -13.59417724609375, -12.879341125488281, -12.164505958557129, -11.449670791625977, -10.734834671020508, -10.019998550415039, -9.305163383483887, -8.590328216552734, -7.875492095947266, -7.160656452178955, -6.4458208084106445, -5.730985164642334, -5.016149520874023, -4.301313877105713, -3.5864782333374023, -2.871642589569092, -2.1568050384521484, -1.441969394683838, -0.7271337509155273, -0.012298107147216797, 0.7025375366210938, 1.4173731803894043, 2.132208824157715, 2.8470444679260254, 3.561880111694336, 4.2767157554626465, 4.991551399230957, 5.706387042999268, 6.421222686767578, 7.136058330535889, 7.850893974304199, 8.565729141235352, 9.28056526184082, 9.995401382446289, 10.710236549377441, 11.425071716308594, 12.139907836914062, 12.854743957519531, 13.569579124450684, 14.284414291381836, 14.999250411987305, 15.714086532592773, 16.42892074584961, 17.143756866455078, 17.858592987060547, 18.573429107666016, 19.288265228271484, 20.00309944152832, 20.71793556213379]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 9.0, 6.0, 18.0, 34.0, 55.0, 117.0, 235.0, 599.0, 2628.0, 26751.0, 626293.0, 373154.0, 15920.0, 1853.0, 476.0, 199.0, 79.0, 43.0, 33.0, 27.0, 10.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5625, -14.7392578125, -13.916015625, -13.0927734375, -12.26953125, -11.4462890625, -10.623046875, -9.7998046875, -8.9765625, -8.1533203125, -7.330078125, -6.5068359375, -5.68359375, -4.8603515625, -4.037109375, -3.2138671875, -2.390625, -1.5673828125, -0.744140625, 0.0791015625, 0.90234375, 1.7255859375, 2.548828125, 3.3720703125, 4.1953125, 5.0185546875, 5.841796875, 6.6650390625, 7.48828125, 8.3115234375, 9.134765625, 9.9580078125, 10.78125, 11.6044921875, 12.427734375, 13.2509765625, 14.07421875, 14.8974609375, 15.720703125, 16.5439453125, 17.3671875, 18.1904296875, 19.013671875, 19.8369140625, 20.66015625, 21.4833984375, 22.306640625, 23.1298828125, 23.953125, 24.7763671875, 25.599609375, 26.4228515625, 27.24609375, 28.0693359375, 28.892578125, 29.7158203125, 30.5390625, 31.3623046875, 32.185546875, 33.0087890625, 33.83203125, 34.6552734375, 35.478515625, 36.3017578125, 37.125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 9.0, 24.0, 42.0, 49.0, 67.0, 112.0, 124.0, 112.0, 131.0, 100.0, 67.0, 66.0, 34.0, 25.0, 10.0, 8.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.96875, -12.6409912109375, -12.313232421875, -11.9854736328125, -11.65771484375, -11.3299560546875, -11.002197265625, -10.6744384765625, -10.3466796875, -10.0189208984375, -9.691162109375, -9.3634033203125, -9.03564453125, -8.7078857421875, -8.380126953125, -8.0523681640625, -7.724609375, -7.3968505859375, -7.069091796875, -6.7413330078125, -6.41357421875, -6.0858154296875, -5.758056640625, -5.4302978515625, -5.1025390625, -4.7747802734375, -4.447021484375, -4.1192626953125, -3.79150390625, -3.4637451171875, -3.135986328125, -2.8082275390625, -2.48046875, -2.1527099609375, -1.824951171875, -1.4971923828125, -1.16943359375, -0.8416748046875, -0.513916015625, -0.1861572265625, 0.1416015625, 0.4693603515625, 0.797119140625, 1.1248779296875, 1.45263671875, 1.7803955078125, 2.108154296875, 2.4359130859375, 2.763671875, 3.0914306640625, 3.419189453125, 3.7469482421875, 4.07470703125, 4.4024658203125, 4.730224609375, 5.0579833984375, 5.3857421875, 5.7135009765625, 6.041259765625, 6.3690185546875, 6.69677734375, 7.0245361328125, 7.352294921875, 7.6800537109375, 8.0078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 7.0, 17.0, 23.0, 27.0, 57.0, 46.0, 103.0, 135.0, 290.0, 571.0, 1193.0, 3459.0, 16536.0, 149298.0, 733466.0, 123353.0, 14485.0, 3206.0, 1105.0, 488.0, 266.0, 144.0, 91.0, 45.0, 30.0, 29.0, 25.0, 10.0, 9.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.219970703125, -17.65869140625, -17.097412109375, -16.5361328125, -15.974853515625, -15.41357421875, -14.852294921875, -14.291015625, -13.729736328125, -13.16845703125, -12.607177734375, -12.0458984375, -11.484619140625, -10.92333984375, -10.362060546875, -9.80078125, -9.239501953125, -8.67822265625, -8.116943359375, -7.5556640625, -6.994384765625, -6.43310546875, -5.871826171875, -5.310546875, -4.749267578125, -4.18798828125, -3.626708984375, -3.0654296875, -2.504150390625, -1.94287109375, -1.381591796875, -0.8203125, -0.259033203125, 0.30224609375, 0.863525390625, 1.4248046875, 1.986083984375, 2.54736328125, 3.108642578125, 3.669921875, 4.231201171875, 4.79248046875, 5.353759765625, 5.9150390625, 6.476318359375, 7.03759765625, 7.598876953125, 8.16015625, 8.721435546875, 9.28271484375, 9.843994140625, 10.4052734375, 10.966552734375, 11.52783203125, 12.089111328125, 12.650390625, 13.211669921875, 13.77294921875, 14.334228515625, 14.8955078125, 15.456787109375, 16.01806640625, 16.579345703125, 17.140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 7.0, 6.0, 7.0, 9.0, 15.0, 25.0, 15.0, 32.0, 37.0, 34.0, 41.0, 48.0, 60.0, 60.0, 66.0, 76.0, 52.0, 60.0, 54.0, 50.0, 36.0, 32.0, 33.0, 39.0, 25.0, 26.0, 8.0, 12.0, 11.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90625, -24.098388671875, -23.29052734375, -22.482666015625, -21.6748046875, -20.866943359375, -20.05908203125, -19.251220703125, -18.443359375, -17.635498046875, -16.82763671875, -16.019775390625, -15.2119140625, -14.404052734375, -13.59619140625, -12.788330078125, -11.98046875, -11.172607421875, -10.36474609375, -9.556884765625, -8.7490234375, -7.941162109375, -7.13330078125, -6.325439453125, -5.517578125, -4.709716796875, -3.90185546875, -3.093994140625, -2.2861328125, -1.478271484375, -0.67041015625, 0.137451171875, 0.9453125, 1.753173828125, 2.56103515625, 3.368896484375, 4.1767578125, 4.984619140625, 5.79248046875, 6.600341796875, 7.408203125, 8.216064453125, 9.02392578125, 9.831787109375, 10.6396484375, 11.447509765625, 12.25537109375, 13.063232421875, 13.87109375, 14.678955078125, 15.48681640625, 16.294677734375, 17.1025390625, 17.910400390625, 18.71826171875, 19.526123046875, 20.333984375, 21.141845703125, 21.94970703125, 22.757568359375, 23.5654296875, 24.373291015625, 25.18115234375, 25.989013671875, 26.796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 12.0, 44.0, 80.0, 225.0, 948.0, 17365.0, 1012708.0, 15814.0, 944.0, 237.0, 95.0, 29.0, 19.0, 4.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.4422607421875, -12.970458984375, -12.4986572265625, -12.02685546875, -11.5550537109375, -11.083251953125, -10.6114501953125, -10.1396484375, -9.6678466796875, -9.196044921875, -8.7242431640625, -8.25244140625, -7.7806396484375, -7.308837890625, -6.8370361328125, -6.365234375, -5.8934326171875, -5.421630859375, -4.9498291015625, -4.47802734375, -4.0062255859375, -3.534423828125, -3.0626220703125, -2.5908203125, -2.1190185546875, -1.647216796875, -1.1754150390625, -0.70361328125, -0.2318115234375, 0.239990234375, 0.7117919921875, 1.18359375, 1.6553955078125, 2.127197265625, 2.5989990234375, 3.07080078125, 3.5426025390625, 4.014404296875, 4.4862060546875, 4.9580078125, 5.4298095703125, 5.901611328125, 6.3734130859375, 6.84521484375, 7.3170166015625, 7.788818359375, 8.2606201171875, 8.732421875, 9.2042236328125, 9.676025390625, 10.1478271484375, 10.61962890625, 11.0914306640625, 11.563232421875, 12.0350341796875, 12.5068359375, 12.9786376953125, 13.450439453125, 13.9222412109375, 14.39404296875, 14.8658447265625, 15.337646484375, 15.8094482421875, 16.28125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 10.0, 8.0, 16.0, 19.0, 38.0, 58.0, 117.0, 155.0, 194.0, 157.0, 88.0, 49.0, 32.0, 26.0, 15.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007524490356445312, -0.0007086843252182007, -0.0006649196147918701, -0.0006211549043655396, -0.000577390193939209, -0.0005336254835128784, -0.0004898607730865479, -0.0004460960626602173, -0.0004023313522338867, -0.00035856664180755615, -0.0003148019313812256, -0.000271037220954895, -0.00022727251052856445, -0.0001835078001022339, -0.00013974308967590332, -9.597837924957275e-05, -5.221366882324219e-05, -8.448958396911621e-06, 3.5315752029418945e-05, 7.908046245574951e-05, 0.00012284517288208008, 0.00016660988330841064, 0.0002103745937347412, 0.0002541393041610718, 0.00029790401458740234, 0.0003416687250137329, 0.0003854334354400635, 0.00042919814586639404, 0.0004729628562927246, 0.0005167275667190552, 0.0005604922771453857, 0.0006042569875717163, 0.0006480216979980469, 0.0006917864084243774, 0.000735551118850708, 0.0007793158292770386, 0.0008230805397033691, 0.0008668452501296997, 0.0009106099605560303, 0.0009543746709823608, 0.0009981393814086914, 0.001041904091835022, 0.0010856688022613525, 0.001129433512687683, 0.0011731982231140137, 0.0012169629335403442, 0.0012607276439666748, 0.0013044923543930054, 0.001348257064819336, 0.0013920217752456665, 0.001435786485671997, 0.0014795511960983276, 0.0015233159065246582, 0.0015670806169509888, 0.0016108453273773193, 0.00165461003780365, 0.0016983747482299805, 0.001742139458656311, 0.0017859041690826416, 0.0018296688795089722, 0.0018734335899353027, 0.0019171983003616333, 0.001960963010787964, 0.0020047277212142944, 0.002048492431640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 9.0, 1.0, 6.0, 20.0, 33.0, 66.0, 111.0, 245.0, 579.0, 2129.0, 16937.0, 544365.0, 465631.0, 15361.0, 2018.0, 558.0, 253.0, 103.0, 58.0, 30.0, 12.0, 10.0, 6.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.4537353515625, -7.196533203125, -6.9393310546875, -6.68212890625, -6.4249267578125, -6.167724609375, -5.9105224609375, -5.6533203125, -5.3961181640625, -5.138916015625, -4.8817138671875, -4.62451171875, -4.3673095703125, -4.110107421875, -3.8529052734375, -3.595703125, -3.3385009765625, -3.081298828125, -2.8240966796875, -2.56689453125, -2.3096923828125, -2.052490234375, -1.7952880859375, -1.5380859375, -1.2808837890625, -1.023681640625, -0.7664794921875, -0.50927734375, -0.2520751953125, 0.005126953125, 0.2623291015625, 0.51953125, 0.7767333984375, 1.033935546875, 1.2911376953125, 1.54833984375, 1.8055419921875, 2.062744140625, 2.3199462890625, 2.5771484375, 2.8343505859375, 3.091552734375, 3.3487548828125, 3.60595703125, 3.8631591796875, 4.120361328125, 4.3775634765625, 4.634765625, 4.8919677734375, 5.149169921875, 5.4063720703125, 5.66357421875, 5.9207763671875, 6.177978515625, 6.4351806640625, 6.6923828125, 6.9495849609375, 7.206787109375, 7.4639892578125, 7.72119140625, 7.9783935546875, 8.235595703125, 8.4927978515625, 8.75]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 13.0, 9.0, 26.0, 29.0, 62.0, 91.0, 127.0, 156.0, 151.0, 125.0, 80.0, 52.0, 34.0, 12.0, 11.0, 17.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.885986328125, -7.63134765625, -7.376708984375, -7.1220703125, -6.867431640625, -6.61279296875, -6.358154296875, -6.103515625, -5.848876953125, -5.59423828125, -5.339599609375, -5.0849609375, -4.830322265625, -4.57568359375, -4.321044921875, -4.06640625, -3.811767578125, -3.55712890625, -3.302490234375, -3.0478515625, -2.793212890625, -2.53857421875, -2.283935546875, -2.029296875, -1.774658203125, -1.52001953125, -1.265380859375, -1.0107421875, -0.756103515625, -0.50146484375, -0.246826171875, 0.0078125, 0.262451171875, 0.51708984375, 0.771728515625, 1.0263671875, 1.281005859375, 1.53564453125, 1.790283203125, 2.044921875, 2.299560546875, 2.55419921875, 2.808837890625, 3.0634765625, 3.318115234375, 3.57275390625, 3.827392578125, 4.08203125, 4.336669921875, 4.59130859375, 4.845947265625, 5.1005859375, 5.355224609375, 5.60986328125, 5.864501953125, 6.119140625, 6.373779296875, 6.62841796875, 6.883056640625, 7.1376953125, 7.392333984375, 7.64697265625, 7.901611328125, 8.15625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 4.0, 7.0, 10.0, 27.0, 62.0, 147.0, 229.0, 231.0, 149.0, 71.0, 36.0, 22.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-200.08505249023438, -194.80789184570312, -189.53073120117188, -184.25357055664062, -178.97640991210938, -173.69924926757812, -168.42208862304688, -163.14492797851562, -157.86776733398438, -152.59060668945312, -147.31344604492188, -142.03628540039062, -136.75912475585938, -131.48196411132812, -126.2048110961914, -120.92765045166016, -115.65049743652344, -110.37333679199219, -105.09617614746094, -99.81901550292969, -94.54185485839844, -89.26469421386719, -83.98754119873047, -78.71038055419922, -73.43321990966797, -68.15605926513672, -62.87889862060547, -57.601741790771484, -52.324581146240234, -47.047420501708984, -41.770263671875, -36.49310302734375, -31.215957641601562, -25.938796997070312, -20.661638259887695, -15.384478569030762, -10.107318878173828, -4.830158233642578, 0.44700050354003906, 5.724159240722656, 11.001319885253906, 16.278480529785156, 21.555639266967773, 26.83279800415039, 32.10995864868164, 37.38711929321289, 42.664276123046875, 47.941436767578125, 53.218597412109375, 58.495758056640625, 63.772918701171875, 69.05007934570312, 74.32723999023438, 79.60440063476562, 84.88155364990234, 90.1587142944336, 95.43587493896484, 100.7130355834961, 105.99019622802734, 111.2673568725586, 116.54450988769531, 121.82167053222656, 127.09883117675781, 132.37599182128906, 137.6531524658203]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 10.0, 17.0, 12.0, 20.0, 16.0, 20.0, 25.0, 32.0, 27.0, 40.0, 37.0, 42.0, 46.0, 42.0, 56.0, 43.0, 53.0, 47.0, 44.0, 48.0, 42.0, 37.0, 37.0, 34.0, 26.0, 16.0, 19.0, 21.0, 10.0, 14.0, 9.0, 9.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-89.7435073852539, -86.97896575927734, -84.21443176269531, -81.44989013671875, -78.68534851074219, -75.92080688476562, -73.1562728881836, -70.39173126220703, -67.627197265625, -64.86265563964844, -62.09811782836914, -59.333580017089844, -56.56903839111328, -53.804500579833984, -51.03996276855469, -48.275421142578125, -45.51087951660156, -42.746341705322266, -39.9818000793457, -37.217262268066406, -34.452720642089844, -31.688182830810547, -28.92364501953125, -26.15910530090332, -23.39456558227539, -20.63002586364746, -17.86548614501953, -15.100948333740234, -12.336408615112305, -9.571868896484375, -6.807331085205078, -4.042791366577148, -1.2782440185546875, 1.486295223236084, 4.2508344650268555, 7.015373229980469, 9.779912948608398, 12.544452667236328, 15.308990478515625, 18.073530197143555, 20.838069915771484, 23.602609634399414, 26.367149353027344, 29.13168716430664, 31.89622688293457, 34.6607666015625, 37.4253044128418, 40.189842224121094, 42.954383850097656, 45.71892166137695, 48.483463287353516, 51.24800109863281, 54.012542724609375, 56.77708053588867, 59.54161834716797, 62.30615997314453, 65.07069396972656, 67.83523559570312, 70.59976959228516, 73.36431121826172, 76.12885284423828, 78.89338684082031, 81.65792846679688, 84.42247009277344, 87.18701171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 9.0, 13.0, 15.0, 22.0, 35.0, 31.0, 80.0, 114.0, 247.0, 480.0, 1085.0, 3044.0, 9883.0, 46322.0, 2670805.0, 1408793.0, 39374.0, 8814.0, 2893.0, 1167.0, 467.0, 259.0, 141.0, 59.0, 40.0, 26.0, 15.0, 12.0, 13.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.487548828125, -11.07666015625, -10.665771484375, -10.2548828125, -9.843994140625, -9.43310546875, -9.022216796875, -8.611328125, -8.200439453125, -7.78955078125, -7.378662109375, -6.9677734375, -6.556884765625, -6.14599609375, -5.735107421875, -5.32421875, -4.913330078125, -4.50244140625, -4.091552734375, -3.6806640625, -3.269775390625, -2.85888671875, -2.447998046875, -2.037109375, -1.626220703125, -1.21533203125, -0.804443359375, -0.3935546875, 0.017333984375, 0.42822265625, 0.839111328125, 1.25, 1.660888671875, 2.07177734375, 2.482666015625, 2.8935546875, 3.304443359375, 3.71533203125, 4.126220703125, 4.537109375, 4.947998046875, 5.35888671875, 5.769775390625, 6.1806640625, 6.591552734375, 7.00244140625, 7.413330078125, 7.82421875, 8.235107421875, 8.64599609375, 9.056884765625, 9.4677734375, 9.878662109375, 10.28955078125, 10.700439453125, 11.111328125, 11.522216796875, 11.93310546875, 12.343994140625, 12.7548828125, 13.165771484375, 13.57666015625, 13.987548828125, 14.3984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 8.0, 12.0, 19.0, 16.0, 26.0, 32.0, 33.0, 42.0, 59.0, 74.0, 54.0, 61.0, 60.0, 70.0, 74.0, 60.0, 46.0, 45.0, 37.0, 36.0, 30.0, 24.0, 17.0, 14.0, 12.0, 8.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.30859375, -5.15228271484375, -4.9959716796875, -4.83966064453125, -4.683349609375, -4.52703857421875, -4.3707275390625, -4.21441650390625, -4.05810546875, -3.90179443359375, -3.7454833984375, -3.58917236328125, -3.432861328125, -3.27655029296875, -3.1202392578125, -2.96392822265625, -2.8076171875, -2.65130615234375, -2.4949951171875, -2.33868408203125, -2.182373046875, -2.02606201171875, -1.8697509765625, -1.71343994140625, -1.55712890625, -1.40081787109375, -1.2445068359375, -1.08819580078125, -0.931884765625, -0.77557373046875, -0.6192626953125, -0.46295166015625, -0.306640625, -0.15032958984375, 0.0059814453125, 0.16229248046875, 0.318603515625, 0.47491455078125, 0.6312255859375, 0.78753662109375, 0.94384765625, 1.10015869140625, 1.2564697265625, 1.41278076171875, 1.569091796875, 1.72540283203125, 1.8817138671875, 2.03802490234375, 2.1943359375, 2.35064697265625, 2.5069580078125, 2.66326904296875, 2.819580078125, 2.97589111328125, 3.1322021484375, 3.28851318359375, 3.44482421875, 3.60113525390625, 3.7574462890625, 3.91375732421875, 4.070068359375, 4.22637939453125, 4.3826904296875, 4.53900146484375, 4.6953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 6.0, 14.0, 16.0, 24.0, 39.0, 56.0, 145.0, 328.0, 1218.0, 5621.0, 39623.0, 3559828.0, 560801.0, 21982.0, 3439.0, 728.0, 192.0, 84.0, 37.0, 23.0, 16.0, 17.0, 5.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -14.9930419921875, -14.337646484375, -13.6822509765625, -13.02685546875, -12.3714599609375, -11.716064453125, -11.0606689453125, -10.4052734375, -9.7498779296875, -9.094482421875, -8.4390869140625, -7.78369140625, -7.1282958984375, -6.472900390625, -5.8175048828125, -5.162109375, -4.5067138671875, -3.851318359375, -3.1959228515625, -2.54052734375, -1.8851318359375, -1.229736328125, -0.5743408203125, 0.0810546875, 0.7364501953125, 1.391845703125, 2.0472412109375, 2.70263671875, 3.3580322265625, 4.013427734375, 4.6688232421875, 5.32421875, 5.9796142578125, 6.635009765625, 7.2904052734375, 7.94580078125, 8.6011962890625, 9.256591796875, 9.9119873046875, 10.5673828125, 11.2227783203125, 11.878173828125, 12.5335693359375, 13.18896484375, 13.8443603515625, 14.499755859375, 15.1551513671875, 15.810546875, 16.4659423828125, 17.121337890625, 17.7767333984375, 18.43212890625, 19.0875244140625, 19.742919921875, 20.3983154296875, 21.0537109375, 21.7091064453125, 22.364501953125, 23.0198974609375, 23.67529296875, 24.3306884765625, 24.986083984375, 25.6414794921875, 26.296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 4.0, 5.0, 9.0, 9.0, 8.0, 10.0, 16.0, 17.0, 17.0, 24.0, 32.0, 40.0, 55.0, 95.0, 126.0, 295.0, 674.0, 1237.0, 668.0, 275.0, 124.0, 84.0, 61.0, 45.0, 30.0, 19.0, 17.0, 13.0, 8.0, 10.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.90625, -11.59698486328125, -11.2877197265625, -10.97845458984375, -10.669189453125, -10.35992431640625, -10.0506591796875, -9.74139404296875, -9.43212890625, -9.12286376953125, -8.8135986328125, -8.50433349609375, -8.195068359375, -7.88580322265625, -7.5765380859375, -7.26727294921875, -6.9580078125, -6.64874267578125, -6.3394775390625, -6.03021240234375, -5.720947265625, -5.41168212890625, -5.1024169921875, -4.79315185546875, -4.48388671875, -4.17462158203125, -3.8653564453125, -3.55609130859375, -3.246826171875, -2.93756103515625, -2.6282958984375, -2.31903076171875, -2.009765625, -1.70050048828125, -1.3912353515625, -1.08197021484375, -0.772705078125, -0.46343994140625, -0.1541748046875, 0.15509033203125, 0.46435546875, 0.77362060546875, 1.0828857421875, 1.39215087890625, 1.701416015625, 2.01068115234375, 2.3199462890625, 2.62921142578125, 2.9384765625, 3.24774169921875, 3.5570068359375, 3.86627197265625, 4.175537109375, 4.48480224609375, 4.7940673828125, 5.10333251953125, 5.41259765625, 5.72186279296875, 6.0311279296875, 6.34039306640625, 6.649658203125, 6.95892333984375, 7.2681884765625, 7.57745361328125, 7.88671875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 21.0, 55.0, 186.0, 345.0, 230.0, 106.0, 27.0, 11.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-284.43719482421875, -278.4835510253906, -272.5299377441406, -266.5762939453125, -260.6226806640625, -254.66903686523438, -248.7154083251953, -242.76177978515625, -236.80813598632812, -230.85450744628906, -224.90087890625, -218.94723510742188, -212.9936065673828, -207.03997802734375, -201.0863494873047, -195.13272094726562, -189.17909240722656, -183.2254638671875, -177.27183532714844, -171.31820678710938, -165.36456298828125, -159.4109344482422, -153.45730590820312, -147.50367736816406, -141.550048828125, -135.59642028808594, -129.64279174804688, -123.68915557861328, -117.73551940917969, -111.78189086914062, -105.82826232910156, -99.8746337890625, -93.92097473144531, -87.96734619140625, -82.01371002197266, -76.0600814819336, -70.1064453125, -64.15281677246094, -58.199188232421875, -52.24555587768555, -46.29192352294922, -40.33829116821289, -34.38465881347656, -28.4310302734375, -22.477397918701172, -16.523765563964844, -10.570137023925781, -4.616504669189453, 1.337127685546875, 7.290759086608887, 13.244390487670898, 19.198020935058594, 25.151653289794922, 31.10528564453125, 37.05891418457031, 43.01254653930664, 48.96617889404297, 54.9198112487793, 60.873443603515625, 66.82707214355469, 72.78070068359375, 78.73433685302734, 84.6879653930664, 90.6416015625, 96.59523010253906]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 7.0, 13.0, 14.0, 8.0, 23.0, 14.0, 21.0, 36.0, 44.0, 42.0, 39.0, 47.0, 52.0, 64.0, 63.0, 54.0, 51.0, 43.0, 65.0, 50.0, 44.0, 42.0, 28.0, 19.0, 22.0, 20.0, 14.0, 15.0, 9.0, 7.0, 6.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.54485321044922, -53.62650680541992, -51.708160400390625, -49.78981018066406, -47.871463775634766, -45.95311737060547, -44.03477096557617, -42.116424560546875, -40.19807434082031, -38.279727935791016, -36.36138153076172, -34.443031311035156, -32.52468490600586, -30.606338500976562, -28.687992095947266, -26.769643783569336, -24.85129737854004, -22.932950973510742, -21.014602661132812, -19.096256256103516, -17.177907943725586, -15.259561538696289, -13.341214179992676, -11.422866821289062, -9.50451946258545, -7.586172103881836, -5.667824745178223, -3.7494778633117676, -1.8311305046081543, 0.08721637725830078, 2.005563735961914, 3.9239110946655273, 5.842258453369141, 7.760605812072754, 9.678953170776367, 11.597299575805664, 13.515647888183594, 15.43399429321289, 17.352340698242188, 19.270689010620117, 21.189037322998047, 23.107383728027344, 25.025732040405273, 26.94407844543457, 28.8624267578125, 30.780773162841797, 32.699119567871094, 34.617469787597656, 36.53581237792969, 38.454158782958984, 40.37250518798828, 42.290855407714844, 44.20920181274414, 46.12754821777344, 48.045894622802734, 49.96424102783203, 51.882591247558594, 53.80093765258789, 55.71928405761719, 57.63763427734375, 59.55598068237305, 61.474327087402344, 63.39267349243164, 65.31101989746094, 67.2293701171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 10.0, 10.0, 15.0, 23.0, 30.0, 49.0, 79.0, 129.0, 194.0, 317.0, 564.0, 957.0, 1862.0, 3277.0, 6664.0, 14070.0, 31529.0, 76156.0, 189969.0, 344872.0, 219765.0, 89179.0, 36912.0, 15982.0, 7641.0, 3710.0, 1940.0, 1097.0, 615.0, 374.0, 216.0, 115.0, 91.0, 45.0, 35.0, 18.0, 17.0, 6.0, 7.0, 10.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53515625, -6.340576171875, -6.14599609375, -5.951416015625, -5.7568359375, -5.562255859375, -5.36767578125, -5.173095703125, -4.978515625, -4.783935546875, -4.58935546875, -4.394775390625, -4.2001953125, -4.005615234375, -3.81103515625, -3.616455078125, -3.421875, -3.227294921875, -3.03271484375, -2.838134765625, -2.6435546875, -2.448974609375, -2.25439453125, -2.059814453125, -1.865234375, -1.670654296875, -1.47607421875, -1.281494140625, -1.0869140625, -0.892333984375, -0.69775390625, -0.503173828125, -0.30859375, -0.114013671875, 0.08056640625, 0.275146484375, 0.4697265625, 0.664306640625, 0.85888671875, 1.053466796875, 1.248046875, 1.442626953125, 1.63720703125, 1.831787109375, 2.0263671875, 2.220947265625, 2.41552734375, 2.610107421875, 2.8046875, 2.999267578125, 3.19384765625, 3.388427734375, 3.5830078125, 3.777587890625, 3.97216796875, 4.166748046875, 4.361328125, 4.555908203125, 4.75048828125, 4.945068359375, 5.1396484375, 5.334228515625, 5.52880859375, 5.723388671875, 5.91796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 7.0, 4.0, 5.0, 6.0, 11.0, 11.0, 11.0, 19.0, 26.0, 32.0, 28.0, 34.0, 47.0, 47.0, 49.0, 43.0, 47.0, 38.0, 32.0, 48.0, 51.0, 51.0, 50.0, 37.0, 41.0, 41.0, 31.0, 32.0, 17.0, 17.0, 16.0, 12.0, 12.0, 13.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.181640625, -3.067840576171875, -2.95404052734375, -2.840240478515625, -2.7264404296875, -2.612640380859375, -2.49884033203125, -2.385040283203125, -2.271240234375, -2.157440185546875, -2.04364013671875, -1.929840087890625, -1.8160400390625, -1.702239990234375, -1.58843994140625, -1.474639892578125, -1.36083984375, -1.247039794921875, -1.13323974609375, -1.019439697265625, -0.9056396484375, -0.791839599609375, -0.67803955078125, -0.564239501953125, -0.450439453125, -0.336639404296875, -0.22283935546875, -0.109039306640625, 0.0047607421875, 0.118560791015625, 0.23236083984375, 0.346160888671875, 0.4599609375, 0.573760986328125, 0.68756103515625, 0.801361083984375, 0.9151611328125, 1.028961181640625, 1.14276123046875, 1.256561279296875, 1.370361328125, 1.484161376953125, 1.59796142578125, 1.711761474609375, 1.8255615234375, 1.939361572265625, 2.05316162109375, 2.166961669921875, 2.28076171875, 2.394561767578125, 2.50836181640625, 2.622161865234375, 2.7359619140625, 2.849761962890625, 2.96356201171875, 3.077362060546875, 3.191162109375, 3.304962158203125, 3.41876220703125, 3.532562255859375, 3.6463623046875, 3.760162353515625, 3.87396240234375, 3.987762451171875, 4.1015625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 4.0, 11.0, 14.0, 15.0, 20.0, 32.0, 43.0, 53.0, 91.0, 176.0, 231.0, 471.0, 812.0, 1618.0, 4509.0, 18500.0, 140388.0, 722515.0, 133335.0, 17888.0, 4247.0, 1687.0, 801.0, 398.0, 232.0, 170.0, 93.0, 74.0, 46.0, 22.0, 10.0, 16.0, 15.0, 4.0, 4.0, 3.0, 3.0], "bins": [-19.578125, -19.1380615234375, -18.697998046875, -18.2579345703125, -17.81787109375, -17.3778076171875, -16.937744140625, -16.4976806640625, -16.0576171875, -15.6175537109375, -15.177490234375, -14.7374267578125, -14.29736328125, -13.8572998046875, -13.417236328125, -12.9771728515625, -12.537109375, -12.0970458984375, -11.656982421875, -11.2169189453125, -10.77685546875, -10.3367919921875, -9.896728515625, -9.4566650390625, -9.0166015625, -8.5765380859375, -8.136474609375, -7.6964111328125, -7.25634765625, -6.8162841796875, -6.376220703125, -5.9361572265625, -5.49609375, -5.0560302734375, -4.615966796875, -4.1759033203125, -3.73583984375, -3.2957763671875, -2.855712890625, -2.4156494140625, -1.9755859375, -1.5355224609375, -1.095458984375, -0.6553955078125, -0.21533203125, 0.2247314453125, 0.664794921875, 1.1048583984375, 1.544921875, 1.9849853515625, 2.425048828125, 2.8651123046875, 3.30517578125, 3.7452392578125, 4.185302734375, 4.6253662109375, 5.0654296875, 5.5054931640625, 5.945556640625, 6.3856201171875, 6.82568359375, 7.2657470703125, 7.705810546875, 8.1458740234375, 8.5859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 4.0, 8.0, 7.0, 2.0, 9.0, 12.0, 15.0, 18.0, 29.0, 26.0, 38.0, 34.0, 37.0, 37.0, 52.0, 35.0, 38.0, 43.0, 59.0, 61.0, 41.0, 57.0, 36.0, 34.0, 34.0, 30.0, 30.0, 30.0, 21.0, 15.0, 18.0, 17.0, 14.0, 9.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-17.484375, -16.982421875, -16.48046875, -15.978515625, -15.4765625, -14.974609375, -14.47265625, -13.970703125, -13.46875, -12.966796875, -12.46484375, -11.962890625, -11.4609375, -10.958984375, -10.45703125, -9.955078125, -9.453125, -8.951171875, -8.44921875, -7.947265625, -7.4453125, -6.943359375, -6.44140625, -5.939453125, -5.4375, -4.935546875, -4.43359375, -3.931640625, -3.4296875, -2.927734375, -2.42578125, -1.923828125, -1.421875, -0.919921875, -0.41796875, 0.083984375, 0.5859375, 1.087890625, 1.58984375, 2.091796875, 2.59375, 3.095703125, 3.59765625, 4.099609375, 4.6015625, 5.103515625, 5.60546875, 6.107421875, 6.609375, 7.111328125, 7.61328125, 8.115234375, 8.6171875, 9.119140625, 9.62109375, 10.123046875, 10.625, 11.126953125, 11.62890625, 12.130859375, 12.6328125, 13.134765625, 13.63671875, 14.138671875, 14.640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 12.0, 17.0, 18.0, 41.0, 49.0, 79.0, 117.0, 241.0, 443.0, 1004.0, 2859.0, 13419.0, 154648.0, 796919.0, 66939.0, 8085.0, 2031.0, 789.0, 330.0, 188.0, 114.0, 58.0, 46.0, 26.0, 10.0, 10.0, 12.0, 10.0, 7.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.92578125, -6.72418212890625, -6.5225830078125, -6.32098388671875, -6.119384765625, -5.91778564453125, -5.7161865234375, -5.51458740234375, -5.31298828125, -5.11138916015625, -4.9097900390625, -4.70819091796875, -4.506591796875, -4.30499267578125, -4.1033935546875, -3.90179443359375, -3.7001953125, -3.49859619140625, -3.2969970703125, -3.09539794921875, -2.893798828125, -2.69219970703125, -2.4906005859375, -2.28900146484375, -2.08740234375, -1.88580322265625, -1.6842041015625, -1.48260498046875, -1.281005859375, -1.07940673828125, -0.8778076171875, -0.67620849609375, -0.474609375, -0.27301025390625, -0.0714111328125, 0.13018798828125, 0.331787109375, 0.53338623046875, 0.7349853515625, 0.93658447265625, 1.13818359375, 1.33978271484375, 1.5413818359375, 1.74298095703125, 1.944580078125, 2.14617919921875, 2.3477783203125, 2.54937744140625, 2.7509765625, 2.95257568359375, 3.1541748046875, 3.35577392578125, 3.557373046875, 3.75897216796875, 3.9605712890625, 4.16217041015625, 4.36376953125, 4.56536865234375, 4.7669677734375, 4.96856689453125, 5.170166015625, 5.37176513671875, 5.5733642578125, 5.77496337890625, 5.9765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 7.0, 11.0, 7.0, 15.0, 16.0, 20.0, 41.0, 35.0, 49.0, 57.0, 62.0, 79.0, 76.0, 92.0, 67.0, 76.0, 66.0, 46.0, 27.0, 27.0, 25.0, 23.0, 14.0, 13.0, 8.0, 10.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0007061958312988281, -0.0006843134760856628, -0.0006624311208724976, -0.0006405487656593323, -0.000618666410446167, -0.0005967840552330017, -0.0005749017000198364, -0.0005530193448066711, -0.0005311369895935059, -0.0005092546343803406, -0.0004873722791671753, -0.00046548992395401, -0.0004436075687408447, -0.00042172521352767944, -0.00039984285831451416, -0.0003779605031013489, -0.0003560781478881836, -0.0003341957926750183, -0.00031231343746185303, -0.00029043108224868774, -0.00026854872703552246, -0.0002466663718223572, -0.0002247840166091919, -0.0002029016613960266, -0.00018101930618286133, -0.00015913695096969604, -0.00013725459575653076, -0.00011537224054336548, -9.34898853302002e-05, -7.160753011703491e-05, -4.972517490386963e-05, -2.7842819690704346e-05, -5.9604644775390625e-06, 1.592189073562622e-05, 3.7804245948791504e-05, 5.968660116195679e-05, 8.156895637512207e-05, 0.00010345131158828735, 0.00012533366680145264, 0.00014721602201461792, 0.0001690983772277832, 0.00019098073244094849, 0.00021286308765411377, 0.00023474544286727905, 0.00025662779808044434, 0.0002785101532936096, 0.0003003925085067749, 0.0003222748637199402, 0.00034415721893310547, 0.00036603957414627075, 0.00038792192935943604, 0.0004098042845726013, 0.0004316866397857666, 0.0004535689949989319, 0.00047545135021209717, 0.0004973337054252625, 0.0005192160606384277, 0.000541098415851593, 0.0005629807710647583, 0.0005848631262779236, 0.0006067454814910889, 0.0006286278367042542, 0.0006505101919174194, 0.0006723925471305847, 0.00069427490234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 23.0, 28.0, 63.0, 185.0, 523.0, 2532.0, 34978.0, 945841.0, 60031.0, 3320.0, 688.0, 187.0, 81.0, 36.0, 14.0, 9.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.5609130859375, -12.207763671875, -11.8546142578125, -11.50146484375, -11.1483154296875, -10.795166015625, -10.4420166015625, -10.0888671875, -9.7357177734375, -9.382568359375, -9.0294189453125, -8.67626953125, -8.3231201171875, -7.969970703125, -7.6168212890625, -7.263671875, -6.9105224609375, -6.557373046875, -6.2042236328125, -5.85107421875, -5.4979248046875, -5.144775390625, -4.7916259765625, -4.4384765625, -4.0853271484375, -3.732177734375, -3.3790283203125, -3.02587890625, -2.6727294921875, -2.319580078125, -1.9664306640625, -1.61328125, -1.2601318359375, -0.906982421875, -0.5538330078125, -0.20068359375, 0.1524658203125, 0.505615234375, 0.8587646484375, 1.2119140625, 1.5650634765625, 1.918212890625, 2.2713623046875, 2.62451171875, 2.9776611328125, 3.330810546875, 3.6839599609375, 4.037109375, 4.3902587890625, 4.743408203125, 5.0965576171875, 5.44970703125, 5.8028564453125, 6.156005859375, 6.5091552734375, 6.8623046875, 7.2154541015625, 7.568603515625, 7.9217529296875, 8.27490234375, 8.6280517578125, 8.981201171875, 9.3343505859375, 9.6875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 10.0, 6.0, 13.0, 14.0, 19.0, 23.0, 36.0, 31.0, 48.0, 65.0, 70.0, 94.0, 71.0, 83.0, 89.0, 71.0, 61.0, 52.0, 31.0, 27.0, 21.0, 17.0, 11.0, 4.0, 8.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20684814453125, -5.0426025390625, -4.87835693359375, -4.714111328125, -4.54986572265625, -4.3856201171875, -4.22137451171875, -4.05712890625, -3.89288330078125, -3.7286376953125, -3.56439208984375, -3.400146484375, -3.23590087890625, -3.0716552734375, -2.90740966796875, -2.7431640625, -2.57891845703125, -2.4146728515625, -2.25042724609375, -2.086181640625, -1.92193603515625, -1.7576904296875, -1.59344482421875, -1.42919921875, -1.26495361328125, -1.1007080078125, -0.93646240234375, -0.772216796875, -0.60797119140625, -0.4437255859375, -0.27947998046875, -0.115234375, 0.04901123046875, 0.2132568359375, 0.37750244140625, 0.541748046875, 0.70599365234375, 0.8702392578125, 1.03448486328125, 1.19873046875, 1.36297607421875, 1.5272216796875, 1.69146728515625, 1.855712890625, 2.01995849609375, 2.1842041015625, 2.34844970703125, 2.5126953125, 2.67694091796875, 2.8411865234375, 3.00543212890625, 3.169677734375, 3.33392333984375, 3.4981689453125, 3.66241455078125, 3.82666015625, 3.99090576171875, 4.1551513671875, 4.31939697265625, 4.483642578125, 4.64788818359375, 4.8121337890625, 4.97637939453125, 5.140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 14.0, 30.0, 60.0, 184.0, 290.0, 237.0, 106.0, 48.0, 14.0, 11.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-171.00503540039062, -165.7771759033203, -160.54933166503906, -155.32147216796875, -150.0936279296875, -144.8657684326172, -139.63792419433594, -134.41006469726562, -129.18222045898438, -123.9543685913086, -118.72651672363281, -113.49866485595703, -108.27081298828125, -103.04295349121094, -97.81510162353516, -92.58724975585938, -87.35939025878906, -82.13153839111328, -76.9036865234375, -71.67583465576172, -66.44798278808594, -61.22012710571289, -55.992271423339844, -50.76441955566406, -45.53656768798828, -40.3087158203125, -35.08086395263672, -29.853008270263672, -24.62515640258789, -19.39730453491211, -14.169450759887695, -8.941596984863281, -3.7137451171875, 1.5141077041625977, 6.741960525512695, 11.969813346862793, 17.19766616821289, 22.425518035888672, 27.653371810913086, 32.8812255859375, 38.10907745361328, 43.33692932128906, 48.564781188964844, 53.79263687133789, 59.02048873901367, 64.24833679199219, 69.4761962890625, 74.70404815673828, 79.93190002441406, 85.15975189208984, 90.38760375976562, 95.6154556274414, 100.84330749511719, 106.0711669921875, 111.29901885986328, 116.52687072753906, 121.75472259521484, 126.98257446289062, 132.21043395996094, 137.4382781982422, 142.6661376953125, 147.89398193359375, 153.12184143066406, 158.34970092773438, 163.57754516601562]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 12.0, 16.0, 14.0, 18.0, 22.0, 28.0, 28.0, 51.0, 44.0, 49.0, 47.0, 54.0, 82.0, 86.0, 60.0, 64.0, 56.0, 40.0, 27.0, 37.0, 22.0, 25.0, 20.0, 23.0, 10.0, 19.0, 11.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-88.14323425292969, -85.63174438476562, -83.12025451660156, -80.60877227783203, -78.09728240966797, -75.5857925415039, -73.07430267333984, -70.56282043457031, -68.05133056640625, -65.53984069824219, -63.02835464477539, -60.51686477661133, -58.00537872314453, -55.49388885498047, -52.982398986816406, -50.47091293334961, -47.95942306518555, -45.447933197021484, -42.93644714355469, -40.424957275390625, -37.91347122192383, -35.401981353759766, -32.89049530029297, -30.379005432128906, -27.867517471313477, -25.356029510498047, -22.844541549682617, -20.333053588867188, -17.821563720703125, -15.310076713562012, -12.798587799072266, -10.287099838256836, -7.775611877441406, -5.264123916625977, -2.7526354789733887, -0.24114704132080078, 2.270340919494629, 4.781828880310059, 7.293317794799805, 9.804805755615234, 12.316293716430664, 14.827781677246094, 17.339269638061523, 19.850757598876953, 22.362247467041016, 24.873733520507812, 27.385223388671875, 29.896711349487305, 32.408199310302734, 34.9196891784668, 37.431175231933594, 39.942665100097656, 42.45415115356445, 44.965641021728516, 47.47712707519531, 49.988616943359375, 52.50010681152344, 55.0115966796875, 57.5230827331543, 60.03457260131836, 62.546058654785156, 65.05754852294922, 67.56903839111328, 70.08052062988281, 72.59201049804688]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 8.0, 6.0, 10.0, 7.0, 15.0, 26.0, 38.0, 50.0, 99.0, 171.0, 327.0, 668.0, 1574.0, 4306.0, 15277.0, 99077.0, 3751084.0, 284730.0, 26355.0, 6654.0, 2197.0, 864.0, 353.0, 189.0, 98.0, 44.0, 22.0, 14.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-15.328125, -14.99957275390625, -14.6710205078125, -14.34246826171875, -14.013916015625, -13.68536376953125, -13.3568115234375, -13.02825927734375, -12.69970703125, -12.37115478515625, -12.0426025390625, -11.71405029296875, -11.385498046875, -11.05694580078125, -10.7283935546875, -10.39984130859375, -10.0712890625, -9.74273681640625, -9.4141845703125, -9.08563232421875, -8.757080078125, -8.42852783203125, -8.0999755859375, -7.77142333984375, -7.44287109375, -7.11431884765625, -6.7857666015625, -6.45721435546875, -6.128662109375, -5.80010986328125, -5.4715576171875, -5.14300537109375, -4.814453125, -4.48590087890625, -4.1573486328125, -3.82879638671875, -3.500244140625, -3.17169189453125, -2.8431396484375, -2.51458740234375, -2.18603515625, -1.85748291015625, -1.5289306640625, -1.20037841796875, -0.871826171875, -0.54327392578125, -0.2147216796875, 0.11383056640625, 0.4423828125, 0.77093505859375, 1.0994873046875, 1.42803955078125, 1.756591796875, 2.08514404296875, 2.4136962890625, 2.74224853515625, 3.07080078125, 3.39935302734375, 3.7279052734375, 4.05645751953125, 4.385009765625, 4.71356201171875, 5.0421142578125, 5.37066650390625, 5.69921875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 22.0, 18.0, 44.0, 69.0, 87.0, 121.0, 106.0, 114.0, 108.0, 102.0, 79.0, 39.0, 30.0, 20.0, 14.0, 9.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0859375, -11.8291015625, -11.572265625, -11.3154296875, -11.05859375, -10.8017578125, -10.544921875, -10.2880859375, -10.03125, -9.7744140625, -9.517578125, -9.2607421875, -9.00390625, -8.7470703125, -8.490234375, -8.2333984375, -7.9765625, -7.7197265625, -7.462890625, -7.2060546875, -6.94921875, -6.6923828125, -6.435546875, -6.1787109375, -5.921875, -5.6650390625, -5.408203125, -5.1513671875, -4.89453125, -4.6376953125, -4.380859375, -4.1240234375, -3.8671875, -3.6103515625, -3.353515625, -3.0966796875, -2.83984375, -2.5830078125, -2.326171875, -2.0693359375, -1.8125, -1.5556640625, -1.298828125, -1.0419921875, -0.78515625, -0.5283203125, -0.271484375, -0.0146484375, 0.2421875, 0.4990234375, 0.755859375, 1.0126953125, 1.26953125, 1.5263671875, 1.783203125, 2.0400390625, 2.296875, 2.5537109375, 2.810546875, 3.0673828125, 3.32421875, 3.5810546875, 3.837890625, 4.0947265625, 4.3515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 3.0, 9.0, 13.0, 12.0, 21.0, 35.0, 59.0, 130.0, 224.0, 481.0, 1175.0, 3365.0, 10410.0, 40183.0, 322648.0, 3591863.0, 179997.0, 29620.0, 8568.0, 3102.0, 1241.0, 507.0, 253.0, 136.0, 85.0, 44.0, 29.0, 17.0, 19.0, 6.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.578125, -9.2730712890625, -8.968017578125, -8.6629638671875, -8.35791015625, -8.0528564453125, -7.747802734375, -7.4427490234375, -7.1376953125, -6.8326416015625, -6.527587890625, -6.2225341796875, -5.91748046875, -5.6124267578125, -5.307373046875, -5.0023193359375, -4.697265625, -4.3922119140625, -4.087158203125, -3.7821044921875, -3.47705078125, -3.1719970703125, -2.866943359375, -2.5618896484375, -2.2568359375, -1.9517822265625, -1.646728515625, -1.3416748046875, -1.03662109375, -0.7315673828125, -0.426513671875, -0.1214599609375, 0.18359375, 0.4886474609375, 0.793701171875, 1.0987548828125, 1.40380859375, 1.7088623046875, 2.013916015625, 2.3189697265625, 2.6240234375, 2.9290771484375, 3.234130859375, 3.5391845703125, 3.84423828125, 4.1492919921875, 4.454345703125, 4.7593994140625, 5.064453125, 5.3695068359375, 5.674560546875, 5.9796142578125, 6.28466796875, 6.5897216796875, 6.894775390625, 7.1998291015625, 7.5048828125, 7.8099365234375, 8.114990234375, 8.4200439453125, 8.72509765625, 9.0301513671875, 9.335205078125, 9.6402587890625, 9.9453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 11.0, 16.0, 18.0, 18.0, 34.0, 46.0, 69.0, 105.0, 207.0, 417.0, 877.0, 1055.0, 518.0, 244.0, 126.0, 73.0, 54.0, 40.0, 25.0, 21.0, 17.0, 12.0, 8.0, 9.0, 3.0, 3.0, 4.0, 2.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.3516845703125, -5.086181640625, -4.8206787109375, -4.55517578125, -4.2896728515625, -4.024169921875, -3.7586669921875, -3.4931640625, -3.2276611328125, -2.962158203125, -2.6966552734375, -2.43115234375, -2.1656494140625, -1.900146484375, -1.6346435546875, -1.369140625, -1.1036376953125, -0.838134765625, -0.5726318359375, -0.30712890625, -0.0416259765625, 0.223876953125, 0.4893798828125, 0.7548828125, 1.0203857421875, 1.285888671875, 1.5513916015625, 1.81689453125, 2.0823974609375, 2.347900390625, 2.6134033203125, 2.87890625, 3.1444091796875, 3.409912109375, 3.6754150390625, 3.94091796875, 4.2064208984375, 4.471923828125, 4.7374267578125, 5.0029296875, 5.2684326171875, 5.533935546875, 5.7994384765625, 6.06494140625, 6.3304443359375, 6.595947265625, 6.8614501953125, 7.126953125, 7.3924560546875, 7.657958984375, 7.9234619140625, 8.18896484375, 8.4544677734375, 8.719970703125, 8.9854736328125, 9.2509765625, 9.5164794921875, 9.781982421875, 10.0474853515625, 10.31298828125, 10.5784912109375, 10.843994140625, 11.1094970703125, 11.375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 12.0, 18.0, 68.0, 196.0, 298.0, 219.0, 98.0, 44.0, 17.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.70344543457031, -67.45089721679688, -64.19835662841797, -60.94580841064453, -57.69326400756836, -54.44071960449219, -51.188175201416016, -47.935630798339844, -44.683082580566406, -41.430538177490234, -38.17799377441406, -34.925445556640625, -31.672901153564453, -28.42035675048828, -25.16781234741211, -21.915266036987305, -18.662723541259766, -15.410178184509277, -12.157632827758789, -8.905088424682617, -5.652543067932129, -2.3999977111816406, 0.8525466918945312, 4.105093002319336, 7.357637405395508, 10.610182762145996, 13.862728118896484, 17.115272521972656, 20.367816925048828, 23.620363235473633, 26.872907638549805, 30.12545394897461, 33.37799835205078, 36.63054275512695, 39.883087158203125, 43.13563537597656, 46.388179779052734, 49.640724182128906, 52.89326858520508, 56.14581298828125, 59.39836120605469, 62.65090560913086, 65.90345001220703, 69.15599822998047, 72.40853881835938, 75.66108703613281, 78.91363525390625, 82.16617584228516, 85.41871643066406, 88.6712646484375, 91.9238052368164, 95.17635345458984, 98.42889404296875, 101.68144226074219, 104.93399047851562, 108.18653106689453, 111.43907928466797, 114.6916275024414, 117.94416809082031, 121.19671630859375, 124.44925689697266, 127.7018051147461, 130.954345703125, 134.20689392089844, 137.45944213867188]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 2.0, 9.0, 11.0, 14.0, 16.0, 33.0, 24.0, 35.0, 53.0, 42.0, 53.0, 58.0, 64.0, 64.0, 51.0, 74.0, 61.0, 61.0, 33.0, 38.0, 34.0, 27.0, 30.0, 22.0, 13.0, 15.0, 8.0, 13.0, 9.0, 10.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-47.14857482910156, -45.783138275146484, -44.417701721191406, -43.052268981933594, -41.686832427978516, -40.32139587402344, -38.955963134765625, -37.59052658081055, -36.22509002685547, -34.85965347290039, -33.49421691894531, -32.1287841796875, -30.763347625732422, -29.397911071777344, -28.0324764251709, -26.667041778564453, -25.301605224609375, -23.936168670654297, -22.57073402404785, -21.205299377441406, -19.839862823486328, -18.47442626953125, -17.108991622924805, -15.743556022644043, -14.378120422363281, -13.01268482208252, -11.647249221801758, -10.281813621520996, -8.916378021240234, -7.550942420959473, -6.185506820678711, -4.820071220397949, -3.4546356201171875, -2.089200019836426, -0.7237644195556641, 0.6416711807250977, 2.0071067810058594, 3.372542381286621, 4.737977981567383, 6.1034135818481445, 7.468849182128906, 8.834284782409668, 10.19972038269043, 11.565155982971191, 12.930591583251953, 14.296027183532715, 15.661462783813477, 17.026897430419922, 18.392333984375, 19.757770538330078, 21.123205184936523, 22.48863983154297, 23.854076385498047, 25.219512939453125, 26.58494758605957, 27.950382232666016, 29.315818786621094, 30.681255340576172, 32.04669189453125, 33.41212463378906, 34.77756118774414, 36.14299774169922, 37.50843048095703, 38.87386703491211, 40.23930358886719]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 9.0, 11.0, 10.0, 14.0, 15.0, 21.0, 30.0, 55.0, 57.0, 114.0, 167.0, 274.0, 409.0, 794.0, 1551.0, 2791.0, 6007.0, 13183.0, 31076.0, 80229.0, 217531.0, 378562.0, 193510.0, 71194.0, 27597.0, 11886.0, 5536.0, 2662.0, 1407.0, 732.0, 443.0, 244.0, 137.0, 112.0, 58.0, 32.0, 23.0, 24.0, 19.0, 10.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.49151611328125, -5.2838134765625, -5.07611083984375, -4.868408203125, -4.66070556640625, -4.4530029296875, -4.24530029296875, -4.03759765625, -3.82989501953125, -3.6221923828125, -3.41448974609375, -3.206787109375, -2.99908447265625, -2.7913818359375, -2.58367919921875, -2.3759765625, -2.16827392578125, -1.9605712890625, -1.75286865234375, -1.545166015625, -1.33746337890625, -1.1297607421875, -0.92205810546875, -0.71435546875, -0.50665283203125, -0.2989501953125, -0.09124755859375, 0.116455078125, 0.32415771484375, 0.5318603515625, 0.73956298828125, 0.947265625, 1.15496826171875, 1.3626708984375, 1.57037353515625, 1.778076171875, 1.98577880859375, 2.1934814453125, 2.40118408203125, 2.60888671875, 2.81658935546875, 3.0242919921875, 3.23199462890625, 3.439697265625, 3.64739990234375, 3.8551025390625, 4.06280517578125, 4.2705078125, 4.47821044921875, 4.6859130859375, 4.89361572265625, 5.101318359375, 5.30902099609375, 5.5167236328125, 5.72442626953125, 5.93212890625, 6.13983154296875, 6.3475341796875, 6.55523681640625, 6.762939453125, 6.97064208984375, 7.1783447265625, 7.38604736328125, 7.59375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 6.0, 17.0, 29.0, 39.0, 49.0, 56.0, 62.0, 77.0, 92.0, 80.0, 79.0, 93.0, 73.0, 50.0, 43.0, 35.0, 25.0, 22.0, 25.0, 10.0, 13.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -8.035369873046875, -7.85198974609375, -7.668609619140625, -7.4852294921875, -7.301849365234375, -7.11846923828125, -6.935089111328125, -6.751708984375, -6.568328857421875, -6.38494873046875, -6.201568603515625, -6.0181884765625, -5.834808349609375, -5.65142822265625, -5.468048095703125, -5.28466796875, -5.101287841796875, -4.91790771484375, -4.734527587890625, -4.5511474609375, -4.367767333984375, -4.18438720703125, -4.001007080078125, -3.817626953125, -3.634246826171875, -3.45086669921875, -3.267486572265625, -3.0841064453125, -2.900726318359375, -2.71734619140625, -2.533966064453125, -2.3505859375, -2.167205810546875, -1.98382568359375, -1.800445556640625, -1.6170654296875, -1.433685302734375, -1.25030517578125, -1.066925048828125, -0.883544921875, -0.700164794921875, -0.51678466796875, -0.333404541015625, -0.1500244140625, 0.033355712890625, 0.21673583984375, 0.400115966796875, 0.58349609375, 0.766876220703125, 0.95025634765625, 1.133636474609375, 1.3170166015625, 1.500396728515625, 1.68377685546875, 1.867156982421875, 2.050537109375, 2.233917236328125, 2.41729736328125, 2.600677490234375, 2.7840576171875, 2.967437744140625, 3.15081787109375, 3.334197998046875, 3.517578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 2.0, 7.0, 5.0, 6.0, 12.0, 14.0, 26.0, 29.0, 36.0, 43.0, 117.0, 166.0, 291.0, 489.0, 1017.0, 2590.0, 8605.0, 45653.0, 386251.0, 532650.0, 55438.0, 9963.0, 2702.0, 1166.0, 513.0, 273.0, 151.0, 102.0, 58.0, 42.0, 35.0, 29.0, 16.0, 12.0, 10.0, 9.0, 5.0, 6.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.1953125, -14.7738037109375, -14.352294921875, -13.9307861328125, -13.50927734375, -13.0877685546875, -12.666259765625, -12.2447509765625, -11.8232421875, -11.4017333984375, -10.980224609375, -10.5587158203125, -10.13720703125, -9.7156982421875, -9.294189453125, -8.8726806640625, -8.451171875, -8.0296630859375, -7.608154296875, -7.1866455078125, -6.76513671875, -6.3436279296875, -5.922119140625, -5.5006103515625, -5.0791015625, -4.6575927734375, -4.236083984375, -3.8145751953125, -3.39306640625, -2.9715576171875, -2.550048828125, -2.1285400390625, -1.70703125, -1.2855224609375, -0.864013671875, -0.4425048828125, -0.02099609375, 0.4005126953125, 0.822021484375, 1.2435302734375, 1.6650390625, 2.0865478515625, 2.508056640625, 2.9295654296875, 3.35107421875, 3.7725830078125, 4.194091796875, 4.6156005859375, 5.037109375, 5.4586181640625, 5.880126953125, 6.3016357421875, 6.72314453125, 7.1446533203125, 7.566162109375, 7.9876708984375, 8.4091796875, 8.8306884765625, 9.252197265625, 9.6737060546875, 10.09521484375, 10.5167236328125, 10.938232421875, 11.3597412109375, 11.78125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 14.0, 11.0, 26.0, 11.0, 25.0, 22.0, 26.0, 31.0, 34.0, 39.0, 43.0, 57.0, 54.0, 58.0, 44.0, 54.0, 45.0, 51.0, 52.0, 55.0, 32.0, 37.0, 44.0, 19.0, 22.0, 17.0, 14.0, 14.0, 11.0, 10.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.2734375, -13.7938232421875, -13.314208984375, -12.8345947265625, -12.35498046875, -11.8753662109375, -11.395751953125, -10.9161376953125, -10.4365234375, -9.9569091796875, -9.477294921875, -8.9976806640625, -8.51806640625, -8.0384521484375, -7.558837890625, -7.0792236328125, -6.599609375, -6.1199951171875, -5.640380859375, -5.1607666015625, -4.68115234375, -4.2015380859375, -3.721923828125, -3.2423095703125, -2.7626953125, -2.2830810546875, -1.803466796875, -1.3238525390625, -0.84423828125, -0.3646240234375, 0.114990234375, 0.5946044921875, 1.07421875, 1.5538330078125, 2.033447265625, 2.5130615234375, 2.99267578125, 3.4722900390625, 3.951904296875, 4.4315185546875, 4.9111328125, 5.3907470703125, 5.870361328125, 6.3499755859375, 6.82958984375, 7.3092041015625, 7.788818359375, 8.2684326171875, 8.748046875, 9.2276611328125, 9.707275390625, 10.1868896484375, 10.66650390625, 11.1461181640625, 11.625732421875, 12.1053466796875, 12.5849609375, 13.0645751953125, 13.544189453125, 14.0238037109375, 14.50341796875, 14.9830322265625, 15.462646484375, 15.9422607421875, 16.421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 12.0, 10.0, 15.0, 19.0, 42.0, 56.0, 78.0, 160.0, 295.0, 594.0, 1758.0, 7500.0, 80561.0, 854527.0, 91751.0, 7923.0, 1849.0, 665.0, 300.0, 163.0, 89.0, 64.0, 31.0, 24.0, 21.0, 13.0, 7.0, 6.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9765625, -5.77410888671875, -5.5716552734375, -5.36920166015625, -5.166748046875, -4.96429443359375, -4.7618408203125, -4.55938720703125, -4.35693359375, -4.15447998046875, -3.9520263671875, -3.74957275390625, -3.547119140625, -3.34466552734375, -3.1422119140625, -2.93975830078125, -2.7373046875, -2.53485107421875, -2.3323974609375, -2.12994384765625, -1.927490234375, -1.72503662109375, -1.5225830078125, -1.32012939453125, -1.11767578125, -0.91522216796875, -0.7127685546875, -0.51031494140625, -0.307861328125, -0.10540771484375, 0.0970458984375, 0.29949951171875, 0.501953125, 0.70440673828125, 0.9068603515625, 1.10931396484375, 1.311767578125, 1.51422119140625, 1.7166748046875, 1.91912841796875, 2.12158203125, 2.32403564453125, 2.5264892578125, 2.72894287109375, 2.931396484375, 3.13385009765625, 3.3363037109375, 3.53875732421875, 3.7412109375, 3.94366455078125, 4.1461181640625, 4.34857177734375, 4.551025390625, 4.75347900390625, 4.9559326171875, 5.15838623046875, 5.36083984375, 5.56329345703125, 5.7657470703125, 5.96820068359375, 6.170654296875, 6.37310791015625, 6.5755615234375, 6.77801513671875, 6.98046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 6.0, 13.0, 11.0, 20.0, 33.0, 42.0, 33.0, 85.0, 115.0, 116.0, 156.0, 97.0, 66.0, 74.0, 37.0, 33.0, 24.0, 9.0, 6.0, 6.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010614395141601562, -0.0010262280702590942, -0.0009910166263580322, -0.0009558051824569702, -0.0009205937385559082, -0.0008853822946548462, -0.0008501708507537842, -0.0008149594068527222, -0.0007797479629516602, -0.0007445365190505981, -0.0007093250751495361, -0.0006741136312484741, -0.0006389021873474121, -0.0006036907434463501, -0.0005684792995452881, -0.0005332678556442261, -0.0004980564117431641, -0.00046284496784210205, -0.00042763352394104004, -0.00039242208003997803, -0.000357210636138916, -0.000321999192237854, -0.000286787748336792, -0.00025157630443573, -0.00021636486053466797, -0.00018115341663360596, -0.00014594197273254395, -0.00011073052883148193, -7.551908493041992e-05, -4.030764102935791e-05, -5.0961971282958984e-06, 3.0115246772766113e-05, 6.532669067382812e-05, 0.00010053813457489014, 0.00013574957847595215, 0.00017096102237701416, 0.00020617246627807617, 0.00024138391017913818, 0.0002765953540802002, 0.0003118067979812622, 0.0003470182418823242, 0.00038222968578338623, 0.00041744112968444824, 0.00045265257358551025, 0.00048786401748657227, 0.0005230754613876343, 0.0005582869052886963, 0.0005934983491897583, 0.0006287097930908203, 0.0006639212369918823, 0.0006991326808929443, 0.0007343441247940063, 0.0007695555686950684, 0.0008047670125961304, 0.0008399784564971924, 0.0008751899003982544, 0.0009104013442993164, 0.0009456127882003784, 0.0009808242321014404, 0.0010160356760025024, 0.0010512471199035645, 0.0010864585638046265, 0.0011216700077056885, 0.0011568814516067505, 0.0011920928955078125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 8.0, 8.0, 10.0, 17.0, 38.0, 50.0, 105.0, 188.0, 341.0, 933.0, 3192.0, 19878.0, 380733.0, 610784.0, 26454.0, 3897.0, 1065.0, 410.0, 191.0, 94.0, 51.0, 27.0, 23.0, 14.0, 10.0, 17.0, 11.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.0447998046875, -4.843505859375, -4.6422119140625, -4.44091796875, -4.2396240234375, -4.038330078125, -3.8370361328125, -3.6357421875, -3.4344482421875, -3.233154296875, -3.0318603515625, -2.83056640625, -2.6292724609375, -2.427978515625, -2.2266845703125, -2.025390625, -1.8240966796875, -1.622802734375, -1.4215087890625, -1.22021484375, -1.0189208984375, -0.817626953125, -0.6163330078125, -0.4150390625, -0.2137451171875, -0.012451171875, 0.1888427734375, 0.39013671875, 0.5914306640625, 0.792724609375, 0.9940185546875, 1.1953125, 1.3966064453125, 1.597900390625, 1.7991943359375, 2.00048828125, 2.2017822265625, 2.403076171875, 2.6043701171875, 2.8056640625, 3.0069580078125, 3.208251953125, 3.4095458984375, 3.61083984375, 3.8121337890625, 4.013427734375, 4.2147216796875, 4.416015625, 4.6173095703125, 4.818603515625, 5.0198974609375, 5.22119140625, 5.4224853515625, 5.623779296875, 5.8250732421875, 6.0263671875, 6.2276611328125, 6.428955078125, 6.6302490234375, 6.83154296875, 7.0328369140625, 7.234130859375, 7.4354248046875, 7.63671875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 7.0, 8.0, 16.0, 14.0, 16.0, 22.0, 24.0, 34.0, 39.0, 69.0, 75.0, 83.0, 92.0, 95.0, 96.0, 70.0, 53.0, 37.0, 30.0, 25.0, 28.0, 21.0, 10.0, 8.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.7049560546875, -4.570068359375, -4.4351806640625, -4.30029296875, -4.1654052734375, -4.030517578125, -3.8956298828125, -3.7607421875, -3.6258544921875, -3.490966796875, -3.3560791015625, -3.22119140625, -3.0863037109375, -2.951416015625, -2.8165283203125, -2.681640625, -2.5467529296875, -2.411865234375, -2.2769775390625, -2.14208984375, -2.0072021484375, -1.872314453125, -1.7374267578125, -1.6025390625, -1.4676513671875, -1.332763671875, -1.1978759765625, -1.06298828125, -0.9281005859375, -0.793212890625, -0.6583251953125, -0.5234375, -0.3885498046875, -0.253662109375, -0.1187744140625, 0.01611328125, 0.1510009765625, 0.285888671875, 0.4207763671875, 0.5556640625, 0.6905517578125, 0.825439453125, 0.9603271484375, 1.09521484375, 1.2301025390625, 1.364990234375, 1.4998779296875, 1.634765625, 1.7696533203125, 1.904541015625, 2.0394287109375, 2.17431640625, 2.3092041015625, 2.444091796875, 2.5789794921875, 2.7138671875, 2.8487548828125, 2.983642578125, 3.1185302734375, 3.25341796875, 3.3883056640625, 3.523193359375, 3.6580810546875, 3.79296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 22.0, 45.0, 86.0, 187.0, 291.0, 184.0, 113.0, 40.0, 14.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-179.1162109375, -175.2705535888672, -171.42489624023438, -167.57923889160156, -163.73358154296875, -159.88792419433594, -156.04226684570312, -152.1966094970703, -148.3509521484375, -144.5052947998047, -140.65963745117188, -136.81398010253906, -132.96832275390625, -129.12266540527344, -125.27700805664062, -121.43135070800781, -117.58568572998047, -113.74002838134766, -109.89437103271484, -106.04871368408203, -102.20305633544922, -98.3573989868164, -94.51173400878906, -90.66607666015625, -86.82041931152344, -82.97476196289062, -79.12910461425781, -75.283447265625, -71.43778991699219, -67.59213256835938, -63.7464714050293, -59.900814056396484, -56.05516052246094, -52.209503173828125, -48.36384582519531, -44.5181884765625, -40.67253112792969, -36.826873779296875, -32.9812126159668, -29.135555267333984, -25.289897918701172, -21.44424057006836, -17.598583221435547, -13.752923965454102, -9.907266616821289, -6.061609268188477, -2.2159500122070312, 1.6297073364257812, 5.475364685058594, 9.321022033691406, 13.166680335998535, 17.012338638305664, 20.857995986938477, 24.70365333557129, 28.549312591552734, 32.39496994018555, 36.24062728881836, 40.08628463745117, 43.931941986083984, 47.77760314941406, 51.623260498046875, 55.46891784667969, 59.3145751953125, 63.16023254394531, 67.00588989257812]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 5.0, 10.0, 18.0, 17.0, 16.0, 31.0, 34.0, 34.0, 43.0, 59.0, 56.0, 66.0, 77.0, 75.0, 89.0, 55.0, 58.0, 38.0, 37.0, 33.0, 29.0, 19.0, 22.0, 14.0, 20.0, 7.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.52621078491211, -56.307403564453125, -54.088592529296875, -51.86978530883789, -49.650978088378906, -47.432167053222656, -45.21335983276367, -42.99455261230469, -40.77574157714844, -38.55693435668945, -36.3381233215332, -34.11931610107422, -31.9005069732666, -29.681697845458984, -27.462890625, -25.244081497192383, -23.025272369384766, -20.80646324157715, -18.58765411376953, -16.368846893310547, -14.15003776550293, -11.931228637695312, -9.712420463562012, -7.493612289428711, -5.274803161621094, -3.0559945106506348, -0.8371858596801758, 1.3816227912902832, 3.600431442260742, 5.819240570068359, 8.03804874420166, 10.256856918334961, 12.475669860839844, 14.694478988647461, 16.913288116455078, 19.132095336914062, 21.35090446472168, 23.569713592529297, 25.78852081298828, 28.0073299407959, 30.226139068603516, 32.4449462890625, 34.66375732421875, 36.882564544677734, 39.10137176513672, 41.32018280029297, 43.53899002075195, 45.75779724121094, 47.97660827636719, 50.19541549682617, 52.41422653198242, 54.633033752441406, 56.851844787597656, 59.07065200805664, 61.289459228515625, 63.508270263671875, 65.72708129882812, 67.94589233398438, 70.1646957397461, 72.38350677490234, 74.6023178100586, 76.82112121582031, 79.03993225097656, 81.25874328613281, 83.47754669189453]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 5.0, 15.0, 13.0, 18.0, 23.0, 29.0, 49.0, 80.0, 120.0, 196.0, 350.0, 570.0, 1029.0, 1915.0, 3881.0, 7801.0, 17399.0, 46007.0, 172632.0, 1081602.0, 2291934.0, 428877.0, 87504.0, 29054.0, 11909.0, 5443.0, 2708.0, 1395.0, 693.0, 447.0, 219.0, 140.0, 79.0, 41.0, 28.0, 21.0, 15.0, 12.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.60546875, -4.48187255859375, -4.3582763671875, -4.23468017578125, -4.111083984375, -3.98748779296875, -3.8638916015625, -3.74029541015625, -3.61669921875, -3.49310302734375, -3.3695068359375, -3.24591064453125, -3.122314453125, -2.99871826171875, -2.8751220703125, -2.75152587890625, -2.6279296875, -2.50433349609375, -2.3807373046875, -2.25714111328125, -2.133544921875, -2.00994873046875, -1.8863525390625, -1.76275634765625, -1.63916015625, -1.51556396484375, -1.3919677734375, -1.26837158203125, -1.144775390625, -1.02117919921875, -0.8975830078125, -0.77398681640625, -0.650390625, -0.52679443359375, -0.4031982421875, -0.27960205078125, -0.156005859375, -0.03240966796875, 0.0911865234375, 0.21478271484375, 0.33837890625, 0.46197509765625, 0.5855712890625, 0.70916748046875, 0.832763671875, 0.95635986328125, 1.0799560546875, 1.20355224609375, 1.3271484375, 1.45074462890625, 1.5743408203125, 1.69793701171875, 1.821533203125, 1.94512939453125, 2.0687255859375, 2.19232177734375, 2.31591796875, 2.43951416015625, 2.5631103515625, 2.68670654296875, 2.810302734375, 2.93389892578125, 3.0574951171875, 3.18109130859375, 3.3046875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 14.0, 12.0, 11.0, 12.0, 22.0, 21.0, 26.0, 32.0, 36.0, 39.0, 41.0, 48.0, 48.0, 42.0, 48.0, 53.0, 54.0, 48.0, 48.0, 61.0, 37.0, 44.0, 32.0, 21.0, 17.0, 25.0, 26.0, 16.0, 13.0, 8.0, 10.0, 6.0, 8.0, 4.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.06585693359375, -2.9656982421875, -2.86553955078125, -2.765380859375, -2.66522216796875, -2.5650634765625, -2.46490478515625, -2.36474609375, -2.26458740234375, -2.1644287109375, -2.06427001953125, -1.964111328125, -1.86395263671875, -1.7637939453125, -1.66363525390625, -1.5634765625, -1.46331787109375, -1.3631591796875, -1.26300048828125, -1.162841796875, -1.06268310546875, -0.9625244140625, -0.86236572265625, -0.76220703125, -0.66204833984375, -0.5618896484375, -0.46173095703125, -0.361572265625, -0.26141357421875, -0.1612548828125, -0.06109619140625, 0.0390625, 0.13922119140625, 0.2393798828125, 0.33953857421875, 0.439697265625, 0.53985595703125, 0.6400146484375, 0.74017333984375, 0.84033203125, 0.94049072265625, 1.0406494140625, 1.14080810546875, 1.240966796875, 1.34112548828125, 1.4412841796875, 1.54144287109375, 1.6416015625, 1.74176025390625, 1.8419189453125, 1.94207763671875, 2.042236328125, 2.14239501953125, 2.2425537109375, 2.34271240234375, 2.44287109375, 2.54302978515625, 2.6431884765625, 2.74334716796875, 2.843505859375, 2.94366455078125, 3.0438232421875, 3.14398193359375, 3.244140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 12.0, 11.0, 24.0, 39.0, 61.0, 125.0, 228.0, 700.0, 2457.0, 14915.0, 194561.0, 3804989.0, 159416.0, 13150.0, 2287.0, 683.0, 262.0, 159.0, 76.0, 39.0, 36.0, 13.0, 8.0, 5.0, 10.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.0582275390625, -10.624267578125, -10.1903076171875, -9.75634765625, -9.3223876953125, -8.888427734375, -8.4544677734375, -8.0205078125, -7.5865478515625, -7.152587890625, -6.7186279296875, -6.28466796875, -5.8507080078125, -5.416748046875, -4.9827880859375, -4.548828125, -4.1148681640625, -3.680908203125, -3.2469482421875, -2.81298828125, -2.3790283203125, -1.945068359375, -1.5111083984375, -1.0771484375, -0.6431884765625, -0.209228515625, 0.2247314453125, 0.65869140625, 1.0926513671875, 1.526611328125, 1.9605712890625, 2.39453125, 2.8284912109375, 3.262451171875, 3.6964111328125, 4.13037109375, 4.5643310546875, 4.998291015625, 5.4322509765625, 5.8662109375, 6.3001708984375, 6.734130859375, 7.1680908203125, 7.60205078125, 8.0360107421875, 8.469970703125, 8.9039306640625, 9.337890625, 9.7718505859375, 10.205810546875, 10.6397705078125, 11.07373046875, 11.5076904296875, 11.941650390625, 12.3756103515625, 12.8095703125, 13.2435302734375, 13.677490234375, 14.1114501953125, 14.54541015625, 14.9793701171875, 15.413330078125, 15.8472900390625, 16.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 0.0, 9.0, 12.0, 11.0, 16.0, 20.0, 31.0, 38.0, 60.0, 60.0, 87.0, 153.0, 215.0, 397.0, 722.0, 896.0, 558.0, 256.0, 187.0, 104.0, 74.0, 45.0, 36.0, 17.0, 17.0, 14.0, 8.0, 5.0, 6.0, 6.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.24859619140625, -6.9620361328125, -6.67547607421875, -6.388916015625, -6.10235595703125, -5.8157958984375, -5.52923583984375, -5.24267578125, -4.95611572265625, -4.6695556640625, -4.38299560546875, -4.096435546875, -3.80987548828125, -3.5233154296875, -3.23675537109375, -2.9501953125, -2.66363525390625, -2.3770751953125, -2.09051513671875, -1.803955078125, -1.51739501953125, -1.2308349609375, -0.94427490234375, -0.65771484375, -0.37115478515625, -0.0845947265625, 0.20196533203125, 0.488525390625, 0.77508544921875, 1.0616455078125, 1.34820556640625, 1.634765625, 1.92132568359375, 2.2078857421875, 2.49444580078125, 2.781005859375, 3.06756591796875, 3.3541259765625, 3.64068603515625, 3.92724609375, 4.21380615234375, 4.5003662109375, 4.78692626953125, 5.073486328125, 5.36004638671875, 5.6466064453125, 5.93316650390625, 6.2197265625, 6.50628662109375, 6.7928466796875, 7.07940673828125, 7.365966796875, 7.65252685546875, 7.9390869140625, 8.22564697265625, 8.51220703125, 8.79876708984375, 9.0853271484375, 9.37188720703125, 9.658447265625, 9.94500732421875, 10.2315673828125, 10.51812744140625, 10.8046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 20.0, 81.0, 356.0, 395.0, 104.0, 23.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.24368286132812, -212.63424682617188, -206.0248260498047, -199.41539001464844, -192.80596923828125, -186.196533203125, -179.5871124267578, -172.97767639160156, -166.36825561523438, -159.75881958007812, -153.14939880371094, -146.5399627685547, -139.9305419921875, -133.32110595703125, -126.71168518066406, -120.10224914550781, -113.4928207397461, -106.88339233398438, -100.27396392822266, -93.66453552246094, -87.05510711669922, -80.4456787109375, -73.83624267578125, -67.22682189941406, -60.61738967895508, -54.00796127319336, -47.39853286743164, -40.789100646972656, -34.17967224121094, -27.57024383544922, -20.9608154296875, -14.351387023925781, -7.7419586181640625, -1.1325297355651855, 5.476899147033691, 12.086328506469727, 18.695756912231445, 25.305187225341797, 31.914615631103516, 38.524044036865234, 45.13347244262695, 51.74290084838867, 58.35232925415039, 64.96176147460938, 71.5711898803711, 78.18061828613281, 84.79004669189453, 91.39947509765625, 98.00890350341797, 104.61833190917969, 111.2277603149414, 117.83718872070312, 124.44661712646484, 131.05604553222656, 137.6654815673828, 144.27490234375, 150.88433837890625, 157.4937744140625, 164.1031951904297, 170.71263122558594, 177.32205200195312, 183.93148803710938, 190.54090881347656, 197.1503448486328, 203.759765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 11.0, 17.0, 19.0, 30.0, 47.0, 39.0, 43.0, 44.0, 59.0, 63.0, 56.0, 59.0, 56.0, 57.0, 66.0, 65.0, 45.0, 32.0, 43.0, 30.0, 26.0, 16.0, 17.0, 10.0, 9.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.18329620361328, -37.494407653808594, -35.80552291870117, -34.116634368896484, -32.4277458190918, -30.738861083984375, -29.049972534179688, -27.361085891723633, -25.672199249267578, -23.983312606811523, -22.294424057006836, -20.60553741455078, -18.916650772094727, -17.227764129638672, -15.538875579833984, -13.84998893737793, -12.161100387573242, -10.472212791442871, -8.783326148986816, -7.094438552856445, -5.405551433563232, -3.7166643142700195, -2.0277767181396484, -0.33889007568359375, 1.3499975204467773, 3.0388846397399902, 4.727771759033203, 6.416659355163574, 8.105546951293945, 9.79443359375, 11.483321189880371, 13.172207832336426, 14.861095428466797, 16.54998207092285, 18.23887062072754, 19.927757263183594, 21.61664390563965, 23.305530548095703, 24.99441909790039, 26.683305740356445, 28.3721923828125, 30.061079025268555, 31.749967575073242, 33.4388542175293, 35.127742767333984, 36.816627502441406, 38.505516052246094, 40.19440460205078, 41.88329315185547, 43.572181701660156, 45.26106643676758, 46.949954986572266, 48.63884353637695, 50.327728271484375, 52.01661682128906, 53.70550537109375, 55.39439010620117, 57.08327865600586, 58.77216339111328, 60.46105194091797, 62.149940490722656, 63.83882522583008, 65.5277099609375, 67.21659851074219, 68.90548706054688]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 6.0, 24.0, 29.0, 37.0, 72.0, 113.0, 158.0, 285.0, 512.0, 1009.0, 2129.0, 4668.0, 10977.0, 25702.0, 61661.0, 147250.0, 309011.0, 273535.0, 122290.0, 51348.0, 21242.0, 8880.0, 3799.0, 1776.0, 894.0, 449.0, 248.0, 167.0, 95.0, 58.0, 38.0, 25.0, 26.0, 12.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6776123046875, -4.503662109375, -4.3297119140625, -4.15576171875, -3.9818115234375, -3.807861328125, -3.6339111328125, -3.4599609375, -3.2860107421875, -3.112060546875, -2.9381103515625, -2.76416015625, -2.5902099609375, -2.416259765625, -2.2423095703125, -2.068359375, -1.8944091796875, -1.720458984375, -1.5465087890625, -1.37255859375, -1.1986083984375, -1.024658203125, -0.8507080078125, -0.6767578125, -0.5028076171875, -0.328857421875, -0.1549072265625, 0.01904296875, 0.1929931640625, 0.366943359375, 0.5408935546875, 0.71484375, 0.8887939453125, 1.062744140625, 1.2366943359375, 1.41064453125, 1.5845947265625, 1.758544921875, 1.9324951171875, 2.1064453125, 2.2803955078125, 2.454345703125, 2.6282958984375, 2.80224609375, 2.9761962890625, 3.150146484375, 3.3240966796875, 3.498046875, 3.6719970703125, 3.845947265625, 4.0198974609375, 4.19384765625, 4.3677978515625, 4.541748046875, 4.7156982421875, 4.8896484375, 5.0635986328125, 5.237548828125, 5.4114990234375, 5.58544921875, 5.7593994140625, 5.933349609375, 6.1072998046875, 6.28125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 9.0, 6.0, 15.0, 20.0, 19.0, 25.0, 21.0, 21.0, 37.0, 35.0, 43.0, 29.0, 34.0, 45.0, 32.0, 54.0, 53.0, 45.0, 45.0, 51.0, 50.0, 33.0, 28.0, 28.0, 31.0, 27.0, 27.0, 20.0, 15.0, 13.0, 19.0, 13.0, 9.0, 8.0, 5.0, 6.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.7464599609375, -2.656982421875, -2.5675048828125, -2.47802734375, -2.3885498046875, -2.299072265625, -2.2095947265625, -2.1201171875, -2.0306396484375, -1.941162109375, -1.8516845703125, -1.76220703125, -1.6727294921875, -1.583251953125, -1.4937744140625, -1.404296875, -1.3148193359375, -1.225341796875, -1.1358642578125, -1.04638671875, -0.9569091796875, -0.867431640625, -0.7779541015625, -0.6884765625, -0.5989990234375, -0.509521484375, -0.4200439453125, -0.33056640625, -0.2410888671875, -0.151611328125, -0.0621337890625, 0.02734375, 0.1168212890625, 0.206298828125, 0.2957763671875, 0.38525390625, 0.4747314453125, 0.564208984375, 0.6536865234375, 0.7431640625, 0.8326416015625, 0.922119140625, 1.0115966796875, 1.10107421875, 1.1905517578125, 1.280029296875, 1.3695068359375, 1.458984375, 1.5484619140625, 1.637939453125, 1.7274169921875, 1.81689453125, 1.9063720703125, 1.995849609375, 2.0853271484375, 2.1748046875, 2.2642822265625, 2.353759765625, 2.4432373046875, 2.53271484375, 2.6221923828125, 2.711669921875, 2.8011474609375, 2.890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 9.0, 22.0, 25.0, 34.0, 49.0, 79.0, 106.0, 146.0, 228.0, 395.0, 568.0, 841.0, 1544.0, 3269.0, 10230.0, 53703.0, 536931.0, 377075.0, 46997.0, 9402.0, 3039.0, 1457.0, 879.0, 510.0, 333.0, 214.0, 143.0, 96.0, 74.0, 37.0, 29.0, 27.0, 18.0, 17.0, 3.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8828125, -10.507080078125, -10.13134765625, -9.755615234375, -9.3798828125, -9.004150390625, -8.62841796875, -8.252685546875, -7.876953125, -7.501220703125, -7.12548828125, -6.749755859375, -6.3740234375, -5.998291015625, -5.62255859375, -5.246826171875, -4.87109375, -4.495361328125, -4.11962890625, -3.743896484375, -3.3681640625, -2.992431640625, -2.61669921875, -2.240966796875, -1.865234375, -1.489501953125, -1.11376953125, -0.738037109375, -0.3623046875, 0.013427734375, 0.38916015625, 0.764892578125, 1.140625, 1.516357421875, 1.89208984375, 2.267822265625, 2.6435546875, 3.019287109375, 3.39501953125, 3.770751953125, 4.146484375, 4.522216796875, 4.89794921875, 5.273681640625, 5.6494140625, 6.025146484375, 6.40087890625, 6.776611328125, 7.15234375, 7.528076171875, 7.90380859375, 8.279541015625, 8.6552734375, 9.031005859375, 9.40673828125, 9.782470703125, 10.158203125, 10.533935546875, 10.90966796875, 11.285400390625, 11.6611328125, 12.036865234375, 12.41259765625, 12.788330078125, 13.1640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 6.0, 9.0, 4.0, 3.0, 6.0, 20.0, 16.0, 11.0, 21.0, 25.0, 19.0, 28.0, 26.0, 31.0, 29.0, 46.0, 42.0, 49.0, 54.0, 43.0, 36.0, 45.0, 44.0, 51.0, 49.0, 48.0, 44.0, 25.0, 24.0, 13.0, 24.0, 23.0, 15.0, 14.0, 12.0, 12.0, 8.0, 6.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5390625, -12.1136474609375, -11.688232421875, -11.2628173828125, -10.83740234375, -10.4119873046875, -9.986572265625, -9.5611572265625, -9.1357421875, -8.7103271484375, -8.284912109375, -7.8594970703125, -7.43408203125, -7.0086669921875, -6.583251953125, -6.1578369140625, -5.732421875, -5.3070068359375, -4.881591796875, -4.4561767578125, -4.03076171875, -3.6053466796875, -3.179931640625, -2.7545166015625, -2.3291015625, -1.9036865234375, -1.478271484375, -1.0528564453125, -0.62744140625, -0.2020263671875, 0.223388671875, 0.6488037109375, 1.07421875, 1.4996337890625, 1.925048828125, 2.3504638671875, 2.77587890625, 3.2012939453125, 3.626708984375, 4.0521240234375, 4.4775390625, 4.9029541015625, 5.328369140625, 5.7537841796875, 6.17919921875, 6.6046142578125, 7.030029296875, 7.4554443359375, 7.880859375, 8.3062744140625, 8.731689453125, 9.1571044921875, 9.58251953125, 10.0079345703125, 10.433349609375, 10.8587646484375, 11.2841796875, 11.7095947265625, 12.135009765625, 12.5604248046875, 12.98583984375, 13.4112548828125, 13.836669921875, 14.2620849609375, 14.6875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 10.0, 14.0, 20.0, 49.0, 80.0, 204.0, 547.0, 2141.0, 19041.0, 810225.0, 206923.0, 7469.0, 1188.0, 348.0, 129.0, 71.0, 36.0, 21.0, 13.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.84503173828125, -7.6197509765625, -7.39447021484375, -7.169189453125, -6.94390869140625, -6.7186279296875, -6.49334716796875, -6.26806640625, -6.04278564453125, -5.8175048828125, -5.59222412109375, -5.366943359375, -5.14166259765625, -4.9163818359375, -4.69110107421875, -4.4658203125, -4.24053955078125, -4.0152587890625, -3.78997802734375, -3.564697265625, -3.33941650390625, -3.1141357421875, -2.88885498046875, -2.66357421875, -2.43829345703125, -2.2130126953125, -1.98773193359375, -1.762451171875, -1.53717041015625, -1.3118896484375, -1.08660888671875, -0.861328125, -0.63604736328125, -0.4107666015625, -0.18548583984375, 0.039794921875, 0.26507568359375, 0.4903564453125, 0.71563720703125, 0.94091796875, 1.16619873046875, 1.3914794921875, 1.61676025390625, 1.842041015625, 2.06732177734375, 2.2926025390625, 2.51788330078125, 2.7431640625, 2.96844482421875, 3.1937255859375, 3.41900634765625, 3.644287109375, 3.86956787109375, 4.0948486328125, 4.32012939453125, 4.54541015625, 4.77069091796875, 4.9959716796875, 5.22125244140625, 5.446533203125, 5.67181396484375, 5.8970947265625, 6.12237548828125, 6.34765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 5.0, 11.0, 10.0, 20.0, 19.0, 23.0, 17.0, 28.0, 37.0, 49.0, 63.0, 67.0, 78.0, 94.0, 87.0, 70.0, 57.0, 50.0, 39.0, 34.0, 29.0, 15.0, 21.0, 7.0, 15.0, 12.0, 6.0, 6.0, 3.0, 2.0, 10.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006961822509765625, -0.0006748288869857788, -0.0006534755229949951, -0.0006321221590042114, -0.0006107687950134277, -0.000589415431022644, -0.0005680620670318604, -0.0005467087030410767, -0.000525355339050293, -0.0005040019750595093, -0.0004826486110687256, -0.0004612952470779419, -0.0004399418830871582, -0.0004185885190963745, -0.0003972351551055908, -0.00037588179111480713, -0.00035452842712402344, -0.00033317506313323975, -0.00031182169914245605, -0.00029046833515167236, -0.00026911497116088867, -0.000247761607170105, -0.0002264082431793213, -0.0002050548791885376, -0.0001837015151977539, -0.00016234815120697021, -0.00014099478721618652, -0.00011964142322540283, -9.828805923461914e-05, -7.693469524383545e-05, -5.558133125305176e-05, -3.4227967262268066e-05, -1.2874603271484375e-05, 8.478760719299316e-06, 2.9832124710083008e-05, 5.11854887008667e-05, 7.253885269165039e-05, 9.389221668243408e-05, 0.00011524558067321777, 0.00013659894466400146, 0.00015795230865478516, 0.00017930567264556885, 0.00020065903663635254, 0.00022201240062713623, 0.00024336576461791992, 0.0002647191286087036, 0.0002860724925994873, 0.000307425856590271, 0.0003287792205810547, 0.0003501325845718384, 0.00037148594856262207, 0.00039283931255340576, 0.00041419267654418945, 0.00043554604053497314, 0.00045689940452575684, 0.00047825276851654053, 0.0004996061325073242, 0.0005209594964981079, 0.0005423128604888916, 0.0005636662244796753, 0.000585019588470459, 0.0006063729524612427, 0.0006277263164520264, 0.0006490796804428101, 0.0006704330444335938]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 3.0, 8.0, 15.0, 19.0, 29.0, 28.0, 41.0, 81.0, 99.0, 185.0, 274.0, 549.0, 1070.0, 2491.0, 6974.0, 27908.0, 180371.0, 698499.0, 102512.0, 18332.0, 5054.0, 1907.0, 867.0, 474.0, 264.0, 150.0, 107.0, 79.0, 39.0, 34.0, 15.0, 18.0, 12.0, 8.0, 1.0, 8.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1953125, -3.08648681640625, -2.9776611328125, -2.86883544921875, -2.760009765625, -2.65118408203125, -2.5423583984375, -2.43353271484375, -2.32470703125, -2.21588134765625, -2.1070556640625, -1.99822998046875, -1.889404296875, -1.78057861328125, -1.6717529296875, -1.56292724609375, -1.4541015625, -1.34527587890625, -1.2364501953125, -1.12762451171875, -1.018798828125, -0.90997314453125, -0.8011474609375, -0.69232177734375, -0.58349609375, -0.47467041015625, -0.3658447265625, -0.25701904296875, -0.148193359375, -0.03936767578125, 0.0694580078125, 0.17828369140625, 0.287109375, 0.39593505859375, 0.5047607421875, 0.61358642578125, 0.722412109375, 0.83123779296875, 0.9400634765625, 1.04888916015625, 1.15771484375, 1.26654052734375, 1.3753662109375, 1.48419189453125, 1.593017578125, 1.70184326171875, 1.8106689453125, 1.91949462890625, 2.0283203125, 2.13714599609375, 2.2459716796875, 2.35479736328125, 2.463623046875, 2.57244873046875, 2.6812744140625, 2.79010009765625, 2.89892578125, 3.00775146484375, 3.1165771484375, 3.22540283203125, 3.334228515625, 3.44305419921875, 3.5518798828125, 3.66070556640625, 3.76953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 18.0, 16.0, 26.0, 47.0, 69.0, 73.0, 110.0, 131.0, 101.0, 122.0, 84.0, 69.0, 50.0, 24.0, 17.0, 17.0, 12.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6953125, -6.51531982421875, -6.3353271484375, -6.15533447265625, -5.975341796875, -5.79534912109375, -5.6153564453125, -5.43536376953125, -5.25537109375, -5.07537841796875, -4.8953857421875, -4.71539306640625, -4.535400390625, -4.35540771484375, -4.1754150390625, -3.99542236328125, -3.8154296875, -3.63543701171875, -3.4554443359375, -3.27545166015625, -3.095458984375, -2.91546630859375, -2.7354736328125, -2.55548095703125, -2.37548828125, -2.19549560546875, -2.0155029296875, -1.83551025390625, -1.655517578125, -1.47552490234375, -1.2955322265625, -1.11553955078125, -0.935546875, -0.75555419921875, -0.5755615234375, -0.39556884765625, -0.215576171875, -0.03558349609375, 0.1444091796875, 0.32440185546875, 0.50439453125, 0.68438720703125, 0.8643798828125, 1.04437255859375, 1.224365234375, 1.40435791015625, 1.5843505859375, 1.76434326171875, 1.9443359375, 2.12432861328125, 2.3043212890625, 2.48431396484375, 2.664306640625, 2.84429931640625, 3.0242919921875, 3.20428466796875, 3.38427734375, 3.56427001953125, 3.7442626953125, 3.92425537109375, 4.104248046875, 4.28424072265625, 4.4642333984375, 4.64422607421875, 4.82421875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 9.0, 13.0, 59.0, 138.0, 299.0, 284.0, 107.0, 60.0, 18.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.42897033691406, -187.26351928710938, -183.0980682373047, -178.9326171875, -174.7671661376953, -170.60171508789062, -166.43626403808594, -162.27081298828125, -158.1053466796875, -153.9398956298828, -149.77444458007812, -145.60899353027344, -141.44354248046875, -137.27809143066406, -133.11264038085938, -128.94717407226562, -124.78173828125, -120.61628723144531, -116.45083618164062, -112.28538513183594, -108.11993408203125, -103.95448303222656, -99.78902435302734, -95.62357330322266, -91.45812225341797, -87.29267120361328, -83.1272201538086, -78.9617691040039, -74.79631042480469, -70.630859375, -66.46540832519531, -62.299957275390625, -58.134521484375, -53.96907043457031, -49.803619384765625, -45.63816452026367, -41.472713470458984, -37.3072624206543, -33.141807556152344, -28.976356506347656, -24.81090545654297, -20.64545440673828, -16.48000144958496, -12.314549446105957, -8.149097442626953, -3.9836463928222656, 0.1818065643310547, 4.347259521484375, 8.512710571289062, 12.678162574768066, 16.84361457824707, 21.00906753540039, 25.174518585205078, 29.339969635009766, 33.50542449951172, 37.670875549316406, 41.836326599121094, 46.00177764892578, 50.16722869873047, 54.33268356323242, 58.49813461303711, 62.6635856628418, 66.82904052734375, 70.99449157714844, 75.15994262695312]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 9.0, 15.0, 12.0, 17.0, 15.0, 19.0, 24.0, 28.0, 35.0, 32.0, 24.0, 30.0, 42.0, 39.0, 61.0, 73.0, 59.0, 58.0, 56.0, 41.0, 36.0, 24.0, 33.0, 28.0, 31.0, 26.0, 13.0, 20.0, 11.0, 11.0, 7.0, 13.0, 11.0, 2.0, 5.0, 6.0, 4.0, 1.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.667144775390625, -43.14491271972656, -41.622684478759766, -40.1004524230957, -38.578224182128906, -37.055992126464844, -35.53376007080078, -34.01152801513672, -32.48929977416992, -30.967069625854492, -29.444839477539062, -27.922607421875, -26.40037727355957, -24.87814712524414, -23.355915069580078, -21.83368492126465, -20.31145477294922, -18.78922462463379, -17.26699447631836, -15.744762420654297, -14.222532272338867, -12.700302124023438, -11.178071022033691, -9.655839920043945, -8.133609771728516, -6.611379146575928, -5.08914852142334, -3.566917896270752, -2.044687271118164, -0.5224566459655762, 0.9997739791870117, 2.522005081176758, 4.0442352294921875, 5.566465854644775, 7.088696479797363, 8.61092758178711, 10.133157730102539, 11.655387878417969, 13.177618980407715, 14.699850082397461, 16.22208023071289, 17.74431037902832, 19.26654052734375, 20.788772583007812, 22.311002731323242, 23.833232879638672, 25.355464935302734, 26.877695083618164, 28.399925231933594, 29.922155380249023, 31.444385528564453, 32.966617584228516, 34.48884582519531, 36.011077880859375, 37.53330993652344, 39.0555419921875, 40.5777702331543, 42.10000228881836, 43.622230529785156, 45.14446258544922, 46.66669464111328, 48.18892288208008, 49.71115493774414, 51.23338317871094, 52.755615234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 7.0, 10.0, 14.0, 23.0, 36.0, 60.0, 92.0, 153.0, 277.0, 523.0, 927.0, 2073.0, 4675.0, 11208.0, 31371.0, 117581.0, 783722.0, 2567211.0, 544825.0, 86836.0, 25701.0, 9440.0, 3850.0, 1830.0, 849.0, 434.0, 232.0, 129.0, 65.0, 43.0, 37.0, 12.0, 12.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.93450927734375, -4.8026123046875, -4.67071533203125, -4.538818359375, -4.40692138671875, -4.2750244140625, -4.14312744140625, -4.01123046875, -3.87933349609375, -3.7474365234375, -3.61553955078125, -3.483642578125, -3.35174560546875, -3.2198486328125, -3.08795166015625, -2.9560546875, -2.82415771484375, -2.6922607421875, -2.56036376953125, -2.428466796875, -2.29656982421875, -2.1646728515625, -2.03277587890625, -1.90087890625, -1.76898193359375, -1.6370849609375, -1.50518798828125, -1.373291015625, -1.24139404296875, -1.1094970703125, -0.97760009765625, -0.845703125, -0.71380615234375, -0.5819091796875, -0.45001220703125, -0.318115234375, -0.18621826171875, -0.0543212890625, 0.07757568359375, 0.20947265625, 0.34136962890625, 0.4732666015625, 0.60516357421875, 0.737060546875, 0.86895751953125, 1.0008544921875, 1.13275146484375, 1.2646484375, 1.39654541015625, 1.5284423828125, 1.66033935546875, 1.792236328125, 1.92413330078125, 2.0560302734375, 2.18792724609375, 2.31982421875, 2.45172119140625, 2.5836181640625, 2.71551513671875, 2.847412109375, 2.97930908203125, 3.1112060546875, 3.24310302734375, 3.375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 0.0, 10.0, 10.0, 11.0, 10.0, 16.0, 18.0, 33.0, 32.0, 40.0, 41.0, 42.0, 38.0, 43.0, 39.0, 44.0, 55.0, 66.0, 61.0, 59.0, 51.0, 43.0, 47.0, 33.0, 31.0, 19.0, 25.0, 11.0, 11.0, 19.0, 11.0, 11.0, 7.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.0, -2.89654541015625, -2.7930908203125, -2.68963623046875, -2.586181640625, -2.48272705078125, -2.3792724609375, -2.27581787109375, -2.17236328125, -2.06890869140625, -1.9654541015625, -1.86199951171875, -1.758544921875, -1.65509033203125, -1.5516357421875, -1.44818115234375, -1.3447265625, -1.24127197265625, -1.1378173828125, -1.03436279296875, -0.930908203125, -0.82745361328125, -0.7239990234375, -0.62054443359375, -0.51708984375, -0.41363525390625, -0.3101806640625, -0.20672607421875, -0.103271484375, 0.00018310546875, 0.1036376953125, 0.20709228515625, 0.310546875, 0.41400146484375, 0.5174560546875, 0.62091064453125, 0.724365234375, 0.82781982421875, 0.9312744140625, 1.03472900390625, 1.13818359375, 1.24163818359375, 1.3450927734375, 1.44854736328125, 1.552001953125, 1.65545654296875, 1.7589111328125, 1.86236572265625, 1.9658203125, 2.06927490234375, 2.1727294921875, 2.27618408203125, 2.379638671875, 2.48309326171875, 2.5865478515625, 2.69000244140625, 2.79345703125, 2.89691162109375, 3.0003662109375, 3.10382080078125, 3.207275390625, 3.31072998046875, 3.4141845703125, 3.51763916015625, 3.62109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 6.0, 11.0, 12.0, 14.0, 26.0, 25.0, 38.0, 58.0, 87.0, 144.0, 231.0, 399.0, 683.0, 1399.0, 3071.0, 7998.0, 25060.0, 101206.0, 917087.0, 2845499.0, 226514.0, 43960.0, 12635.0, 4464.0, 1716.0, 817.0, 443.0, 230.0, 140.0, 93.0, 44.0, 43.0, 29.0, 27.0, 19.0, 9.0, 10.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-6.625, -6.43145751953125, -6.2379150390625, -6.04437255859375, -5.850830078125, -5.65728759765625, -5.4637451171875, -5.27020263671875, -5.07666015625, -4.88311767578125, -4.6895751953125, -4.49603271484375, -4.302490234375, -4.10894775390625, -3.9154052734375, -3.72186279296875, -3.5283203125, -3.33477783203125, -3.1412353515625, -2.94769287109375, -2.754150390625, -2.56060791015625, -2.3670654296875, -2.17352294921875, -1.97998046875, -1.78643798828125, -1.5928955078125, -1.39935302734375, -1.205810546875, -1.01226806640625, -0.8187255859375, -0.62518310546875, -0.431640625, -0.23809814453125, -0.0445556640625, 0.14898681640625, 0.342529296875, 0.53607177734375, 0.7296142578125, 0.92315673828125, 1.11669921875, 1.31024169921875, 1.5037841796875, 1.69732666015625, 1.890869140625, 2.08441162109375, 2.2779541015625, 2.47149658203125, 2.6650390625, 2.85858154296875, 3.0521240234375, 3.24566650390625, 3.439208984375, 3.63275146484375, 3.8262939453125, 4.01983642578125, 4.21337890625, 4.40692138671875, 4.6004638671875, 4.79400634765625, 4.987548828125, 5.18109130859375, 5.3746337890625, 5.56817626953125, 5.76171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 13.0, 15.0, 14.0, 19.0, 24.0, 41.0, 50.0, 75.0, 88.0, 136.0, 232.0, 391.0, 580.0, 747.0, 598.0, 365.0, 215.0, 139.0, 77.0, 53.0, 40.0, 40.0, 28.0, 12.0, 17.0, 10.0, 13.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5625, -8.3338623046875, -8.105224609375, -7.8765869140625, -7.64794921875, -7.4193115234375, -7.190673828125, -6.9620361328125, -6.7333984375, -6.5047607421875, -6.276123046875, -6.0474853515625, -5.81884765625, -5.5902099609375, -5.361572265625, -5.1329345703125, -4.904296875, -4.6756591796875, -4.447021484375, -4.2183837890625, -3.98974609375, -3.7611083984375, -3.532470703125, -3.3038330078125, -3.0751953125, -2.8465576171875, -2.617919921875, -2.3892822265625, -2.16064453125, -1.9320068359375, -1.703369140625, -1.4747314453125, -1.24609375, -1.0174560546875, -0.788818359375, -0.5601806640625, -0.33154296875, -0.1029052734375, 0.125732421875, 0.3543701171875, 0.5830078125, 0.8116455078125, 1.040283203125, 1.2689208984375, 1.49755859375, 1.7261962890625, 1.954833984375, 2.1834716796875, 2.412109375, 2.6407470703125, 2.869384765625, 3.0980224609375, 3.32666015625, 3.5552978515625, 3.783935546875, 4.0125732421875, 4.2412109375, 4.4698486328125, 4.698486328125, 4.9271240234375, 5.15576171875, 5.3843994140625, 5.613037109375, 5.8416748046875, 6.0703125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 33.0, 67.0, 144.0, 236.0, 268.0, 145.0, 61.0, 19.0, 7.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-123.30146026611328, -119.98234558105469, -116.6632308959961, -113.3441162109375, -110.02500915527344, -106.70588684082031, -103.38677978515625, -100.06766510009766, -96.74855041503906, -93.42943572998047, -90.11032104492188, -86.79120635986328, -83.47209167480469, -80.15298461914062, -76.83386993408203, -73.51475524902344, -70.19564056396484, -66.87652587890625, -63.557411193847656, -60.23830032348633, -56.919185638427734, -53.60007095336914, -50.28096008300781, -46.96184539794922, -43.642730712890625, -40.32361602783203, -37.00450134277344, -33.68539047241211, -30.366275787353516, -27.047161102294922, -23.72804832458496, -20.408935546875, -17.089828491210938, -13.77071475982666, -10.451601028442383, -7.1324872970581055, -3.813373565673828, -0.4942588806152344, 2.8248538970947266, 6.1439666748046875, 9.463081359863281, 12.782195091247559, 16.101308822631836, 19.420421600341797, 22.73953628540039, 26.058650970458984, 29.377763748168945, 32.696876525878906, 36.0159912109375, 39.335105895996094, 42.65422058105469, 45.973331451416016, 49.29244613647461, 52.6115608215332, 55.93067169189453, 59.249786376953125, 62.56890106201172, 65.88801574707031, 69.2071304321289, 72.5262451171875, 75.84535217285156, 79.16447448730469, 82.48358154296875, 85.80269622802734, 89.12181091308594]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 14.0, 12.0, 12.0, 12.0, 18.0, 26.0, 25.0, 31.0, 28.0, 36.0, 40.0, 39.0, 36.0, 44.0, 49.0, 49.0, 59.0, 50.0, 60.0, 51.0, 46.0, 30.0, 32.0, 31.0, 33.0, 19.0, 20.0, 14.0, 13.0, 10.0, 16.0, 1.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-41.623390197753906, -40.47854232788086, -39.33369445800781, -38.188846588134766, -37.04399871826172, -35.89915084838867, -34.754302978515625, -33.60945510864258, -32.46460723876953, -31.319759368896484, -30.174911499023438, -29.03006362915039, -27.885215759277344, -26.740367889404297, -25.59552001953125, -24.450672149658203, -23.305824279785156, -22.16097640991211, -21.016128540039062, -19.871280670166016, -18.72643280029297, -17.581584930419922, -16.436737060546875, -15.291889190673828, -14.147041320800781, -13.002193450927734, -11.857345581054688, -10.71249771118164, -9.567649841308594, -8.422801971435547, -7.2779541015625, -6.133106231689453, -4.988254547119141, -3.8434066772460938, -2.698558807373047, -1.5537109375, -0.4088630676269531, 0.7359848022460938, 1.8808326721191406, 3.0256805419921875, 4.170528411865234, 5.315376281738281, 6.460224151611328, 7.605072021484375, 8.749919891357422, 9.894767761230469, 11.039615631103516, 12.184463500976562, 13.32931137084961, 14.474159240722656, 15.619007110595703, 16.76385498046875, 17.908702850341797, 19.053550720214844, 20.19839859008789, 21.343246459960938, 22.488094329833984, 23.63294219970703, 24.777790069580078, 25.922637939453125, 27.067485809326172, 28.21233367919922, 29.357181549072266, 30.502029418945312, 31.64687728881836]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 9.0, 12.0, 17.0, 16.0, 32.0, 54.0, 85.0, 140.0, 231.0, 348.0, 598.0, 1020.0, 1822.0, 3515.0, 6926.0, 15161.0, 33374.0, 75846.0, 179251.0, 328410.0, 225666.0, 96726.0, 42205.0, 18874.0, 8770.0, 4369.0, 2188.0, 1156.0, 684.0, 405.0, 237.0, 166.0, 78.0, 63.0, 45.0, 20.0, 10.0, 8.0, 9.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.0390625, -5.86962890625, -5.7001953125, -5.53076171875, -5.361328125, -5.19189453125, -5.0224609375, -4.85302734375, -4.68359375, -4.51416015625, -4.3447265625, -4.17529296875, -4.005859375, -3.83642578125, -3.6669921875, -3.49755859375, -3.328125, -3.15869140625, -2.9892578125, -2.81982421875, -2.650390625, -2.48095703125, -2.3115234375, -2.14208984375, -1.97265625, -1.80322265625, -1.6337890625, -1.46435546875, -1.294921875, -1.12548828125, -0.9560546875, -0.78662109375, -0.6171875, -0.44775390625, -0.2783203125, -0.10888671875, 0.060546875, 0.22998046875, 0.3994140625, 0.56884765625, 0.73828125, 0.90771484375, 1.0771484375, 1.24658203125, 1.416015625, 1.58544921875, 1.7548828125, 1.92431640625, 2.09375, 2.26318359375, 2.4326171875, 2.60205078125, 2.771484375, 2.94091796875, 3.1103515625, 3.27978515625, 3.44921875, 3.61865234375, 3.7880859375, 3.95751953125, 4.126953125, 4.29638671875, 4.4658203125, 4.63525390625, 4.8046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 11.0, 14.0, 17.0, 16.0, 17.0, 14.0, 30.0, 36.0, 22.0, 39.0, 40.0, 48.0, 34.0, 49.0, 41.0, 42.0, 60.0, 47.0, 42.0, 47.0, 56.0, 31.0, 21.0, 33.0, 26.0, 16.0, 26.0, 20.0, 18.0, 20.0, 9.0, 8.0, 7.0, 4.0, 6.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.838165283203125, -2.74664306640625, -2.655120849609375, -2.5635986328125, -2.472076416015625, -2.38055419921875, -2.289031982421875, -2.197509765625, -2.105987548828125, -2.01446533203125, -1.922943115234375, -1.8314208984375, -1.739898681640625, -1.64837646484375, -1.556854248046875, -1.46533203125, -1.373809814453125, -1.28228759765625, -1.190765380859375, -1.0992431640625, -1.007720947265625, -0.91619873046875, -0.824676513671875, -0.733154296875, -0.641632080078125, -0.55010986328125, -0.458587646484375, -0.3670654296875, -0.275543212890625, -0.18402099609375, -0.092498779296875, -0.0009765625, 0.090545654296875, 0.18206787109375, 0.273590087890625, 0.3651123046875, 0.456634521484375, 0.54815673828125, 0.639678955078125, 0.731201171875, 0.822723388671875, 0.91424560546875, 1.005767822265625, 1.0972900390625, 1.188812255859375, 1.28033447265625, 1.371856689453125, 1.46337890625, 1.554901123046875, 1.64642333984375, 1.737945556640625, 1.8294677734375, 1.920989990234375, 2.01251220703125, 2.104034423828125, 2.195556640625, 2.287078857421875, 2.37860107421875, 2.470123291015625, 2.5616455078125, 2.653167724609375, 2.74468994140625, 2.836212158203125, 2.927734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 3.0, 9.0, 11.0, 16.0, 30.0, 31.0, 38.0, 43.0, 81.0, 120.0, 165.0, 229.0, 351.0, 623.0, 1069.0, 2052.0, 5020.0, 18754.0, 112834.0, 714858.0, 156493.0, 24259.0, 6008.0, 2410.0, 1138.0, 657.0, 372.0, 281.0, 169.0, 119.0, 94.0, 46.0, 44.0, 30.0, 29.0, 16.0, 11.0, 10.0, 7.0, 5.0, 8.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5234375, -11.1466064453125, -10.769775390625, -10.3929443359375, -10.01611328125, -9.6392822265625, -9.262451171875, -8.8856201171875, -8.5087890625, -8.1319580078125, -7.755126953125, -7.3782958984375, -7.00146484375, -6.6246337890625, -6.247802734375, -5.8709716796875, -5.494140625, -5.1173095703125, -4.740478515625, -4.3636474609375, -3.98681640625, -3.6099853515625, -3.233154296875, -2.8563232421875, -2.4794921875, -2.1026611328125, -1.725830078125, -1.3489990234375, -0.97216796875, -0.5953369140625, -0.218505859375, 0.1583251953125, 0.53515625, 0.9119873046875, 1.288818359375, 1.6656494140625, 2.04248046875, 2.4193115234375, 2.796142578125, 3.1729736328125, 3.5498046875, 3.9266357421875, 4.303466796875, 4.6802978515625, 5.05712890625, 5.4339599609375, 5.810791015625, 6.1876220703125, 6.564453125, 6.9412841796875, 7.318115234375, 7.6949462890625, 8.07177734375, 8.4486083984375, 8.825439453125, 9.2022705078125, 9.5791015625, 9.9559326171875, 10.332763671875, 10.7095947265625, 11.08642578125, 11.4632568359375, 11.840087890625, 12.2169189453125, 12.59375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 4.0, 2.0, 6.0, 13.0, 17.0, 17.0, 21.0, 30.0, 41.0, 37.0, 50.0, 50.0, 59.0, 62.0, 74.0, 62.0, 65.0, 50.0, 57.0, 52.0, 37.0, 48.0, 25.0, 32.0, 13.0, 14.0, 17.0, 9.0, 6.0, 10.0, 5.0, 5.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0], "bins": [-19.25, -18.785888671875, -18.32177734375, -17.857666015625, -17.3935546875, -16.929443359375, -16.46533203125, -16.001220703125, -15.537109375, -15.072998046875, -14.60888671875, -14.144775390625, -13.6806640625, -13.216552734375, -12.75244140625, -12.288330078125, -11.82421875, -11.360107421875, -10.89599609375, -10.431884765625, -9.9677734375, -9.503662109375, -9.03955078125, -8.575439453125, -8.111328125, -7.647216796875, -7.18310546875, -6.718994140625, -6.2548828125, -5.790771484375, -5.32666015625, -4.862548828125, -4.3984375, -3.934326171875, -3.47021484375, -3.006103515625, -2.5419921875, -2.077880859375, -1.61376953125, -1.149658203125, -0.685546875, -0.221435546875, 0.24267578125, 0.706787109375, 1.1708984375, 1.635009765625, 2.09912109375, 2.563232421875, 3.02734375, 3.491455078125, 3.95556640625, 4.419677734375, 4.8837890625, 5.347900390625, 5.81201171875, 6.276123046875, 6.740234375, 7.204345703125, 7.66845703125, 8.132568359375, 8.5966796875, 9.060791015625, 9.52490234375, 9.989013671875, 10.453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 3.0, 4.0, 14.0, 6.0, 24.0, 13.0, 35.0, 32.0, 68.0, 131.0, 184.0, 313.0, 634.0, 1377.0, 4035.0, 15973.0, 113243.0, 762083.0, 126052.0, 17210.0, 4149.0, 1421.0, 657.0, 319.0, 188.0, 118.0, 65.0, 62.0, 39.0, 21.0, 19.0, 12.0, 9.0, 4.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.955078125, -3.833465576171875, -3.71185302734375, -3.590240478515625, -3.4686279296875, -3.347015380859375, -3.22540283203125, -3.103790283203125, -2.982177734375, -2.860565185546875, -2.73895263671875, -2.617340087890625, -2.4957275390625, -2.374114990234375, -2.25250244140625, -2.130889892578125, -2.00927734375, -1.887664794921875, -1.76605224609375, -1.644439697265625, -1.5228271484375, -1.401214599609375, -1.27960205078125, -1.157989501953125, -1.036376953125, -0.914764404296875, -0.79315185546875, -0.671539306640625, -0.5499267578125, -0.428314208984375, -0.30670166015625, -0.185089111328125, -0.0634765625, 0.058135986328125, 0.17974853515625, 0.301361083984375, 0.4229736328125, 0.544586181640625, 0.66619873046875, 0.787811279296875, 0.909423828125, 1.031036376953125, 1.15264892578125, 1.274261474609375, 1.3958740234375, 1.517486572265625, 1.63909912109375, 1.760711669921875, 1.88232421875, 2.003936767578125, 2.12554931640625, 2.247161865234375, 2.3687744140625, 2.490386962890625, 2.61199951171875, 2.733612060546875, 2.855224609375, 2.976837158203125, 3.09844970703125, 3.220062255859375, 3.3416748046875, 3.463287353515625, 3.58489990234375, 3.706512451171875, 3.828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 6.0, 12.0, 13.0, 10.0, 23.0, 27.0, 33.0, 56.0, 70.0, 97.0, 89.0, 108.0, 114.0, 103.0, 59.0, 46.0, 36.0, 28.0, 21.0, 21.0, 11.0, 3.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.0014476776123046875, -0.001416534185409546, -0.0013853907585144043, -0.0013542473316192627, -0.001323103904724121, -0.0012919604778289795, -0.0012608170509338379, -0.0012296736240386963, -0.0011985301971435547, -0.001167386770248413, -0.0011362433433532715, -0.0011050999164581299, -0.0010739564895629883, -0.0010428130626678467, -0.001011669635772705, -0.0009805262088775635, -0.0009493827819824219, -0.0009182393550872803, -0.0008870959281921387, -0.0008559525012969971, -0.0008248090744018555, -0.0007936656475067139, -0.0007625222206115723, -0.0007313787937164307, -0.0007002353668212891, -0.0006690919399261475, -0.0006379485130310059, -0.0006068050861358643, -0.0005756616592407227, -0.0005445182323455811, -0.0005133748054504395, -0.00048223137855529785, -0.00045108795166015625, -0.00041994452476501465, -0.00038880109786987305, -0.00035765767097473145, -0.00032651424407958984, -0.00029537081718444824, -0.00026422739028930664, -0.00023308396339416504, -0.00020194053649902344, -0.00017079710960388184, -0.00013965368270874023, -0.00010851025581359863, -7.736682891845703e-05, -4.622340202331543e-05, -1.5079975128173828e-05, 1.6063451766967773e-05, 4.7206878662109375e-05, 7.835030555725098e-05, 0.00010949373245239258, 0.00014063715934753418, 0.00017178058624267578, 0.00020292401313781738, 0.00023406744003295898, 0.0002652108669281006, 0.0002963542938232422, 0.0003274977207183838, 0.0003586411476135254, 0.000389784574508667, 0.0004209280014038086, 0.0004520714282989502, 0.0004832148551940918, 0.0005143582820892334, 0.000545501708984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 8.0, 12.0, 10.0, 5.0, 15.0, 10.0, 30.0, 33.0, 53.0, 66.0, 109.0, 192.0, 300.0, 498.0, 923.0, 1988.0, 4243.0, 11521.0, 49522.0, 588525.0, 334360.0, 38544.0, 9907.0, 3822.0, 1735.0, 841.0, 480.0, 305.0, 157.0, 109.0, 56.0, 44.0, 28.0, 26.0, 25.0, 15.0, 3.0, 8.0, 9.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.951171875, -3.834716796875, -3.71826171875, -3.601806640625, -3.4853515625, -3.368896484375, -3.25244140625, -3.135986328125, -3.01953125, -2.903076171875, -2.78662109375, -2.670166015625, -2.5537109375, -2.437255859375, -2.32080078125, -2.204345703125, -2.087890625, -1.971435546875, -1.85498046875, -1.738525390625, -1.6220703125, -1.505615234375, -1.38916015625, -1.272705078125, -1.15625, -1.039794921875, -0.92333984375, -0.806884765625, -0.6904296875, -0.573974609375, -0.45751953125, -0.341064453125, -0.224609375, -0.108154296875, 0.00830078125, 0.124755859375, 0.2412109375, 0.357666015625, 0.47412109375, 0.590576171875, 0.70703125, 0.823486328125, 0.93994140625, 1.056396484375, 1.1728515625, 1.289306640625, 1.40576171875, 1.522216796875, 1.638671875, 1.755126953125, 1.87158203125, 1.988037109375, 2.1044921875, 2.220947265625, 2.33740234375, 2.453857421875, 2.5703125, 2.686767578125, 2.80322265625, 2.919677734375, 3.0361328125, 3.152587890625, 3.26904296875, 3.385498046875, 3.501953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 2.0, 6.0, 6.0, 4.0, 9.0, 7.0, 17.0, 17.0, 23.0, 30.0, 50.0, 66.0, 77.0, 54.0, 71.0, 84.0, 71.0, 63.0, 65.0, 61.0, 42.0, 42.0, 24.0, 19.0, 20.0, 15.0, 11.0, 9.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.900543212890625, -2.79522705078125, -2.689910888671875, -2.5845947265625, -2.479278564453125, -2.37396240234375, -2.268646240234375, -2.163330078125, -2.058013916015625, -1.95269775390625, -1.847381591796875, -1.7420654296875, -1.636749267578125, -1.53143310546875, -1.426116943359375, -1.32080078125, -1.215484619140625, -1.11016845703125, -1.004852294921875, -0.8995361328125, -0.794219970703125, -0.68890380859375, -0.583587646484375, -0.478271484375, -0.372955322265625, -0.26763916015625, -0.162322998046875, -0.0570068359375, 0.048309326171875, 0.15362548828125, 0.258941650390625, 0.3642578125, 0.469573974609375, 0.57489013671875, 0.680206298828125, 0.7855224609375, 0.890838623046875, 0.99615478515625, 1.101470947265625, 1.206787109375, 1.312103271484375, 1.41741943359375, 1.522735595703125, 1.6280517578125, 1.733367919921875, 1.83868408203125, 1.944000244140625, 2.04931640625, 2.154632568359375, 2.25994873046875, 2.365264892578125, 2.4705810546875, 2.575897216796875, 2.68121337890625, 2.786529541015625, 2.891845703125, 2.997161865234375, 3.10247802734375, 3.207794189453125, 3.3131103515625, 3.418426513671875, 3.52374267578125, 3.629058837890625, 3.734375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 28.0, 95.0, 412.0, 345.0, 82.0, 17.0, 11.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-326.1297607421875, -319.8470764160156, -313.5644226074219, -307.28173828125, -300.9990539550781, -294.7164001464844, -288.4337158203125, -282.1510314941406, -275.86834716796875, -269.5856628417969, -263.3030090332031, -257.02032470703125, -250.73764038085938, -244.45497131347656, -238.17230224609375, -231.88961791992188, -225.60696411132812, -219.3242950439453, -213.04161071777344, -206.75894165039062, -200.47625732421875, -194.19358825683594, -187.91091918945312, -181.62823486328125, -175.34556579589844, -169.06289672851562, -162.78021240234375, -156.49754333496094, -150.21487426757812, -143.93218994140625, -137.64952087402344, -131.36685180664062, -125.08415222167969, -118.80147552490234, -112.518798828125, -106.23612976074219, -99.95345306396484, -93.6707763671875, -87.38810729980469, -81.10543060302734, -74.82275390625, -68.54007720947266, -62.25740432739258, -55.9747314453125, -49.692054748535156, -43.40937805175781, -37.126705169677734, -30.844032287597656, -24.561355590820312, -18.2786808013916, -11.99600601196289, -5.71333122253418, 0.5693435668945312, 6.852018356323242, 13.134693145751953, 19.41736602783203, 25.700042724609375, 31.982717514038086, 38.2653923034668, 44.548065185546875, 50.83074188232422, 57.11341857910156, 63.39609146118164, 69.67876434326172, 75.96144104003906]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 12.0, 9.0, 8.0, 16.0, 13.0, 17.0, 25.0, 32.0, 27.0, 31.0, 27.0, 25.0, 24.0, 51.0, 52.0, 62.0, 63.0, 53.0, 68.0, 63.0, 39.0, 42.0, 32.0, 26.0, 23.0, 15.0, 29.0, 13.0, 18.0, 14.0, 14.0, 10.0, 10.0, 5.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-50.21049499511719, -48.77964401245117, -47.34879684448242, -45.917945861816406, -44.487098693847656, -43.05624771118164, -41.625396728515625, -40.194549560546875, -38.763702392578125, -37.33285140991211, -35.90200424194336, -34.471153259277344, -33.040306091308594, -31.609455108642578, -30.178606033325195, -28.747756958007812, -27.316905975341797, -25.886056900024414, -24.45520782470703, -23.024356842041016, -21.593509674072266, -20.16265869140625, -18.731809616088867, -17.300960540771484, -15.870111465454102, -14.439262390136719, -13.008413314819336, -11.577563285827637, -10.146714210510254, -8.715865135192871, -7.285015106201172, -5.854166030883789, -4.423316955566406, -2.9924676418304443, -1.5616183280944824, -0.1307687759399414, 1.3000802993774414, 2.730929374694824, 4.161779403686523, 5.592628479003906, 7.023477554321289, 8.454326629638672, 9.885175704956055, 11.316025733947754, 12.746874809265137, 14.17772388458252, 15.608573913574219, 17.0394229888916, 18.470272064208984, 19.901121139526367, 21.33197021484375, 22.762821197509766, 24.193668365478516, 25.62451934814453, 27.055368423461914, 28.486217498779297, 29.91706657409668, 31.347915649414062, 32.77876663208008, 34.20961380004883, 35.640464782714844, 37.071311950683594, 38.50216293334961, 39.933013916015625, 41.363861083984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 5.0, 7.0, 6.0, 12.0, 22.0, 21.0, 57.0, 99.0, 161.0, 256.0, 569.0, 1229.0, 2944.0, 8290.0, 33640.0, 279901.0, 2682023.0, 1071910.0, 87820.0, 16577.0, 5023.0, 1950.0, 877.0, 386.0, 238.0, 97.0, 56.0, 39.0, 22.0, 13.0, 12.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.06072998046875, -3.9144287109375, -3.76812744140625, -3.621826171875, -3.47552490234375, -3.3292236328125, -3.18292236328125, -3.03662109375, -2.89031982421875, -2.7440185546875, -2.59771728515625, -2.451416015625, -2.30511474609375, -2.1588134765625, -2.01251220703125, -1.8662109375, -1.71990966796875, -1.5736083984375, -1.42730712890625, -1.281005859375, -1.13470458984375, -0.9884033203125, -0.84210205078125, -0.69580078125, -0.54949951171875, -0.4031982421875, -0.25689697265625, -0.110595703125, 0.03570556640625, 0.1820068359375, 0.32830810546875, 0.474609375, 0.62091064453125, 0.7672119140625, 0.91351318359375, 1.059814453125, 1.20611572265625, 1.3524169921875, 1.49871826171875, 1.64501953125, 1.79132080078125, 1.9376220703125, 2.08392333984375, 2.230224609375, 2.37652587890625, 2.5228271484375, 2.66912841796875, 2.8154296875, 2.96173095703125, 3.1080322265625, 3.25433349609375, 3.400634765625, 3.54693603515625, 3.6932373046875, 3.83953857421875, 3.98583984375, 4.13214111328125, 4.2784423828125, 4.42474365234375, 4.571044921875, 4.71734619140625, 4.8636474609375, 5.00994873046875, 5.15625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 15.0, 9.0, 9.0, 7.0, 16.0, 19.0, 13.0, 32.0, 23.0, 31.0, 31.0, 34.0, 35.0, 33.0, 30.0, 42.0, 47.0, 41.0, 61.0, 48.0, 27.0, 44.0, 48.0, 39.0, 33.0, 33.0, 30.0, 21.0, 22.0, 20.0, 15.0, 12.0, 13.0, 19.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 6.0, 4.0, 1.0], "bins": [-2.962890625, -2.883270263671875, -2.80364990234375, -2.724029541015625, -2.6444091796875, -2.564788818359375, -2.48516845703125, -2.405548095703125, -2.325927734375, -2.246307373046875, -2.16668701171875, -2.087066650390625, -2.0074462890625, -1.927825927734375, -1.84820556640625, -1.768585205078125, -1.68896484375, -1.609344482421875, -1.52972412109375, -1.450103759765625, -1.3704833984375, -1.290863037109375, -1.21124267578125, -1.131622314453125, -1.052001953125, -0.972381591796875, -0.89276123046875, -0.813140869140625, -0.7335205078125, -0.653900146484375, -0.57427978515625, -0.494659423828125, -0.4150390625, -0.335418701171875, -0.25579833984375, -0.176177978515625, -0.0965576171875, -0.016937255859375, 0.06268310546875, 0.142303466796875, 0.221923828125, 0.301544189453125, 0.38116455078125, 0.460784912109375, 0.5404052734375, 0.620025634765625, 0.69964599609375, 0.779266357421875, 0.85888671875, 0.938507080078125, 1.01812744140625, 1.097747802734375, 1.1773681640625, 1.256988525390625, 1.33660888671875, 1.416229248046875, 1.495849609375, 1.575469970703125, 1.65509033203125, 1.734710693359375, 1.8143310546875, 1.893951416015625, 1.97357177734375, 2.053192138671875, 2.1328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 4.0, 14.0, 15.0, 25.0, 37.0, 61.0, 135.0, 264.0, 766.0, 2891.0, 18273.0, 522315.0, 3588072.0, 53396.0, 5722.0, 1303.0, 446.0, 219.0, 119.0, 70.0, 47.0, 31.0, 14.0, 16.0, 9.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.2784423828125, -9.900634765625, -9.5228271484375, -9.14501953125, -8.7672119140625, -8.389404296875, -8.0115966796875, -7.6337890625, -7.2559814453125, -6.878173828125, -6.5003662109375, -6.12255859375, -5.7447509765625, -5.366943359375, -4.9891357421875, -4.611328125, -4.2335205078125, -3.855712890625, -3.4779052734375, -3.10009765625, -2.7222900390625, -2.344482421875, -1.9666748046875, -1.5888671875, -1.2110595703125, -0.833251953125, -0.4554443359375, -0.07763671875, 0.3001708984375, 0.677978515625, 1.0557861328125, 1.43359375, 1.8114013671875, 2.189208984375, 2.5670166015625, 2.94482421875, 3.3226318359375, 3.700439453125, 4.0782470703125, 4.4560546875, 4.8338623046875, 5.211669921875, 5.5894775390625, 5.96728515625, 6.3450927734375, 6.722900390625, 7.1007080078125, 7.478515625, 7.8563232421875, 8.234130859375, 8.6119384765625, 8.98974609375, 9.3675537109375, 9.745361328125, 10.1231689453125, 10.5009765625, 10.8787841796875, 11.256591796875, 11.6343994140625, 12.01220703125, 12.3900146484375, 12.767822265625, 13.1456298828125, 13.5234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 18.0, 27.0, 37.0, 51.0, 84.0, 159.0, 316.0, 665.0, 1031.0, 783.0, 376.0, 196.0, 110.0, 62.0, 53.0, 30.0, 18.0, 14.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.60675048828125, -6.3267822265625, -6.04681396484375, -5.766845703125, -5.48687744140625, -5.2069091796875, -4.92694091796875, -4.64697265625, -4.36700439453125, -4.0870361328125, -3.80706787109375, -3.527099609375, -3.24713134765625, -2.9671630859375, -2.68719482421875, -2.4072265625, -2.12725830078125, -1.8472900390625, -1.56732177734375, -1.287353515625, -1.00738525390625, -0.7274169921875, -0.44744873046875, -0.16748046875, 0.11248779296875, 0.3924560546875, 0.67242431640625, 0.952392578125, 1.23236083984375, 1.5123291015625, 1.79229736328125, 2.072265625, 2.35223388671875, 2.6322021484375, 2.91217041015625, 3.192138671875, 3.47210693359375, 3.7520751953125, 4.03204345703125, 4.31201171875, 4.59197998046875, 4.8719482421875, 5.15191650390625, 5.431884765625, 5.71185302734375, 5.9918212890625, 6.27178955078125, 6.5517578125, 6.83172607421875, 7.1116943359375, 7.39166259765625, 7.671630859375, 7.95159912109375, 8.2315673828125, 8.51153564453125, 8.79150390625, 9.07147216796875, 9.3514404296875, 9.63140869140625, 9.911376953125, 10.19134521484375, 10.4713134765625, 10.75128173828125, 11.03125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 6.0, 22.0, 32.0, 121.0, 239.0, 274.0, 171.0, 73.0, 21.0, 17.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.64287185668945, -60.75640869140625, -57.86994171142578, -54.98347854614258, -52.097015380859375, -49.210548400878906, -46.3240852355957, -43.4376220703125, -40.55115509033203, -37.66469192504883, -34.77822494506836, -31.891761779785156, -29.005298614501953, -26.118833541870117, -23.23236846923828, -20.345905303955078, -17.459442138671875, -14.572978019714355, -11.686513900756836, -8.800048828125, -5.9135847091674805, -3.027120590209961, -0.140655517578125, 2.745807647705078, 5.632272720336914, 8.518736839294434, 11.405200958251953, 14.291666030883789, 17.178131103515625, 20.064594268798828, 22.951059341430664, 25.837522506713867, 28.72399139404297, 31.610456466674805, 34.49692153930664, 37.383384704589844, 40.26984786987305, 43.15631103515625, 46.04277801513672, 48.92924118041992, 51.815704345703125, 54.70216751098633, 57.5886344909668, 60.47509765625, 63.3615608215332, 66.2480239868164, 69.13449096679688, 72.02095031738281, 74.90742492675781, 77.79389190673828, 80.68035125732422, 83.56681823730469, 86.45328521728516, 89.3397445678711, 92.22621154785156, 95.1126708984375, 97.99913787841797, 100.88560485839844, 103.77206420898438, 106.65853118896484, 109.54499816894531, 112.43145751953125, 115.31792449951172, 118.20439147949219, 121.09085083007812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 21.0, 16.0, 15.0, 24.0, 31.0, 40.0, 36.0, 51.0, 38.0, 40.0, 50.0, 40.0, 56.0, 59.0, 65.0, 46.0, 43.0, 53.0, 31.0, 39.0, 45.0, 27.0, 15.0, 23.0, 14.0, 12.0, 17.0, 14.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.672576904296875, -35.61730194091797, -34.56203079223633, -33.50675964355469, -32.45148468017578, -31.396211624145508, -30.340938568115234, -29.28566551208496, -28.230392456054688, -27.175119400024414, -26.11984634399414, -25.064573287963867, -24.009300231933594, -22.95402717590332, -21.898754119873047, -20.843481063842773, -19.7882080078125, -18.732934951782227, -17.677661895751953, -16.62238883972168, -15.567115783691406, -14.511842727661133, -13.45656967163086, -12.401296615600586, -11.346023559570312, -10.290750503540039, -9.235477447509766, -8.180204391479492, -7.124931335449219, -6.069658279418945, -5.014385223388672, -3.9591121673583984, -2.9038429260253906, -1.8485698699951172, -0.7932968139648438, 0.2619762420654297, 1.3172492980957031, 2.3725223541259766, 3.42779541015625, 4.483068466186523, 5.538341522216797, 6.59361457824707, 7.648887634277344, 8.704160690307617, 9.75943374633789, 10.814706802368164, 11.869979858398438, 12.925252914428711, 13.980525970458984, 15.035799026489258, 16.09107208251953, 17.146345138549805, 18.201618194580078, 19.25689125061035, 20.312164306640625, 21.3674373626709, 22.422710418701172, 23.477983474731445, 24.53325653076172, 25.588529586791992, 26.643802642822266, 27.69907569885254, 28.754348754882812, 29.809621810913086, 30.86489486694336]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 12.0, 7.0, 17.0, 12.0, 26.0, 43.0, 48.0, 108.0, 141.0, 239.0, 456.0, 655.0, 1117.0, 1896.0, 3591.0, 7110.0, 14522.0, 32316.0, 75194.0, 172212.0, 297121.0, 239227.0, 112091.0, 48371.0, 20951.0, 9832.0, 4975.0, 2599.0, 1466.0, 850.0, 508.0, 301.0, 153.0, 138.0, 87.0, 52.0, 35.0, 22.0, 11.0, 7.0, 13.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.265625, -4.1171875, -3.96875, -3.8203125, -3.671875, -3.5234375, -3.375, -3.2265625, -3.078125, -2.9296875, -2.78125, -2.6328125, -2.484375, -2.3359375, -2.1875, -2.0390625, -1.890625, -1.7421875, -1.59375, -1.4453125, -1.296875, -1.1484375, -1.0, -0.8515625, -0.703125, -0.5546875, -0.40625, -0.2578125, -0.109375, 0.0390625, 0.1875, 0.3359375, 0.484375, 0.6328125, 0.78125, 0.9296875, 1.078125, 1.2265625, 1.375, 1.5234375, 1.671875, 1.8203125, 1.96875, 2.1171875, 2.265625, 2.4140625, 2.5625, 2.7109375, 2.859375, 3.0078125, 3.15625, 3.3046875, 3.453125, 3.6015625, 3.75, 3.8984375, 4.046875, 4.1953125, 4.34375, 4.4921875, 4.640625, 4.7890625, 4.9375, 5.0859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 1.0, 6.0, 6.0, 8.0, 11.0, 11.0, 19.0, 13.0, 16.0, 20.0, 22.0, 22.0, 32.0, 44.0, 29.0, 36.0, 41.0, 40.0, 45.0, 41.0, 54.0, 52.0, 36.0, 50.0, 44.0, 36.0, 31.0, 21.0, 33.0, 34.0, 22.0, 21.0, 20.0, 10.0, 15.0, 8.0, 11.0, 9.0, 10.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.72265625, -2.636138916015625, -2.54962158203125, -2.463104248046875, -2.3765869140625, -2.290069580078125, -2.20355224609375, -2.117034912109375, -2.030517578125, -1.944000244140625, -1.85748291015625, -1.770965576171875, -1.6844482421875, -1.597930908203125, -1.51141357421875, -1.424896240234375, -1.33837890625, -1.251861572265625, -1.16534423828125, -1.078826904296875, -0.9923095703125, -0.905792236328125, -0.81927490234375, -0.732757568359375, -0.646240234375, -0.559722900390625, -0.47320556640625, -0.386688232421875, -0.3001708984375, -0.213653564453125, -0.12713623046875, -0.040618896484375, 0.0458984375, 0.132415771484375, 0.21893310546875, 0.305450439453125, 0.3919677734375, 0.478485107421875, 0.56500244140625, 0.651519775390625, 0.738037109375, 0.824554443359375, 0.91107177734375, 0.997589111328125, 1.0841064453125, 1.170623779296875, 1.25714111328125, 1.343658447265625, 1.43017578125, 1.516693115234375, 1.60321044921875, 1.689727783203125, 1.7762451171875, 1.862762451171875, 1.94927978515625, 2.035797119140625, 2.122314453125, 2.208831787109375, 2.29534912109375, 2.381866455078125, 2.4683837890625, 2.554901123046875, 2.64141845703125, 2.727935791015625, 2.814453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0, 2.0, 7.0, 5.0, 9.0, 22.0, 40.0, 53.0, 101.0, 203.0, 387.0, 1048.0, 3910.0, 32937.0, 717499.0, 272287.0, 16123.0, 2495.0, 716.0, 324.0, 158.0, 98.0, 46.0, 27.0, 19.0, 13.0, 11.0, 8.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9140625, -15.3983154296875, -14.882568359375, -14.3668212890625, -13.85107421875, -13.3353271484375, -12.819580078125, -12.3038330078125, -11.7880859375, -11.2723388671875, -10.756591796875, -10.2408447265625, -9.72509765625, -9.2093505859375, -8.693603515625, -8.1778564453125, -7.662109375, -7.1463623046875, -6.630615234375, -6.1148681640625, -5.59912109375, -5.0833740234375, -4.567626953125, -4.0518798828125, -3.5361328125, -3.0203857421875, -2.504638671875, -1.9888916015625, -1.47314453125, -0.9573974609375, -0.441650390625, 0.0740966796875, 0.58984375, 1.1055908203125, 1.621337890625, 2.1370849609375, 2.65283203125, 3.1685791015625, 3.684326171875, 4.2000732421875, 4.7158203125, 5.2315673828125, 5.747314453125, 6.2630615234375, 6.77880859375, 7.2945556640625, 7.810302734375, 8.3260498046875, 8.841796875, 9.3575439453125, 9.873291015625, 10.3890380859375, 10.90478515625, 11.4205322265625, 11.936279296875, 12.4520263671875, 12.9677734375, 13.4835205078125, 13.999267578125, 14.5150146484375, 15.03076171875, 15.5465087890625, 16.062255859375, 16.5780029296875, 17.09375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 13.0, 17.0, 20.0, 29.0, 33.0, 50.0, 47.0, 69.0, 78.0, 69.0, 92.0, 83.0, 68.0, 69.0, 68.0, 45.0, 32.0, 27.0, 18.0, 18.0, 17.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.7578125, -15.2427978515625, -14.727783203125, -14.2127685546875, -13.69775390625, -13.1827392578125, -12.667724609375, -12.1527099609375, -11.6376953125, -11.1226806640625, -10.607666015625, -10.0926513671875, -9.57763671875, -9.0626220703125, -8.547607421875, -8.0325927734375, -7.517578125, -7.0025634765625, -6.487548828125, -5.9725341796875, -5.45751953125, -4.9425048828125, -4.427490234375, -3.9124755859375, -3.3974609375, -2.8824462890625, -2.367431640625, -1.8524169921875, -1.33740234375, -0.8223876953125, -0.307373046875, 0.2076416015625, 0.72265625, 1.2376708984375, 1.752685546875, 2.2677001953125, 2.78271484375, 3.2977294921875, 3.812744140625, 4.3277587890625, 4.8427734375, 5.3577880859375, 5.872802734375, 6.3878173828125, 6.90283203125, 7.4178466796875, 7.932861328125, 8.4478759765625, 8.962890625, 9.4779052734375, 9.992919921875, 10.5079345703125, 11.02294921875, 11.5379638671875, 12.052978515625, 12.5679931640625, 13.0830078125, 13.5980224609375, 14.113037109375, 14.6280517578125, 15.14306640625, 15.6580810546875, 16.173095703125, 16.6881103515625, 17.203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 7.0, 8.0, 14.0, 15.0, 17.0, 16.0, 27.0, 37.0, 48.0, 65.0, 107.0, 165.0, 229.0, 378.0, 694.0, 1447.0, 3742.0, 11342.0, 43844.0, 232735.0, 627173.0, 94399.0, 21136.0, 6230.0, 2297.0, 992.0, 495.0, 276.0, 180.0, 112.0, 78.0, 50.0, 44.0, 32.0, 35.0, 19.0, 10.0, 7.0, 11.0, 8.0, 6.0, 4.0, 3.0, 5.0, 4.0, 1.0, 7.0], "bins": [-3.642578125, -3.544769287109375, -3.44696044921875, -3.349151611328125, -3.2513427734375, -3.153533935546875, -3.05572509765625, -2.957916259765625, -2.860107421875, -2.762298583984375, -2.66448974609375, -2.566680908203125, -2.4688720703125, -2.371063232421875, -2.27325439453125, -2.175445556640625, -2.07763671875, -1.979827880859375, -1.88201904296875, -1.784210205078125, -1.6864013671875, -1.588592529296875, -1.49078369140625, -1.392974853515625, -1.295166015625, -1.197357177734375, -1.09954833984375, -1.001739501953125, -0.9039306640625, -0.806121826171875, -0.70831298828125, -0.610504150390625, -0.5126953125, -0.414886474609375, -0.31707763671875, -0.219268798828125, -0.1214599609375, -0.023651123046875, 0.07415771484375, 0.171966552734375, 0.269775390625, 0.367584228515625, 0.46539306640625, 0.563201904296875, 0.6610107421875, 0.758819580078125, 0.85662841796875, 0.954437255859375, 1.05224609375, 1.150054931640625, 1.24786376953125, 1.345672607421875, 1.4434814453125, 1.541290283203125, 1.63909912109375, 1.736907958984375, 1.834716796875, 1.932525634765625, 2.03033447265625, 2.128143310546875, 2.2259521484375, 2.323760986328125, 2.42156982421875, 2.519378662109375, 2.6171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 9.0, 10.0, 13.0, 11.0, 14.0, 22.0, 28.0, 26.0, 43.0, 67.0, 68.0, 72.0, 104.0, 73.0, 75.0, 79.0, 62.0, 52.0, 27.0, 28.0, 18.0, 18.0, 23.0, 9.0, 10.0, 6.0, 7.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008630752563476562, -0.0008385926485061646, -0.0008141100406646729, -0.0007896274328231812, -0.0007651448249816895, -0.0007406622171401978, -0.0007161796092987061, -0.0006916970014572144, -0.0006672143936157227, -0.000642731785774231, -0.0006182491779327393, -0.0005937665700912476, -0.0005692839622497559, -0.0005448013544082642, -0.0005203187465667725, -0.0004958361387252808, -0.00047135353088378906, -0.00044687092304229736, -0.00042238831520080566, -0.00039790570735931396, -0.00037342309951782227, -0.00034894049167633057, -0.00032445788383483887, -0.00029997527599334717, -0.00027549266815185547, -0.00025101006031036377, -0.00022652745246887207, -0.00020204484462738037, -0.00017756223678588867, -0.00015307962894439697, -0.00012859702110290527, -0.00010411441326141357, -7.963180541992188e-05, -5.5149197578430176e-05, -3.0666589736938477e-05, -6.183981895446777e-06, 1.8298625946044922e-05, 4.278123378753662e-05, 6.726384162902832e-05, 9.174644947052002e-05, 0.00011622905731201172, 0.00014071166515350342, 0.00016519427299499512, 0.00018967688083648682, 0.00021415948867797852, 0.00023864209651947021, 0.0002631247043609619, 0.0002876073122024536, 0.0003120899200439453, 0.000336572527885437, 0.0003610551357269287, 0.0003855377435684204, 0.0004100203514099121, 0.0004345029592514038, 0.0004589855670928955, 0.0004834681749343872, 0.0005079507827758789, 0.0005324333906173706, 0.0005569159984588623, 0.000581398606300354, 0.0006058812141418457, 0.0006303638219833374, 0.0006548464298248291, 0.0006793290376663208, 0.0007038116455078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 7.0, 8.0, 5.0, 11.0, 22.0, 53.0, 72.0, 153.0, 297.0, 641.0, 1808.0, 6419.0, 37543.0, 564189.0, 393419.0, 34912.0, 6024.0, 1736.0, 621.0, 289.0, 136.0, 64.0, 47.0, 21.0, 13.0, 15.0, 5.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.2564697265625, -4.114501953125, -3.9725341796875, -3.83056640625, -3.6885986328125, -3.546630859375, -3.4046630859375, -3.2626953125, -3.1207275390625, -2.978759765625, -2.8367919921875, -2.69482421875, -2.5528564453125, -2.410888671875, -2.2689208984375, -2.126953125, -1.9849853515625, -1.843017578125, -1.7010498046875, -1.55908203125, -1.4171142578125, -1.275146484375, -1.1331787109375, -0.9912109375, -0.8492431640625, -0.707275390625, -0.5653076171875, -0.42333984375, -0.2813720703125, -0.139404296875, 0.0025634765625, 0.14453125, 0.2864990234375, 0.428466796875, 0.5704345703125, 0.71240234375, 0.8543701171875, 0.996337890625, 1.1383056640625, 1.2802734375, 1.4222412109375, 1.564208984375, 1.7061767578125, 1.84814453125, 1.9901123046875, 2.132080078125, 2.2740478515625, 2.416015625, 2.5579833984375, 2.699951171875, 2.8419189453125, 2.98388671875, 3.1258544921875, 3.267822265625, 3.4097900390625, 3.5517578125, 3.6937255859375, 3.835693359375, 3.9776611328125, 4.11962890625, 4.2615966796875, 4.403564453125, 4.5455322265625, 4.6875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 13.0, 11.0, 18.0, 15.0, 31.0, 35.0, 42.0, 44.0, 52.0, 74.0, 104.0, 70.0, 80.0, 84.0, 67.0, 47.0, 43.0, 33.0, 29.0, 22.0, 19.0, 14.0, 12.0, 8.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.64453125, -2.5421142578125, -2.439697265625, -2.3372802734375, -2.23486328125, -2.1324462890625, -2.030029296875, -1.9276123046875, -1.8251953125, -1.7227783203125, -1.620361328125, -1.5179443359375, -1.41552734375, -1.3131103515625, -1.210693359375, -1.1082763671875, -1.005859375, -0.9034423828125, -0.801025390625, -0.6986083984375, -0.59619140625, -0.4937744140625, -0.391357421875, -0.2889404296875, -0.1865234375, -0.0841064453125, 0.018310546875, 0.1207275390625, 0.22314453125, 0.3255615234375, 0.427978515625, 0.5303955078125, 0.6328125, 0.7352294921875, 0.837646484375, 0.9400634765625, 1.04248046875, 1.1448974609375, 1.247314453125, 1.3497314453125, 1.4521484375, 1.5545654296875, 1.656982421875, 1.7593994140625, 1.86181640625, 1.9642333984375, 2.066650390625, 2.1690673828125, 2.271484375, 2.3739013671875, 2.476318359375, 2.5787353515625, 2.68115234375, 2.7835693359375, 2.885986328125, 2.9884033203125, 3.0908203125, 3.1932373046875, 3.295654296875, 3.3980712890625, 3.50048828125, 3.6029052734375, 3.705322265625, 3.8077392578125, 3.91015625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 11.0, 10.0, 28.0, 55.0, 106.0, 173.0, 337.0, 146.0, 75.0, 27.0, 17.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-136.14776611328125, -133.1521453857422, -130.1565399169922, -127.16091918945312, -124.1653060913086, -121.16969299316406, -118.174072265625, -115.17845916748047, -112.18284606933594, -109.1872329711914, -106.19161224365234, -103.19599914550781, -100.20038604736328, -97.20477294921875, -94.20915222167969, -91.21353912353516, -88.2179183959961, -85.22230529785156, -82.2266845703125, -79.23107147216797, -76.23545837402344, -73.23983764648438, -70.24422454833984, -67.24861145019531, -64.25299072265625, -61.25737380981445, -58.26176071166992, -55.266143798828125, -52.270530700683594, -49.2749137878418, -46.279296875, -43.28368377685547, -40.28807067871094, -37.29245376586914, -34.29684066772461, -31.301223754882812, -28.30560874938965, -25.309993743896484, -22.314376831054688, -19.318761825561523, -16.32314682006836, -13.327531814575195, -10.331915855407715, -7.336299896240234, -4.34068489074707, -1.3450698852539062, 1.6505470275878906, 4.646162033081055, 7.641777038574219, 10.637392044067383, 13.633008003234863, 16.628623962402344, 19.624238967895508, 22.619853973388672, 25.61547088623047, 28.611085891723633, 31.606700897216797, 34.602317810058594, 37.597930908203125, 40.59354782104492, 43.58916473388672, 46.58477783203125, 49.58039474487305, 52.576011657714844, 55.571624755859375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 5.0, 8.0, 10.0, 7.0, 12.0, 22.0, 17.0, 24.0, 21.0, 20.0, 36.0, 31.0, 46.0, 40.0, 46.0, 73.0, 72.0, 83.0, 62.0, 43.0, 42.0, 32.0, 31.0, 24.0, 29.0, 28.0, 17.0, 24.0, 13.0, 12.0, 11.0, 11.0, 9.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.79401397705078, -40.435062408447266, -39.076114654541016, -37.7171630859375, -36.35821533203125, -34.999263763427734, -33.64031219482422, -32.28136444091797, -30.922412872314453, -29.56346321105957, -28.204513549804688, -26.845561981201172, -25.48661231994629, -24.127662658691406, -22.768712997436523, -21.40976333618164, -20.050813674926758, -18.691864013671875, -17.332914352416992, -15.973963737487793, -14.615013122558594, -13.256063461303711, -11.897113800048828, -10.538163185119629, -9.179213523864746, -7.820263385772705, -6.461313247680664, -5.102363586425781, -3.7434134483337402, -2.384463310241699, -1.0255136489868164, 0.3334369659423828, 1.6923866271972656, 3.0513367652893066, 4.410286903381348, 5.7692365646362305, 7.1281867027282715, 8.487136840820312, 9.846086502075195, 11.205037117004395, 12.563986778259277, 13.92293643951416, 15.28188705444336, 16.640836715698242, 17.999786376953125, 19.35873794555664, 20.71768569946289, 22.076637268066406, 23.43558692932129, 24.794536590576172, 26.153486251831055, 27.512435913085938, 28.871387481689453, 30.230337142944336, 31.58928680419922, 32.948238372802734, 34.307186126708984, 35.6661376953125, 37.02508544921875, 38.384037017822266, 39.742984771728516, 41.10193634033203, 42.46088409423828, 43.8198356628418, 45.17878723144531]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 11.0, 13.0, 16.0, 14.0, 17.0, 33.0, 70.0, 102.0, 181.0, 323.0, 623.0, 1368.0, 3490.0, 11476.0, 60895.0, 818798.0, 2961883.0, 291663.0, 30859.0, 7567.0, 2526.0, 1083.0, 556.0, 301.0, 154.0, 91.0, 57.0, 42.0, 13.0, 10.0, 5.0, 9.0, 5.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.87890625, -5.717041015625, -5.55517578125, -5.393310546875, -5.2314453125, -5.069580078125, -4.90771484375, -4.745849609375, -4.583984375, -4.422119140625, -4.26025390625, -4.098388671875, -3.9365234375, -3.774658203125, -3.61279296875, -3.450927734375, -3.2890625, -3.127197265625, -2.96533203125, -2.803466796875, -2.6416015625, -2.479736328125, -2.31787109375, -2.156005859375, -1.994140625, -1.832275390625, -1.67041015625, -1.508544921875, -1.3466796875, -1.184814453125, -1.02294921875, -0.861083984375, -0.69921875, -0.537353515625, -0.37548828125, -0.213623046875, -0.0517578125, 0.110107421875, 0.27197265625, 0.433837890625, 0.595703125, 0.757568359375, 0.91943359375, 1.081298828125, 1.2431640625, 1.405029296875, 1.56689453125, 1.728759765625, 1.890625, 2.052490234375, 2.21435546875, 2.376220703125, 2.5380859375, 2.699951171875, 2.86181640625, 3.023681640625, 3.185546875, 3.347412109375, 3.50927734375, 3.671142578125, 3.8330078125, 3.994873046875, 4.15673828125, 4.318603515625, 4.48046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 3.0, 11.0, 9.0, 16.0, 15.0, 20.0, 15.0, 17.0, 27.0, 23.0, 28.0, 25.0, 30.0, 30.0, 33.0, 44.0, 47.0, 53.0, 45.0, 47.0, 42.0, 57.0, 38.0, 31.0, 33.0, 34.0, 32.0, 22.0, 26.0, 24.0, 23.0, 19.0, 12.0, 15.0, 8.0, 10.0, 4.0, 6.0, 8.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.62042236328125, -2.5357666015625, -2.45111083984375, -2.366455078125, -2.28179931640625, -2.1971435546875, -2.11248779296875, -2.02783203125, -1.94317626953125, -1.8585205078125, -1.77386474609375, -1.689208984375, -1.60455322265625, -1.5198974609375, -1.43524169921875, -1.3505859375, -1.26593017578125, -1.1812744140625, -1.09661865234375, -1.011962890625, -0.92730712890625, -0.8426513671875, -0.75799560546875, -0.67333984375, -0.58868408203125, -0.5040283203125, -0.41937255859375, -0.334716796875, -0.25006103515625, -0.1654052734375, -0.08074951171875, 0.00390625, 0.08856201171875, 0.1732177734375, 0.25787353515625, 0.342529296875, 0.42718505859375, 0.5118408203125, 0.59649658203125, 0.68115234375, 0.76580810546875, 0.8504638671875, 0.93511962890625, 1.019775390625, 1.10443115234375, 1.1890869140625, 1.27374267578125, 1.3583984375, 1.44305419921875, 1.5277099609375, 1.61236572265625, 1.697021484375, 1.78167724609375, 1.8663330078125, 1.95098876953125, 2.03564453125, 2.12030029296875, 2.2049560546875, 2.28961181640625, 2.374267578125, 2.45892333984375, 2.5435791015625, 2.62823486328125, 2.712890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 6.0, 10.0, 6.0, 17.0, 25.0, 21.0, 39.0, 49.0, 65.0, 106.0, 174.0, 351.0, 836.0, 2197.0, 6708.0, 29559.0, 316398.0, 3625931.0, 180992.0, 21895.0, 5424.0, 1893.0, 707.0, 322.0, 184.0, 107.0, 63.0, 51.0, 27.0, 30.0, 16.0, 16.0, 10.0, 7.0, 11.0, 3.0, 5.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-8.28125, -8.0257568359375, -7.770263671875, -7.5147705078125, -7.25927734375, -7.0037841796875, -6.748291015625, -6.4927978515625, -6.2373046875, -5.9818115234375, -5.726318359375, -5.4708251953125, -5.21533203125, -4.9598388671875, -4.704345703125, -4.4488525390625, -4.193359375, -3.9378662109375, -3.682373046875, -3.4268798828125, -3.17138671875, -2.9158935546875, -2.660400390625, -2.4049072265625, -2.1494140625, -1.8939208984375, -1.638427734375, -1.3829345703125, -1.12744140625, -0.8719482421875, -0.616455078125, -0.3609619140625, -0.10546875, 0.1500244140625, 0.405517578125, 0.6610107421875, 0.91650390625, 1.1719970703125, 1.427490234375, 1.6829833984375, 1.9384765625, 2.1939697265625, 2.449462890625, 2.7049560546875, 2.96044921875, 3.2159423828125, 3.471435546875, 3.7269287109375, 3.982421875, 4.2379150390625, 4.493408203125, 4.7489013671875, 5.00439453125, 5.2598876953125, 5.515380859375, 5.7708740234375, 6.0263671875, 6.2818603515625, 6.537353515625, 6.7928466796875, 7.04833984375, 7.3038330078125, 7.559326171875, 7.8148193359375, 8.0703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 6.0, 12.0, 11.0, 12.0, 14.0, 27.0, 38.0, 47.0, 60.0, 95.0, 155.0, 250.0, 427.0, 632.0, 769.0, 567.0, 354.0, 183.0, 101.0, 82.0, 53.0, 41.0, 28.0, 26.0, 18.0, 13.0, 8.0, 5.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.82421875, -5.62530517578125, -5.4263916015625, -5.22747802734375, -5.028564453125, -4.82965087890625, -4.6307373046875, -4.43182373046875, -4.23291015625, -4.03399658203125, -3.8350830078125, -3.63616943359375, -3.437255859375, -3.23834228515625, -3.0394287109375, -2.84051513671875, -2.6416015625, -2.44268798828125, -2.2437744140625, -2.04486083984375, -1.845947265625, -1.64703369140625, -1.4481201171875, -1.24920654296875, -1.05029296875, -0.85137939453125, -0.6524658203125, -0.45355224609375, -0.254638671875, -0.05572509765625, 0.1431884765625, 0.34210205078125, 0.541015625, 0.73992919921875, 0.9388427734375, 1.13775634765625, 1.336669921875, 1.53558349609375, 1.7344970703125, 1.93341064453125, 2.13232421875, 2.33123779296875, 2.5301513671875, 2.72906494140625, 2.927978515625, 3.12689208984375, 3.3258056640625, 3.52471923828125, 3.7236328125, 3.92254638671875, 4.1214599609375, 4.32037353515625, 4.519287109375, 4.71820068359375, 4.9171142578125, 5.11602783203125, 5.31494140625, 5.51385498046875, 5.7127685546875, 5.91168212890625, 6.110595703125, 6.30950927734375, 6.5084228515625, 6.70733642578125, 6.90625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 16.0, 25.0, 37.0, 96.0, 142.0, 204.0, 188.0, 138.0, 66.0, 38.0, 18.0, 11.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.72591018676758, -48.6863899230957, -46.64686965942383, -44.60734558105469, -42.56782531738281, -40.52830505371094, -38.48878479003906, -36.44926452636719, -34.40974426269531, -32.37022399902344, -30.33070182800293, -28.291181564331055, -26.251659393310547, -24.212139129638672, -22.172618865966797, -20.133098602294922, -18.09357452392578, -16.054054260253906, -14.014532089233398, -11.975011825561523, -9.935490608215332, -7.895969390869141, -5.856449127197266, -3.816927909851074, -1.7774066925048828, 0.2621142864227295, 2.301635265350342, 4.341156005859375, 6.380677223205566, 8.420198440551758, 10.459718704223633, 12.499239921569824, 14.53875732421875, 16.578277587890625, 18.617799758911133, 20.657320022583008, 22.696842193603516, 24.73636245727539, 26.775882720947266, 28.81540298461914, 30.85492515563965, 32.894447326660156, 34.93396759033203, 36.973487854003906, 39.01300811767578, 41.052528381347656, 43.09204864501953, 45.13157272338867, 47.17109298706055, 49.21061325073242, 51.2501335144043, 53.28965759277344, 55.32917785644531, 57.36869812011719, 59.40821838378906, 61.44773864746094, 63.48725891113281, 65.52677917480469, 67.56629943847656, 69.60581970214844, 71.64533996582031, 73.68486022949219, 75.72438049316406, 77.76390838623047, 79.80342864990234]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 7.0, 3.0, 7.0, 13.0, 8.0, 12.0, 12.0, 15.0, 24.0, 21.0, 19.0, 20.0, 30.0, 33.0, 38.0, 54.0, 33.0, 43.0, 46.0, 39.0, 45.0, 37.0, 47.0, 47.0, 36.0, 42.0, 32.0, 34.0, 27.0, 28.0, 19.0, 18.0, 13.0, 9.0, 19.0, 13.0, 6.0, 7.0, 7.0, 6.0, 10.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.080543518066406, -23.26055145263672, -22.44055938720703, -21.620567321777344, -20.80057716369629, -19.9805850982666, -19.160593032836914, -18.340600967407227, -17.520610809326172, -16.700618743896484, -15.880627632141113, -15.060635566711426, -14.240644454956055, -13.420652389526367, -12.60066032409668, -11.780668258666992, -10.960676193237305, -10.140684127807617, -9.320693016052246, -8.500700950622559, -7.680709362030029, -6.8607177734375, -6.0407257080078125, -5.220734119415283, -4.400742530822754, -3.5807509422302246, -2.760759115219116, -1.9407672882080078, -1.1207756996154785, -0.3007841110229492, 0.5192079544067383, 1.3391995429992676, 2.159191131591797, 2.979182720184326, 3.7991745471954346, 4.619166374206543, 5.439157962799072, 6.259149551391602, 7.079141616821289, 7.899133205413818, 8.719124794006348, 9.539116859436035, 10.359107971191406, 11.179100036621094, 11.999092102050781, 12.819083213806152, 13.63907527923584, 14.459066390991211, 15.279058456420898, 16.099050521850586, 16.919042587280273, 17.739032745361328, 18.559024810791016, 19.379016876220703, 20.19900894165039, 21.019001007080078, 21.838993072509766, 22.658985137939453, 23.47897720336914, 24.298969268798828, 25.118959426879883, 25.93895149230957, 26.758943557739258, 27.578935623168945, 28.39892578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 14.0, 13.0, 25.0, 30.0, 43.0, 69.0, 122.0, 163.0, 288.0, 446.0, 698.0, 1241.0, 2080.0, 3679.0, 6902.0, 13673.0, 28635.0, 61661.0, 137061.0, 274580.0, 268986.0, 132074.0, 59588.0, 27448.0, 13396.0, 6876.0, 3546.0, 2080.0, 1173.0, 711.0, 411.0, 299.0, 150.0, 127.0, 86.0, 43.0, 45.0, 34.0, 14.0, 15.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.046875, -3.924163818359375, -3.80145263671875, -3.678741455078125, -3.5560302734375, -3.433319091796875, -3.31060791015625, -3.187896728515625, -3.065185546875, -2.942474365234375, -2.81976318359375, -2.697052001953125, -2.5743408203125, -2.451629638671875, -2.32891845703125, -2.206207275390625, -2.08349609375, -1.960784912109375, -1.83807373046875, -1.715362548828125, -1.5926513671875, -1.469940185546875, -1.34722900390625, -1.224517822265625, -1.101806640625, -0.979095458984375, -0.85638427734375, -0.733673095703125, -0.6109619140625, -0.488250732421875, -0.36553955078125, -0.242828369140625, -0.1201171875, 0.002593994140625, 0.12530517578125, 0.248016357421875, 0.3707275390625, 0.493438720703125, 0.61614990234375, 0.738861083984375, 0.861572265625, 0.984283447265625, 1.10699462890625, 1.229705810546875, 1.3524169921875, 1.475128173828125, 1.59783935546875, 1.720550537109375, 1.84326171875, 1.965972900390625, 2.08868408203125, 2.211395263671875, 2.3341064453125, 2.456817626953125, 2.57952880859375, 2.702239990234375, 2.824951171875, 2.947662353515625, 3.07037353515625, 3.193084716796875, 3.3157958984375, 3.438507080078125, 3.56121826171875, 3.683929443359375, 3.806640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 7.0, 0.0, 10.0, 16.0, 8.0, 15.0, 19.0, 22.0, 23.0, 38.0, 31.0, 29.0, 32.0, 35.0, 39.0, 39.0, 42.0, 50.0, 49.0, 48.0, 53.0, 42.0, 39.0, 40.0, 41.0, 37.0, 30.0, 26.0, 27.0, 19.0, 14.0, 10.0, 15.0, 8.0, 6.0, 10.0, 2.0, 9.0, 5.0, 1.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.05859375, -2.96533203125, -2.8720703125, -2.77880859375, -2.685546875, -2.59228515625, -2.4990234375, -2.40576171875, -2.3125, -2.21923828125, -2.1259765625, -2.03271484375, -1.939453125, -1.84619140625, -1.7529296875, -1.65966796875, -1.56640625, -1.47314453125, -1.3798828125, -1.28662109375, -1.193359375, -1.10009765625, -1.0068359375, -0.91357421875, -0.8203125, -0.72705078125, -0.6337890625, -0.54052734375, -0.447265625, -0.35400390625, -0.2607421875, -0.16748046875, -0.07421875, 0.01904296875, 0.1123046875, 0.20556640625, 0.298828125, 0.39208984375, 0.4853515625, 0.57861328125, 0.671875, 0.76513671875, 0.8583984375, 0.95166015625, 1.044921875, 1.13818359375, 1.2314453125, 1.32470703125, 1.41796875, 1.51123046875, 1.6044921875, 1.69775390625, 1.791015625, 1.88427734375, 1.9775390625, 2.07080078125, 2.1640625, 2.25732421875, 2.3505859375, 2.44384765625, 2.537109375, 2.63037109375, 2.7236328125, 2.81689453125, 2.91015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 12.0, 16.0, 26.0, 36.0, 48.0, 62.0, 122.0, 185.0, 248.0, 483.0, 1048.0, 2654.0, 9930.0, 62222.0, 741320.0, 199638.0, 22318.0, 4828.0, 1627.0, 745.0, 377.0, 212.0, 124.0, 75.0, 60.0, 37.0, 30.0, 22.0, 9.0, 14.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.2109375, -11.8594970703125, -11.508056640625, -11.1566162109375, -10.80517578125, -10.4537353515625, -10.102294921875, -9.7508544921875, -9.3994140625, -9.0479736328125, -8.696533203125, -8.3450927734375, -7.99365234375, -7.6422119140625, -7.290771484375, -6.9393310546875, -6.587890625, -6.2364501953125, -5.885009765625, -5.5335693359375, -5.18212890625, -4.8306884765625, -4.479248046875, -4.1278076171875, -3.7763671875, -3.4249267578125, -3.073486328125, -2.7220458984375, -2.37060546875, -2.0191650390625, -1.667724609375, -1.3162841796875, -0.96484375, -0.6134033203125, -0.261962890625, 0.0894775390625, 0.44091796875, 0.7923583984375, 1.143798828125, 1.4952392578125, 1.8466796875, 2.1981201171875, 2.549560546875, 2.9010009765625, 3.25244140625, 3.6038818359375, 3.955322265625, 4.3067626953125, 4.658203125, 5.0096435546875, 5.361083984375, 5.7125244140625, 6.06396484375, 6.4154052734375, 6.766845703125, 7.1182861328125, 7.4697265625, 7.8211669921875, 8.172607421875, 8.5240478515625, 8.87548828125, 9.2269287109375, 9.578369140625, 9.9298095703125, 10.28125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 11.0, 7.0, 14.0, 5.0, 11.0, 17.0, 27.0, 37.0, 29.0, 49.0, 45.0, 49.0, 69.0, 74.0, 81.0, 79.0, 60.0, 55.0, 59.0, 40.0, 40.0, 35.0, 30.0, 22.0, 15.0, 12.0, 8.0, 6.0, 7.0, 5.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.7822265625, -13.298828125, -12.8154296875, -12.33203125, -11.8486328125, -11.365234375, -10.8818359375, -10.3984375, -9.9150390625, -9.431640625, -8.9482421875, -8.46484375, -7.9814453125, -7.498046875, -7.0146484375, -6.53125, -6.0478515625, -5.564453125, -5.0810546875, -4.59765625, -4.1142578125, -3.630859375, -3.1474609375, -2.6640625, -2.1806640625, -1.697265625, -1.2138671875, -0.73046875, -0.2470703125, 0.236328125, 0.7197265625, 1.203125, 1.6865234375, 2.169921875, 2.6533203125, 3.13671875, 3.6201171875, 4.103515625, 4.5869140625, 5.0703125, 5.5537109375, 6.037109375, 6.5205078125, 7.00390625, 7.4873046875, 7.970703125, 8.4541015625, 8.9375, 9.4208984375, 9.904296875, 10.3876953125, 10.87109375, 11.3544921875, 11.837890625, 12.3212890625, 12.8046875, 13.2880859375, 13.771484375, 14.2548828125, 14.73828125, 15.2216796875, 15.705078125, 16.1884765625, 16.671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 6.0, 13.0, 16.0, 23.0, 25.0, 39.0, 64.0, 87.0, 151.0, 285.0, 553.0, 1241.0, 3036.0, 8990.0, 36419.0, 258214.0, 662881.0, 56629.0, 12745.0, 4025.0, 1558.0, 672.0, 321.0, 178.0, 113.0, 93.0, 49.0, 33.0, 24.0, 12.0, 13.0, 8.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.837890625, -2.740478515625, -2.64306640625, -2.545654296875, -2.4482421875, -2.350830078125, -2.25341796875, -2.156005859375, -2.05859375, -1.961181640625, -1.86376953125, -1.766357421875, -1.6689453125, -1.571533203125, -1.47412109375, -1.376708984375, -1.279296875, -1.181884765625, -1.08447265625, -0.987060546875, -0.8896484375, -0.792236328125, -0.69482421875, -0.597412109375, -0.5, -0.402587890625, -0.30517578125, -0.207763671875, -0.1103515625, -0.012939453125, 0.08447265625, 0.181884765625, 0.279296875, 0.376708984375, 0.47412109375, 0.571533203125, 0.6689453125, 0.766357421875, 0.86376953125, 0.961181640625, 1.05859375, 1.156005859375, 1.25341796875, 1.350830078125, 1.4482421875, 1.545654296875, 1.64306640625, 1.740478515625, 1.837890625, 1.935302734375, 2.03271484375, 2.130126953125, 2.2275390625, 2.324951171875, 2.42236328125, 2.519775390625, 2.6171875, 2.714599609375, 2.81201171875, 2.909423828125, 3.0068359375, 3.104248046875, 3.20166015625, 3.299072265625, 3.396484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 7.0, 13.0, 17.0, 32.0, 30.0, 55.0, 63.0, 100.0, 131.0, 153.0, 110.0, 80.0, 42.0, 43.0, 23.0, 16.0, 16.0, 12.0, 16.0, 6.0, 6.0, 4.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000759124755859375, -0.0007290393114089966, -0.0006989538669586182, -0.0006688684225082397, -0.0006387829780578613, -0.0006086975336074829, -0.0005786120891571045, -0.0005485266447067261, -0.0005184412002563477, -0.0004883557558059692, -0.0004582703113555908, -0.0004281848669052124, -0.000398099422454834, -0.00036801397800445557, -0.00033792853355407715, -0.00030784308910369873, -0.0002777576446533203, -0.0002476722002029419, -0.00021758675575256348, -0.00018750131130218506, -0.00015741586685180664, -0.00012733042240142822, -9.72449779510498e-05, -6.715953350067139e-05, -3.707408905029297e-05, -6.988644599914551e-06, 2.3096799850463867e-05, 5.3182244300842285e-05, 8.32676887512207e-05, 0.00011335313320159912, 0.00014343857765197754, 0.00017352402210235596, 0.00020360946655273438, 0.0002336949110031128, 0.0002637803554534912, 0.00029386579990386963, 0.00032395124435424805, 0.00035403668880462646, 0.0003841221332550049, 0.0004142075777053833, 0.0004442930221557617, 0.00047437846660614014, 0.0005044639110565186, 0.000534549355506897, 0.0005646347999572754, 0.0005947202444076538, 0.0006248056888580322, 0.0006548911333084106, 0.0006849765777587891, 0.0007150620222091675, 0.0007451474666595459, 0.0007752329111099243, 0.0008053183555603027, 0.0008354038000106812, 0.0008654892444610596, 0.000895574688911438, 0.0009256601333618164, 0.0009557455778121948, 0.0009858310222625732, 0.0010159164667129517, 0.00104600191116333, 0.0010760873556137085, 0.001106172800064087, 0.0011362582445144653, 0.0011663436889648438]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 12.0, 10.0, 10.0, 33.0, 32.0, 50.0, 104.0, 160.0, 250.0, 452.0, 1001.0, 2153.0, 6158.0, 25836.0, 216264.0, 727336.0, 52568.0, 10281.0, 3133.0, 1305.0, 621.0, 326.0, 161.0, 103.0, 66.0, 38.0, 19.0, 20.0, 14.0, 11.0, 7.0, 5.0, 0.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.279632568359375, -3.17449951171875, -3.069366455078125, -2.9642333984375, -2.859100341796875, -2.75396728515625, -2.648834228515625, -2.543701171875, -2.438568115234375, -2.33343505859375, -2.228302001953125, -2.1231689453125, -2.018035888671875, -1.91290283203125, -1.807769775390625, -1.70263671875, -1.597503662109375, -1.49237060546875, -1.387237548828125, -1.2821044921875, -1.176971435546875, -1.07183837890625, -0.966705322265625, -0.861572265625, -0.756439208984375, -0.65130615234375, -0.546173095703125, -0.4410400390625, -0.335906982421875, -0.23077392578125, -0.125640869140625, -0.0205078125, 0.084625244140625, 0.18975830078125, 0.294891357421875, 0.4000244140625, 0.505157470703125, 0.61029052734375, 0.715423583984375, 0.820556640625, 0.925689697265625, 1.03082275390625, 1.135955810546875, 1.2410888671875, 1.346221923828125, 1.45135498046875, 1.556488037109375, 1.66162109375, 1.766754150390625, 1.87188720703125, 1.977020263671875, 2.0821533203125, 2.187286376953125, 2.29241943359375, 2.397552490234375, 2.502685546875, 2.607818603515625, 2.71295166015625, 2.818084716796875, 2.9232177734375, 3.028350830078125, 3.13348388671875, 3.238616943359375, 3.34375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 14.0, 10.0, 6.0, 22.0, 12.0, 13.0, 28.0, 37.0, 50.0, 59.0, 80.0, 98.0, 93.0, 108.0, 89.0, 71.0, 51.0, 34.0, 26.0, 20.0, 20.0, 11.0, 9.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.869140625, -2.783538818359375, -2.69793701171875, -2.612335205078125, -2.5267333984375, -2.441131591796875, -2.35552978515625, -2.269927978515625, -2.184326171875, -2.098724365234375, -2.01312255859375, -1.927520751953125, -1.8419189453125, -1.756317138671875, -1.67071533203125, -1.585113525390625, -1.49951171875, -1.413909912109375, -1.32830810546875, -1.242706298828125, -1.1571044921875, -1.071502685546875, -0.98590087890625, -0.900299072265625, -0.814697265625, -0.729095458984375, -0.64349365234375, -0.557891845703125, -0.4722900390625, -0.386688232421875, -0.30108642578125, -0.215484619140625, -0.1298828125, -0.044281005859375, 0.04132080078125, 0.126922607421875, 0.2125244140625, 0.298126220703125, 0.38372802734375, 0.469329833984375, 0.554931640625, 0.640533447265625, 0.72613525390625, 0.811737060546875, 0.8973388671875, 0.982940673828125, 1.06854248046875, 1.154144287109375, 1.23974609375, 1.325347900390625, 1.41094970703125, 1.496551513671875, 1.5821533203125, 1.667755126953125, 1.75335693359375, 1.838958740234375, 1.924560546875, 2.010162353515625, 2.09576416015625, 2.181365966796875, 2.2669677734375, 2.352569580078125, 2.43817138671875, 2.523773193359375, 2.609375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 5.0, 16.0, 49.0, 75.0, 155.0, 383.0, 166.0, 87.0, 34.0, 10.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.68077087402344, -102.86898040771484, -100.05718994140625, -97.24539947509766, -94.43360900878906, -91.62181854248047, -88.81002807617188, -85.99822998046875, -83.18644714355469, -80.3746566772461, -77.5628662109375, -74.7510757446289, -71.93928527832031, -69.12749481201172, -66.31570434570312, -63.503910064697266, -60.692115783691406, -57.88032531738281, -55.06853485107422, -52.256744384765625, -49.44495391845703, -46.63316345214844, -43.82136917114258, -41.009578704833984, -38.19778823852539, -35.3859977722168, -32.5742073059082, -29.762414932250977, -26.950624465942383, -24.13883399963379, -21.327041625976562, -18.51525115966797, -15.703453063964844, -12.89166259765625, -10.07987117767334, -7.26807975769043, -4.456289291381836, -1.6444988250732422, 1.1672935485839844, 3.979084014892578, 6.790874481201172, 9.602664947509766, 12.414456367492676, 15.226247787475586, 18.03803825378418, 20.849828720092773, 23.66162109375, 26.473411560058594, 29.285202026367188, 32.09699249267578, 34.908782958984375, 37.72057342529297, 40.53236389160156, 43.344154357910156, 46.155948638916016, 48.96773910522461, 51.7795295715332, 54.5913200378418, 57.40311050415039, 60.21490478515625, 63.026695251464844, 65.83848571777344, 68.65027618408203, 71.46206665039062, 74.27385711669922]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 8.0, 5.0, 10.0, 8.0, 12.0, 13.0, 19.0, 17.0, 20.0, 26.0, 28.0, 27.0, 28.0, 39.0, 41.0, 47.0, 81.0, 112.0, 77.0, 54.0, 50.0, 35.0, 28.0, 26.0, 25.0, 24.0, 27.0, 20.0, 13.0, 17.0, 11.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.03126907348633, -37.74959945678711, -36.46792984008789, -35.18626022338867, -33.90459060668945, -32.622920989990234, -31.341249465942383, -30.059579849243164, -28.777910232543945, -27.496240615844727, -26.214570999145508, -24.93290138244629, -23.651229858398438, -22.36956024169922, -21.087890625, -19.80622100830078, -18.524551391601562, -17.242881774902344, -15.961212158203125, -14.67954158782959, -13.397871971130371, -12.116202354431152, -10.834531784057617, -9.552862167358398, -8.27119255065918, -6.989522933959961, -5.707852840423584, -4.426182746887207, -3.1445131301879883, -1.8628435134887695, -0.5811734199523926, 0.7004966735839844, 1.9821662902832031, 3.263836145401001, 4.545506000518799, 5.827176094055176, 7.1088457107543945, 8.390515327453613, 9.672185897827148, 10.953855514526367, 12.235525131225586, 13.517194747924805, 14.798864364624023, 16.080533981323242, 17.362205505371094, 18.643875122070312, 19.92554473876953, 21.20721435546875, 22.48888397216797, 23.770553588867188, 25.052223205566406, 26.333892822265625, 27.615562438964844, 28.897232055664062, 30.178903579711914, 31.460573196411133, 32.74224090576172, 34.02391052246094, 35.305580139160156, 36.587249755859375, 37.868919372558594, 39.15058898925781, 40.43225860595703, 41.71392822265625, 42.995601654052734]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 12.0, 23.0, 28.0, 49.0, 98.0, 120.0, 248.0, 587.0, 1803.0, 18862.0, 2691219.0, 1466504.0, 12158.0, 1461.0, 488.0, 232.0, 138.0, 77.0, 54.0, 34.0, 18.0, 13.0, 11.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.15625, -10.7706298828125, -10.385009765625, -9.9993896484375, -9.61376953125, -9.2281494140625, -8.842529296875, -8.4569091796875, -8.0712890625, -7.6856689453125, -7.300048828125, -6.9144287109375, -6.52880859375, -6.1431884765625, -5.757568359375, -5.3719482421875, -4.986328125, -4.6007080078125, -4.215087890625, -3.8294677734375, -3.44384765625, -3.0582275390625, -2.672607421875, -2.2869873046875, -1.9013671875, -1.5157470703125, -1.130126953125, -0.7445068359375, -0.35888671875, 0.0267333984375, 0.412353515625, 0.7979736328125, 1.18359375, 1.5692138671875, 1.954833984375, 2.3404541015625, 2.72607421875, 3.1116943359375, 3.497314453125, 3.8829345703125, 4.2685546875, 4.6541748046875, 5.039794921875, 5.4254150390625, 5.81103515625, 6.1966552734375, 6.582275390625, 6.9678955078125, 7.353515625, 7.7391357421875, 8.124755859375, 8.5103759765625, 8.89599609375, 9.2816162109375, 9.667236328125, 10.0528564453125, 10.4384765625, 10.8240966796875, 11.209716796875, 11.5953369140625, 11.98095703125, 12.3665771484375, 12.752197265625, 13.1378173828125, 13.5234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 10.0, 9.0, 17.0, 20.0, 21.0, 26.0, 22.0, 18.0, 35.0, 35.0, 42.0, 42.0, 34.0, 41.0, 50.0, 44.0, 40.0, 60.0, 54.0, 52.0, 39.0, 45.0, 38.0, 29.0, 32.0, 18.0, 20.0, 17.0, 10.0, 13.0, 7.0, 11.0, 7.0, 5.0, 9.0, 3.0, 0.0, 0.0, 9.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.015625, -2.92144775390625, -2.8272705078125, -2.73309326171875, -2.638916015625, -2.54473876953125, -2.4505615234375, -2.35638427734375, -2.26220703125, -2.16802978515625, -2.0738525390625, -1.97967529296875, -1.885498046875, -1.79132080078125, -1.6971435546875, -1.60296630859375, -1.5087890625, -1.41461181640625, -1.3204345703125, -1.22625732421875, -1.132080078125, -1.03790283203125, -0.9437255859375, -0.84954833984375, -0.75537109375, -0.66119384765625, -0.5670166015625, -0.47283935546875, -0.378662109375, -0.28448486328125, -0.1903076171875, -0.09613037109375, -0.001953125, 0.09222412109375, 0.1864013671875, 0.28057861328125, 0.374755859375, 0.46893310546875, 0.5631103515625, 0.65728759765625, 0.75146484375, 0.84564208984375, 0.9398193359375, 1.03399658203125, 1.128173828125, 1.22235107421875, 1.3165283203125, 1.41070556640625, 1.5048828125, 1.59906005859375, 1.6932373046875, 1.78741455078125, 1.881591796875, 1.97576904296875, 2.0699462890625, 2.16412353515625, 2.25830078125, 2.35247802734375, 2.4466552734375, 2.54083251953125, 2.635009765625, 2.72918701171875, 2.8233642578125, 2.91754150390625, 3.01171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 8.0, 23.0, 27.0, 37.0, 59.0, 104.0, 183.0, 464.0, 1161.0, 3728.0, 21904.0, 1272511.0, 2855222.0, 31568.0, 4667.0, 1448.0, 526.0, 265.0, 132.0, 70.0, 48.0, 34.0, 20.0, 17.0, 10.0, 8.0, 5.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6875, -11.298828125, -10.91015625, -10.521484375, -10.1328125, -9.744140625, -9.35546875, -8.966796875, -8.578125, -8.189453125, -7.80078125, -7.412109375, -7.0234375, -6.634765625, -6.24609375, -5.857421875, -5.46875, -5.080078125, -4.69140625, -4.302734375, -3.9140625, -3.525390625, -3.13671875, -2.748046875, -2.359375, -1.970703125, -1.58203125, -1.193359375, -0.8046875, -0.416015625, -0.02734375, 0.361328125, 0.75, 1.138671875, 1.52734375, 1.916015625, 2.3046875, 2.693359375, 3.08203125, 3.470703125, 3.859375, 4.248046875, 4.63671875, 5.025390625, 5.4140625, 5.802734375, 6.19140625, 6.580078125, 6.96875, 7.357421875, 7.74609375, 8.134765625, 8.5234375, 8.912109375, 9.30078125, 9.689453125, 10.078125, 10.466796875, 10.85546875, 11.244140625, 11.6328125, 12.021484375, 12.41015625, 12.798828125, 13.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 8.0, 15.0, 14.0, 22.0, 25.0, 41.0, 58.0, 86.0, 162.0, 269.0, 456.0, 703.0, 790.0, 536.0, 345.0, 184.0, 113.0, 69.0, 43.0, 36.0, 20.0, 11.0, 18.0, 8.0, 8.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.44921875, -7.20233154296875, -6.9554443359375, -6.70855712890625, -6.461669921875, -6.21478271484375, -5.9678955078125, -5.72100830078125, -5.47412109375, -5.22723388671875, -4.9803466796875, -4.73345947265625, -4.486572265625, -4.23968505859375, -3.9927978515625, -3.74591064453125, -3.4990234375, -3.25213623046875, -3.0052490234375, -2.75836181640625, -2.511474609375, -2.26458740234375, -2.0177001953125, -1.77081298828125, -1.52392578125, -1.27703857421875, -1.0301513671875, -0.78326416015625, -0.536376953125, -0.28948974609375, -0.0426025390625, 0.20428466796875, 0.451171875, 0.69805908203125, 0.9449462890625, 1.19183349609375, 1.438720703125, 1.68560791015625, 1.9324951171875, 2.17938232421875, 2.42626953125, 2.67315673828125, 2.9200439453125, 3.16693115234375, 3.413818359375, 3.66070556640625, 3.9075927734375, 4.15447998046875, 4.4013671875, 4.64825439453125, 4.8951416015625, 5.14202880859375, 5.388916015625, 5.63580322265625, 5.8826904296875, 6.12957763671875, 6.37646484375, 6.62335205078125, 6.8702392578125, 7.11712646484375, 7.364013671875, 7.61090087890625, 7.8577880859375, 8.10467529296875, 8.3515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 13.0, 32.0, 159.0, 330.0, 300.0, 100.0, 34.0, 13.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.35205078125, -63.04004669189453, -58.72804260253906, -54.416038513183594, -50.104034423828125, -45.792030334472656, -41.48002624511719, -37.16802215576172, -32.85601806640625, -28.54401397705078, -24.232009887695312, -19.920005798339844, -15.608001708984375, -11.295997619628906, -6.9839935302734375, -2.6719894409179688, 1.6400146484375, 5.952018737792969, 10.264022827148438, 14.576026916503906, 18.888031005859375, 23.200035095214844, 27.512039184570312, 31.82404327392578, 36.13604736328125, 40.44805145263672, 44.76005554199219, 49.072059631347656, 53.384063720703125, 57.696067810058594, 62.00807189941406, 66.32007598876953, 70.63209533691406, 74.94409942626953, 79.256103515625, 83.56810760498047, 87.88011169433594, 92.1921157836914, 96.50411987304688, 100.81612396240234, 105.12812805175781, 109.44013214111328, 113.75213623046875, 118.06414031982422, 122.37614440917969, 126.68814849853516, 131.00015258789062, 135.31216430664062, 139.62416076660156, 143.9361572265625, 148.2481689453125, 152.5601806640625, 156.87217712402344, 161.18417358398438, 165.49618530273438, 169.80819702148438, 174.1201934814453, 178.43218994140625, 182.74420166015625, 187.05621337890625, 191.3682098388672, 195.68020629882812, 199.99221801757812, 204.30422973632812, 208.61622619628906]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 12.0, 10.0, 15.0, 16.0, 18.0, 24.0, 39.0, 36.0, 38.0, 52.0, 56.0, 49.0, 56.0, 61.0, 48.0, 57.0, 46.0, 60.0, 47.0, 37.0, 41.0, 40.0, 27.0, 16.0, 19.0, 16.0, 14.0, 15.0, 6.0, 8.0, 7.0, 8.0, 1.0, 2.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.37263488769531, -41.01166534423828, -39.65069580078125, -38.289730072021484, -36.92876052856445, -35.56779098510742, -34.20682144165039, -32.845855712890625, -31.484886169433594, -30.123916625976562, -28.762948989868164, -27.401979446411133, -26.041011810302734, -24.680042266845703, -23.319072723388672, -21.958105087280273, -20.597135543823242, -19.23616600036621, -17.875198364257812, -16.51422882080078, -15.153261184692383, -13.792291641235352, -12.431323051452637, -11.070354461669922, -9.709385871887207, -8.348417282104492, -6.987448692321777, -5.626479625701904, -4.2655110359191895, -2.9045424461364746, -1.5435733795166016, -0.18260478973388672, 1.1783638000488281, 2.539332389831543, 3.900301218032837, 5.261270046234131, 6.622238636016846, 7.9832072257995605, 9.344176292419434, 10.705144882202148, 12.066113471984863, 13.427082061767578, 14.788050651550293, 16.149019241333008, 17.50998878479004, 18.870956420898438, 20.23192596435547, 21.5928955078125, 22.9538631439209, 24.31483268737793, 25.675800323486328, 27.03676986694336, 28.397737503051758, 29.75870704650879, 31.119674682617188, 32.48064422607422, 33.84161376953125, 35.20258331298828, 36.56355285644531, 37.92451858520508, 39.28548812866211, 40.64645767211914, 42.00742721557617, 43.36839294433594, 44.72936248779297]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 2.0, 3.0, 18.0, 21.0, 30.0, 34.0, 38.0, 75.0, 102.0, 144.0, 222.0, 368.0, 520.0, 742.0, 1162.0, 1875.0, 2945.0, 4768.0, 7621.0, 12625.0, 22177.0, 39697.0, 74283.0, 142221.0, 243626.0, 221978.0, 122620.0, 64401.0, 34700.0, 19411.0, 11396.0, 6855.0, 4193.0, 2709.0, 1666.0, 1064.0, 761.0, 495.0, 317.0, 226.0, 162.0, 91.0, 59.0, 34.0, 32.0, 26.0, 13.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.58203125, -3.473114013671875, -3.36419677734375, -3.255279541015625, -3.1463623046875, -3.037445068359375, -2.92852783203125, -2.819610595703125, -2.710693359375, -2.601776123046875, -2.49285888671875, -2.383941650390625, -2.2750244140625, -2.166107177734375, -2.05718994140625, -1.948272705078125, -1.83935546875, -1.730438232421875, -1.62152099609375, -1.512603759765625, -1.4036865234375, -1.294769287109375, -1.18585205078125, -1.076934814453125, -0.968017578125, -0.859100341796875, -0.75018310546875, -0.641265869140625, -0.5323486328125, -0.423431396484375, -0.31451416015625, -0.205596923828125, -0.0966796875, 0.012237548828125, 0.12115478515625, 0.230072021484375, 0.3389892578125, 0.447906494140625, 0.55682373046875, 0.665740966796875, 0.774658203125, 0.883575439453125, 0.99249267578125, 1.101409912109375, 1.2103271484375, 1.319244384765625, 1.42816162109375, 1.537078857421875, 1.64599609375, 1.754913330078125, 1.86383056640625, 1.972747802734375, 2.0816650390625, 2.190582275390625, 2.29949951171875, 2.408416748046875, 2.517333984375, 2.626251220703125, 2.73516845703125, 2.844085693359375, 2.9530029296875, 3.061920166015625, 3.17083740234375, 3.279754638671875, 3.388671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 10.0, 10.0, 17.0, 21.0, 27.0, 24.0, 22.0, 33.0, 26.0, 36.0, 32.0, 32.0, 43.0, 30.0, 59.0, 47.0, 47.0, 46.0, 43.0, 45.0, 42.0, 40.0, 40.0, 33.0, 28.0, 25.0, 21.0, 25.0, 13.0, 14.0, 10.0, 8.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.953369140625, -2.85205078125, -2.750732421875, -2.6494140625, -2.548095703125, -2.44677734375, -2.345458984375, -2.244140625, -2.142822265625, -2.04150390625, -1.940185546875, -1.8388671875, -1.737548828125, -1.63623046875, -1.534912109375, -1.43359375, -1.332275390625, -1.23095703125, -1.129638671875, -1.0283203125, -0.927001953125, -0.82568359375, -0.724365234375, -0.623046875, -0.521728515625, -0.42041015625, -0.319091796875, -0.2177734375, -0.116455078125, -0.01513671875, 0.086181640625, 0.1875, 0.288818359375, 0.39013671875, 0.491455078125, 0.5927734375, 0.694091796875, 0.79541015625, 0.896728515625, 0.998046875, 1.099365234375, 1.20068359375, 1.302001953125, 1.4033203125, 1.504638671875, 1.60595703125, 1.707275390625, 1.80859375, 1.909912109375, 2.01123046875, 2.112548828125, 2.2138671875, 2.315185546875, 2.41650390625, 2.517822265625, 2.619140625, 2.720458984375, 2.82177734375, 2.923095703125, 3.0244140625, 3.125732421875, 3.22705078125, 3.328369140625, 3.4296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 9.0, 10.0, 11.0, 13.0, 16.0, 20.0, 35.0, 50.0, 71.0, 89.0, 149.0, 243.0, 377.0, 658.0, 1249.0, 2914.0, 11947.0, 114775.0, 843770.0, 59317.0, 7902.0, 2335.0, 1057.0, 546.0, 356.0, 207.0, 128.0, 75.0, 69.0, 41.0, 20.0, 28.0, 11.0, 12.0, 10.0, 12.0, 3.0, 3.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.8409423828125, -11.408447265625, -10.9759521484375, -10.54345703125, -10.1109619140625, -9.678466796875, -9.2459716796875, -8.8134765625, -8.3809814453125, -7.948486328125, -7.5159912109375, -7.08349609375, -6.6510009765625, -6.218505859375, -5.7860107421875, -5.353515625, -4.9210205078125, -4.488525390625, -4.0560302734375, -3.62353515625, -3.1910400390625, -2.758544921875, -2.3260498046875, -1.8935546875, -1.4610595703125, -1.028564453125, -0.5960693359375, -0.16357421875, 0.2689208984375, 0.701416015625, 1.1339111328125, 1.56640625, 1.9989013671875, 2.431396484375, 2.8638916015625, 3.29638671875, 3.7288818359375, 4.161376953125, 4.5938720703125, 5.0263671875, 5.4588623046875, 5.891357421875, 6.3238525390625, 6.75634765625, 7.1888427734375, 7.621337890625, 8.0538330078125, 8.486328125, 8.9188232421875, 9.351318359375, 9.7838134765625, 10.21630859375, 10.6488037109375, 11.081298828125, 11.5137939453125, 11.9462890625, 12.3787841796875, 12.811279296875, 13.2437744140625, 13.67626953125, 14.1087646484375, 14.541259765625, 14.9737548828125, 15.40625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 7.0, 13.0, 14.0, 23.0, 21.0, 29.0, 33.0, 30.0, 44.0, 58.0, 71.0, 63.0, 63.0, 63.0, 58.0, 60.0, 51.0, 41.0, 55.0, 39.0, 22.0, 17.0, 20.0, 30.0, 8.0, 11.0, 8.0, 6.0, 4.0, 1.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.2734375, -14.7833251953125, -14.293212890625, -13.8031005859375, -13.31298828125, -12.8228759765625, -12.332763671875, -11.8426513671875, -11.3525390625, -10.8624267578125, -10.372314453125, -9.8822021484375, -9.39208984375, -8.9019775390625, -8.411865234375, -7.9217529296875, -7.431640625, -6.9415283203125, -6.451416015625, -5.9613037109375, -5.47119140625, -4.9810791015625, -4.490966796875, -4.0008544921875, -3.5107421875, -3.0206298828125, -2.530517578125, -2.0404052734375, -1.55029296875, -1.0601806640625, -0.570068359375, -0.0799560546875, 0.41015625, 0.9002685546875, 1.390380859375, 1.8804931640625, 2.37060546875, 2.8607177734375, 3.350830078125, 3.8409423828125, 4.3310546875, 4.8211669921875, 5.311279296875, 5.8013916015625, 6.29150390625, 6.7816162109375, 7.271728515625, 7.7618408203125, 8.251953125, 8.7420654296875, 9.232177734375, 9.7222900390625, 10.21240234375, 10.7025146484375, 11.192626953125, 11.6827392578125, 12.1728515625, 12.6629638671875, 13.153076171875, 13.6431884765625, 14.13330078125, 14.6234130859375, 15.113525390625, 15.6036376953125, 16.09375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 10.0, 17.0, 40.0, 78.0, 140.0, 318.0, 712.0, 2091.0, 7537.0, 43550.0, 795970.0, 173488.0, 18377.0, 4055.0, 1248.0, 481.0, 215.0, 91.0, 48.0, 23.0, 21.0, 13.0, 3.0, 3.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.810546875, -3.69427490234375, -3.5780029296875, -3.46173095703125, -3.345458984375, -3.22918701171875, -3.1129150390625, -2.99664306640625, -2.88037109375, -2.76409912109375, -2.6478271484375, -2.53155517578125, -2.415283203125, -2.29901123046875, -2.1827392578125, -2.06646728515625, -1.9501953125, -1.83392333984375, -1.7176513671875, -1.60137939453125, -1.485107421875, -1.36883544921875, -1.2525634765625, -1.13629150390625, -1.02001953125, -0.90374755859375, -0.7874755859375, -0.67120361328125, -0.554931640625, -0.43865966796875, -0.3223876953125, -0.20611572265625, -0.08984375, 0.02642822265625, 0.1427001953125, 0.25897216796875, 0.375244140625, 0.49151611328125, 0.6077880859375, 0.72406005859375, 0.84033203125, 0.95660400390625, 1.0728759765625, 1.18914794921875, 1.305419921875, 1.42169189453125, 1.5379638671875, 1.65423583984375, 1.7705078125, 1.88677978515625, 2.0030517578125, 2.11932373046875, 2.235595703125, 2.35186767578125, 2.4681396484375, 2.58441162109375, 2.70068359375, 2.81695556640625, 2.9332275390625, 3.04949951171875, 3.165771484375, 3.28204345703125, 3.3983154296875, 3.51458740234375, 3.630859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 8.0, 9.0, 7.0, 8.0, 12.0, 10.0, 26.0, 34.0, 62.0, 50.0, 73.0, 100.0, 118.0, 98.0, 71.0, 69.0, 54.0, 33.0, 31.0, 21.0, 19.0, 22.0, 12.0, 13.0, 8.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008864402770996094, -0.0008594244718551636, -0.0008324086666107178, -0.000805392861366272, -0.0007783770561218262, -0.0007513612508773804, -0.0007243454456329346, -0.0006973296403884888, -0.000670313835144043, -0.0006432980298995972, -0.0006162822246551514, -0.0005892664194107056, -0.0005622506141662598, -0.000535234808921814, -0.0005082190036773682, -0.00048120319843292236, -0.00045418739318847656, -0.00042717158794403076, -0.00040015578269958496, -0.00037313997745513916, -0.00034612417221069336, -0.00031910836696624756, -0.00029209256172180176, -0.00026507675647735596, -0.00023806095123291016, -0.00021104514598846436, -0.00018402934074401855, -0.00015701353549957275, -0.00012999773025512695, -0.00010298192501068115, -7.596611976623535e-05, -4.895031452178955e-05, -2.193450927734375e-05, 5.081295967102051e-06, 3.209710121154785e-05, 5.911290645599365e-05, 8.612871170043945e-05, 0.00011314451694488525, 0.00014016032218933105, 0.00016717612743377686, 0.00019419193267822266, 0.00022120773792266846, 0.00024822354316711426, 0.00027523934841156006, 0.00030225515365600586, 0.00032927095890045166, 0.00035628676414489746, 0.00038330256938934326, 0.00041031837463378906, 0.00043733417987823486, 0.00046434998512268066, 0.0004913657903671265, 0.0005183815956115723, 0.0005453974008560181, 0.0005724132061004639, 0.0005994290113449097, 0.0006264448165893555, 0.0006534606218338013, 0.0006804764270782471, 0.0007074922323226929, 0.0007345080375671387, 0.0007615238428115845, 0.0007885396480560303, 0.0008155554533004761, 0.0008425712585449219]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 6.0, 7.0, 12.0, 25.0, 24.0, 48.0, 80.0, 121.0, 228.0, 545.0, 1173.0, 3419.0, 15907.0, 164603.0, 800621.0, 50771.0, 7329.0, 2105.0, 747.0, 352.0, 173.0, 111.0, 64.0, 31.0, 22.0, 14.0, 9.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5546875, -3.456695556640625, -3.35870361328125, -3.260711669921875, -3.1627197265625, -3.064727783203125, -2.96673583984375, -2.868743896484375, -2.770751953125, -2.672760009765625, -2.57476806640625, -2.476776123046875, -2.3787841796875, -2.280792236328125, -2.18280029296875, -2.084808349609375, -1.98681640625, -1.888824462890625, -1.79083251953125, -1.692840576171875, -1.5948486328125, -1.496856689453125, -1.39886474609375, -1.300872802734375, -1.202880859375, -1.104888916015625, -1.00689697265625, -0.908905029296875, -0.8109130859375, -0.712921142578125, -0.61492919921875, -0.516937255859375, -0.4189453125, -0.320953369140625, -0.22296142578125, -0.124969482421875, -0.0269775390625, 0.071014404296875, 0.16900634765625, 0.266998291015625, 0.364990234375, 0.462982177734375, 0.56097412109375, 0.658966064453125, 0.7569580078125, 0.854949951171875, 0.95294189453125, 1.050933837890625, 1.14892578125, 1.246917724609375, 1.34490966796875, 1.442901611328125, 1.5408935546875, 1.638885498046875, 1.73687744140625, 1.834869384765625, 1.932861328125, 2.030853271484375, 2.12884521484375, 2.226837158203125, 2.3248291015625, 2.422821044921875, 2.52081298828125, 2.618804931640625, 2.716796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 7.0, 13.0, 14.0, 18.0, 18.0, 32.0, 54.0, 52.0, 68.0, 79.0, 100.0, 107.0, 97.0, 86.0, 55.0, 38.0, 45.0, 27.0, 23.0, 14.0, 9.0, 8.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.54901123046875, -2.4671630859375, -2.38531494140625, -2.303466796875, -2.22161865234375, -2.1397705078125, -2.05792236328125, -1.97607421875, -1.89422607421875, -1.8123779296875, -1.73052978515625, -1.648681640625, -1.56683349609375, -1.4849853515625, -1.40313720703125, -1.3212890625, -1.23944091796875, -1.1575927734375, -1.07574462890625, -0.993896484375, -0.91204833984375, -0.8302001953125, -0.74835205078125, -0.66650390625, -0.58465576171875, -0.5028076171875, -0.42095947265625, -0.339111328125, -0.25726318359375, -0.1754150390625, -0.09356689453125, -0.01171875, 0.07012939453125, 0.1519775390625, 0.23382568359375, 0.315673828125, 0.39752197265625, 0.4793701171875, 0.56121826171875, 0.64306640625, 0.72491455078125, 0.8067626953125, 0.88861083984375, 0.970458984375, 1.05230712890625, 1.1341552734375, 1.21600341796875, 1.2978515625, 1.37969970703125, 1.4615478515625, 1.54339599609375, 1.625244140625, 1.70709228515625, 1.7889404296875, 1.87078857421875, 1.95263671875, 2.03448486328125, 2.1163330078125, 2.19818115234375, 2.280029296875, 2.36187744140625, 2.4437255859375, 2.52557373046875, 2.607421875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 12.0, 6.0, 16.0, 34.0, 65.0, 129.0, 317.0, 274.0, 79.0, 30.0, 25.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-112.8205795288086, -109.77059173583984, -106.7206039428711, -103.67061614990234, -100.62062072753906, -97.57063293457031, -94.52064514160156, -91.47065734863281, -88.42066955566406, -85.37068176269531, -82.32069396972656, -79.27070617675781, -76.22071838378906, -73.17072296142578, -70.12073516845703, -67.07074737548828, -64.02075958251953, -60.97077178955078, -57.92078399658203, -54.870792388916016, -51.820804595947266, -48.770816802978516, -45.7208251953125, -42.67083740234375, -39.620849609375, -36.57086181640625, -33.5208740234375, -30.470882415771484, -27.420894622802734, -24.370906829833984, -21.3209171295166, -18.27092742919922, -15.220947265625, -12.170958518981934, -9.120969772338867, -6.070981025695801, -3.0209922790527344, 0.02899646759033203, 3.0789852142333984, 6.128974914550781, 9.178962707519531, 12.228951454162598, 15.278940200805664, 18.328929901123047, 21.378917694091797, 24.428905487060547, 27.47889518737793, 30.528884887695312, 33.57887268066406, 36.62886047363281, 39.67884826660156, 42.72883987426758, 45.77882766723633, 48.82881546020508, 51.878807067871094, 54.928794860839844, 57.978782653808594, 61.028770446777344, 64.0787582397461, 67.12874603271484, 70.17874145507812, 73.22872924804688, 76.27871704101562, 79.32870483398438, 82.37869262695312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 11.0, 10.0, 20.0, 16.0, 15.0, 13.0, 16.0, 27.0, 21.0, 24.0, 26.0, 25.0, 40.0, 47.0, 100.0, 133.0, 81.0, 44.0, 41.0, 20.0, 30.0, 25.0, 23.0, 19.0, 25.0, 19.0, 17.0, 8.0, 6.0, 11.0, 9.0, 7.0, 10.0, 8.0, 5.0, 3.0, 5.0, 5.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-41.20676803588867, -39.891212463378906, -38.575660705566406, -37.260108947753906, -35.94455337524414, -34.628997802734375, -33.313446044921875, -31.997892379760742, -30.68233871459961, -29.366785049438477, -28.051231384277344, -26.73567771911621, -25.420124053955078, -24.104570388793945, -22.789016723632812, -21.47346305847168, -20.157909393310547, -18.842355728149414, -17.52680206298828, -16.21124839782715, -14.895694732666016, -13.580141067504883, -12.26458740234375, -10.949033737182617, -9.633480072021484, -8.317926406860352, -7.002372741699219, -5.686819076538086, -4.371265411376953, -3.0557117462158203, -1.7401580810546875, -0.4246044158935547, 0.8909530639648438, 2.2065067291259766, 3.5220603942871094, 4.837614059448242, 6.153167724609375, 7.468721389770508, 8.78427505493164, 10.099828720092773, 11.415382385253906, 12.730936050415039, 14.046489715576172, 15.362043380737305, 16.677597045898438, 17.99315071105957, 19.308704376220703, 20.624258041381836, 21.93981170654297, 23.2553653717041, 24.570919036865234, 25.886472702026367, 27.2020263671875, 28.517580032348633, 29.833133697509766, 31.1486873626709, 32.46424102783203, 33.77979278564453, 35.0953483581543, 36.41090393066406, 37.72645568847656, 39.04200744628906, 40.35756301879883, 41.673118591308594, 42.988670349121094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 4.0, 6.0, 17.0, 19.0, 42.0, 52.0, 115.0, 171.0, 312.0, 615.0, 1255.0, 2795.0, 7271.0, 27220.0, 166877.0, 1314677.0, 2220905.0, 383903.0, 49074.0, 11493.0, 3976.0, 1718.0, 752.0, 404.0, 243.0, 148.0, 74.0, 46.0, 40.0, 21.0, 9.0, 8.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.55303955078125, -5.3560791015625, -5.15911865234375, -4.962158203125, -4.76519775390625, -4.5682373046875, -4.37127685546875, -4.17431640625, -3.97735595703125, -3.7803955078125, -3.58343505859375, -3.386474609375, -3.18951416015625, -2.9925537109375, -2.79559326171875, -2.5986328125, -2.40167236328125, -2.2047119140625, -2.00775146484375, -1.810791015625, -1.61383056640625, -1.4168701171875, -1.21990966796875, -1.02294921875, -0.82598876953125, -0.6290283203125, -0.43206787109375, -0.235107421875, -0.03814697265625, 0.1588134765625, 0.35577392578125, 0.552734375, 0.74969482421875, 0.9466552734375, 1.14361572265625, 1.340576171875, 1.53753662109375, 1.7344970703125, 1.93145751953125, 2.12841796875, 2.32537841796875, 2.5223388671875, 2.71929931640625, 2.916259765625, 3.11322021484375, 3.3101806640625, 3.50714111328125, 3.7041015625, 3.90106201171875, 4.0980224609375, 4.29498291015625, 4.491943359375, 4.68890380859375, 4.8858642578125, 5.08282470703125, 5.27978515625, 5.47674560546875, 5.6737060546875, 5.87066650390625, 6.067626953125, 6.26458740234375, 6.4615478515625, 6.65850830078125, 6.85546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 11.0, 6.0, 7.0, 13.0, 18.0, 17.0, 22.0, 31.0, 33.0, 30.0, 32.0, 35.0, 43.0, 40.0, 31.0, 53.0, 47.0, 51.0, 36.0, 49.0, 44.0, 43.0, 43.0, 44.0, 37.0, 31.0, 36.0, 19.0, 25.0, 22.0, 11.0, 12.0, 7.0, 4.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.83831787109375, -2.7391357421875, -2.63995361328125, -2.540771484375, -2.44158935546875, -2.3424072265625, -2.24322509765625, -2.14404296875, -2.04486083984375, -1.9456787109375, -1.84649658203125, -1.747314453125, -1.64813232421875, -1.5489501953125, -1.44976806640625, -1.3505859375, -1.25140380859375, -1.1522216796875, -1.05303955078125, -0.953857421875, -0.85467529296875, -0.7554931640625, -0.65631103515625, -0.55712890625, -0.45794677734375, -0.3587646484375, -0.25958251953125, -0.160400390625, -0.06121826171875, 0.0379638671875, 0.13714599609375, 0.236328125, 0.33551025390625, 0.4346923828125, 0.53387451171875, 0.633056640625, 0.73223876953125, 0.8314208984375, 0.93060302734375, 1.02978515625, 1.12896728515625, 1.2281494140625, 1.32733154296875, 1.426513671875, 1.52569580078125, 1.6248779296875, 1.72406005859375, 1.8232421875, 1.92242431640625, 2.0216064453125, 2.12078857421875, 2.219970703125, 2.31915283203125, 2.4183349609375, 2.51751708984375, 2.61669921875, 2.71588134765625, 2.8150634765625, 2.91424560546875, 3.013427734375, 3.11260986328125, 3.2117919921875, 3.31097412109375, 3.41015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 13.0, 21.0, 39.0, 57.0, 82.0, 192.0, 367.0, 1014.0, 3942.0, 77410.0, 4084710.0, 22732.0, 2393.0, 671.0, 283.0, 150.0, 94.0, 37.0, 24.0, 11.0, 13.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.779052734375, -31.90185546875, -31.024658203125, -30.1474609375, -29.270263671875, -28.39306640625, -27.515869140625, -26.638671875, -25.761474609375, -24.88427734375, -24.007080078125, -23.1298828125, -22.252685546875, -21.37548828125, -20.498291015625, -19.62109375, -18.743896484375, -17.86669921875, -16.989501953125, -16.1123046875, -15.235107421875, -14.35791015625, -13.480712890625, -12.603515625, -11.726318359375, -10.84912109375, -9.971923828125, -9.0947265625, -8.217529296875, -7.34033203125, -6.463134765625, -5.5859375, -4.708740234375, -3.83154296875, -2.954345703125, -2.0771484375, -1.199951171875, -0.32275390625, 0.554443359375, 1.431640625, 2.308837890625, 3.18603515625, 4.063232421875, 4.9404296875, 5.817626953125, 6.69482421875, 7.572021484375, 8.44921875, 9.326416015625, 10.20361328125, 11.080810546875, 11.9580078125, 12.835205078125, 13.71240234375, 14.589599609375, 15.466796875, 16.343994140625, 17.22119140625, 18.098388671875, 18.9755859375, 19.852783203125, 20.72998046875, 21.607177734375, 22.484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 8.0, 7.0, 5.0, 16.0, 18.0, 51.0, 73.0, 91.0, 157.0, 270.0, 414.0, 765.0, 902.0, 499.0, 306.0, 197.0, 116.0, 65.0, 36.0, 20.0, 23.0, 11.0, 12.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.578125, -20.1231689453125, -19.668212890625, -19.2132568359375, -18.75830078125, -18.3033447265625, -17.848388671875, -17.3934326171875, -16.9384765625, -16.4835205078125, -16.028564453125, -15.5736083984375, -15.11865234375, -14.6636962890625, -14.208740234375, -13.7537841796875, -13.298828125, -12.8438720703125, -12.388916015625, -11.9339599609375, -11.47900390625, -11.0240478515625, -10.569091796875, -10.1141357421875, -9.6591796875, -9.2042236328125, -8.749267578125, -8.2943115234375, -7.83935546875, -7.3843994140625, -6.929443359375, -6.4744873046875, -6.01953125, -5.5645751953125, -5.109619140625, -4.6546630859375, -4.19970703125, -3.7447509765625, -3.289794921875, -2.8348388671875, -2.3798828125, -1.9249267578125, -1.469970703125, -1.0150146484375, -0.56005859375, -0.1051025390625, 0.349853515625, 0.8048095703125, 1.259765625, 1.7147216796875, 2.169677734375, 2.6246337890625, 3.07958984375, 3.5345458984375, 3.989501953125, 4.4444580078125, 4.8994140625, 5.3543701171875, 5.809326171875, 6.2642822265625, 6.71923828125, 7.1741943359375, 7.629150390625, 8.0841064453125, 8.5390625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 13.0, 21.0, 57.0, 127.0, 257.0, 280.0, 141.0, 55.0, 23.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-271.49066162109375, -265.58349609375, -259.6763000488281, -253.7691192626953, -247.8619384765625, -241.95477294921875, -236.04757690429688, -230.14041137695312, -224.2332305908203, -218.3260498046875, -212.4188690185547, -206.51168823242188, -200.60450744628906, -194.69732666015625, -188.7901611328125, -182.8829803466797, -176.97579956054688, -171.06861877441406, -165.16143798828125, -159.25425720214844, -153.34707641601562, -147.43991088867188, -141.53271484375, -135.62554931640625, -129.71835327148438, -123.81117248535156, -117.90399169921875, -111.99681091308594, -106.08963775634766, -100.18245697021484, -94.27527618408203, -88.36810302734375, -82.46092224121094, -76.55374145507812, -70.64656066894531, -64.7393798828125, -58.83220672607422, -52.925025939941406, -47.017845153808594, -41.11066818237305, -35.203487396240234, -29.296308517456055, -23.389129638671875, -17.481948852539062, -11.574769973754883, -5.667591094970703, 0.23958969116210938, 6.146766662597656, 12.053947448730469, 17.96112632751465, 23.868305206298828, 29.77548599243164, 35.68266296386719, 41.58984375, 47.49702453613281, 53.40420150756836, 59.31138229370117, 65.21855926513672, 71.12574005126953, 77.03292083740234, 82.94010162353516, 88.84727478027344, 94.75445556640625, 100.66163635253906, 106.56881713867188]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 12.0, 4.0, 2.0, 11.0, 7.0, 14.0, 20.0, 21.0, 30.0, 25.0, 31.0, 49.0, 37.0, 45.0, 58.0, 59.0, 72.0, 80.0, 60.0, 70.0, 48.0, 37.0, 34.0, 30.0, 25.0, 29.0, 19.0, 16.0, 11.0, 11.0, 9.0, 6.0, 4.0, 2.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.94343566894531, -62.73412322998047, -60.52481460571289, -58.31550216674805, -56.1061897277832, -53.896881103515625, -51.68756866455078, -49.47825622558594, -47.268943786621094, -45.05963134765625, -42.85032272338867, -40.64101028442383, -38.431697845458984, -36.222389221191406, -34.01307678222656, -31.80376434326172, -29.59445571899414, -27.38514518737793, -25.175832748413086, -22.966522216796875, -20.75720977783203, -18.54789924621582, -16.33858871459961, -14.129277229309082, -11.919965744018555, -9.710654258728027, -7.501343250274658, -5.292032241821289, -3.0827207565307617, -0.8734092712402344, 1.3359012603759766, 3.545212745666504, 5.754524230957031, 7.963835716247559, 10.173147201538086, 12.382457733154297, 14.591769218444824, 16.80108070373535, 19.010391235351562, 21.219703674316406, 23.429014205932617, 25.638324737548828, 27.847637176513672, 30.056947708129883, 32.266258239746094, 34.47557067871094, 36.68488311767578, 38.89419174194336, 41.1035041809082, 43.31281661987305, 45.522125244140625, 47.73143768310547, 49.94075012207031, 52.150062561035156, 54.359371185302734, 56.56868362426758, 58.777992248535156, 60.9873046875, 63.19661331176758, 65.40592956542969, 67.615234375, 69.82454681396484, 72.03385925292969, 74.24317169189453, 76.45248413085938]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 13.0, 21.0, 54.0, 83.0, 162.0, 380.0, 1052.0, 2877.0, 10171.0, 55326.0, 672194.0, 266555.0, 29923.0, 6438.0, 1983.0, 718.0, 313.0, 118.0, 74.0, 30.0, 19.0, 11.0, 11.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.7548828125, -8.416015625, -8.0771484375, -7.73828125, -7.3994140625, -7.060546875, -6.7216796875, -6.3828125, -6.0439453125, -5.705078125, -5.3662109375, -5.02734375, -4.6884765625, -4.349609375, -4.0107421875, -3.671875, -3.3330078125, -2.994140625, -2.6552734375, -2.31640625, -1.9775390625, -1.638671875, -1.2998046875, -0.9609375, -0.6220703125, -0.283203125, 0.0556640625, 0.39453125, 0.7333984375, 1.072265625, 1.4111328125, 1.75, 2.0888671875, 2.427734375, 2.7666015625, 3.10546875, 3.4443359375, 3.783203125, 4.1220703125, 4.4609375, 4.7998046875, 5.138671875, 5.4775390625, 5.81640625, 6.1552734375, 6.494140625, 6.8330078125, 7.171875, 7.5107421875, 7.849609375, 8.1884765625, 8.52734375, 8.8662109375, 9.205078125, 9.5439453125, 9.8828125, 10.2216796875, 10.560546875, 10.8994140625, 11.23828125, 11.5771484375, 11.916015625, 12.2548828125, 12.59375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 11.0, 7.0, 7.0, 10.0, 23.0, 20.0, 43.0, 31.0, 41.0, 59.0, 49.0, 61.0, 52.0, 69.0, 69.0, 69.0, 57.0, 54.0, 49.0, 45.0, 30.0, 34.0, 24.0, 16.0, 17.0, 11.0, 8.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.252532958984375, -3.10467529296875, -2.956817626953125, -2.8089599609375, -2.661102294921875, -2.51324462890625, -2.365386962890625, -2.217529296875, -2.069671630859375, -1.92181396484375, -1.773956298828125, -1.6260986328125, -1.478240966796875, -1.33038330078125, -1.182525634765625, -1.03466796875, -0.886810302734375, -0.73895263671875, -0.591094970703125, -0.4432373046875, -0.295379638671875, -0.14752197265625, 0.000335693359375, 0.148193359375, 0.296051025390625, 0.44390869140625, 0.591766357421875, 0.7396240234375, 0.887481689453125, 1.03533935546875, 1.183197021484375, 1.3310546875, 1.478912353515625, 1.62677001953125, 1.774627685546875, 1.9224853515625, 2.070343017578125, 2.21820068359375, 2.366058349609375, 2.513916015625, 2.661773681640625, 2.80963134765625, 2.957489013671875, 3.1053466796875, 3.253204345703125, 3.40106201171875, 3.548919677734375, 3.69677734375, 3.844635009765625, 3.99249267578125, 4.140350341796875, 4.2882080078125, 4.436065673828125, 4.58392333984375, 4.731781005859375, 4.879638671875, 5.027496337890625, 5.17535400390625, 5.323211669921875, 5.4710693359375, 5.618927001953125, 5.76678466796875, 5.914642333984375, 6.0625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 1.0, 5.0, 3.0, 8.0, 15.0, 21.0, 19.0, 28.0, 42.0, 49.0, 70.0, 120.0, 202.0, 301.0, 483.0, 907.0, 2317.0, 8018.0, 52593.0, 902499.0, 66600.0, 9311.0, 2462.0, 1038.0, 491.0, 325.0, 188.0, 137.0, 80.0, 51.0, 32.0, 37.0, 31.0, 17.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.328125, -10.990478515625, -10.65283203125, -10.315185546875, -9.9775390625, -9.639892578125, -9.30224609375, -8.964599609375, -8.626953125, -8.289306640625, -7.95166015625, -7.614013671875, -7.2763671875, -6.938720703125, -6.60107421875, -6.263427734375, -5.92578125, -5.588134765625, -5.25048828125, -4.912841796875, -4.5751953125, -4.237548828125, -3.89990234375, -3.562255859375, -3.224609375, -2.886962890625, -2.54931640625, -2.211669921875, -1.8740234375, -1.536376953125, -1.19873046875, -0.861083984375, -0.5234375, -0.185791015625, 0.15185546875, 0.489501953125, 0.8271484375, 1.164794921875, 1.50244140625, 1.840087890625, 2.177734375, 2.515380859375, 2.85302734375, 3.190673828125, 3.5283203125, 3.865966796875, 4.20361328125, 4.541259765625, 4.87890625, 5.216552734375, 5.55419921875, 5.891845703125, 6.2294921875, 6.567138671875, 6.90478515625, 7.242431640625, 7.580078125, 7.917724609375, 8.25537109375, 8.593017578125, 8.9306640625, 9.268310546875, 9.60595703125, 9.943603515625, 10.28125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 7.0, 10.0, 8.0, 13.0, 12.0, 14.0, 21.0, 27.0, 32.0, 33.0, 41.0, 43.0, 63.0, 73.0, 107.0, 92.0, 73.0, 58.0, 37.0, 33.0, 27.0, 31.0, 24.0, 26.0, 24.0, 12.0, 12.0, 7.0, 10.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.15625, -21.5711669921875, -20.986083984375, -20.4010009765625, -19.81591796875, -19.2308349609375, -18.645751953125, -18.0606689453125, -17.4755859375, -16.8905029296875, -16.305419921875, -15.7203369140625, -15.13525390625, -14.5501708984375, -13.965087890625, -13.3800048828125, -12.794921875, -12.2098388671875, -11.624755859375, -11.0396728515625, -10.45458984375, -9.8695068359375, -9.284423828125, -8.6993408203125, -8.1142578125, -7.5291748046875, -6.944091796875, -6.3590087890625, -5.77392578125, -5.1888427734375, -4.603759765625, -4.0186767578125, -3.43359375, -2.8485107421875, -2.263427734375, -1.6783447265625, -1.09326171875, -0.5081787109375, 0.076904296875, 0.6619873046875, 1.2470703125, 1.8321533203125, 2.417236328125, 3.0023193359375, 3.58740234375, 4.1724853515625, 4.757568359375, 5.3426513671875, 5.927734375, 6.5128173828125, 7.097900390625, 7.6829833984375, 8.26806640625, 8.8531494140625, 9.438232421875, 10.0233154296875, 10.6083984375, 11.1934814453125, 11.778564453125, 12.3636474609375, 12.94873046875, 13.5338134765625, 14.118896484375, 14.7039794921875, 15.2890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 8.0, 10.0, 15.0, 16.0, 33.0, 47.0, 50.0, 81.0, 158.0, 283.0, 629.0, 1409.0, 4342.0, 18704.0, 212302.0, 778880.0, 23226.0, 5166.0, 1636.0, 692.0, 309.0, 201.0, 113.0, 70.0, 45.0, 29.0, 22.0, 17.0, 11.0, 7.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9453125, -2.8658447265625, -2.786376953125, -2.7069091796875, -2.62744140625, -2.5479736328125, -2.468505859375, -2.3890380859375, -2.3095703125, -2.2301025390625, -2.150634765625, -2.0711669921875, -1.99169921875, -1.9122314453125, -1.832763671875, -1.7532958984375, -1.673828125, -1.5943603515625, -1.514892578125, -1.4354248046875, -1.35595703125, -1.2764892578125, -1.197021484375, -1.1175537109375, -1.0380859375, -0.9586181640625, -0.879150390625, -0.7996826171875, -0.72021484375, -0.6407470703125, -0.561279296875, -0.4818115234375, -0.40234375, -0.3228759765625, -0.243408203125, -0.1639404296875, -0.08447265625, -0.0050048828125, 0.074462890625, 0.1539306640625, 0.2333984375, 0.3128662109375, 0.392333984375, 0.4718017578125, 0.55126953125, 0.6307373046875, 0.710205078125, 0.7896728515625, 0.869140625, 0.9486083984375, 1.028076171875, 1.1075439453125, 1.18701171875, 1.2664794921875, 1.345947265625, 1.4254150390625, 1.5048828125, 1.5843505859375, 1.663818359375, 1.7432861328125, 1.82275390625, 1.9022216796875, 1.981689453125, 2.0611572265625, 2.140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 8.0, 11.0, 13.0, 17.0, 15.0, 43.0, 48.0, 80.0, 180.0, 205.0, 150.0, 78.0, 47.0, 22.0, 21.0, 19.0, 15.0, 7.0, 8.0, 6.0, 1.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013322830200195312, -0.0012976229190826416, -0.001262962818145752, -0.0012283027172088623, -0.0011936426162719727, -0.001158982515335083, -0.0011243224143981934, -0.0010896623134613037, -0.001055002212524414, -0.0010203421115875244, -0.0009856820106506348, -0.0009510219097137451, -0.0009163618087768555, -0.0008817017078399658, -0.0008470416069030762, -0.0008123815059661865, -0.0007777214050292969, -0.0007430613040924072, -0.0007084012031555176, -0.0006737411022186279, -0.0006390810012817383, -0.0006044209003448486, -0.000569760799407959, -0.0005351006984710693, -0.0005004405975341797, -0.00046578049659729004, -0.0004311203956604004, -0.00039646029472351074, -0.0003618001937866211, -0.00032714009284973145, -0.0002924799919128418, -0.00025781989097595215, -0.0002231597900390625, -0.00018849968910217285, -0.0001538395881652832, -0.00011917948722839355, -8.45193862915039e-05, -4.985928535461426e-05, -1.519918441772461e-05, 1.946091651916504e-05, 5.412101745605469e-05, 8.878111839294434e-05, 0.00012344121932983398, 0.00015810132026672363, 0.00019276142120361328, 0.00022742152214050293, 0.0002620816230773926, 0.0002967417240142822, 0.0003314018249511719, 0.0003660619258880615, 0.00040072202682495117, 0.0004353821277618408, 0.00047004222869873047, 0.0005047023296356201, 0.0005393624305725098, 0.0005740225315093994, 0.0006086826324462891, 0.0006433427333831787, 0.0006780028343200684, 0.000712662935256958, 0.0007473230361938477, 0.0007819831371307373, 0.000816643238067627, 0.0008513033390045166, 0.0008859634399414062]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 8.0, 8.0, 7.0, 14.0, 11.0, 23.0, 36.0, 73.0, 112.0, 172.0, 269.0, 535.0, 1064.0, 2526.0, 6272.0, 21351.0, 135353.0, 818746.0, 44238.0, 10845.0, 3699.0, 1518.0, 721.0, 383.0, 226.0, 125.0, 79.0, 58.0, 27.0, 17.0, 8.0, 11.0, 11.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.3351898193359375, -1.289520263671875, -1.2438507080078125, -1.19818115234375, -1.1525115966796875, -1.106842041015625, -1.0611724853515625, -1.0155029296875, -0.9698333740234375, -0.924163818359375, -0.8784942626953125, -0.83282470703125, -0.7871551513671875, -0.741485595703125, -0.6958160400390625, -0.650146484375, -0.6044769287109375, -0.558807373046875, -0.5131378173828125, -0.46746826171875, -0.4217987060546875, -0.376129150390625, -0.3304595947265625, -0.2847900390625, -0.2391204833984375, -0.193450927734375, -0.1477813720703125, -0.10211181640625, -0.0564422607421875, -0.010772705078125, 0.0348968505859375, 0.08056640625, 0.1262359619140625, 0.171905517578125, 0.2175750732421875, 0.26324462890625, 0.3089141845703125, 0.354583740234375, 0.4002532958984375, 0.4459228515625, 0.4915924072265625, 0.537261962890625, 0.5829315185546875, 0.62860107421875, 0.6742706298828125, 0.719940185546875, 0.7656097412109375, 0.811279296875, 0.8569488525390625, 0.902618408203125, 0.9482879638671875, 0.99395751953125, 1.0396270751953125, 1.085296630859375, 1.1309661865234375, 1.1766357421875, 1.2223052978515625, 1.267974853515625, 1.3136444091796875, 1.35931396484375, 1.4049835205078125, 1.450653076171875, 1.4963226318359375, 1.5419921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 9.0, 24.0, 23.0, 26.0, 47.0, 74.0, 88.0, 115.0, 139.0, 126.0, 96.0, 73.0, 45.0, 28.0, 21.0, 12.0, 8.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.212890625, -3.13348388671875, -3.0540771484375, -2.97467041015625, -2.895263671875, -2.81585693359375, -2.7364501953125, -2.65704345703125, -2.57763671875, -2.49822998046875, -2.4188232421875, -2.33941650390625, -2.260009765625, -2.18060302734375, -2.1011962890625, -2.02178955078125, -1.9423828125, -1.86297607421875, -1.7835693359375, -1.70416259765625, -1.624755859375, -1.54534912109375, -1.4659423828125, -1.38653564453125, -1.30712890625, -1.22772216796875, -1.1483154296875, -1.06890869140625, -0.989501953125, -0.91009521484375, -0.8306884765625, -0.75128173828125, -0.671875, -0.59246826171875, -0.5130615234375, -0.43365478515625, -0.354248046875, -0.27484130859375, -0.1954345703125, -0.11602783203125, -0.03662109375, 0.04278564453125, 0.1221923828125, 0.20159912109375, 0.281005859375, 0.36041259765625, 0.4398193359375, 0.51922607421875, 0.5986328125, 0.67803955078125, 0.7574462890625, 0.83685302734375, 0.916259765625, 0.99566650390625, 1.0750732421875, 1.15447998046875, 1.23388671875, 1.31329345703125, 1.3927001953125, 1.47210693359375, 1.551513671875, 1.63092041015625, 1.7103271484375, 1.78973388671875, 1.869140625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 12.0, 18.0, 21.0, 61.0, 88.0, 490.0, 158.0, 64.0, 43.0, 21.0, 14.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-88.9464340209961, -86.31135559082031, -83.67626953125, -81.04119110107422, -78.40611267089844, -75.77102661132812, -73.13594818115234, -70.50086975097656, -67.86578369140625, -65.23070526123047, -62.59562301635742, -59.960540771484375, -57.325462341308594, -54.69038009643555, -52.0552978515625, -49.42021942138672, -46.78514099121094, -44.15005874633789, -41.51498031616211, -38.87989807128906, -36.24481964111328, -33.609737396240234, -30.974655151367188, -28.339574813842773, -25.70449447631836, -23.069414138793945, -20.43433380126953, -17.799251556396484, -15.16417121887207, -12.529090881347656, -9.894009590148926, -7.258928298950195, -4.623847961425781, -1.988767147064209, 0.6463136672973633, 3.2813944816589355, 5.916475296020508, 8.551555633544922, 11.186636924743652, 13.821718215942383, 16.456798553466797, 19.09187889099121, 21.726959228515625, 24.362041473388672, 26.997121810913086, 29.6322021484375, 32.26728439331055, 34.902366638183594, 37.537445068359375, 40.17252731323242, 42.8076057434082, 45.44268798828125, 48.07776641845703, 50.71284866333008, 53.347930908203125, 55.983009338378906, 58.61809158325195, 61.253173828125, 63.88825225830078, 66.52333068847656, 69.15841674804688, 71.79349517822266, 74.42857360839844, 77.06365966796875, 79.69873809814453]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 10.0, 15.0, 9.0, 12.0, 14.0, 19.0, 18.0, 24.0, 28.0, 38.0, 29.0, 68.0, 250.0, 189.0, 43.0, 23.0, 30.0, 22.0, 27.0, 16.0, 16.0, 16.0, 14.0, 12.0, 7.0, 8.0, 10.0, 7.0, 10.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.42938232421875, -47.82673263549805, -46.224082946777344, -44.621437072753906, -43.0187873840332, -41.4161376953125, -39.81349182128906, -38.21084213256836, -36.608192443847656, -35.00554275512695, -33.40289306640625, -31.800247192382812, -30.19759750366211, -28.594947814941406, -26.992300033569336, -25.389652252197266, -23.787002563476562, -22.18435287475586, -20.58170509338379, -18.97905731201172, -17.376407623291016, -15.773758888244629, -14.171110153198242, -12.568461418151855, -10.965812683105469, -9.363163948059082, -7.760515213012695, -6.157866477966309, -4.555217742919922, -2.952569007873535, -1.3499202728271484, 0.2527284622192383, 1.855377197265625, 3.4580259323120117, 5.060674667358398, 6.663323402404785, 8.265972137451172, 9.868620872497559, 11.471269607543945, 13.073918342590332, 14.676567077636719, 16.279216766357422, 17.881864547729492, 19.484512329101562, 21.087162017822266, 22.68981170654297, 24.29245948791504, 25.89510726928711, 27.497756958007812, 29.100406646728516, 30.703054428100586, 32.305702209472656, 33.90835189819336, 35.51100158691406, 37.1136474609375, 38.7162971496582, 40.318946838378906, 41.92159652709961, 43.52424621582031, 45.12689208984375, 46.72954177856445, 48.332191467285156, 49.934837341308594, 51.5374870300293, 53.14013671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 7.0, 12.0, 10.0, 14.0, 14.0, 17.0, 22.0, 21.0, 26.0, 44.0, 36.0, 63.0, 199.0, 155.0, 63.0, 29.0, 43.0, 34.0, 22.0, 24.0, 20.0, 24.0, 8.0, 11.0, 14.0, 4.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.065704345703125, -2.95562744140625, -2.845550537109375, -2.7354736328125, -2.625396728515625, -2.51531982421875, -2.405242919921875, -2.295166015625, -2.185089111328125, -2.07501220703125, -1.964935302734375, -1.8548583984375, -1.744781494140625, -1.63470458984375, -1.524627685546875, -1.41455078125, -1.304473876953125, -1.19439697265625, -1.084320068359375, -0.9742431640625, -0.864166259765625, -0.75408935546875, -0.644012451171875, -0.533935546875, -0.423858642578125, -0.31378173828125, -0.203704833984375, -0.0936279296875, 0.016448974609375, 0.12652587890625, 0.236602783203125, 0.3466796875, 0.456756591796875, 0.56683349609375, 0.676910400390625, 0.7869873046875, 0.897064208984375, 1.00714111328125, 1.117218017578125, 1.227294921875, 1.337371826171875, 1.44744873046875, 1.557525634765625, 1.6676025390625, 1.777679443359375, 1.88775634765625, 1.997833251953125, 2.10791015625, 2.217987060546875, 2.32806396484375, 2.438140869140625, 2.5482177734375, 2.658294677734375, 2.76837158203125, 2.878448486328125, 2.988525390625, 3.098602294921875, 3.20867919921875, 3.318756103515625, 3.4288330078125, 3.538909912109375, 3.64898681640625, 3.759063720703125, 3.869140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 2.0, 3.0, 5.0, 6.0, 6.0, 8.0, 13.0, 14.0, 21.0, 17.0, 53.0, 78.0, 113.0, 259.0, 784.0, 3204.0, 37919.0, 8337056.0, 6906.0, 1259.0, 429.0, 144.0, 90.0, 53.0, 35.0, 22.0, 10.0, 5.0, 13.0, 9.0, 5.0, 11.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-43.5997200012207, -42.20271301269531, -40.805702209472656, -39.40869140625, -38.01168441772461, -36.61467742919922, -35.21766662597656, -33.820655822753906, -32.423648834228516, -31.026639938354492, -29.62963104248047, -28.232622146606445, -26.835613250732422, -25.4386043548584, -24.041595458984375, -22.64458656311035, -21.247577667236328, -19.850568771362305, -18.45355987548828, -17.056550979614258, -15.659542083740234, -14.262533187866211, -12.865524291992188, -11.468515396118164, -10.07150650024414, -8.674497604370117, -7.277488708496094, -5.88047981262207, -4.483470916748047, -3.0864620208740234, -1.689453125, -0.29244422912597656, 1.1045646667480469, 2.5015735626220703, 3.8985824584960938, 5.295591354370117, 6.692600250244141, 8.089609146118164, 9.486618041992188, 10.883626937866211, 12.280635833740234, 13.677644729614258, 15.074653625488281, 16.471662521362305, 17.868671417236328, 19.26568031311035, 20.662689208984375, 22.0596981048584, 23.456707000732422, 24.853715896606445, 26.25072479248047, 27.647733688354492, 29.044742584228516, 30.44175148010254, 31.838760375976562, 33.23577117919922, 34.63277816772461, 36.02978515625, 37.426795959472656, 38.82380676269531, 40.2208137512207, 41.617820739746094, 43.01483154296875, 44.411842346191406, 45.8088493347168]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 5.0, 5.0, 7.0, 2.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.25627136230469, -44.149169921875, -43.04207229614258, -41.93497085571289, -40.82787322998047, -39.72077178955078, -38.613670349121094, -37.50657272338867, -36.399471282958984, -35.2923698425293, -34.185272216796875, -33.07817077636719, -31.971071243286133, -30.863971710205078, -29.75687026977539, -28.649770736694336, -27.54267120361328, -26.435571670532227, -25.328472137451172, -24.221370697021484, -23.11427116394043, -22.007171630859375, -20.900070190429688, -19.792970657348633, -18.685871124267578, -17.578771591186523, -16.47167205810547, -15.364570617675781, -14.257471084594727, -13.150371551513672, -12.0432710647583, -10.93617057800293, -9.829071044921875, -8.72197151184082, -7.614871025085449, -6.507771015167236, -5.400671005249023, -4.2935709953308105, -3.1864709854125977, -2.0793709754943848, -0.9722709655761719, 0.13482904434204102, 1.241929054260254, 2.349029064178467, 3.4561290740966797, 4.563229084014893, 5.6703290939331055, 6.777429103851318, 7.884529113769531, 8.991628646850586, 10.098729133605957, 11.205829620361328, 12.312929153442383, 13.420028686523438, 14.527129173278809, 15.63422966003418, 16.741329193115234, 17.84842872619629, 18.955528259277344, 20.06262969970703, 21.169729232788086, 22.27682876586914, 23.383930206298828, 24.491029739379883, 25.598129272460938]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 9.0, 9.0, 9.0, 23.0, 27.0, 27.0, 57.0, 80.0, 127.0, 210.0, 391.0, 915.0, 2516.0, 9041.0, 36967.0, 175911.0, 228504.0, 51993.0, 11781.0, 3439.0, 1087.0, 466.0, 245.0, 142.0, 96.0, 52.0, 35.0, 30.0, 16.0, 15.0, 4.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-43.09375, -41.8662109375, -40.638671875, -39.4111328125, -38.18359375, -36.9560546875, -35.728515625, -34.5009765625, -33.2734375, -32.0458984375, -30.818359375, -29.5908203125, -28.36328125, -27.1357421875, -25.908203125, -24.6806640625, -23.453125, -22.2255859375, -20.998046875, -19.7705078125, -18.54296875, -17.3154296875, -16.087890625, -14.8603515625, -13.6328125, -12.4052734375, -11.177734375, -9.9501953125, -8.72265625, -7.4951171875, -6.267578125, -5.0400390625, -3.8125, -2.5849609375, -1.357421875, -0.1298828125, 1.09765625, 2.3251953125, 3.552734375, 4.7802734375, 6.0078125, 7.2353515625, 8.462890625, 9.6904296875, 10.91796875, 12.1455078125, 13.373046875, 14.6005859375, 15.828125, 17.0556640625, 18.283203125, 19.5107421875, 20.73828125, 21.9658203125, 23.193359375, 24.4208984375, 25.6484375, 26.8759765625, 28.103515625, 29.3310546875, 30.55859375, 31.7861328125, 33.013671875, 34.2412109375, 35.46875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 8.0, 13.0, 14.0, 22.0, 22.0, 25.0, 30.0, 23.0, 36.0, 40.0, 44.0, 48.0, 60.0, 68.0, 72.0, 62.0, 66.0, 62.0, 52.0, 42.0, 27.0, 35.0, 19.0, 26.0, 17.0, 11.0, 9.0, 7.0, 12.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1328125, -4.00396728515625, -3.8751220703125, -3.74627685546875, -3.617431640625, -3.48858642578125, -3.3597412109375, -3.23089599609375, -3.10205078125, -2.97320556640625, -2.8443603515625, -2.71551513671875, -2.586669921875, -2.45782470703125, -2.3289794921875, -2.20013427734375, -2.0712890625, -1.94244384765625, -1.8135986328125, -1.68475341796875, -1.555908203125, -1.42706298828125, -1.2982177734375, -1.16937255859375, -1.04052734375, -0.91168212890625, -0.7828369140625, -0.65399169921875, -0.525146484375, -0.39630126953125, -0.2674560546875, -0.13861083984375, -0.009765625, 0.11907958984375, 0.2479248046875, 0.37677001953125, 0.505615234375, 0.63446044921875, 0.7633056640625, 0.89215087890625, 1.02099609375, 1.14984130859375, 1.2786865234375, 1.40753173828125, 1.536376953125, 1.66522216796875, 1.7940673828125, 1.92291259765625, 2.0517578125, 2.18060302734375, 2.3094482421875, 2.43829345703125, 2.567138671875, 2.69598388671875, 2.8248291015625, 2.95367431640625, 3.08251953125, 3.21136474609375, 3.3402099609375, 3.46905517578125, 3.597900390625, 3.72674560546875, 3.8555908203125, 3.98443603515625, 4.11328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 12.0, 24.0, 38.0, 67.0, 113.0, 92.0, 66.0, 29.0, 12.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.6678352355957, -44.37339401245117, -43.07895278930664, -41.784507751464844, -40.49006652832031, -39.19562530517578, -37.90118408203125, -36.60674285888672, -35.31230163574219, -34.017860412597656, -32.723419189453125, -31.42897605895996, -30.134532928466797, -28.840091705322266, -27.545650482177734, -26.251209259033203, -24.956764221191406, -23.662322998046875, -22.36787986755371, -21.07343864440918, -19.778995513916016, -18.484554290771484, -17.190113067626953, -15.895670890808105, -14.601228713989258, -13.30678653717041, -12.012344360351562, -10.717903137207031, -9.423460960388184, -8.129018783569336, -6.8345770835876465, -5.540135383605957, -4.245689392089844, -2.951247453689575, -1.6568055152893066, -0.3623635768890381, 0.9320783615112305, 2.226520538330078, 3.5209622383117676, 4.815403938293457, 6.109846115112305, 7.404288291931152, 8.69873046875, 9.993171691894531, 11.287613868713379, 12.582056045532227, 13.876497268676758, 15.170939445495605, 16.465381622314453, 17.759822845458984, 19.05426597595215, 20.34870719909668, 21.643150329589844, 22.937591552734375, 24.232032775878906, 25.526473999023438, 26.8209171295166, 28.115358352661133, 29.409801483154297, 30.704242706298828, 31.99868392944336, 33.293128967285156, 34.58757019042969, 35.88201141357422, 37.17645263671875]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 13.0, 24.0, 30.0, 50.0, 67.0, 78.0, 69.0, 39.0, 22.0, 18.0, 15.0, 5.0, 3.0, 5.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-27.61479949951172, -26.92591667175293, -26.237035751342773, -25.548152923583984, -24.859272003173828, -24.17038917541504, -23.481508255004883, -22.792625427246094, -22.103744506835938, -21.41486167907715, -20.725980758666992, -20.037097930908203, -19.348217010498047, -18.659334182739258, -17.9704532623291, -17.281570434570312, -16.592689514160156, -15.903807640075684, -15.214925765991211, -14.526043891906738, -13.837162017822266, -13.148280143737793, -12.45939826965332, -11.770515441894531, -11.081632614135742, -10.39275074005127, -9.703868865966797, -9.014986991882324, -8.326105117797852, -7.637223243713379, -6.948340892791748, -6.259459018707275, -5.570577621459961, -4.881695747375488, -4.192813873291016, -3.503931760787964, -2.815049886703491, -2.1261680126190186, -1.4372859001159668, -0.7484040260314941, -0.059522151947021484, 0.629359781742096, 1.3182417154312134, 2.0071237087249756, 2.6960055828094482, 3.384887456893921, 4.073769569396973, 4.762651443481445, 5.451533317565918, 6.140415191650391, 6.829297065734863, 7.518178939819336, 8.207060813903809, 8.895942687988281, 9.58482551574707, 10.273706436157227, 10.962589263916016, 11.651471138000488, 12.340353012084961, 13.029234886169434, 13.718116760253906, 14.406998634338379, 15.095880508422852, 15.78476333618164, 16.473644256591797]}, "eval/loss": 4.40821647644043, "eval/wer": 1.907457358191194, "eval/runtime": 786.867, "eval/samples_per_second": 3.358, "eval/steps_per_second": 0.281}